Token | . |
Token ID | 13 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
Run | +0.046 |
sorts | +0.046 |
ites | +0.046 |
ang | +0.046 |
atch | +0.046 |
Neg logit contributions | |
sob | -0.028 |
Nib | -0.028 |
dentist | -0.027 |
babys | -0.026 |
ache | -0.026 |
Token | He |
Token ID | 679 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
ites | +0.029 |
ang | +0.029 |
cer | +0.029 |
Run | +0.029 |
mer | +0.029 |
Neg logit contributions | |
Her | -0.014 |
dentist | -0.013 |
Nib | -0.012 |
sob | -0.012 |
doctor | -0.012 |
Token | was |
Token ID | 373 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
ites | +0.047 |
Run | +0.046 |
akes | +0.046 |
atch | +0.046 |
about | +0.046 |
Neg logit contributions | |
sob | -0.053 |
Nib | -0.051 |
dentist | -0.050 |
Her | -0.049 |
throat | -0.049 |
Token | the |
Token ID | 262 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
sob | +0.018 |
dentist | +0.017 |
ache | +0.017 |
grandmother | +0.017 |
forgiveness | +0.017 |
Neg logit contributions | |
sorts | -0.023 |
ang | -0.023 |
ab | -0.021 |
atch | -0.020 |
blows | -0.020 |
Token | most |
Token ID | 749 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
OK | +0.037 |
ang | +0.036 |
sorts | +0.036 |
atch | +0.036 |
Wow | +0.036 |
Neg logit contributions | |
sob | -0.043 |
Nib | -0.039 |
Her | -0.039 |
babys | -0.039 |
ache | -0.039 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
Mine | +0.065 |
Run | +0.065 |
Wow | +0.064 |
atch | +0.064 |
akes | +0.063 |
Neg logit contributions | |
ache | -0.037 |
doctor | -0.037 |
Nib | -0.037 |
sob | -0.036 |
dentist | -0.036 |
Token | cy |
Token ID | 948 |
Feature activation | +3.29e+00 |
Pos logit contributions | |
Run | +0.105 |
Pull | +0.105 |
Quick | +0.098 |
AW | +0.096 |
Uh | +0.092 |
Neg logit contributions | |
anywhere | -0.319 |
Nib | -0.313 |
tooth | -0.308 |
stomach | -0.305 |
doctor | -0.305 |
Token | , |
Token ID | 11 |
Feature activation | -8.11e-02 |
Pos logit contributions | |
ites | +0.076 |
akes | +0.076 |
ised | +0.074 |
atch | +0.074 |
Run | +0.073 |
Neg logit contributions | |
anywhere | -0.057 |
doctor | -0.054 |
tooth | -0.053 |
sob | -0.053 |
maid | -0.053 |
Token | happiest |
Token ID | 49414 |
Feature activation | +4.15e+00 |
Pos logit contributions | |
sob | +0.001 |
Nib | +0.001 |
anywhere | +0.001 |
dentist | +0.001 |
doctor | +0.001 |
Neg logit contributions | |
ites | -0.002 |
Run | -0.002 |
akes | -0.002 |
atch | -0.002 |
about | -0.002 |
Token | inch |
Token ID | 11111 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
atch | +0.099 |
akes | +0.099 |
acked | +0.099 |
ites | +0.098 |
Mine | +0.096 |
Neg logit contributions | |
doctor | -0.075 |
tooth | -0.070 |
Nib | -0.069 |
throat | -0.067 |
maid | -0.066 |
Token | worm |
Token ID | 25323 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
Run | +0.082 |
Wow | +0.082 |
Uh | +0.080 |
akes | +0.079 |
atch | +0.079 |
Neg logit contributions | |
Nib | -0.046 |
anywhere | -0.046 |
sob | -0.045 |
dentist | -0.044 |
doctor | -0.044 |
Token | It |
Token ID | 632 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
sob | +0.011 |
Nib | +0.011 |
dentist | +0.011 |
ache | +0.011 |
babys | +0.011 |
Neg logit contributions | |
Run | -0.016 |
sorts | -0.016 |
Wow | -0.016 |
ites | -0.016 |
OK | -0.016 |
Token | was |
Token ID | 373 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
ites | +0.037 |
akes | +0.037 |
atch | +0.036 |
Wow | +0.036 |
Run | +0.035 |
Neg logit contributions | |
sob | -0.026 |
Nib | -0.023 |
Her | -0.023 |
dentist | -0.022 |
anywhere | -0.022 |
Token | a |
Token ID | 257 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
sob | +0.002 |
Nib | +0.002 |
dentist | +0.002 |
ache | +0.002 |
ppa | +0.002 |
Neg logit contributions | |
sorts | -0.003 |
Run | -0.003 |
Wow | -0.003 |
atch | -0.003 |
about | -0.003 |
Token | big |
Token ID | 1263 |
Feature activation | +5.85e+00 |
Pos logit contributions | |
ites | +0.034 |
akes | +0.034 |
atch | +0.033 |
acked | +0.033 |
Run | +0.033 |
Neg logit contributions | |
sob | -0.030 |
dentist | -0.029 |
doctor | -0.029 |
babys | -0.029 |
Nib | -0.029 |
Token | , |
Token ID | 11 |
Feature activation | +8.56e-01 |
Pos logit contributions | |
ites | +0.167 |
akes | +0.166 |
acked | +0.164 |
Quick | +0.155 |
ang | +0.155 |
Neg logit contributions | |
doctor | -0.079 |
throat | -0.076 |
dentist | -0.075 |
sob | -0.075 |
stomach | -0.075 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
akes | +0.019 |
ites | +0.019 |
atch | +0.018 |
ang | +0.018 |
cer | +0.018 |
Neg logit contributions | |
sob | -0.017 |
Nib | -0.015 |
dentist | -0.015 |
anywhere | -0.015 |
doctor | -0.015 |
Token | cy |
Token ID | 948 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
Pull | +0.135 |
Run | +0.126 |
blows | +0.123 |
Quick | +0.122 |
AW | +0.121 |
Neg logit contributions | |
anywhere | -0.263 |
costume | -0.259 |
tooth | -0.251 |
Nib | -0.247 |
mask | -0.246 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
ites | +0.002 |
akes | +0.002 |
Uh | +0.002 |
OK | +0.002 |
sorts | +0.002 |
Neg logit contributions | |
sob | -0.002 |
anywhere | -0.002 |
stomach | -0.002 |
throat | -0.002 |
crown | -0.002 |
Token | ! |
Token ID | 0 |
Feature activation | -2.05e-01 |
Pos logit contributions | |
Wow | +0.042 |
OK | +0.042 |
Uh | +0.042 |
Quick | +0.041 |
akes | +0.041 |
Neg logit contributions | |
sob | -0.019 |
anywhere | -0.019 |
Nib | -0.018 |
doctor | -0.018 |
Her | -0.018 |
Token | When |
Token ID | 1649 |
Feature activation | +8.77e-01 |
Pos logit contributions | |
sob | +0.003 |
Nib | +0.003 |
dentist | +0.003 |
Her | +0.003 |
babys | +0.003 |
Neg logit contributions | |
Run | -0.005 |
sorts | -0.005 |
atch | -0.005 |
ites | -0.005 |
cer | -0.005 |
Token | she |
Token ID | 673 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
Run | +0.024 |
Wow | +0.023 |
sorts | +0.023 |
OK | +0.023 |
ites | +0.023 |
Neg logit contributions | |
sob | -0.011 |
Nib | -0.011 |
ache | -0.011 |
dentist | -0.011 |
babys | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +7.82e-01 |
Pos logit contributions | |
sorts | +0.021 |
Run | +0.021 |
ites | +0.021 |
OK | +0.021 |
atch | +0.021 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.015 |
dentist | -0.015 |
babys | -0.015 |
ache | -0.015 |
Token | It |
Token ID | 632 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
Run | +0.020 |
ites | +0.019 |
atch | +0.019 |
ang | +0.019 |
cer | +0.019 |
Neg logit contributions | |
Her | -0.012 |
Nib | -0.012 |
dentist | -0.012 |
sob | -0.012 |
doctor | -0.011 |
Token | was |
Token ID | 373 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
ites | +0.047 |
Run | +0.047 |
akes | +0.047 |
atch | +0.046 |
ang | +0.046 |
Neg logit contributions | |
sob | -0.030 |
Nib | -0.028 |
dentist | -0.028 |
doctor | -0.027 |
Her | -0.027 |
Token | a |
Token ID | 257 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
sob | +0.005 |
ache | +0.005 |
ppa | +0.005 |
babys | +0.005 |
maid | +0.004 |
Neg logit contributions | |
sorts | -0.007 |
Wow | -0.006 |
cer | -0.006 |
cy | -0.006 |
atch | -0.006 |
Token | big |
Token ID | 1263 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
Run | +0.032 |
sorts | +0.031 |
ites | +0.031 |
Wow | +0.031 |
OK | +0.031 |
Neg logit contributions | |
sob | -0.027 |
Nib | -0.026 |
dentist | -0.026 |
babys | -0.025 |
throat | -0.025 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
ites | +0.155 |
ang | +0.150 |
akes | +0.150 |
Run | +0.149 |
acked | +0.146 |
Neg logit contributions | |
dentist | -0.078 |
grandmother | -0.075 |
doctor | -0.074 |
sob | -0.074 |
throat | -0.073 |
Token | cy |
Token ID | 948 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
Run | +0.110 |
Pull | +0.106 |
blows | +0.096 |
Quick | +0.096 |
AW | +0.093 |
Neg logit contributions | |
tooth | -0.303 |
anywhere | -0.302 |
Nib | -0.299 |
costume | -0.298 |
doctor | -0.298 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
ites | +0.014 |
ang | +0.014 |
Run | +0.014 |
atch | +0.014 |
akes | +0.013 |
Neg logit contributions | |
sob | -0.009 |
anywhere | -0.009 |
babys | -0.009 |
grandmother | -0.009 |
throat | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
Run | +0.044 |
Wow | +0.044 |
OK | +0.044 |
ites | +0.043 |
Quick | +0.043 |
Neg logit contributions | |
sob | -0.030 |
Nib | -0.030 |
anywhere | -0.029 |
dentist | -0.029 |
doctor | -0.029 |
Token | The |
Token ID | 383 |
Feature activation | +5.40e-02 |
Pos logit contributions | |
Run | +0.011 |
atch | +0.011 |
ites | +0.011 |
ang | +0.011 |
cer | +0.011 |
Neg logit contributions | |
Her | -0.007 |
Nib | -0.007 |
dentist | -0.007 |
sob | -0.007 |
doctor | -0.006 |
Token | 3 |
Token ID | 513 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
ites | +0.001 |
akes | +0.001 |
Run | +0.001 |
atch | +0.001 |
sorts | +0.001 |
Neg logit contributions | |
sob | -0.001 |
dentist | -0.001 |
Nib | -0.001 |
doctor | -0.001 |
babys | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +7.82e-01 |
Pos logit contributions | |
sorts | +0.021 |
Run | +0.021 |
ites | +0.021 |
OK | +0.021 |
atch | +0.021 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.015 |
dentist | -0.015 |
babys | -0.015 |
ache | -0.015 |
Token | It |
Token ID | 632 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
Run | +0.020 |
ites | +0.019 |
atch | +0.019 |
ang | +0.019 |
cer | +0.019 |
Neg logit contributions | |
Her | -0.012 |
Nib | -0.012 |
dentist | -0.012 |
sob | -0.012 |
doctor | -0.011 |
Token | was |
Token ID | 373 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
ites | +0.047 |
Run | +0.047 |
akes | +0.047 |
atch | +0.046 |
ang | +0.046 |
Neg logit contributions | |
sob | -0.030 |
Nib | -0.028 |
dentist | -0.028 |
doctor | -0.027 |
Her | -0.027 |
Token | a |
Token ID | 257 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
sob | +0.005 |
ache | +0.005 |
ppa | +0.005 |
babys | +0.005 |
maid | +0.004 |
Neg logit contributions | |
sorts | -0.007 |
Wow | -0.006 |
cer | -0.006 |
cy | -0.006 |
atch | -0.006 |
Token | big |
Token ID | 1263 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
Run | +0.032 |
sorts | +0.031 |
ites | +0.031 |
Wow | +0.031 |
OK | +0.031 |
Neg logit contributions | |
sob | -0.027 |
Nib | -0.026 |
dentist | -0.026 |
babys | -0.025 |
throat | -0.025 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
ites | +0.155 |
ang | +0.150 |
akes | +0.150 |
Run | +0.149 |
acked | +0.146 |
Neg logit contributions | |
dentist | -0.078 |
grandmother | -0.075 |
doctor | -0.074 |
sob | -0.074 |
throat | -0.073 |
Token | cy |
Token ID | 948 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
Run | +0.110 |
Pull | +0.106 |
blows | +0.096 |
Quick | +0.096 |
AW | +0.093 |
Neg logit contributions | |
tooth | -0.303 |
anywhere | -0.302 |
Nib | -0.299 |
costume | -0.298 |
doctor | -0.298 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
ites | +0.014 |
ang | +0.014 |
Run | +0.014 |
atch | +0.014 |
akes | +0.013 |
Neg logit contributions | |
sob | -0.009 |
anywhere | -0.009 |
babys | -0.009 |
grandmother | -0.009 |
throat | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
Run | +0.044 |
Wow | +0.044 |
OK | +0.044 |
ites | +0.043 |
Quick | +0.043 |
Neg logit contributions | |
sob | -0.030 |
Nib | -0.030 |
anywhere | -0.029 |
dentist | -0.029 |
doctor | -0.029 |
Token | The |
Token ID | 383 |
Feature activation | +5.40e-02 |
Pos logit contributions | |
Run | +0.011 |
atch | +0.011 |
ites | +0.011 |
ang | +0.011 |
cer | +0.011 |
Neg logit contributions | |
Her | -0.007 |
Nib | -0.007 |
dentist | -0.007 |
sob | -0.007 |
doctor | -0.006 |
Token | 3 |
Token ID | 513 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
ites | +0.001 |
akes | +0.001 |
Run | +0.001 |
atch | +0.001 |
sorts | +0.001 |
Neg logit contributions | |
sob | -0.001 |
dentist | -0.001 |
Nib | -0.001 |
doctor | -0.001 |
babys | -0.001 |
Token | then |
Token ID | 788 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
Run | +0.007 |
Wow | +0.007 |
cer | +0.007 |
OK | +0.007 |
cy | +0.006 |
Neg logit contributions | |
ache | -0.008 |
dentist | -0.008 |
sob | -0.008 |
babys | -0.008 |
anywhere | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
Run | +0.030 |
Wow | +0.029 |
OK | +0.028 |
cer | +0.028 |
cy | +0.027 |
Neg logit contributions | |
sob | -0.023 |
ache | -0.023 |
dentist | -0.023 |
babys | -0.023 |
ppa | -0.023 |
Token | a |
Token ID | 257 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
sob | +0.000 |
ache | +0.000 |
dentist | +0.000 |
ppa | +0.000 |
babys | +0.000 |
Neg logit contributions | |
Run | -0.000 |
Wow | -0.000 |
cer | -0.000 |
OK | -0.000 |
cy | -0.000 |
Token | big |
Token ID | 1263 |
Feature activation | +5.70e+00 |
Pos logit contributions | |
Run | +0.037 |
OK | +0.036 |
Wow | +0.036 |
sorts | +0.036 |
about | +0.035 |
Neg logit contributions | |
sob | -0.037 |
Nib | -0.036 |
Her | -0.035 |
dentist | -0.035 |
anywhere | -0.035 |
Token | , |
Token ID | 11 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
akes | +0.125 |
ites | +0.124 |
atch | +0.118 |
Wow | +0.118 |
sorts | +0.118 |
Neg logit contributions | |
sob | -0.111 |
doctor | -0.107 |
Nib | -0.107 |
dentist | -0.107 |
throat | -0.105 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
akes | +0.042 |
ites | +0.040 |
acked | +0.039 |
iling | +0.039 |
atch | +0.039 |
Neg logit contributions | |
sob | -0.024 |
sorry | -0.023 |
crying | -0.022 |
dentist | -0.022 |
doctor | -0.022 |
Token | cy |
Token ID | 948 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
Pull | +0.101 |
AW | +0.098 |
sizes | +0.096 |
Run | +0.093 |
OK | +0.092 |
Neg logit contributions | |
Nib | -0.288 |
doctor | -0.288 |
anywhere | -0.286 |
stomach | -0.285 |
costume | -0.285 |
Token | ball |
Token ID | 2613 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
Wow | +0.022 |
akes | +0.022 |
ites | +0.021 |
ised | +0.021 |
OK | +0.021 |
Neg logit contributions | |
sob | -0.021 |
stomach | -0.020 |
throat | -0.020 |
doctor | -0.020 |
anywhere | -0.020 |
Token | floated |
Token ID | 29742 |
Feature activation | +2.67e+00 |
Pos logit contributions | |
akes | +0.066 |
ised | +0.065 |
Wow | +0.065 |
sorts | +0.064 |
OK | +0.064 |
Neg logit contributions | |
sob | -0.040 |
anywhere | -0.040 |
doctor | -0.039 |
crying | -0.038 |
Nib | -0.038 |
Token | by |
Token ID | 416 |
Feature activation | -5.50e-01 |
Pos logit contributions | |
akes | +0.065 |
sorts | +0.064 |
iling | +0.063 |
ites | +0.063 |
ang | +0.063 |
Neg logit contributions | |
anywhere | -0.042 |
sob | -0.040 |
Nib | -0.039 |
back | -0.036 |
not | -0.036 |
Token | . |
Token ID | 13 |
Feature activation | +5.63e-01 |
Pos logit contributions | |
sob | +0.009 |
Nib | +0.009 |
anywhere | +0.008 |
dentist | +0.008 |
throat | +0.008 |
Neg logit contributions | |
ites | -0.013 |
akes | -0.013 |
Run | -0.013 |
Wow | -0.013 |
OK | -0.013 |
Token | It |
Token ID | 1026 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
akes | +0.011 |
cer | +0.011 |
sorts | +0.011 |
cy | +0.011 |
mer | +0.010 |
Neg logit contributions | |
Her | -0.008 |
Her | -0.008 |
sob | -0.007 |
not | -0.007 |
doctor | -0.007 |
Token | was |
Token ID | 373 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
ites | +0.060 |
akes | +0.059 |
ang | +0.058 |
atch | +0.057 |
Run | +0.056 |
Neg logit contributions | |
sob | -0.032 |
Nib | -0.029 |
dentist | -0.028 |
doctor | -0.028 |
ache | -0.027 |
Token | a |
Token ID | 257 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
sob | +0.007 |
ache | +0.007 |
ppa | +0.006 |
maid | +0.006 |
throat | +0.006 |
Neg logit contributions | |
sorts | -0.009 |
Wow | -0.009 |
Mine | -0.008 |
Run | -0.008 |
about | -0.008 |
Token | big |
Token ID | 1263 |
Feature activation | +5.54e+00 |
Pos logit contributions | |
Run | +0.030 |
sorts | +0.030 |
ites | +0.030 |
Wow | +0.030 |
atch | +0.029 |
Neg logit contributions | |
sob | -0.027 |
Nib | -0.026 |
dentist | -0.026 |
babys | -0.025 |
throat | -0.025 |
Token | , |
Token ID | 11 |
Feature activation | +9.88e-01 |
Pos logit contributions | |
ites | +0.145 |
akes | +0.142 |
acked | +0.141 |
ang | +0.141 |
Run | +0.140 |
Neg logit contributions | |
doctor | -0.087 |
dentist | -0.087 |
babys | -0.087 |
sob | -0.084 |
throat | -0.084 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
akes | +0.020 |
ites | +0.020 |
atch | +0.019 |
ang | +0.019 |
Run | +0.019 |
Neg logit contributions | |
sob | -0.020 |
Nib | -0.019 |
dentist | -0.019 |
babys | -0.019 |
doctor | -0.019 |
Token | cy |
Token ID | 948 |
Feature activation | +5.23e-01 |
Pos logit contributions | |
Pull | +0.124 |
Run | +0.123 |
AW | +0.115 |
Quick | +0.112 |
Further | +0.110 |
Neg logit contributions | |
anywhere | -0.275 |
doctor | -0.274 |
costume | -0.273 |
babys | -0.270 |
tooth | -0.270 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
ites | +0.011 |
Run | +0.011 |
Wow | +0.011 |
akes | +0.011 |
sorts | +0.011 |
Neg logit contributions | |
sob | -0.010 |
doctor | -0.010 |
anywhere | -0.010 |
babys | -0.010 |
throat | -0.010 |
Token | ! |
Token ID | 0 |
Feature activation | +6.72e-01 |
Pos logit contributions | |
Wow | +0.054 |
OK | +0.054 |
Quick | +0.053 |
Uh | +0.053 |
Run | +0.053 |
Neg logit contributions | |
anywhere | -0.023 |
doctor | -0.023 |
sob | -0.022 |
Nib | -0.022 |
dentist | -0.021 |
Token | The |
Token ID | 383 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
atch | +0.014 |
cer | +0.014 |
Run | +0.014 |
ites | +0.014 |
sorts | +0.014 |
Neg logit contributions | |
Her | -0.014 |
Nib | -0.013 |
sob | -0.013 |
babys | -0.013 |
throat | -0.012 |
Token | kid |
Token ID | 5141 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
sob | +0.003 |
babys | +0.003 |
dentist | +0.003 |
doctor | +0.003 |
Nib | +0.003 |
Neg logit contributions | |
akes | -0.005 |
ites | -0.005 |
sorts | -0.005 |
Run | -0.005 |
atch | -0.005 |
Token | she |
Token ID | 673 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
Run | +0.019 |
Wow | +0.019 |
OK | +0.018 |
cy | +0.018 |
sorts | +0.018 |
Neg logit contributions | |
ache | -0.011 |
ppa | -0.010 |
throat | -0.010 |
sob | -0.010 |
urger | -0.010 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
sorts | +0.017 |
cy | +0.017 |
cer | +0.017 |
Run | +0.017 |
ang | +0.016 |
Neg logit contributions | |
Nib | -0.029 |
ache | -0.029 |
babys | -0.029 |
dentist | -0.028 |
sob | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
ache | +0.035 |
ppa | +0.034 |
throat | +0.034 |
urger | +0.033 |
gag | +0.032 |
Neg logit contributions | |
sorts | -0.032 |
Wow | -0.030 |
ised | -0.028 |
Run | -0.028 |
kinds | -0.028 |
Token | big |
Token ID | 1263 |
Feature activation | +5.21e+00 |
Pos logit contributions | |
ites | +0.020 |
atch | +0.020 |
akes | +0.020 |
Run | +0.020 |
sorts | +0.020 |
Neg logit contributions | |
sob | -0.019 |
dentist | -0.018 |
Nib | -0.018 |
babys | -0.018 |
doctor | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | +9.65e-01 |
Pos logit contributions | |
akes | +0.146 |
ites | +0.145 |
acked | +0.138 |
OK | +0.137 |
atch | +0.136 |
Neg logit contributions | |
doctor | -0.075 |
dentist | -0.074 |
sob | -0.074 |
tooth | -0.072 |
crying | -0.071 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
akes | +0.021 |
ites | +0.021 |
atch | +0.020 |
ang | +0.020 |
cer | +0.020 |
Neg logit contributions | |
sob | -0.019 |
dentist | -0.018 |
Nib | -0.018 |
babys | -0.017 |
doctor | -0.017 |
Token | cy |
Token ID | 948 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
Pull | +0.114 |
Run | +0.109 |
Quick | +0.099 |
OK | +0.098 |
AW | +0.097 |
Neg logit contributions | |
anywhere | -0.291 |
costume | -0.288 |
tooth | -0.285 |
mask | -0.282 |
doctor | -0.280 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
ites | +0.007 |
akes | +0.007 |
sorts | +0.006 |
OK | +0.006 |
atch | +0.006 |
Neg logit contributions | |
sob | -0.007 |
tooth | -0.007 |
anywhere | -0.007 |
crown | -0.006 |
mask | -0.006 |
Token | ! |
Token ID | 0 |
Feature activation | -2.87e-01 |
Pos logit contributions | |
OK | +0.055 |
akes | +0.055 |
ised | +0.055 |
Quick | +0.054 |
Wow | +0.054 |
Neg logit contributions | |
anywhere | -0.022 |
sob | -0.022 |
crying | -0.021 |
doctor | -0.020 |
Nib | -0.019 |
Token | Lily |
Token ID | 20037 |
Feature activation | +6.69e-01 |
Pos logit contributions | |
sob | +0.005 |
ache | +0.005 |
dentist | +0.005 |
anywhere | +0.005 |
ppa | +0.005 |
Neg logit contributions | |
Wow | -0.007 |
sorts | -0.006 |
Run | -0.006 |
OK | -0.006 |
about | -0.006 |
Token | was |
Token ID | 373 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
akes | +0.016 |
Run | +0.016 |
ites | +0.016 |
sorts | +0.016 |
Wow | +0.016 |
Neg logit contributions | |
sob | -0.012 |
Her | -0.011 |
Nib | -0.010 |
babys | -0.010 |
throat | -0.010 |
Token | room |
Token ID | 2119 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
sob | +0.064 |
ache | +0.063 |
Nib | +0.062 |
gag | +0.060 |
hesitation | +0.060 |
Neg logit contributions | |
cy | -0.043 |
sorts | -0.043 |
cer | -0.043 |
ang | -0.042 |
ites | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | -8.08e-01 |
Pos logit contributions | |
sob | +0.022 |
dentist | +0.020 |
Nib | +0.020 |
babys | +0.020 |
throat | +0.019 |
Neg logit contributions | |
Run | -0.045 |
ites | -0.045 |
Wow | -0.045 |
sorts | -0.044 |
OK | -0.044 |
Token | It |
Token ID | 632 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
ache | +0.020 |
ppa | +0.019 |
dentist | +0.019 |
sob | +0.019 |
anywhere | +0.019 |
Neg logit contributions | |
Wow | -0.014 |
Mine | -0.013 |
about | -0.013 |
sorts | -0.012 |
OK | -0.012 |
Token | was |
Token ID | 373 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
Wow | +0.020 |
sorts | +0.019 |
cy | +0.019 |
Run | +0.018 |
cer | +0.018 |
Neg logit contributions | |
dentist | -0.029 |
ache | -0.029 |
ppa | -0.029 |
hesitation | -0.028 |
throat | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
ache | +0.007 |
ppa | +0.007 |
ridge | +0.006 |
Him | +0.006 |
maid | +0.006 |
Neg logit contributions | |
sorts | -0.005 |
Wow | -0.005 |
pitch | -0.004 |
Mine | -0.004 |
than | -0.004 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
Run | +0.029 |
Wow | +0.029 |
sorts | +0.029 |
OK | +0.029 |
atch | +0.029 |
Neg logit contributions | |
sob | -0.031 |
Nib | -0.030 |
dentist | -0.030 |
Her | -0.029 |
ache | -0.029 |
Token | cy |
Token ID | 948 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
Run | +0.105 |
Pull | +0.098 |
Quick | +0.092 |
pitches | +0.083 |
OK | +0.083 |
Neg logit contributions | |
anywhere | -0.310 |
tooth | -0.302 |
Nib | -0.299 |
doctor | -0.295 |
costume | -0.295 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
ites | +0.009 |
sorts | +0.009 |
Run | +0.009 |
ang | +0.009 |
OK | +0.009 |
Neg logit contributions | |
anywhere | -0.008 |
sob | -0.008 |
doctor | -0.007 |
babys | -0.007 |
tooth | -0.007 |
Token | with |
Token ID | 351 |
Feature activation | -4.23e-01 |
Pos logit contributions | |
OK | +0.046 |
Quick | +0.046 |
Wow | +0.046 |
Run | +0.045 |
ites | +0.045 |
Neg logit contributions | |
sob | -0.020 |
anywhere | -0.020 |
Nib | -0.019 |
doctor | -0.019 |
crying | -0.019 |
Token | a |
Token ID | 257 |
Feature activation | -8.23e-02 |
Pos logit contributions | |
sob | +0.007 |
Nib | +0.006 |
Her | +0.006 |
dentist | +0.006 |
anywhere | +0.006 |
Neg logit contributions | |
Run | -0.010 |
ites | -0.010 |
OK | -0.010 |
akes | -0.010 |
ang | -0.010 |
Token | fun |
Token ID | 1257 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
sob | +0.002 |
doctor | +0.002 |
Nib | +0.002 |
babys | +0.002 |
anywhere | +0.002 |
Neg logit contributions | |
ites | -0.002 |
sorts | -0.002 |
akes | -0.002 |
atch | -0.002 |
Run | -0.002 |
Token | there |
Token ID | 612 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
sob | +0.021 |
Nib | +0.020 |
anywhere | +0.019 |
Her | +0.019 |
dentist | +0.019 |
Neg logit contributions | |
ites | -0.031 |
sorts | -0.031 |
atch | -0.031 |
about | -0.031 |
akes | -0.031 |
Token | was |
Token ID | 373 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
Run | +0.022 |
sorts | +0.022 |
ites | +0.022 |
Wow | +0.022 |
atch | +0.022 |
Neg logit contributions | |
sob | -0.019 |
Nib | -0.019 |
dentist | -0.018 |
babys | -0.018 |
throat | -0.018 |
Token | a |
Token ID | 257 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
sob | +0.022 |
Nib | +0.021 |
ache | +0.021 |
dentist | +0.021 |
babys | +0.020 |
Neg logit contributions | |
Wow | -0.041 |
sorts | -0.041 |
Run | -0.041 |
about | -0.040 |
ites | -0.040 |
Token | big |
Token ID | 1263 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
ites | +0.027 |
sorts | +0.027 |
akes | +0.027 |
atch | +0.027 |
Run | +0.027 |
Neg logit contributions | |
sob | -0.023 |
dentist | -0.023 |
Nib | -0.023 |
doctor | -0.022 |
babys | -0.022 |
Token | , |
Token ID | 11 |
Feature activation | +8.20e-01 |
Pos logit contributions | |
acked | +0.137 |
Run | +0.136 |
ites | +0.135 |
akes | +0.134 |
Wow | +0.134 |
Neg logit contributions | |
dentist | -0.095 |
doctor | -0.094 |
stomach | -0.087 |
mom | -0.087 |
babys | -0.086 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
akes | +0.023 |
ites | +0.023 |
atch | +0.022 |
cer | +0.022 |
Mine | +0.021 |
Neg logit contributions | |
sob | -0.013 |
sorry | -0.013 |
dentist | -0.012 |
doctor | -0.012 |
crying | -0.012 |
Token | cy |
Token ID | 948 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
Run | +0.097 |
Pull | +0.097 |
Quick | +0.081 |
AW | +0.080 |
OK | +0.079 |
Neg logit contributions | |
doctor | -0.310 |
anywhere | -0.306 |
stomach | -0.305 |
Nib | -0.304 |
babys | -0.304 |
Token | ball |
Token ID | 2613 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
sorts | +0.025 |
akes | +0.024 |
ised | +0.024 |
Run | +0.024 |
Uh | +0.024 |
Neg logit contributions | |
doctor | -0.021 |
mom | -0.020 |
sob | -0.020 |
babys | -0.020 |
maid | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | +7.74e-01 |
Pos logit contributions | |
Run | +0.063 |
Wow | +0.063 |
OK | +0.063 |
ites | +0.063 |
akes | +0.062 |
Neg logit contributions | |
sob | -0.024 |
Her | -0.023 |
doctor | -0.023 |
Nib | -0.022 |
dentist | -0.022 |
Token | It |
Token ID | 632 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
cer | +0.021 |
ang | +0.021 |
ites | +0.020 |
Run | +0.020 |
atch | +0.020 |
Neg logit contributions | |
Her | -0.011 |
Nib | -0.010 |
sob | -0.010 |
dentist | -0.010 |
doctor | -0.010 |
Token | was |
Token ID | 373 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
akes | +0.052 |
ites | +0.051 |
ised | +0.051 |
Run | +0.051 |
about | +0.050 |
Neg logit contributions | |
sob | -0.032 |
Her | -0.031 |
Nib | -0.031 |
not | -0.029 |
doctor | -0.028 |
Token | time |
Token ID | 640 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
ites | +0.015 |
Wow | +0.014 |
Run | +0.014 |
cer | +0.014 |
about | +0.013 |
Neg logit contributions | |
sob | -0.015 |
Her | -0.014 |
dentist | -0.014 |
stomach | -0.014 |
not | -0.014 |
Token | , |
Token ID | 11 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
sob | +0.002 |
dentist | +0.002 |
Nib | +0.002 |
ache | +0.002 |
throat | +0.002 |
Neg logit contributions | |
Run | -0.002 |
sorts | -0.002 |
ites | -0.002 |
Wow | -0.002 |
atch | -0.002 |
Token | there |
Token ID | 612 |
Feature activation | +9.21e-01 |
Pos logit contributions | |
sob | +0.021 |
Nib | +0.020 |
Her | +0.020 |
anywhere | +0.020 |
doctor | +0.018 |
Neg logit contributions | |
ites | -0.035 |
sorts | -0.035 |
atch | -0.034 |
about | -0.034 |
akes | -0.034 |
Token | was |
Token ID | 373 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Run | +0.020 |
ites | +0.020 |
sorts | +0.019 |
Wow | +0.019 |
atch | +0.019 |
Neg logit contributions | |
sob | -0.017 |
Nib | -0.016 |
dentist | -0.016 |
babys | -0.016 |
anywhere | -0.016 |
Token | a |
Token ID | 257 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
sob | +0.019 |
Nib | +0.018 |
dentist | +0.018 |
Her | +0.017 |
babys | +0.016 |
Neg logit contributions | |
ites | -0.050 |
atch | -0.050 |
OK | -0.049 |
Run | -0.049 |
ang | -0.049 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
akes | +0.031 |
ites | +0.031 |
atch | +0.031 |
sorts | +0.031 |
acked | +0.030 |
Neg logit contributions | |
doctor | -0.023 |
dentist | -0.023 |
sob | -0.023 |
babys | -0.022 |
Nib | -0.022 |
Token | cy |
Token ID | 948 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
Pull | +0.101 |
Run | +0.097 |
Quick | +0.084 |
AW | +0.084 |
blows | +0.081 |
Neg logit contributions | |
doctor | -0.306 |
anywhere | -0.302 |
stomach | -0.301 |
Nib | -0.301 |
babys | -0.298 |
Token | rubber |
Token ID | 14239 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
sorts | +0.030 |
akes | +0.029 |
ised | +0.029 |
atch | +0.028 |
ites | +0.028 |
Neg logit contributions | |
doctor | -0.025 |
mom | -0.024 |
sob | -0.024 |
babys | -0.024 |
dentist | -0.023 |
Token | ball |
Token ID | 2613 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
sorts | +0.062 |
Run | +0.061 |
atch | +0.061 |
ised | +0.061 |
Wow | +0.060 |
Neg logit contributions | |
doctor | -0.052 |
sob | -0.050 |
Nib | -0.049 |
babys | -0.049 |
throat | -0.049 |
Token | . |
Token ID | 13 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
Run | +0.059 |
Wow | +0.059 |
OK | +0.059 |
Uh | +0.058 |
ites | +0.058 |
Neg logit contributions | |
sob | -0.022 |
Her | -0.021 |
Nib | -0.021 |
doctor | -0.020 |
dentist | -0.020 |
Token | It |
Token ID | 632 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
cer | +0.023 |
ang | +0.023 |
ites | +0.023 |
Run | +0.023 |
atch | +0.023 |
Neg logit contributions | |
Her | -0.012 |
Nib | -0.010 |
doctor | -0.009 |
dentist | -0.009 |
sob | -0.009 |
Token | loud |
Token ID | 7812 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
sob | +0.006 |
Nib | +0.006 |
dentist | +0.006 |
ppa | +0.006 |
ache | +0.006 |
Neg logit contributions | |
sorts | -0.008 |
Run | -0.008 |
Wow | -0.008 |
about | -0.007 |
atch | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
ites | +0.050 |
OK | +0.049 |
Wow | +0.049 |
Run | +0.049 |
ang | +0.049 |
Neg logit contributions | |
sob | -0.043 |
Nib | -0.041 |
dentist | -0.041 |
anywhere | -0.041 |
ache | -0.040 |
Token | there |
Token ID | 612 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
sob | +0.004 |
Nib | +0.003 |
dentist | +0.003 |
anywhere | +0.003 |
babys | +0.003 |
Neg logit contributions | |
akes | -0.004 |
ites | -0.004 |
atch | -0.004 |
about | -0.004 |
cer | -0.004 |
Token | was |
Token ID | 373 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
sorts | +0.000 |
Run | +0.000 |
about | +0.000 |
Wow | +0.000 |
OK | +0.000 |
Neg logit contributions | |
sob | -0.000 |
Nib | -0.000 |
dentist | -0.000 |
ppa | -0.000 |
ache | -0.000 |
Token | a |
Token ID | 257 |
Feature activation | +9.64e-01 |
Pos logit contributions | |
ppa | +0.005 |
sob | +0.005 |
Nib | +0.005 |
ache | +0.005 |
babys | +0.004 |
Neg logit contributions | |
sorts | -0.007 |
Run | -0.007 |
about | -0.007 |
Wow | -0.007 |
OK | -0.007 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
ites | +0.020 |
atch | +0.020 |
akes | +0.020 |
sorts | +0.020 |
Run | +0.019 |
Neg logit contributions | |
sob | -0.019 |
babys | -0.018 |
dentist | -0.018 |
doctor | -0.018 |
Nib | -0.018 |
Token | cy |
Token ID | 948 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
Pull | +0.121 |
Run | +0.112 |
Quick | +0.106 |
OK | +0.099 |
AW | +0.098 |
Neg logit contributions | |
anywhere | -0.288 |
costume | -0.282 |
babys | -0.274 |
mask | -0.273 |
tooth | -0.272 |
Token | castle |
Token ID | 16669 |
Feature activation | -5.31e-02 |
Pos logit contributions | |
atch | +0.005 |
ites | +0.005 |
sorts | +0.005 |
OK | +0.005 |
Run | +0.005 |
Neg logit contributions | |
sob | -0.005 |
anywhere | -0.005 |
babys | -0.005 |
throat | -0.005 |
doctor | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -7.13e-01 |
Pos logit contributions | |
anywhere | +0.001 |
sob | +0.001 |
dentist | +0.001 |
ache | +0.001 |
doctor | +0.001 |
Neg logit contributions | |
Wow | -0.001 |
OK | -0.001 |
Run | -0.001 |
Quick | -0.001 |
Uh | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
sob | +0.011 |
Her | +0.011 |
Nib | +0.011 |
dentist | +0.011 |
babys | +0.010 |
Neg logit contributions | |
ites | -0.017 |
cer | -0.017 |
ang | -0.017 |
Run | -0.017 |
atch | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | -8.47e-02 |
Pos logit contributions | |
ache | +0.024 |
throat | +0.023 |
Nib | +0.022 |
sob | +0.022 |
dentist | +0.022 |
Neg logit contributions | |
sorts | -0.028 |
Wow | -0.028 |
OK | -0.027 |
ites | -0.027 |
Run | -0.027 |
Token | found |
Token ID | 1043 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
sob | +0.007 |
Her | +0.006 |
anywhere | +0.006 |
babys | +0.006 |
doctor | +0.006 |
Neg logit contributions | |
Wow | -0.008 |
Run | -0.008 |
akes | -0.008 |
Uh | -0.008 |
ites | -0.008 |
Token | was |
Token ID | 373 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
sob | +0.007 |
ache | +0.006 |
ppa | +0.006 |
babys | +0.006 |
dentist | +0.006 |
Neg logit contributions | |
sorts | -0.009 |
Run | -0.009 |
ites | -0.009 |
Wow | -0.009 |
cer | -0.009 |
Token | a |
Token ID | 257 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
ppa | +0.022 |
Nib | +0.021 |
sob | +0.021 |
ache | +0.021 |
maid | +0.020 |
Neg logit contributions | |
sorts | -0.029 |
pitch | -0.026 |
wins | -0.025 |
Run | -0.025 |
atch | -0.025 |
Token | big |
Token ID | 1263 |
Feature activation | +5.49e+00 |
Pos logit contributions | |
ites | +0.021 |
Run | +0.021 |
atch | +0.020 |
akes | +0.020 |
Wow | +0.020 |
Neg logit contributions | |
sob | -0.020 |
dentist | -0.019 |
Nib | -0.019 |
babys | -0.019 |
doctor | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
ites | +0.135 |
acked | +0.135 |
akes | +0.132 |
Wow | +0.132 |
Run | +0.128 |
Neg logit contributions | |
doctor | -0.096 |
dentist | -0.092 |
throat | -0.091 |
babys | -0.091 |
Nib | -0.089 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
akes | +0.039 |
ites | +0.038 |
cer | +0.038 |
atch | +0.037 |
ang | +0.037 |
Neg logit contributions | |
sob | -0.034 |
Nib | -0.032 |
dentist | -0.032 |
doctor | -0.031 |
babys | -0.031 |
Token | cy |
Token ID | 948 |
Feature activation | +5.90e-01 |
Pos logit contributions | |
Pull | +0.111 |
Run | +0.106 |
AW | +0.096 |
Quick | +0.094 |
OK | +0.090 |
Neg logit contributions | |
anywhere | -0.296 |
costume | -0.291 |
doctor | -0.285 |
tooth | -0.284 |
mask | -0.283 |
Token | tr |
Token ID | 491 |
Feature activation | +7.06e+00 |
Pos logit contributions | |
ites | +0.012 |
atch | +0.012 |
sorts | +0.012 |
akes | +0.012 |
Run | +0.012 |
Neg logit contributions | |
sob | -0.012 |
throat | -0.011 |
anywhere | -0.011 |
doctor | -0.011 |
babys | -0.011 |
Token | amp |
Token ID | 696 |
Feature activation | +5.77e+00 |
Pos logit contributions | |
OK | +0.119 |
Wow | +0.111 |
Run | +0.109 |
Uh | +0.098 |
Pull | +0.097 |
Neg logit contributions | |
anywhere | -0.169 |
dentist | -0.164 |
babys | -0.162 |
ocket | -0.160 |
ppa | -0.160 |
Token | oline |
Token ID | 14453 |
Feature activation | +2.62e+00 |
Pos logit contributions | |
OK | +0.093 |
sorts | +0.092 |
Uh | +0.092 |
ites | +0.090 |
Run | +0.089 |
Neg logit contributions | |
anywhere | -0.136 |
dentist | -0.133 |
Her | -0.130 |
sob | -0.130 |
doctor | -0.128 |
Token | . |
Token ID | 13 |
Feature activation | +2.77e-01 |
Pos logit contributions | |
Wow | +0.073 |
Run | +0.072 |
sorts | +0.072 |
OK | +0.072 |
ites | +0.072 |
Neg logit contributions | |
sob | -0.031 |
Nib | -0.029 |
anywhere | -0.029 |
dentist | -0.029 |
ache | -0.028 |
Token | time |
Token ID | 640 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
ites | +0.018 |
Wow | +0.017 |
cer | +0.017 |
Run | +0.017 |
sorts | +0.017 |
Neg logit contributions | |
sob | -0.019 |
dentist | -0.018 |
Her | -0.017 |
stomach | -0.017 |
not | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
Run | +0.005 |
sorts | +0.005 |
Wow | +0.005 |
atch | +0.005 |
ites | +0.005 |
Neg logit contributions | |
sob | -0.003 |
dentist | -0.003 |
Nib | -0.003 |
ache | -0.003 |
throat | -0.003 |
Token | there |
Token ID | 612 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
sob | +0.017 |
Nib | +0.017 |
anywhere | +0.016 |
Her | +0.016 |
doctor | +0.015 |
Neg logit contributions | |
ites | -0.028 |
sorts | -0.027 |
atch | -0.027 |
about | -0.027 |
akes | -0.027 |
Token | was |
Token ID | 373 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Run | +0.026 |
sorts | +0.026 |
Wow | +0.026 |
ites | +0.026 |
atch | +0.026 |
Neg logit contributions | |
sob | -0.024 |
Nib | -0.023 |
dentist | -0.023 |
babys | -0.022 |
ache | -0.022 |
Token | a |
Token ID | 257 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
sob | +0.019 |
Nib | +0.018 |
dentist | +0.018 |
babys | +0.017 |
ache | +0.017 |
Neg logit contributions | |
Run | -0.040 |
sorts | -0.040 |
Wow | -0.040 |
ites | -0.040 |
atch | -0.039 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
ites | +0.032 |
akes | +0.032 |
sorts | +0.032 |
atch | +0.031 |
acked | +0.031 |
Neg logit contributions | |
sob | -0.026 |
dentist | -0.026 |
doctor | -0.026 |
Nib | -0.025 |
babys | -0.025 |
Token | cy |
Token ID | 948 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
Run | +0.093 |
Pull | +0.091 |
Quick | +0.078 |
AW | +0.077 |
blows | +0.075 |
Neg logit contributions | |
doctor | -0.312 |
Nib | -0.310 |
stomach | -0.310 |
anywhere | -0.309 |
tooth | -0.307 |
Token | little |
Token ID | 1310 |
Feature activation | +4.49e+00 |
Pos logit contributions | |
sorts | +0.026 |
akes | +0.025 |
ites | +0.025 |
atch | +0.025 |
ised | +0.024 |
Neg logit contributions | |
doctor | -0.027 |
sob | -0.027 |
mom | -0.027 |
babys | -0.027 |
stomach | -0.026 |
Token | bunny |
Token ID | 44915 |
Feature activation | +6.49e-01 |
Pos logit contributions | |
iling | +0.101 |
acked | +0.099 |
atch | +0.099 |
Pull | +0.098 |
sorts | +0.096 |
Neg logit contributions | |
doctor | -0.083 |
mom | -0.083 |
babys | -0.082 |
throat | -0.081 |
stomach | -0.080 |
Token | called |
Token ID | 1444 |
Feature activation | -2.51e+00 |
Pos logit contributions | |
ang | +0.015 |
sorts | +0.015 |
cer | +0.015 |
ites | +0.015 |
Run | +0.015 |
Neg logit contributions | |
sob | -0.011 |
dentist | -0.011 |
Nib | -0.011 |
ache | -0.010 |
babys | -0.010 |
Token | Bob |
Token ID | 5811 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
sob | +0.039 |
dentist | +0.037 |
ache | +0.037 |
babys | +0.035 |
ppa | +0.035 |
Neg logit contributions | |
Run | -0.062 |
Wow | -0.061 |
sorts | -0.060 |
atch | -0.060 |
ites | -0.060 |
Token | blue |
Token ID | 4171 |
Feature activation | +3.97e+00 |
Pos logit contributions | |
ites | +0.109 |
akes | +0.107 |
ang | +0.106 |
Wow | +0.105 |
Run | +0.105 |
Neg logit contributions | |
sob | -0.078 |
doctor | -0.077 |
babys | -0.077 |
dentist | -0.077 |
stomach | -0.077 |
Token | balloon |
Token ID | 21190 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
ites | +0.087 |
ang | +0.087 |
Run | +0.087 |
OK | +0.087 |
atch | +0.085 |
Neg logit contributions | |
babys | -0.071 |
doctor | -0.071 |
dentist | -0.070 |
Nib | -0.070 |
anywhere | -0.069 |
Token | . |
Token ID | 13 |
Feature activation | -4.91e-02 |
Pos logit contributions | |
Run | +0.029 |
Wow | +0.029 |
OK | +0.029 |
ites | +0.029 |
akes | +0.029 |
Neg logit contributions | |
sob | -0.022 |
Nib | -0.021 |
dentist | -0.021 |
anywhere | -0.021 |
doctor | -0.020 |
Token | It |
Token ID | 632 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
Nib | +0.001 |
sob | +0.001 |
Her | +0.001 |
dentist | +0.001 |
doctor | +0.001 |
Neg logit contributions | |
ites | -0.001 |
Run | -0.001 |
cer | -0.001 |
atch | -0.001 |
ang | -0.001 |
Token | was |
Token ID | 373 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
akes | +0.041 |
ites | +0.041 |
atch | +0.041 |
Wow | +0.040 |
Run | +0.040 |
Neg logit contributions | |
sob | -0.028 |
Nib | -0.026 |
dentist | -0.025 |
anywhere | -0.025 |
Her | -0.025 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
sob | +0.003 |
dentist | +0.003 |
Nib | +0.003 |
ache | +0.003 |
ppa | +0.003 |
Neg logit contributions | |
sorts | -0.005 |
Wow | -0.004 |
Run | -0.004 |
atch | -0.004 |
about | -0.004 |
Token | cy |
Token ID | 948 |
Feature activation | -5.45e-01 |
Pos logit contributions | |
Run | +0.109 |
blows | +0.104 |
Quick | +0.102 |
Pull | +0.100 |
OK | +0.100 |
Neg logit contributions | |
anywhere | -0.290 |
Nib | -0.274 |
ocket | -0.271 |
Her | -0.269 |
pt | -0.269 |
Token | and |
Token ID | 290 |
Feature activation | -5.42e-01 |
Pos logit contributions | |
anywhere | +0.009 |
sob | +0.009 |
Nib | +0.009 |
throat | +0.009 |
stomach | +0.009 |
Neg logit contributions | |
Run | -0.013 |
Wow | -0.012 |
Uh | -0.012 |
OK | -0.012 |
Quick | -0.012 |
Token | fun |
Token ID | 1257 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
sob | +0.010 |
not | +0.009 |
Nib | +0.009 |
Her | +0.009 |
anywhere | +0.009 |
Neg logit contributions | |
akes | -0.012 |
atch | -0.012 |
iling | -0.012 |
ites | -0.012 |
ang | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
Run | +0.046 |
Wow | +0.046 |
ang | +0.045 |
Uh | +0.045 |
OK | +0.045 |
Neg logit contributions | |
anywhere | -0.025 |
sob | -0.024 |
dentist | -0.022 |
Nib | -0.022 |
doctor | -0.022 |
Token | He |
Token ID | 679 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
Nib | +0.006 |
sob | +0.006 |
Her | +0.006 |
dentist | +0.005 |
doctor | +0.005 |
Neg logit contributions | |
Run | -0.010 |
ites | -0.010 |
cer | -0.010 |
atch | -0.009 |
sorts | -0.009 |
Token | they |
Token ID | 484 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
atch | +0.026 |
akes | +0.026 |
ites | +0.026 |
ang | +0.025 |
sorts | +0.025 |
Neg logit contributions | |
sob | -0.017 |
Nib | -0.016 |
anywhere | -0.016 |
dentist | -0.016 |
doctor | -0.015 |
Token | found |
Token ID | 1043 |
Feature activation | -6.00e-01 |
Pos logit contributions | |
Run | +0.055 |
akes | +0.055 |
atch | +0.054 |
OK | +0.054 |
Wow | +0.054 |
Neg logit contributions | |
sob | -0.039 |
Nib | -0.038 |
anywhere | -0.037 |
dentist | -0.037 |
doctor | -0.035 |
Token | a |
Token ID | 257 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
sob | +0.009 |
Nib | +0.008 |
dentist | +0.008 |
babys | +0.008 |
ache | +0.008 |
Neg logit contributions | |
sorts | -0.015 |
Run | -0.015 |
Wow | -0.015 |
ites | -0.015 |
OK | -0.015 |
Token | big |
Token ID | 1263 |
Feature activation | +4.96e+00 |
Pos logit contributions | |
Run | +0.007 |
sorts | +0.007 |
Wow | +0.007 |
ites | +0.007 |
OK | +0.007 |
Neg logit contributions | |
sob | -0.007 |
Nib | -0.007 |
dentist | -0.007 |
babys | -0.006 |
Her | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +5.98e-01 |
Pos logit contributions | |
ites | +0.125 |
akes | +0.125 |
ang | +0.119 |
acked | +0.118 |
Run | +0.116 |
Neg logit contributions | |
dentist | -0.084 |
doctor | -0.084 |
sob | -0.083 |
tooth | -0.082 |
throat | -0.081 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
akes | +0.013 |
ites | +0.012 |
atch | +0.012 |
ang | +0.012 |
cer | +0.012 |
Neg logit contributions | |
sob | -0.012 |
dentist | -0.011 |
Nib | -0.011 |
doctor | -0.011 |
babys | -0.011 |
Token | cy |
Token ID | 948 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
Run | +0.119 |
Pull | +0.116 |
AW | +0.108 |
blows | +0.107 |
Quick | +0.106 |
Neg logit contributions | |
anywhere | -0.278 |
costume | -0.273 |
tooth | -0.269 |
doctor | -0.264 |
Nib | -0.262 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
ites | +0.004 |
akes | +0.004 |
ang | +0.004 |
OK | +0.004 |
sorts | +0.004 |
Neg logit contributions | |
sob | -0.004 |
anywhere | -0.004 |
tooth | -0.004 |
crown | -0.004 |
throat | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -3.32e-01 |
Pos logit contributions | |
OK | +0.048 |
Wow | +0.048 |
Uh | +0.048 |
Quick | +0.048 |
ised | +0.047 |
Neg logit contributions | |
anywhere | -0.017 |
sob | -0.017 |
Nib | -0.016 |
doctor | -0.016 |
crying | -0.015 |
Token | They |
Token ID | 1119 |
Feature activation | +2.17e+00 |
Pos logit contributions | |
sob | +0.006 |
Nib | +0.006 |
dentist | +0.006 |
Her | +0.006 |
babys | +0.006 |
Neg logit contributions | |
Run | -0.007 |
atch | -0.007 |
sorts | -0.007 |
ites | -0.007 |
OK | -0.007 |
Token | were |
Token ID | 547 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
akes | +0.057 |
iling | +0.055 |
atch | +0.054 |
Run | +0.054 |
mer | +0.054 |
Neg logit contributions | |
sob | -0.033 |
Her | -0.031 |
Nib | -0.031 |
yes | -0.030 |
mom | -0.029 |
Token | , |
Token ID | 11 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
sob | +0.002 |
dentist | +0.002 |
ache | +0.002 |
ppa | +0.002 |
Nib | +0.002 |
Neg logit contributions | |
Run | -0.003 |
sorts | -0.003 |
Wow | -0.003 |
ang | -0.003 |
atch | -0.003 |
Token | there |
Token ID | 612 |
Feature activation | +8.73e-01 |
Pos logit contributions | |
sob | +0.023 |
Nib | +0.022 |
anywhere | +0.022 |
Her | +0.022 |
doctor | +0.020 |
Neg logit contributions | |
ites | -0.037 |
sorts | -0.037 |
atch | -0.037 |
about | -0.036 |
akes | -0.036 |
Token | was |
Token ID | 373 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
sorts | +0.017 |
Wow | +0.017 |
Run | +0.017 |
about | +0.016 |
cy | +0.016 |
Neg logit contributions | |
sob | -0.018 |
ache | -0.017 |
dentist | -0.017 |
Nib | -0.017 |
ppa | -0.017 |
Token | a |
Token ID | 257 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
sob | +0.024 |
Nib | +0.023 |
dentist | +0.022 |
babys | +0.021 |
ache | +0.021 |
Neg logit contributions | |
Run | -0.050 |
sorts | -0.050 |
Wow | -0.049 |
ites | -0.049 |
atch | -0.049 |
Token | small |
Token ID | 1402 |
Feature activation | +6.00e+00 |
Pos logit contributions | |
ites | +0.027 |
akes | +0.027 |
sorts | +0.027 |
atch | +0.027 |
acked | +0.026 |
Neg logit contributions | |
sob | -0.022 |
dentist | -0.022 |
doctor | -0.022 |
Nib | -0.022 |
babys | -0.021 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
atch | +0.139 |
ites | +0.137 |
acked | +0.136 |
Run | +0.134 |
Wow | +0.133 |
Neg logit contributions | |
doctor | -0.112 |
dentist | -0.109 |
babys | -0.107 |
throat | -0.106 |
Nib | -0.105 |
Token | cy |
Token ID | 948 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
Pull | +0.095 |
Run | +0.094 |
Quick | +0.081 |
AW | +0.080 |
blows | +0.077 |
Neg logit contributions | |
doctor | -0.309 |
stomach | -0.308 |
Nib | -0.306 |
anywhere | -0.305 |
babys | -0.304 |
Token | thing |
Token ID | 1517 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
sorts | +0.026 |
ites | +0.025 |
akes | +0.025 |
atch | +0.025 |
ised | +0.024 |
Neg logit contributions | |
doctor | -0.024 |
sob | -0.024 |
babys | -0.024 |
mom | -0.024 |
stomach | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +7.71e-01 |
Pos logit contributions | |
sob | +0.016 |
Nib | +0.015 |
dentist | +0.015 |
ppa | +0.014 |
ache | +0.014 |
Neg logit contributions | |
sorts | -0.026 |
Run | -0.026 |
ites | -0.025 |
ang | -0.025 |
about | -0.025 |
Token | It |
Token ID | 632 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
cer | +0.020 |
ang | +0.020 |
ites | +0.020 |
atch | +0.019 |
mer | +0.019 |
Neg logit contributions | |
Her | -0.012 |
Nib | -0.011 |
sob | -0.011 |
dentist | -0.010 |
throat | -0.010 |
Token | was |
Token ID | 373 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
ites | +0.048 |
Run | +0.047 |
akes | +0.047 |
atch | +0.047 |
about | +0.046 |
Neg logit contributions | |
sob | -0.037 |
Nib | -0.036 |
Her | -0.035 |
dentist | -0.034 |
throat | -0.034 |
Token |
|
Token ID | 198 |
Feature activation | +8.90e-02 |
Pos logit contributions | |
throat | +0.021 |
ache | +0.021 |
babys | +0.020 |
sob | +0.020 |
Nib | +0.020 |
Neg logit contributions | |
sorts | -0.021 |
Wow | -0.021 |
OK | -0.021 |
Run | -0.021 |
ang | -0.020 |
Token | He |
Token ID | 1544 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
akes | +0.002 |
cy | +0.002 |
ites | +0.002 |
mer | +0.002 |
sorts | +0.002 |
Neg logit contributions | |
dentist | -0.002 |
doctor | -0.002 |
sob | -0.002 |
not | -0.002 |
Her | -0.002 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
Run | +0.022 |
sorts | +0.022 |
ites | +0.022 |
Wow | +0.022 |
atch | +0.022 |
Neg logit contributions | |
sob | -0.025 |
Nib | -0.024 |
dentist | -0.024 |
babys | -0.023 |
throat | -0.023 |
Token | a |
Token ID | 257 |
Feature activation | +8.45e-01 |
Pos logit contributions | |
ppa | +0.037 |
ache | +0.036 |
babys | +0.034 |
sob | +0.034 |
ridge | +0.034 |
Neg logit contributions | |
sorts | -0.030 |
Wow | -0.028 |
Run | -0.027 |
about | -0.027 |
kinds | -0.027 |
Token | big |
Token ID | 1263 |
Feature activation | +4.84e+00 |
Pos logit contributions | |
Run | +0.017 |
ites | +0.017 |
sorts | +0.017 |
atch | +0.017 |
akes | +0.017 |
Neg logit contributions | |
sob | -0.017 |
Nib | -0.016 |
dentist | -0.016 |
babys | -0.016 |
doctor | -0.015 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
akes | +0.118 |
acked | +0.115 |
ites | +0.114 |
OK | +0.113 |
atch | +0.112 |
Neg logit contributions | |
dentist | -0.082 |
doctor | -0.081 |
sob | -0.080 |
Nib | -0.079 |
babys | -0.079 |
Token | cy |
Token ID | 948 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
Pull | +0.114 |
Run | +0.112 |
Quick | +0.103 |
AW | +0.099 |
OK | +0.098 |
Neg logit contributions | |
anywhere | -0.287 |
costume | -0.285 |
tooth | -0.279 |
doctor | -0.278 |
mask | -0.278 |
Token | castle |
Token ID | 16669 |
Feature activation | +4.75e-02 |
Pos logit contributions | |
ites | +0.007 |
sorts | +0.007 |
akes | +0.007 |
ang | +0.006 |
OK | +0.006 |
Neg logit contributions | |
sob | -0.007 |
babys | -0.007 |
anywhere | -0.007 |
doctor | -0.007 |
stomach | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +3.91e-01 |
Pos logit contributions | |
Wow | +0.001 |
Mine | +0.001 |
akes | +0.001 |
OK | +0.001 |
Run | +0.001 |
Neg logit contributions | |
sob | -0.001 |
anywhere | -0.001 |
dentist | -0.001 |
doctor | -0.001 |
not | -0.001 |
Token | He |
Token ID | 679 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
cer | +0.010 |
ang | +0.010 |
ites | +0.010 |
mer | +0.010 |
cy | +0.010 |
Neg logit contributions | |
dentist | -0.006 |
sob | -0.006 |
Her | -0.006 |
Nib | -0.006 |
doctor | -0.006 |
Token | wanted |
Token ID | 2227 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
akes | +0.032 |
ites | +0.029 |
cer | +0.029 |
atch | +0.028 |
mer | +0.028 |
Neg logit contributions | |
sob | -0.024 |
Her | -0.021 |
not | -0.021 |
mom | -0.021 |
dentist | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | +6.91e-01 |
Pos logit contributions | |
sorts | +0.026 |
ang | +0.026 |
cer | +0.026 |
Run | +0.026 |
ites | +0.026 |
Neg logit contributions | |
sob | -0.020 |
dentist | -0.019 |
Nib | -0.019 |
babys | -0.019 |
ache | -0.019 |
Token | He |
Token ID | 679 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
Run | +0.016 |
sorts | +0.016 |
ites | +0.016 |
Wow | +0.016 |
atch | +0.016 |
Neg logit contributions | |
sob | -0.012 |
Nib | -0.011 |
dentist | -0.011 |
babys | -0.011 |
ache | -0.011 |
Token | was |
Token ID | 373 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Run | +0.037 |
sorts | +0.037 |
Wow | +0.036 |
OK | +0.036 |
ites | +0.036 |
Neg logit contributions | |
sob | -0.056 |
Nib | -0.055 |
dentist | -0.055 |
babys | -0.054 |
ache | -0.053 |
Token | a |
Token ID | 257 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
ache | +0.024 |
sob | +0.022 |
dentist | +0.022 |
grandmother | +0.021 |
forgiveness | +0.021 |
Neg logit contributions | |
sorts | -0.026 |
ang | -0.025 |
ab | -0.023 |
atch | -0.023 |
pitch | -0.023 |
Token | very |
Token ID | 845 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
Run | +0.035 |
sorts | +0.035 |
ites | +0.035 |
Wow | +0.034 |
atch | +0.034 |
Neg logit contributions | |
sob | -0.027 |
Nib | -0.026 |
dentist | -0.025 |
babys | -0.025 |
throat | -0.024 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
OK | +0.030 |
ang | +0.030 |
sorts | +0.030 |
Run | +0.030 |
ites | +0.029 |
Neg logit contributions | |
sob | -0.030 |
Nib | -0.029 |
dentist | -0.029 |
anywhere | -0.028 |
ache | -0.028 |
Token | cy |
Token ID | 948 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
Pull | +0.096 |
Run | +0.095 |
AW | +0.086 |
Quick | +0.083 |
blows | +0.080 |
Neg logit contributions | |
anywhere | -0.302 |
doctor | -0.301 |
tooth | -0.299 |
Nib | -0.299 |
stomach | -0.299 |
Token | bunny |
Token ID | 44915 |
Feature activation | +3.78e-01 |
Pos logit contributions | |
ites | +0.028 |
akes | +0.028 |
Run | +0.028 |
sorts | +0.028 |
atch | +0.028 |
Neg logit contributions | |
sob | -0.018 |
doctor | -0.017 |
throat | -0.017 |
anywhere | -0.017 |
stomach | -0.017 |
Token | and |
Token ID | 290 |
Feature activation | -5.80e-01 |
Pos logit contributions | |
sorts | +0.009 |
ang | +0.009 |
Run | +0.009 |
ites | +0.009 |
cer | +0.009 |
Neg logit contributions | |
sob | -0.006 |
dentist | -0.006 |
Nib | -0.006 |
babys | -0.006 |
ache | -0.006 |
Token | all |
Token ID | 477 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
sob | +0.013 |
Nib | +0.012 |
dentist | +0.012 |
babys | +0.012 |
throat | +0.012 |
Neg logit contributions | |
Run | -0.010 |
sorts | -0.010 |
ites | -0.010 |
Wow | -0.010 |
atch | -0.010 |
Token | day |
Token ID | 1110 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
Run | +0.054 |
Uh | +0.051 |
OK | +0.051 |
atch | +0.051 |
Quick | +0.050 |
Neg logit contributions | |
Her | -0.044 |
Nib | -0.044 |
sob | -0.042 |
anywhere | -0.042 |
throat | -0.040 |
Token | to |
Token ID | 284 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
Run | +0.005 |
sorts | +0.005 |
Wow | +0.005 |
ites | +0.005 |
atch | +0.005 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.003 |
dentist | -0.003 |
babys | -0.003 |
throat | -0.003 |
Token | be |
Token ID | 307 |
Feature activation | -8.00e-02 |
Pos logit contributions | |
sorts | +0.004 |
Run | +0.004 |
Wow | +0.004 |
atch | +0.004 |
OK | +0.004 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.002 |
dentist | -0.002 |
ache | -0.002 |
babys | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
babys | +0.001 |
Nib | +0.001 |
sob | +0.001 |
ache | +0.001 |
dentist | +0.001 |
Neg logit contributions | |
sorts | -0.002 |
cer | -0.002 |
about | -0.002 |
Run | -0.002 |
atch | -0.002 |
Token | big |
Token ID | 1263 |
Feature activation | +5.06e+00 |
Pos logit contributions | |
Run | +0.004 |
sorts | +0.004 |
Wow | +0.004 |
OK | +0.003 |
about | +0.003 |
Neg logit contributions | |
sob | -0.004 |
Nib | -0.004 |
dentist | -0.004 |
Her | -0.003 |
throat | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
ites | +0.125 |
akes | +0.124 |
acked | +0.121 |
ang | +0.119 |
atch | +0.117 |
Neg logit contributions | |
doctor | -0.082 |
dentist | -0.082 |
Nib | -0.082 |
sob | -0.082 |
throat | -0.079 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
akes | +0.033 |
ites | +0.033 |
atch | +0.031 |
cer | +0.031 |
ang | +0.031 |
Neg logit contributions | |
sob | -0.031 |
Nib | -0.029 |
dentist | -0.029 |
doctor | -0.028 |
babys | -0.028 |
Token | cy |
Token ID | 948 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
Pull | +0.105 |
Run | +0.104 |
Quick | +0.096 |
AW | +0.091 |
blows | +0.090 |
Neg logit contributions | |
anywhere | -0.284 |
Nib | -0.281 |
tooth | -0.279 |
doctor | -0.279 |
costume | -0.277 |
Token | rubber |
Token ID | 14239 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
ites | +0.005 |
akes | +0.005 |
atch | +0.005 |
sorts | +0.005 |
ang | +0.005 |
Neg logit contributions | |
sob | -0.005 |
throat | -0.005 |
Nib | -0.005 |
anywhere | -0.005 |
doctor | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -6.41e-01 |
Pos logit contributions | |
Wow | +0.028 |
sorts | +0.028 |
ised | +0.028 |
ites | +0.027 |
Uh | +0.027 |
Neg logit contributions | |
doctor | -0.028 |
sob | -0.028 |
Nib | -0.027 |
throat | -0.027 |
anywhere | -0.027 |
Token | He |
Token ID | 679 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
sob | +0.009 |
Her | +0.009 |
Nib | +0.009 |
dentist | +0.009 |
doctor | +0.008 |
Neg logit contributions | |
ites | -0.016 |
ang | -0.016 |
akes | -0.016 |
Run | -0.016 |
cer | -0.016 |
Token | bent |
Token ID | 17157 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
akes | +0.025 |
ites | +0.024 |
sorts | +0.024 |
atch | +0.023 |
cer | +0.023 |
Neg logit contributions | |
sob | -0.022 |
Her | -0.020 |
Nib | -0.020 |
dentist | -0.019 |
doctor | -0.019 |
Token | she |
Token ID | 673 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
sorts | +0.031 |
Run | +0.029 |
about | +0.028 |
akes | +0.028 |
cy | +0.028 |
Neg logit contributions | |
ppa | -0.036 |
ache | -0.036 |
dentist | -0.035 |
throat | -0.034 |
sob | -0.034 |
Token | found |
Token ID | 1043 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
sorts | +0.011 |
OK | +0.011 |
cy | +0.011 |
cer | +0.011 |
Run | +0.011 |
Neg logit contributions | |
Nib | -0.014 |
ache | -0.014 |
sob | -0.014 |
babys | -0.014 |
dentist | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
ache | +0.024 |
ppa | +0.024 |
babys | +0.023 |
sob | +0.022 |
throat | +0.022 |
Neg logit contributions | |
sorts | -0.021 |
Wow | -0.018 |
kinds | -0.018 |
Run | -0.017 |
hed | -0.017 |
Token | big |
Token ID | 1263 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
sob | +0.006 |
Nib | +0.006 |
Her | +0.005 |
ppa | +0.005 |
dentist | +0.005 |
Neg logit contributions | |
sorts | -0.005 |
Wow | -0.005 |
OK | -0.005 |
Run | -0.005 |
about | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +8.52e-01 |
Pos logit contributions | |
ites | +0.100 |
akes | +0.098 |
Run | +0.097 |
OK | +0.096 |
ang | +0.096 |
Neg logit contributions | |
dentist | -0.067 |
sob | -0.066 |
doctor | -0.065 |
throat | -0.064 |
Nib | -0.064 |
Token | boun |
Token ID | 31283 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
ites | +0.017 |
akes | +0.017 |
atch | +0.016 |
Run | +0.016 |
cer | +0.016 |
Neg logit contributions | |
sob | -0.018 |
dentist | -0.017 |
Nib | -0.017 |
babys | -0.016 |
anywhere | -0.016 |
Token | cy |
Token ID | 948 |
Feature activation | -6.38e-02 |
Pos logit contributions | |
Run | +0.104 |
Pull | +0.102 |
OK | +0.090 |
AW | +0.089 |
blows | +0.087 |
Neg logit contributions | |
anywhere | -0.294 |
costume | -0.287 |
tooth | -0.284 |
doctor | -0.284 |
mask | -0.282 |
Token | mattress |
Token ID | 33388 |
Feature activation | +8.61e-01 |
Pos logit contributions | |
sob | +0.001 |
babys | +0.001 |
throat | +0.001 |
doctor | +0.001 |
dentist | +0.001 |
Neg logit contributions | |
ites | -0.002 |
atch | -0.002 |
akes | -0.002 |
OK | -0.002 |
ang | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -8.49e-01 |
Pos logit contributions | |
Wow | +0.022 |
ites | +0.022 |
akes | +0.022 |
OK | +0.021 |
Run | +0.021 |
Neg logit contributions | |
sob | -0.013 |
dentist | -0.012 |
anywhere | -0.012 |
Nib | -0.012 |
doctor | -0.012 |
Token | She |
Token ID | 1375 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
ache | +0.015 |
dentist | +0.015 |
ppa | +0.015 |
sob | +0.014 |
anywhere | +0.014 |
Neg logit contributions | |
Wow | -0.020 |
sorts | -0.020 |
Run | -0.019 |
ites | -0.019 |
ang | -0.019 |
Token | thought |
Token ID | 1807 |
Feature activation | -4.40e-01 |
Pos logit contributions | |
akes | +0.026 |
Run | +0.025 |
ites | +0.025 |
Wow | +0.025 |
atch | +0.025 |
Neg logit contributions | |
sob | -0.020 |
Her | -0.018 |
Nib | -0.017 |
dentist | -0.017 |
throat | -0.017 |
Token | she |
Token ID | 673 |
Feature activation | +7.02e-01 |
Pos logit contributions | |
sob | +0.010 |
Nib | +0.009 |
dentist | +0.009 |
babys | +0.009 |
anywhere | +0.008 |
Neg logit contributions | |
Run | -0.027 |
sorts | -0.027 |
OK | -0.026 |
Wow | -0.026 |
ites | -0.026 |
Token | smiled |
Token ID | 13541 |
Feature activation | -7.46e-02 |
Pos logit contributions | |
akes | +0.019 |
Wow | +0.019 |
atch | +0.019 |
ites | +0.019 |
cer | +0.019 |
Neg logit contributions | |
sob | -0.010 |
ache | -0.009 |
Her | -0.008 |
dentist | -0.008 |
throat | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
dentist | +0.002 |
Nib | +0.001 |
babys | +0.001 |
sob | +0.001 |
maid | +0.001 |
Neg logit contributions | |
ised | -0.001 |
cer | -0.001 |
sorts | -0.001 |
cy | -0.001 |
OK | -0.001 |
Token | gave |
Token ID | 2921 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
sob | +0.016 |
Nib | +0.016 |
dentist | +0.015 |
babys | +0.015 |
throat | +0.015 |
Neg logit contributions | |
Run | -0.028 |
ites | -0.028 |
sorts | -0.028 |
Wow | -0.028 |
atch | -0.028 |
Token | her |
Token ID | 607 |
Feature activation | -6.34e+00 |
Pos logit contributions | |
sob | +0.006 |
ache | +0.006 |
Nib | +0.006 |
throat | +0.006 |
babys | +0.006 |
Neg logit contributions | |
sorts | -0.010 |
ee | -0.009 |
cy | -0.009 |
Wow | -0.009 |
OK | -0.009 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.63e+00 |
Pos logit contributions | |
sob | +0.110 |
Nib | +0.109 |
ache | +0.106 |
ppa | +0.104 |
dentist | +0.103 |
Neg logit contributions | |
sorts | -0.147 |
cy | -0.141 |
OK | -0.137 |
about | -0.135 |
ites | -0.135 |
Token | a |
Token ID | 257 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
dentist | +0.154 |
ache | +0.152 |
Nib | +0.152 |
sob | +0.151 |
anywhere | +0.146 |
Neg logit contributions | |
sorts | -0.198 |
cy | -0.183 |
ites | -0.178 |
able | -0.173 |
kinds | -0.172 |
Token | big |
Token ID | 1263 |
Feature activation | +2.43e+00 |
Pos logit contributions | |
Nib | +0.037 |
sob | +0.037 |
dentist | +0.035 |
ppa | +0.035 |
anywhere | +0.035 |
Neg logit contributions | |
sorts | -0.044 |
OK | -0.042 |
Run | -0.042 |
about | -0.042 |
Wow | -0.042 |
Token | hug |
Token ID | 16225 |
Feature activation | -9.69e-01 |
Pos logit contributions | |
ites | +0.076 |
atch | +0.075 |
Wow | +0.075 |
akes | +0.075 |
cer | +0.075 |
Neg logit contributions | |
sob | -0.024 |
babys | -0.022 |
throat | -0.021 |
doctor | -0.021 |
dentist | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | -8.75e-01 |
Pos logit contributions | |
Nib | +0.019 |
sob | +0.019 |
dentist | +0.019 |
maid | +0.018 |
babys | +0.018 |
Neg logit contributions | |
mer | -0.019 |
OK | -0.019 |
sorts | -0.018 |
cer | -0.018 |
cy | -0.018 |
Token | |
Token ID | 220 |
Feature activation | +4.90e-01 |
Pos logit contributions | |
sob | +0.010 |
Nib | +0.010 |
dentist | +0.010 |
babys | +0.009 |
Her | +0.009 |
Neg logit contributions | |
Run | -0.025 |
sorts | -0.024 |
ites | -0.024 |
Wow | -0.024 |
atch | -0.024 |
Token | happy |
Token ID | 3772 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
Run | +0.004 |
sorts | +0.004 |
ites | +0.004 |
Wow | +0.004 |
atch | +0.004 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.003 |
dentist | -0.003 |
babys | -0.003 |
throat | -0.002 |
Token | that |
Token ID | 326 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
sorts | +0.040 |
Run | +0.040 |
ites | +0.040 |
Wow | +0.040 |
atch | +0.040 |
Neg logit contributions | |
sob | -0.023 |
Nib | -0.022 |
dentist | -0.022 |
babys | -0.021 |
ache | -0.021 |
Token | he |
Token ID | 339 |
Feature activation | +9.06e-01 |
Pos logit contributions | |
sob | +0.004 |
ache | +0.004 |
ppa | +0.004 |
throat | +0.004 |
babys | +0.004 |
Neg logit contributions | |
sorts | -0.008 |
Wow | -0.008 |
cer | -0.007 |
Run | -0.007 |
OK | -0.007 |
Token | gave |
Token ID | 2921 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
akes | +0.022 |
about | +0.022 |
ites | +0.021 |
sorts | +0.021 |
Wow | +0.021 |
Neg logit contributions | |
sob | -0.015 |
Nib | -0.014 |
ache | -0.014 |
dentist | -0.014 |
ppa | -0.014 |
Token | his |
Token ID | 465 |
Feature activation | -5.78e+00 |
Pos logit contributions | |
sorts | +0.004 |
cy | +0.004 |
cer | +0.004 |
able | +0.003 |
Wow | +0.003 |
Neg logit contributions | |
ache | -0.003 |
sob | -0.003 |
babys | -0.003 |
gag | -0.003 |
throat | -0.003 |
Token | wife |
Token ID | 3656 |
Feature activation | -8.59e+00 |
Pos logit contributions | |
sob | +0.068 |
Nib | +0.068 |
Her | +0.058 |
dentist | +0.057 |
Rat | +0.056 |
Neg logit contributions | |
OK | -0.165 |
cer | -0.162 |
Run | -0.161 |
mer | -0.159 |
ites | -0.159 |
Token | a |
Token ID | 257 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
sob | +0.142 |
Nib | +0.132 |
babys | +0.130 |
dentist | +0.130 |
ache | +0.129 |
Neg logit contributions | |
sorts | -0.207 |
ites | -0.198 |
cy | -0.196 |
cer | -0.195 |
atch | -0.194 |
Token | big |
Token ID | 1263 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
sob | +0.051 |
Nib | +0.049 |
ppa | +0.048 |
anywhere | +0.047 |
dentist | +0.047 |
Neg logit contributions | |
sorts | -0.050 |
OK | -0.048 |
Run | -0.047 |
Wow | -0.046 |
cy | -0.046 |
Token | hug |
Token ID | 16225 |
Feature activation | -9.87e-01 |
Pos logit contributions | |
ites | +0.059 |
Wow | +0.059 |
akes | +0.059 |
atch | +0.059 |
cer | +0.059 |
Neg logit contributions | |
sob | -0.018 |
dentist | -0.017 |
babys | -0.017 |
Nib | -0.017 |
throat | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
sob | +0.022 |
Nib | +0.022 |
maid | +0.021 |
ppa | +0.021 |
dentist | +0.021 |
Neg logit contributions | |
cer | -0.017 |
sorts | -0.017 |
mer | -0.016 |
about | -0.016 |
OK | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | -9.08e-01 |
Pos logit contributions | |
sob | +0.033 |
Nib | +0.033 |
dentist | +0.032 |
babys | +0.031 |
anywhere | +0.031 |
Neg logit contributions | |
Run | -0.037 |
sorts | -0.037 |
Wow | -0.036 |
ites | -0.036 |
OK | -0.036 |
Token | she |
Token ID | 673 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
sob | +0.013 |
Nib | +0.012 |
dentist | +0.012 |
anywhere | +0.011 |
babys | +0.011 |
Neg logit contributions | |
sorts | -0.032 |
Run | -0.032 |
OK | -0.032 |
ites | -0.032 |
Wow | -0.032 |
Token | decided |
Token ID | 3066 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
Run | +0.031 |
ites | +0.031 |
sorts | +0.031 |
Wow | +0.031 |
about | +0.031 |
Neg logit contributions | |
sob | -0.026 |
Nib | -0.025 |
dentist | -0.025 |
babys | -0.024 |
ache | -0.024 |
Token | to |
Token ID | 284 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
Nib | +0.038 |
gag | +0.035 |
throat | +0.035 |
sob | +0.035 |
ocket | +0.035 |
Neg logit contributions | |
OK | -0.046 |
than | -0.044 |
Run | -0.043 |
atch | -0.043 |
sorts | -0.043 |
Token | give |
Token ID | 1577 |
Feature activation | -6.04e-01 |
Pos logit contributions | |
sob | +0.033 |
dentist | +0.032 |
Nib | +0.032 |
babys | +0.031 |
Her | +0.031 |
Neg logit contributions | |
Run | -0.049 |
ites | -0.049 |
ang | -0.049 |
Wow | -0.048 |
cer | -0.048 |
Token | her |
Token ID | 607 |
Feature activation | -5.84e+00 |
Pos logit contributions | |
ache | +0.010 |
sob | +0.010 |
throat | +0.009 |
dentist | +0.009 |
anywhere | +0.009 |
Neg logit contributions | |
cy | -0.014 |
Wow | -0.014 |
sorts | -0.014 |
Mine | -0.013 |
OK | -0.013 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.50e+00 |
Pos logit contributions | |
sob | +0.105 |
Nib | +0.102 |
ppa | +0.101 |
ache | +0.101 |
dentist | +0.093 |
Neg logit contributions | |
sorts | -0.130 |
cy | -0.122 |
ites | -0.119 |
about | -0.118 |
OK | -0.117 |
Token | a |
Token ID | 257 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
sob | +0.171 |
ache | +0.163 |
Nib | +0.161 |
dentist | +0.157 |
babys | +0.155 |
Neg logit contributions | |
sorts | -0.185 |
cy | -0.162 |
kinds | -0.162 |
pitch | -0.157 |
able | -0.156 |
Token | teaspoon |
Token ID | 22326 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
ppa | +0.040 |
Nib | +0.040 |
sob | +0.040 |
anywhere | +0.036 |
ache | +0.036 |
Neg logit contributions | |
sorts | -0.039 |
OK | -0.036 |
pitch | -0.035 |
ee | -0.035 |
cy | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
sob | +0.005 |
Nib | +0.004 |
dentist | +0.004 |
maid | +0.004 |
babys | +0.004 |
Neg logit contributions | |
sorts | -0.006 |
ang | -0.005 |
cy | -0.005 |
mer | -0.005 |
ites | -0.005 |
Token | The |
Token ID | 383 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
Run | +0.012 |
sorts | +0.012 |
ites | +0.012 |
Wow | +0.012 |
atch | +0.012 |
Neg logit contributions | |
sob | -0.008 |
Nib | -0.007 |
dentist | -0.007 |
babys | -0.007 |
throat | -0.007 |
Token | little |
Token ID | 1310 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
Nib | +0.002 |
anywhere | +0.002 |
sob | +0.002 |
ppa | +0.002 |
ache | +0.002 |
Neg logit contributions | |
OK | -0.005 |
Wow | -0.005 |
Quick | -0.005 |
Run | -0.005 |
cy | -0.005 |
Token | gentle |
Token ID | 10296 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
Nib | +0.037 |
throat | +0.036 |
sob | +0.036 |
dentist | +0.036 |
Her | +0.035 |
Neg logit contributions | |
sorts | -0.045 |
Run | -0.042 |
ab | -0.042 |
cer | -0.042 |
atch | -0.041 |
Token | and |
Token ID | 290 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
sorts | +0.043 |
cer | +0.042 |
Run | +0.041 |
about | +0.041 |
atch | +0.041 |
Neg logit contributions | |
sob | -0.059 |
Nib | -0.059 |
dentist | -0.058 |
babys | -0.057 |
ppa | -0.056 |
Token | he |
Token ID | 339 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
sob | +0.025 |
Nib | +0.024 |
dentist | +0.024 |
babys | +0.023 |
anywhere | +0.023 |
Neg logit contributions | |
sorts | -0.032 |
Run | -0.032 |
OK | -0.032 |
ites | -0.031 |
Wow | -0.031 |
Token | showed |
Token ID | 3751 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
sorts | +0.004 |
Run | +0.004 |
OK | +0.004 |
ites | +0.004 |
atch | +0.004 |
Neg logit contributions | |
sob | -0.004 |
Nib | -0.004 |
dentist | -0.004 |
babys | -0.004 |
anywhere | -0.004 |
Token | his |
Token ID | 465 |
Feature activation | -5.38e+00 |
Pos logit contributions | |
sob | +0.020 |
dentist | +0.019 |
babys | +0.019 |
throat | +0.019 |
ache | +0.018 |
Neg logit contributions | |
sorts | -0.030 |
ab | -0.029 |
cy | -0.028 |
able | -0.028 |
acked | -0.028 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.44e+00 |
Pos logit contributions | |
Nib | +0.099 |
sob | +0.094 |
ppa | +0.094 |
dentist | +0.092 |
Her | +0.089 |
Neg logit contributions | |
sorts | -0.119 |
OK | -0.111 |
Run | -0.108 |
about | -0.108 |
pitches | -0.108 |
Token | how |
Token ID | 703 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
sob | +0.150 |
dentist | +0.149 |
babys | +0.145 |
ache | +0.144 |
ppa | +0.144 |
Neg logit contributions | |
sorts | -0.197 |
about | -0.174 |
kinds | -0.173 |
wins | -0.171 |
cer | -0.170 |
Token | to |
Token ID | 284 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
sorts | +0.004 |
ites | +0.004 |
OK | +0.004 |
Run | +0.004 |
atch | +0.004 |
Neg logit contributions | |
sob | -0.002 |
dentist | -0.002 |
Nib | -0.002 |
babys | -0.002 |
maid | -0.002 |
Token | give |
Token ID | 1577 |
Feature activation | -2.77e-01 |
Pos logit contributions | |
sob | +0.005 |
Nib | +0.005 |
dentist | +0.005 |
babys | +0.005 |
throat | +0.005 |
Neg logit contributions | |
Wow | -0.006 |
ites | -0.006 |
Run | -0.006 |
sorts | -0.006 |
about | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | -2.40e+00 |
Pos logit contributions | |
sob | +0.005 |
dentist | +0.005 |
babys | +0.004 |
ache | +0.004 |
Nib | +0.004 |
Neg logit contributions | |
sorts | -0.006 |
cer | -0.006 |
cy | -0.006 |
OK | -0.006 |
ites | -0.006 |
Token | horse |
Token ID | 8223 |
Feature activation | -5.20e+00 |
Pos logit contributions | |
sob | +0.046 |
Nib | +0.044 |
dentist | +0.043 |
babys | +0.042 |
throat | +0.042 |
Neg logit contributions | |
Run | -0.050 |
sorts | -0.050 |
ites | -0.050 |
Wow | -0.049 |
OK | -0.049 |
Token | and |
Token ID | 290 |
Feature activation | -3.67e-01 |
Pos logit contributions | |
Run | +0.051 |
Wow | +0.051 |
ites | +0.050 |
atch | +0.050 |
about | +0.050 |
Neg logit contributions | |
sob | -0.044 |
Nib | -0.042 |
dentist | -0.041 |
anywhere | -0.041 |
babys | -0.041 |
Token | the |
Token ID | 262 |
Feature activation | -4.74e-01 |
Pos logit contributions | |
sob | +0.006 |
dentist | +0.006 |
Nib | +0.006 |
ache | +0.006 |
babys | +0.006 |
Neg logit contributions | |
sorts | -0.008 |
OK | -0.008 |
Run | -0.008 |
ites | -0.008 |
Wow | -0.008 |
Token | mum |
Token ID | 25682 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
sob | +0.007 |
dentist | +0.006 |
Nib | +0.006 |
babys | +0.006 |
throat | +0.006 |
Neg logit contributions | |
ites | -0.012 |
sorts | -0.012 |
atch | -0.012 |
Run | -0.012 |
akes | -0.012 |
Token | gave |
Token ID | 2921 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
sob | +0.020 |
Nib | +0.020 |
dentist | +0.020 |
anywhere | +0.019 |
babys | +0.019 |
Neg logit contributions | |
sorts | -0.022 |
ites | -0.022 |
Run | -0.022 |
ang | -0.022 |
OK | -0.022 |
Token | her |
Token ID | 607 |
Feature activation | -6.01e+00 |
Pos logit contributions | |
cy | +0.009 |
sorts | +0.009 |
OK | +0.008 |
Wow | +0.008 |
cer | +0.008 |
Neg logit contributions | |
dentist | -0.004 |
ache | -0.004 |
sob | -0.004 |
babys | -0.004 |
Nib | -0.004 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.37e+00 |
Pos logit contributions | |
sob | +0.098 |
Nib | +0.093 |
dentist | +0.092 |
ache | +0.090 |
babys | +0.088 |
Neg logit contributions | |
sorts | -0.148 |
cy | -0.141 |
OK | -0.141 |
Run | -0.139 |
ites | -0.139 |
Token | lots |
Token ID | 6041 |
Feature activation | +9.67e-01 |
Pos logit contributions | |
sob | +0.141 |
dentist | +0.140 |
Nib | +0.137 |
ache | +0.135 |
babys | +0.134 |
Neg logit contributions | |
sorts | -0.201 |
cy | -0.186 |
ites | -0.186 |
OK | -0.180 |
cer | -0.180 |
Token | of |
Token ID | 286 |
Feature activation | -5.44e-02 |
Pos logit contributions | |
Run | +0.018 |
Wow | +0.018 |
atch | +0.018 |
OK | +0.018 |
ites | +0.018 |
Neg logit contributions | |
sob | -0.020 |
Nib | -0.020 |
dentist | -0.019 |
babys | -0.019 |
ache | -0.019 |
Token | hugs |
Token ID | 40657 |
Feature activation | -9.73e-01 |
Pos logit contributions | |
sob | +0.001 |
Nib | +0.001 |
dentist | +0.001 |
ache | +0.001 |
anywhere | +0.001 |
Neg logit contributions | |
sorts | -0.001 |
Run | -0.001 |
ites | -0.001 |
OK | -0.001 |
Wow | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -6.72e-01 |
Pos logit contributions | |
sob | +0.019 |
dentist | +0.019 |
Nib | +0.018 |
babys | +0.018 |
maid | +0.018 |
Neg logit contributions | |
OK | -0.020 |
sorts | -0.020 |
Wow | -0.019 |
Run | -0.019 |
cer | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
sob | +0.008 |
Nib | +0.008 |
dentist | +0.008 |
babys | +0.008 |
ache | +0.008 |
Neg logit contributions | |
Run | -0.018 |
sorts | -0.018 |
ites | -0.018 |
Wow | -0.018 |
OK | -0.018 |
Token | felt |
Token ID | 2936 |
Feature activation | +6.09e-01 |
Pos logit contributions | |
dentist | +0.062 |
Nib | +0.061 |
sob | +0.060 |
babys | +0.060 |
maid | +0.059 |
Neg logit contributions | |
ab | -0.070 |
Run | -0.070 |
cy | -0.070 |
cer | -0.069 |
ang | -0.069 |
Token | happy |
Token ID | 3772 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
sorts | +0.014 |
Run | +0.013 |
ised | +0.013 |
OK | +0.013 |
mer | +0.013 |
Neg logit contributions | |
dentist | -0.010 |
ppa | -0.010 |
Nib | -0.010 |
maid | -0.010 |
sob | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
sorts | +0.000 |
cer | +0.000 |
OK | +0.000 |
than | +0.000 |
Wow | +0.000 |
Neg logit contributions | |
Nib | -0.000 |
ppa | -0.000 |
dentist | -0.000 |
sob | -0.000 |
babys | -0.000 |
Token | hugged |
Token ID | 41130 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
sob | +0.021 |
dentist | +0.021 |
Nib | +0.021 |
anywhere | +0.020 |
babys | +0.020 |
Neg logit contributions | |
sorts | -0.028 |
OK | -0.027 |
Run | -0.027 |
Wow | -0.027 |
ites | -0.027 |
Token | her |
Token ID | 607 |
Feature activation | -7.46e+00 |
Pos logit contributions | |
ache | +0.020 |
dentist | +0.020 |
sob | +0.019 |
anywhere | +0.019 |
throat | +0.018 |
Neg logit contributions | |
OK | -0.033 |
Wow | -0.032 |
cy | -0.032 |
Run | -0.031 |
sorts | -0.031 |
Token | granddaughter |
Token ID | 46458 |
Feature activation | -8.36e+00 |
Pos logit contributions | |
dentist | +0.111 |
ache | +0.108 |
anywhere | +0.103 |
ridge | +0.103 |
ppa | +0.102 |
Neg logit contributions | |
cy | -0.175 |
ang | -0.173 |
OK | -0.173 |
cer | -0.173 |
sorts | -0.172 |
Token | tightly |
Token ID | 17707 |
Feature activation | -2.48e-03 |
Pos logit contributions | |
dentist | +0.177 |
ache | +0.165 |
Nib | +0.162 |
babys | +0.162 |
Rat | +0.157 |
Neg logit contributions | |
sorts | -0.152 |
cy | -0.149 |
ites | -0.148 |
cer | -0.146 |
pitch | -0.141 |
Token | . |
Token ID | 13 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
dentist | +0.000 |
maid | +0.000 |
Nib | +0.000 |
babys | +0.000 |
doctor | +0.000 |
Neg logit contributions | |
ised | -0.000 |
cer | -0.000 |
sorts | -0.000 |
than | -0.000 |
mer | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
anywhere | +0.020 |
ache | +0.020 |
sob | +0.019 |
dentist | +0.019 |
Nib | +0.018 |
Neg logit contributions | |
Wow | -0.027 |
sorts | -0.026 |
OK | -0.025 |
Run | -0.025 |
ites | -0.025 |
Token |
|
Token ID | 198 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
ache | +0.018 |
throat | +0.018 |
anywhere | +0.018 |
sob | +0.017 |
dentist | +0.017 |
Neg logit contributions | |
Wow | -0.026 |
sorts | -0.025 |
ang | -0.025 |
ites | -0.025 |
Run | -0.025 |
Token | Together |
Token ID | 41631 |
Feature activation | +2.43e+00 |
Pos logit contributions | |
Her | +0.005 |
sob | +0.005 |
Nib | +0.005 |
dentist | +0.005 |
doctor | +0.005 |
Neg logit contributions | |
akes | -0.006 |
cer | -0.005 |
mer | -0.005 |
sorts | -0.005 |
about | -0.005 |
Token | her |
Token ID | 607 |
Feature activation | -5.33e+00 |
Pos logit contributions | |
Mine | +0.031 |
Wow | +0.030 |
about | +0.030 |
pitch | +0.029 |
sorts | +0.029 |
Neg logit contributions | |
ache | -0.019 |
Nib | -0.018 |
sob | -0.018 |
dentist | -0.018 |
anywhere | -0.018 |
Token | face |
Token ID | 1986 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
Nib | +0.075 |
dentist | +0.071 |
sob | +0.068 |
anywhere | +0.067 |
maid | +0.065 |
Neg logit contributions | |
OK | -0.134 |
about | -0.132 |
ised | -0.130 |
cer | -0.130 |
ang | -0.130 |
Token | and |
Token ID | 290 |
Feature activation | -8.91e-01 |
Pos logit contributions | |
sob | +0.063 |
Nib | +0.063 |
dentist | +0.062 |
maid | +0.061 |
babys | +0.060 |
Neg logit contributions | |
about | -0.039 |
sorts | -0.038 |
ab | -0.038 |
ang | -0.037 |
cer | -0.037 |
Token | asked |
Token ID | 1965 |
Feature activation | -4.39e+00 |
Pos logit contributions | |
sob | +0.015 |
Nib | +0.015 |
dentist | +0.015 |
ache | +0.014 |
anywhere | +0.014 |
Neg logit contributions | |
sorts | -0.020 |
Run | -0.020 |
OK | -0.020 |
Wow | -0.020 |
ites | -0.020 |
Token | her |
Token ID | 607 |
Feature activation | -6.12e+00 |
Pos logit contributions | |
ache | +0.081 |
sob | +0.077 |
gag | +0.076 |
throat | +0.076 |
ppa | +0.073 |
Neg logit contributions | |
sorts | -0.091 |
about | -0.089 |
OK | -0.087 |
Mine | -0.087 |
cy | -0.087 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.29e+00 |
Pos logit contributions | |
sob | +0.083 |
ache | +0.082 |
ppa | +0.080 |
gag | +0.077 |
Nib | +0.075 |
Neg logit contributions | |
sorts | -0.168 |
cy | -0.161 |
about | -0.157 |
OK | -0.155 |
kinds | -0.151 |
Token | , |
Token ID | 11 |
Feature activation | -2.65e+00 |
Pos logit contributions | |
sob | +0.183 |
ache | +0.178 |
ppa | +0.176 |
gag | +0.175 |
dentist | +0.169 |
Neg logit contributions | |
sorts | -0.162 |
wins | -0.154 |
cy | -0.154 |
about | -0.144 |
kinds | -0.136 |
Token | " |
Token ID | 366 |
Feature activation | +3.90e+00 |
Pos logit contributions | |
dentist | +0.050 |
ache | +0.050 |
sob | +0.049 |
anywhere | +0.048 |
throat | +0.048 |
Neg logit contributions | |
Wow | -0.053 |
OK | -0.053 |
Run | -0.052 |
ang | -0.052 |
sorts | -0.051 |
Token | Do |
Token ID | 5211 |
Feature activation | -6.25e-01 |
Pos logit contributions | |
sorts | +0.070 |
ites | +0.070 |
Run | +0.069 |
akes | +0.069 |
ang | +0.068 |
Neg logit contributions | |
sob | -0.084 |
dentist | -0.083 |
Nib | -0.082 |
babys | -0.080 |
Her | -0.079 |
Token | you |
Token ID | 345 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
sob | +0.017 |
ache | +0.016 |
babys | +0.016 |
Nib | +0.016 |
dentist | +0.016 |
Neg logit contributions | |
OK | -0.009 |
atch | -0.009 |
Wow | -0.009 |
ites | -0.008 |
Run | -0.008 |
Token | want |
Token ID | 765 |
Feature activation | -7.33e-01 |
Pos logit contributions | |
ites | +0.008 |
Run | +0.008 |
Wow | +0.008 |
cer | +0.008 |
ang | +0.008 |
Neg logit contributions | |
sob | -0.011 |
Nib | -0.011 |
dentist | -0.011 |
throat | -0.011 |
anywhere | -0.011 |
Token | had |
Token ID | 550 |
Feature activation | -6.45e-01 |
Pos logit contributions | |
sorts | +0.042 |
Run | +0.041 |
OK | +0.041 |
atch | +0.041 |
Wow | +0.040 |
Neg logit contributions | |
sob | -0.043 |
Nib | -0.042 |
dentist | -0.042 |
babys | -0.041 |
grandmother | -0.041 |
Token | time |
Token ID | 640 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
sob | +0.010 |
Nib | +0.009 |
ppa | +0.009 |
babys | +0.009 |
ache | +0.009 |
Neg logit contributions | |
sorts | -0.016 |
ites | -0.015 |
Run | -0.015 |
OK | -0.015 |
atch | -0.015 |
Token | to |
Token ID | 284 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
Nib | +0.028 |
dentist | +0.027 |
sob | +0.026 |
ache | +0.025 |
ppa | +0.025 |
Neg logit contributions | |
ites | -0.046 |
sorts | -0.044 |
ab | -0.044 |
ang | -0.044 |
OK | -0.044 |
Token | take |
Token ID | 1011 |
Feature activation | +9.57e-01 |
Pos logit contributions | |
Run | +0.005 |
OK | +0.005 |
sorts | +0.005 |
about | +0.005 |
atch | +0.005 |
Neg logit contributions | |
sob | -0.005 |
Nib | -0.005 |
dentist | -0.005 |
ache | -0.005 |
throat | -0.005 |
Token | their |
Token ID | 511 |
Feature activation | -4.44e+00 |
Pos logit contributions | |
sorts | +0.021 |
Run | +0.021 |
ites | +0.021 |
Wow | +0.021 |
atch | +0.021 |
Neg logit contributions | |
sob | -0.017 |
dentist | -0.016 |
ache | -0.016 |
Nib | -0.016 |
ppa | -0.016 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.24e+00 |
Pos logit contributions | |
sob | +0.095 |
Nib | +0.094 |
dentist | +0.092 |
ppa | +0.090 |
ache | +0.090 |
Neg logit contributions | |
ites | -0.082 |
Run | -0.081 |
sorts | -0.081 |
OK | -0.080 |
atch | -0.080 |
Token | to |
Token ID | 284 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
Nib | +0.155 |
sob | +0.152 |
dentist | +0.151 |
ppa | +0.145 |
maid | +0.144 |
Neg logit contributions | |
sorts | -0.172 |
cy | -0.170 |
pitch | -0.167 |
ites | -0.163 |
cer | -0.161 |
Token | explore |
Token ID | 7301 |
Feature activation | +2.38e-03 |
Pos logit contributions | |
ache | +0.023 |
sob | +0.022 |
ppa | +0.022 |
Nib | +0.021 |
throat | +0.021 |
Neg logit contributions | |
sorts | -0.025 |
Run | -0.024 |
OK | -0.023 |
about | -0.023 |
Wow | -0.023 |
Token | the |
Token ID | 262 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Run | +0.000 |
atch | +0.000 |
ites | +0.000 |
Wow | +0.000 |
OK | +0.000 |
Neg logit contributions | |
sob | -0.000 |
Nib | -0.000 |
dentist | -0.000 |
anywhere | -0.000 |
doctor | -0.000 |
Token | city |
Token ID | 1748 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
dentist | +0.032 |
doctor | +0.031 |
anywhere | +0.029 |
grandmother | +0.029 |
babys | +0.028 |
Neg logit contributions | |
ang | -0.026 |
Run | -0.026 |
acked | -0.026 |
cer | -0.025 |
Pull | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | -6.33e-01 |
Pos logit contributions | |
sob | +0.002 |
dentist | +0.002 |
anywhere | +0.002 |
Nib | +0.002 |
doctor | +0.002 |
Neg logit contributions | |
Run | -0.005 |
Wow | -0.005 |
OK | -0.005 |
ites | -0.005 |
atch | -0.005 |
Token | um |
Token ID | 388 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
anywhere | +0.006 |
sob | +0.005 |
ache | +0.005 |
Nib | +0.005 |
heal | +0.005 |
Neg logit contributions | |
ee | -0.004 |
ay | -0.004 |
ite | -0.003 |
cy | -0.003 |
atch | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +4.09e-02 |
Pos logit contributions | |
sob | +0.022 |
dentist | +0.022 |
Nib | +0.022 |
Her | +0.021 |
babys | +0.021 |
Neg logit contributions | |
Run | -0.028 |
OK | -0.028 |
Wow | -0.028 |
ites | -0.028 |
akes | -0.027 |
Token | Dad |
Token ID | 17415 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
akes | +0.001 |
atch | +0.001 |
ites | +0.001 |
mer | +0.001 |
ang | +0.001 |
Neg logit contributions | |
sob | -0.000 |
Nib | -0.000 |
Her | -0.000 |
babys | -0.000 |
dentist | -0.000 |
Token | took |
Token ID | 1718 |
Feature activation | +5.60e-01 |
Pos logit contributions | |
Her | +0.033 |
Nib | +0.032 |
sob | +0.032 |
babys | +0.032 |
dentist | +0.032 |
Neg logit contributions | |
Run | -0.051 |
Wow | -0.050 |
ised | -0.050 |
ites | -0.049 |
ang | -0.049 |
Token | their |
Token ID | 511 |
Feature activation | -4.99e+00 |
Pos logit contributions | |
sorts | +0.013 |
Run | +0.013 |
Wow | +0.013 |
ites | +0.013 |
cy | +0.013 |
Neg logit contributions | |
sob | -0.009 |
Nib | -0.009 |
dentist | -0.009 |
ache | -0.009 |
throat | -0.008 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.20e+00 |
Pos logit contributions | |
sob | +0.102 |
Nib | +0.102 |
ache | +0.100 |
ppa | +0.100 |
dentist | +0.096 |
Neg logit contributions | |
cy | -0.098 |
sorts | -0.095 |
Run | -0.095 |
ites | -0.092 |
atch | -0.092 |
Token | to |
Token ID | 284 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
sob | +0.145 |
ache | +0.142 |
dentist | +0.140 |
Nib | +0.137 |
ppa | +0.136 |
Neg logit contributions | |
sorts | -0.189 |
cy | -0.186 |
ites | -0.176 |
about | -0.172 |
atch | -0.172 |
Token | the |
Token ID | 262 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
sob | +0.041 |
ache | +0.039 |
Nib | +0.039 |
dentist | +0.038 |
ppa | +0.038 |
Neg logit contributions | |
sorts | -0.050 |
Run | -0.049 |
Wow | -0.049 |
atch | -0.048 |
OK | -0.048 |
Token | toys |
Token ID | 14958 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
sob | +0.064 |
ache | +0.062 |
ppa | +0.061 |
Nib | +0.061 |
throat | +0.061 |
Neg logit contributions | |
Wow | -0.031 |
sorts | -0.031 |
atch | -0.031 |
OK | -0.030 |
cy | -0.030 |
Token | hop |
Token ID | 8548 |
Feature activation | +7.26e-02 |
Pos logit contributions | |
sob | +0.024 |
Nib | +0.023 |
dentist | +0.023 |
anywhere | +0.022 |
babys | +0.022 |
Neg logit contributions | |
Run | -0.045 |
Wow | -0.045 |
ites | -0.044 |
sorts | -0.044 |
OK | -0.044 |
Token | . |
Token ID | 13 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
sorts | +0.002 |
ites | +0.002 |
about | +0.002 |
Run | +0.002 |
ang | +0.002 |
Neg logit contributions | |
sob | -0.001 |
Nib | -0.001 |
dentist | -0.001 |
throat | -0.001 |
babys | -0.001 |
Token | ummy |
Token ID | 13513 |
Feature activation | +6.23e-01 |
Pos logit contributions | |
anywhere | +0.005 |
sob | +0.005 |
throat | +0.005 |
ache | +0.005 |
Nib | +0.005 |
Neg logit contributions | |
ee | -0.003 |
ay | -0.003 |
atch | -0.003 |
ites | -0.003 |
ang | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +9.01e-01 |
Pos logit contributions | |
Wow | +0.014 |
ites | +0.014 |
Run | +0.014 |
OK | +0.014 |
ang | +0.014 |
Neg logit contributions | |
sob | -0.011 |
dentist | -0.010 |
Nib | -0.010 |
doctor | -0.010 |
Her | -0.010 |
Token | Daddy |
Token ID | 26926 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
akes | +0.025 |
atch | +0.025 |
ites | +0.025 |
mer | +0.025 |
about | +0.024 |
Neg logit contributions | |
Nib | -0.011 |
sob | -0.011 |
Her | -0.011 |
Prince | -0.010 |
babys | -0.010 |
Token | took |
Token ID | 1718 |
Feature activation | +5.90e-01 |
Pos logit contributions | |
Nib | +0.020 |
sob | +0.018 |
Her | +0.018 |
dentist | +0.018 |
babys | +0.018 |
Neg logit contributions | |
ised | -0.030 |
Wow | -0.029 |
Uh | -0.029 |
Run | -0.029 |
ites | -0.029 |
Token | their |
Token ID | 511 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
sorts | +0.015 |
Run | +0.015 |
Wow | +0.015 |
ites | +0.015 |
atch | +0.014 |
Neg logit contributions | |
sob | -0.009 |
dentist | -0.008 |
Nib | -0.008 |
ache | -0.008 |
throat | -0.008 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.13e+00 |
Pos logit contributions | |
sob | +0.094 |
Nib | +0.093 |
ache | +0.092 |
ppa | +0.091 |
dentist | +0.090 |
Neg logit contributions | |
cy | -0.088 |
Run | -0.088 |
sorts | -0.087 |
Wow | -0.085 |
atch | -0.085 |
Token | to |
Token ID | 284 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
sob | +0.137 |
dentist | +0.133 |
ache | +0.133 |
Nib | +0.131 |
ppa | +0.128 |
Neg logit contributions | |
sorts | -0.193 |
cy | -0.187 |
ites | -0.184 |
atch | -0.181 |
about | -0.179 |
Token | the |
Token ID | 262 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
sob | +0.039 |
Nib | +0.038 |
ache | +0.038 |
dentist | +0.037 |
throat | +0.036 |
Neg logit contributions | |
sorts | -0.050 |
Run | -0.049 |
Wow | -0.049 |
atch | -0.049 |
OK | -0.048 |
Token | beach |
Token ID | 10481 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
sob | +0.050 |
Nib | +0.049 |
ache | +0.048 |
throat | +0.048 |
dentist | +0.047 |
Neg logit contributions | |
sorts | -0.029 |
Wow | -0.028 |
Run | -0.028 |
atch | -0.028 |
OK | -0.028 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
sob | +0.020 |
Nib | +0.019 |
dentist | +0.018 |
babys | +0.018 |
anywhere | +0.018 |
Neg logit contributions | |
Run | -0.038 |
Wow | -0.038 |
OK | -0.038 |
ites | -0.038 |
atch | -0.037 |
Token | It |
Token ID | 632 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
atch | +0.029 |
ites | +0.029 |
cer | +0.029 |
Run | +0.029 |
OK | +0.029 |
Neg logit contributions | |
Her | -0.029 |
Nib | -0.028 |
babys | -0.027 |
sob | -0.027 |
Prince | -0.026 |
Token | was |
Token ID | 373 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Run | +0.007 |
Quick | +0.007 |
sorts | +0.007 |
blows | +0.007 |
cy | +0.006 |
Neg logit contributions | |
anywhere | -0.009 |
Nib | -0.009 |
dentist | -0.009 |
nightmares | -0.009 |
throat | -0.009 |
Token | angry |
Token ID | 7954 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
Him | +0.032 |
Nib | +0.031 |
ridge | +0.030 |
urger | +0.030 |
Rat | +0.030 |
Neg logit contributions | |
ang | -0.024 |
ised | -0.023 |
sorts | -0.023 |
aking | -0.023 |
Uh | -0.022 |
Token | and |
Token ID | 290 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
cer | +0.021 |
Run | +0.021 |
about | +0.021 |
sorts | +0.020 |
atch | +0.020 |
Neg logit contributions | |
Nib | -0.027 |
sob | -0.027 |
babys | -0.027 |
dentist | -0.027 |
ppa | -0.027 |
Token | asked |
Token ID | 1965 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
dentist | +0.029 |
Nib | +0.028 |
anywhere | +0.028 |
ocket | +0.028 |
maid | +0.028 |
Neg logit contributions | |
Run | -0.035 |
OK | -0.033 |
sorts | -0.033 |
Wow | -0.032 |
ang | -0.032 |
Token | her |
Token ID | 607 |
Feature activation | -5.96e+00 |
Pos logit contributions | |
ache | +0.076 |
throat | +0.073 |
ridge | +0.073 |
gag | +0.072 |
dentist | +0.072 |
Neg logit contributions | |
Wow | -0.073 |
Run | -0.073 |
OK | -0.072 |
cy | -0.071 |
ised | -0.070 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.12e+00 |
Pos logit contributions | |
ridge | +0.123 |
gag | +0.116 |
gh | +0.115 |
lor | +0.112 |
ppa | +0.110 |
Neg logit contributions | |
sorts | -0.102 |
cy | -0.095 |
about | -0.089 |
pitches | -0.087 |
able | -0.087 |
Token | why |
Token ID | 1521 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
ppa | +0.188 |
ridge | +0.188 |
Tooth | +0.186 |
lor | +0.184 |
dentist | +0.180 |
Neg logit contributions | |
wins | -0.119 |
sorts | -0.116 |
cy | -0.113 |
atch | -0.103 |
at | -0.098 |
Token | she |
Token ID | 673 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
sob | +0.006 |
Nib | +0.006 |
dentist | +0.006 |
throat | +0.005 |
babys | +0.005 |
Neg logit contributions | |
Run | -0.015 |
sorts | -0.015 |
OK | -0.014 |
ites | -0.014 |
Wow | -0.014 |
Token | had |
Token ID | 550 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
sob | +0.023 |
Nib | +0.023 |
dentist | +0.022 |
babys | +0.022 |
throat | +0.021 |
Neg logit contributions | |
Run | -0.022 |
sorts | -0.022 |
atch | -0.022 |
OK | -0.022 |
Wow | -0.022 |
Token | done |
Token ID | 1760 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
sorts | +0.006 |
atch | +0.006 |
Run | +0.006 |
ites | +0.006 |
Wow | +0.006 |
Neg logit contributions | |
Nib | -0.006 |
sob | -0.006 |
Her | -0.005 |
dentist | -0.005 |
maid | -0.005 |
Token | something |
Token ID | 1223 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
Nib | +0.032 |
ppa | +0.031 |
maid | +0.031 |
throat | +0.030 |
ache | +0.030 |
Neg logit contributions | |
sorts | -0.032 |
about | -0.031 |
Mine | -0.031 |
pitch | -0.030 |
pitches | -0.030 |
Token | knowing |
Token ID | 6970 |
Feature activation | -8.84e-01 |
Pos logit contributions | |
sob | +0.044 |
Nib | +0.044 |
dentist | +0.043 |
anywhere | +0.042 |
babys | +0.042 |
Neg logit contributions | |
sorts | -0.065 |
Run | -0.064 |
Wow | -0.064 |
OK | -0.063 |
ites | -0.063 |
Token | he |
Token ID | 339 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
gag | +0.017 |
sob | +0.016 |
ppa | +0.016 |
throat | +0.016 |
ache | +0.016 |
Neg logit contributions | |
sorts | -0.019 |
Wow | -0.017 |
gol | -0.017 |
Run | -0.017 |
ised | -0.017 |
Token | had |
Token ID | 550 |
Feature activation | -6.35e-01 |
Pos logit contributions | |
Run | +0.007 |
ites | +0.007 |
about | +0.007 |
Wow | +0.007 |
akes | +0.007 |
Neg logit contributions | |
sob | -0.006 |
Nib | -0.006 |
dentist | -0.006 |
anywhere | -0.006 |
ache | -0.006 |
Token | given |
Token ID | 1813 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
Nib | +0.014 |
babys | +0.014 |
sob | +0.013 |
ache | +0.013 |
dentist | +0.013 |
Neg logit contributions | |
sorts | -0.012 |
OK | -0.011 |
atch | -0.011 |
cer | -0.011 |
Wow | -0.011 |
Token | his |
Token ID | 465 |
Feature activation | -4.87e+00 |
Pos logit contributions | |
ache | +0.008 |
sob | +0.008 |
throat | +0.008 |
gag | +0.008 |
ppa | +0.008 |
Neg logit contributions | |
sorts | -0.012 |
Wow | -0.011 |
kinds | -0.011 |
cy | -0.011 |
able | -0.011 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.08e+00 |
Pos logit contributions | |
Nib | +0.082 |
sob | +0.081 |
ppa | +0.075 |
dentist | +0.074 |
ache | +0.074 |
Neg logit contributions | |
sorts | -0.116 |
OK | -0.113 |
Run | -0.111 |
about | -0.110 |
ites | -0.110 |
Token | an |
Token ID | 281 |
Feature activation | +9.14e-01 |
Pos logit contributions | |
sob | +0.153 |
Nib | +0.152 |
babys | +0.146 |
dentist | +0.141 |
ache | +0.140 |
Neg logit contributions | |
sorts | -0.185 |
kinds | -0.160 |
ites | -0.159 |
cer | -0.159 |
cy | -0.158 |
Token | interesting |
Token ID | 3499 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
ites | +0.020 |
Run | +0.020 |
Wow | +0.020 |
akes | +0.020 |
cer | +0.019 |
Neg logit contributions | |
sob | -0.017 |
dentist | -0.016 |
grandmother | -0.016 |
Nib | -0.016 |
doctor | -0.016 |
Token | gift |
Token ID | 6979 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
Run | +0.035 |
ites | +0.035 |
ang | +0.035 |
Wow | +0.035 |
atch | +0.034 |
Neg logit contributions | |
sob | -0.026 |
dentist | -0.026 |
grandmother | -0.025 |
doctor | -0.025 |
babys | -0.025 |
Token | that |
Token ID | 326 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
gag | +0.072 |
sob | +0.071 |
Nib | +0.069 |
ppa | +0.068 |
throat | +0.064 |
Neg logit contributions | |
sorts | -0.063 |
than | -0.061 |
cer | -0.060 |
mer | -0.058 |
ab | -0.056 |
Token | would |
Token ID | 561 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
sorts | +0.003 |
Wow | +0.003 |
OK | +0.003 |
Run | +0.003 |
cer | +0.003 |
Neg logit contributions | |
sob | -0.002 |
Nib | -0.002 |
dentist | -0.002 |
ache | -0.002 |
ppa | -0.002 |
Token | um |
Token ID | 388 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
Run | +0.007 |
Wow | +0.007 |
sorts | +0.007 |
cer | +0.007 |
ites | +0.007 |
Neg logit contributions | |
sob | -0.007 |
Her | -0.007 |
dentist | -0.007 |
babys | -0.007 |
Nib | -0.007 |
Token | smiled |
Token ID | 13541 |
Feature activation | -6.88e-02 |
Pos logit contributions | |
Run | +0.005 |
sorts | +0.005 |
ites | +0.005 |
Wow | +0.005 |
atch | +0.005 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.003 |
dentist | -0.003 |
babys | -0.003 |
ache | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | -4.96e-01 |
Pos logit contributions | |
dentist | +0.001 |
Nib | +0.001 |
anywhere | +0.001 |
sob | +0.001 |
babys | +0.001 |
Neg logit contributions | |
ised | -0.001 |
OK | -0.001 |
cy | -0.001 |
cer | -0.001 |
Wow | -0.001 |
Token | gave |
Token ID | 2921 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
sob | +0.007 |
Nib | +0.007 |
dentist | +0.007 |
Her | +0.006 |
babys | +0.006 |
Neg logit contributions | |
akes | -0.013 |
atch | -0.013 |
Run | -0.013 |
ites | -0.013 |
about | -0.013 |
Token | her |
Token ID | 607 |
Feature activation | -5.75e+00 |
Pos logit contributions | |
cy | +0.013 |
sorts | +0.012 |
Wow | +0.012 |
OK | +0.012 |
ee | +0.012 |
Neg logit contributions | |
ache | -0.006 |
dentist | -0.006 |
sob | -0.006 |
throat | -0.006 |
babys | -0.006 |
Token | daughter |
Token ID | 4957 |
Feature activation | -8.01e+00 |
Pos logit contributions | |
sob | +0.095 |
Nib | +0.092 |
dentist | +0.091 |
ache | +0.090 |
throat | +0.085 |
Neg logit contributions | |
sorts | -0.139 |
cy | -0.136 |
OK | -0.133 |
cer | -0.132 |
Run | -0.130 |
Token | another |
Token ID | 1194 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
dentist | +0.138 |
sob | +0.136 |
Nib | +0.134 |
ache | +0.134 |
babys | +0.132 |
Neg logit contributions | |
sorts | -0.189 |
cy | -0.176 |
ites | -0.173 |
OK | -0.169 |
cer | -0.169 |
Token | hug |
Token ID | 16225 |
Feature activation | -3.99e-01 |
Pos logit contributions | |
sob | +0.021 |
Nib | +0.020 |
dentist | +0.020 |
anywhere | +0.019 |
ppa | +0.019 |
Neg logit contributions | |
sorts | -0.031 |
Run | -0.031 |
OK | -0.030 |
about | -0.030 |
Wow | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | -4.97e-02 |
Pos logit contributions | |
Nib | +0.007 |
sob | +0.007 |
dentist | +0.007 |
babys | +0.006 |
maid | +0.006 |
Neg logit contributions | |
OK | -0.009 |
sorts | -0.009 |
cer | -0.009 |
mer | -0.009 |
Run | -0.009 |
Token | ' |
Token ID | 705 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
Her | +0.001 |
sob | +0.001 |
Nib | +0.001 |
grandmother | +0.001 |
babys | +0.001 |
Neg logit contributions | |
ites | -0.001 |
atch | -0.001 |
Run | -0.001 |
akes | -0.001 |
sorts | -0.001 |
Token | That |
Token ID | 2504 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
akes | +0.068 |
pitch | +0.065 |
sorts | +0.064 |
pitches | +0.064 |
blows | +0.063 |
Neg logit contributions | |
yes | -0.093 |
ppa | -0.091 |
Her | -0.088 |
sob | -0.087 |
ache | -0.087 |
Token | Why |
Token ID | 5195 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
akes | +0.105 |
sorts | +0.099 |
ites | +0.099 |
mer | +0.098 |
slope | +0.094 |
Neg logit contributions | |
sob | -0.097 |
ppa | -0.092 |
babys | -0.089 |
Nib | -0.089 |
dentist | -0.087 |
Token | did |
Token ID | 750 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
ites | +0.049 |
Run | +0.049 |
Wow | +0.048 |
ang | +0.048 |
sorts | +0.048 |
Neg logit contributions | |
sob | -0.052 |
dentist | -0.050 |
Nib | -0.049 |
anywhere | -0.048 |
babys | -0.048 |
Token | you |
Token ID | 345 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
sob | +0.035 |
Nib | +0.033 |
babys | +0.033 |
ppa | +0.033 |
dentist | +0.033 |
Neg logit contributions | |
Run | -0.025 |
atch | -0.024 |
ites | -0.024 |
Wow | -0.024 |
sorts | -0.023 |
Token | give |
Token ID | 1577 |
Feature activation | +4.36e-01 |
Pos logit contributions | |
sob | +0.009 |
Nib | +0.009 |
dentist | +0.008 |
babys | +0.008 |
anywhere | +0.008 |
Neg logit contributions | |
Run | -0.011 |
Wow | -0.011 |
ites | -0.011 |
sorts | -0.011 |
OK | -0.011 |
Token | your |
Token ID | 534 |
Feature activation | -4.80e+00 |
Pos logit contributions | |
atch | +0.008 |
cy | +0.008 |
sorts | +0.008 |
ites | +0.007 |
ee | +0.007 |
Neg logit contributions | |
sob | -0.010 |
throat | -0.010 |
babys | -0.009 |
Her | -0.009 |
Nib | -0.009 |
Token | daughter |
Token ID | 4957 |
Feature activation | -7.99e+00 |
Pos logit contributions | |
sob | +0.087 |
Nib | +0.083 |
dentist | +0.081 |
ache | +0.081 |
ppa | +0.080 |
Neg logit contributions | |
sorts | -0.106 |
Run | -0.103 |
OK | -0.103 |
atch | -0.103 |
about | -0.102 |
Token | a |
Token ID | 257 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
sob | +0.142 |
Nib | +0.135 |
maid | +0.127 |
dentist | +0.125 |
ache | +0.125 |
Neg logit contributions | |
sorts | -0.179 |
atch | -0.173 |
cy | -0.171 |
ites | -0.170 |
cer | -0.166 |
Token | treat |
Token ID | 2190 |
Feature activation | -2.14e+00 |
Pos logit contributions | |
sob | +0.031 |
Nib | +0.031 |
ppa | +0.030 |
Her | +0.029 |
dentist | +0.029 |
Neg logit contributions | |
sorts | -0.032 |
OK | -0.031 |
cy | -0.030 |
ab | -0.030 |
about | -0.030 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
sob | +0.044 |
Nib | +0.042 |
dentist | +0.041 |
throat | +0.040 |
babys | +0.040 |
Neg logit contributions | |
sorts | -0.041 |
about | -0.041 |
atch | -0.041 |
cer | -0.041 |
OK | -0.040 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
anywhere | +0.039 |
ocket | +0.037 |
ache | +0.037 |
ppa | +0.037 |
maid | +0.035 |
Neg logit contributions | |
Wow | -0.035 |
Run | -0.033 |
OK | -0.032 |
ang | -0.031 |
about | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
anywhere | +0.030 |
throat | +0.028 |
ache | +0.028 |
Nib | +0.027 |
dentist | +0.027 |
Neg logit contributions | |
Wow | -0.031 |
ang | -0.031 |
Run | -0.030 |
OK | -0.030 |
Quick | -0.030 |
Token | had |
Token ID | 550 |
Feature activation | +8.08e-01 |
Pos logit contributions | |
akes | +0.032 |
ites | +0.032 |
about | +0.032 |
Run | +0.031 |
ang | +0.031 |
Neg logit contributions | |
sob | -0.023 |
dentist | -0.023 |
anywhere | -0.022 |
Nib | -0.021 |
ache | -0.021 |
Token | achieved |
Token ID | 8793 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
Run | +0.021 |
ang | +0.021 |
Wow | +0.021 |
ites | +0.021 |
about | +0.021 |
Neg logit contributions | |
sob | -0.012 |
anywhere | -0.011 |
dentist | -0.011 |
Her | -0.011 |
not | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | +4.54e-01 |
Pos logit contributions | |
sob | +0.023 |
Nib | +0.023 |
dentist | +0.022 |
anywhere | +0.022 |
babys | +0.022 |
Neg logit contributions | |
Run | -0.036 |
ites | -0.036 |
Wow | -0.036 |
sorts | -0.036 |
atch | -0.035 |
Token | thanked |
Token ID | 26280 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
sorts | +0.010 |
cer | +0.010 |
OK | +0.010 |
Run | +0.010 |
about | +0.010 |
Neg logit contributions | |
sob | -0.008 |
Nib | -0.008 |
dentist | -0.008 |
ache | -0.008 |
babys | -0.007 |
Token | his |
Token ID | 465 |
Feature activation | -5.17e+00 |
Pos logit contributions | |
ache | +0.079 |
sob | +0.071 |
ppa | +0.070 |
babys | +0.066 |
ocket | +0.066 |
Neg logit contributions | |
sorts | -0.069 |
cer | -0.061 |
Wow | -0.060 |
about | -0.060 |
ised | -0.060 |
Token | wife |
Token ID | 3656 |
Feature activation | -7.99e+00 |
Pos logit contributions | |
sob | +0.053 |
ppa | +0.052 |
Nib | +0.052 |
anywhere | +0.051 |
ache | +0.049 |
Neg logit contributions | |
OK | -0.151 |
sorts | -0.148 |
about | -0.145 |
ang | -0.144 |
cy | -0.144 |
Token | for |
Token ID | 329 |
Feature activation | -7.28e-02 |
Pos logit contributions | |
sob | +0.180 |
dentist | +0.171 |
babys | +0.170 |
ache | +0.169 |
ppa | +0.169 |
Neg logit contributions | |
sorts | -0.148 |
cer | -0.129 |
cy | -0.129 |
wins | -0.129 |
about | -0.128 |
Token | reminding |
Token ID | 30047 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
sob | +0.001 |
Nib | +0.001 |
ache | +0.001 |
dentist | +0.001 |
throat | +0.001 |
Neg logit contributions | |
sorts | -0.002 |
Run | -0.002 |
Wow | -0.002 |
OK | -0.002 |
atch | -0.002 |
Token | him |
Token ID | 683 |
Feature activation | -4.72e+00 |
Pos logit contributions | |
sob | +0.014 |
ache | +0.014 |
throat | +0.014 |
Nib | +0.013 |
dentist | +0.013 |
Neg logit contributions | |
sorts | -0.027 |
cer | -0.026 |
ised | -0.026 |
atch | -0.026 |
Mine | -0.026 |
Token | . |
Token ID | 13 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
sob | +0.082 |
Nib | +0.080 |
babys | +0.078 |
dentist | +0.078 |
ppa | +0.077 |
Neg logit contributions | |
sorts | -0.111 |
ites | -0.102 |
atch | -0.102 |
about | -0.101 |
akes | -0.100 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
sob | +0.022 |
ache | +0.022 |
anywhere | +0.021 |
dentist | +0.021 |
Nib | +0.021 |
Neg logit contributions | |
Wow | -0.033 |
sorts | -0.032 |
OK | -0.032 |
Run | -0.032 |
ang | -0.031 |
Token | asked |
Token ID | 1965 |
Feature activation | -4.29e+00 |
Pos logit contributions | |
Nib | +0.025 |
dentist | +0.025 |
sob | +0.025 |
anywhere | +0.024 |
ache | +0.024 |
Neg logit contributions | |
sorts | -0.036 |
Run | -0.035 |
OK | -0.035 |
Wow | -0.034 |
cer | -0.034 |
Token | if |
Token ID | 611 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
throat | +0.086 |
sob | +0.085 |
gag | +0.084 |
ache | +0.081 |
nightmares | +0.077 |
Neg logit contributions | |
sorts | -0.084 |
about | -0.079 |
OK | -0.078 |
ised | -0.077 |
cy | -0.076 |
Token | she |
Token ID | 673 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
sob | +0.027 |
throat | +0.026 |
gag | +0.026 |
ache | +0.026 |
urger | +0.025 |
Neg logit contributions | |
OK | -0.031 |
Run | -0.030 |
Wow | -0.029 |
sorts | -0.028 |
ised | -0.027 |
Token | could |
Token ID | 714 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
sob | +0.032 |
Nib | +0.032 |
babys | +0.031 |
dentist | +0.031 |
throat | +0.030 |
Neg logit contributions | |
OK | -0.031 |
cy | -0.029 |
sorts | -0.029 |
mer | -0.028 |
Run | -0.028 |
Token | lend |
Token ID | 22096 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
sob | +0.050 |
Nib | +0.047 |
dentist | +0.047 |
ache | +0.045 |
throat | +0.044 |
Neg logit contributions | |
atch | -0.068 |
OK | -0.068 |
sorts | -0.068 |
ites | -0.067 |
about | -0.066 |
Token | her |
Token ID | 607 |
Feature activation | -7.98e+00 |
Pos logit contributions | |
ache | +0.032 |
sob | +0.031 |
dentist | +0.029 |
throat | +0.029 |
gag | +0.029 |
Neg logit contributions | |
Mine | -0.035 |
sorts | -0.034 |
cy | -0.034 |
Wow | -0.034 |
atch | -0.032 |
Token | the |
Token ID | 262 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
sob | +0.142 |
Nib | +0.134 |
dentist | +0.133 |
ache | +0.131 |
throat | +0.128 |
Neg logit contributions | |
sorts | -0.179 |
ites | -0.177 |
OK | -0.174 |
about | -0.174 |
cy | -0.173 |
Token | money |
Token ID | 1637 |
Feature activation | -3.11e+00 |
Pos logit contributions | |
sob | +0.041 |
dentist | +0.040 |
Nib | +0.040 |
anywhere | +0.040 |
babys | +0.040 |
Neg logit contributions | |
Run | -0.065 |
ang | -0.065 |
ites | -0.065 |
akes | -0.064 |
sorts | -0.064 |
Token | for |
Token ID | 329 |
Feature activation | -8.64e-01 |
Pos logit contributions | |
sob | +0.049 |
Nib | +0.046 |
dentist | +0.046 |
throat | +0.044 |
babys | +0.044 |
Neg logit contributions | |
sorts | -0.075 |
OK | -0.075 |
ites | -0.075 |
cer | -0.074 |
cy | -0.074 |
Token | something |
Token ID | 1223 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
ache | +0.016 |
sob | +0.015 |
dentist | +0.014 |
throat | +0.014 |
maid | +0.014 |
Neg logit contributions | |
ised | -0.018 |
Mine | -0.018 |
sorts | -0.018 |
OK | -0.018 |
atch | -0.018 |
Token | she |
Token ID | 673 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
dentist | +0.031 |
sob | +0.031 |
Nib | +0.029 |
throat | +0.029 |
babys | +0.029 |
Neg logit contributions | |
sorts | -0.044 |
OK | -0.043 |
atch | -0.042 |
mer | -0.042 |
ites | -0.042 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
sorts | +0.057 |
Run | +0.057 |
about | +0.056 |
cer | +0.056 |
Wow | +0.056 |
Neg logit contributions | |
sob | -0.056 |
Nib | -0.055 |
dentist | -0.054 |
babys | -0.053 |
Her | -0.052 |
Token | He |
Token ID | 679 |
Feature activation | +5.81e-01 |
Pos logit contributions | |
Run | +0.004 |
sorts | +0.004 |
ites | +0.004 |
Wow | +0.004 |
atch | +0.004 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.003 |
dentist | -0.003 |
babys | -0.003 |
throat | -0.003 |
Token | then |
Token ID | 788 |
Feature activation | +6.62e-01 |
Pos logit contributions | |
Run | +0.012 |
sorts | +0.012 |
OK | +0.012 |
ites | +0.012 |
Wow | +0.012 |
Neg logit contributions | |
sob | -0.010 |
Nib | -0.010 |
dentist | -0.010 |
anywhere | -0.010 |
babys | -0.010 |
Token | gave |
Token ID | 2921 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
Run | +0.015 |
sorts | +0.014 |
OK | +0.014 |
ites | +0.014 |
Wow | +0.014 |
Neg logit contributions | |
sob | -0.012 |
Nib | -0.011 |
dentist | -0.011 |
anywhere | -0.011 |
babys | -0.011 |
Token | her |
Token ID | 607 |
Feature activation | -6.44e+00 |
Pos logit contributions | |
cy | +0.003 |
sorts | +0.002 |
Wow | +0.002 |
cer | +0.002 |
Mine | +0.002 |
Neg logit contributions | |
ache | -0.002 |
sob | -0.002 |
dentist | -0.002 |
throat | -0.002 |
babys | -0.002 |
Token | daughter |
Token ID | 4957 |
Feature activation | -7.96e+00 |
Pos logit contributions | |
sob | +0.117 |
dentist | +0.111 |
Nib | +0.111 |
ache | +0.110 |
anywhere | +0.105 |
Neg logit contributions | |
sorts | -0.141 |
cy | -0.138 |
ee | -0.130 |
cer | -0.130 |
about | -0.129 |
Token | some |
Token ID | 617 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
sob | +0.142 |
dentist | +0.141 |
ache | +0.139 |
Nib | +0.136 |
babys | +0.135 |
Neg logit contributions | |
sorts | -0.177 |
cy | -0.165 |
about | -0.159 |
ee | -0.158 |
Mine | -0.157 |
Token | medicine |
Token ID | 9007 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
sob | +0.019 |
Nib | +0.018 |
dentist | +0.018 |
babys | +0.017 |
anywhere | +0.017 |
Neg logit contributions | |
Run | -0.025 |
sorts | -0.025 |
ites | -0.025 |
OK | -0.025 |
Wow | -0.025 |
Token | to |
Token ID | 284 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
sob | +0.020 |
Nib | +0.020 |
dentist | +0.020 |
babys | +0.019 |
maid | +0.019 |
Neg logit contributions | |
sorts | -0.025 |
Run | -0.025 |
ites | -0.025 |
OK | -0.025 |
akes | -0.025 |
Token | take |
Token ID | 1011 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
sorts | +0.007 |
OK | +0.007 |
Run | +0.007 |
cy | +0.007 |
atch | +0.007 |
Neg logit contributions | |
dentist | -0.007 |
sob | -0.007 |
anywhere | -0.007 |
ache | -0.007 |
maid | -0.007 |
Token | every |
Token ID | 790 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
sorts | +0.026 |
cy | +0.025 |
OK | +0.025 |
akes | +0.025 |
Run | +0.025 |
Neg logit contributions | |
sob | -0.018 |
dentist | -0.018 |
babys | -0.016 |
maid | -0.016 |
ache | -0.016 |
Token | you |
Token ID | 345 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
Run | +0.006 |
sorts | +0.006 |
ites | +0.006 |
Wow | +0.006 |
atch | +0.006 |
Neg logit contributions | |
sob | -0.005 |
Nib | -0.005 |
dentist | -0.005 |
babys | -0.005 |
throat | -0.005 |
Token | ." |
Token ID | 526 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
dentist | +0.036 |
sob | +0.036 |
Nib | +0.035 |
babys | +0.035 |
ache | +0.033 |
Neg logit contributions | |
sorts | -0.030 |
akes | -0.029 |
OK | -0.029 |
cer | -0.028 |
mer | -0.028 |
Token | She |
Token ID | 1375 |
Feature activation | +6.41e-01 |
Pos logit contributions | |
anywhere | +0.034 |
ache | +0.033 |
dentist | +0.029 |
ocket | +0.029 |
gag | +0.028 |
Neg logit contributions | |
Wow | -0.035 |
cy | -0.035 |
sorts | -0.034 |
OK | -0.033 |
ites | -0.033 |
Token | showed |
Token ID | 3751 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
Run | +0.014 |
sorts | +0.014 |
OK | +0.014 |
about | +0.014 |
ites | +0.014 |
Neg logit contributions | |
sob | -0.011 |
Nib | -0.011 |
dentist | -0.011 |
anywhere | -0.011 |
babys | -0.011 |
Token | her |
Token ID | 607 |
Feature activation | -6.62e+00 |
Pos logit contributions | |
ache | +0.042 |
gag | +0.038 |
throat | +0.038 |
sob | +0.037 |
ppa | +0.037 |
Neg logit contributions | |
sorts | -0.049 |
Mine | -0.047 |
ee | -0.046 |
cy | -0.045 |
turns | -0.045 |
Token | daughter |
Token ID | 4957 |
Feature activation | -7.95e+00 |
Pos logit contributions | |
Nib | +0.088 |
ache | +0.084 |
ppa | +0.081 |
dentist | +0.077 |
sob | +0.077 |
Neg logit contributions | |
sorts | -0.184 |
cy | -0.169 |
ised | -0.168 |
Mine | -0.168 |
kinds | -0.167 |
Token | how |
Token ID | 703 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
ache | +0.167 |
dentist | +0.160 |
ppa | +0.157 |
babys | +0.152 |
Nib | +0.151 |
Neg logit contributions | |
sorts | -0.169 |
kinds | -0.143 |
about | -0.141 |
pitch | -0.140 |
pitches | -0.138 |
Token | she |
Token ID | 673 |
Feature activation | +7.05e-01 |
Pos logit contributions | |
sorts | +0.004 |
ites | +0.004 |
OK | +0.004 |
able | +0.004 |
atch | +0.003 |
Neg logit contributions | |
Nib | -0.002 |
dentist | -0.002 |
sob | -0.002 |
maid | -0.002 |
ppa | -0.002 |
Token | could |
Token ID | 714 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
akes | +0.016 |
Wow | +0.016 |
ites | +0.016 |
Run | +0.016 |
about | +0.016 |
Neg logit contributions | |
sob | -0.013 |
Nib | -0.012 |
dentist | -0.012 |
ache | -0.011 |
doctor | -0.011 |
Token | make |
Token ID | 787 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
sob | +0.020 |
Nib | +0.020 |
dentist | +0.020 |
babys | +0.019 |
ache | +0.019 |
Neg logit contributions | |
Run | -0.021 |
sorts | -0.021 |
ites | -0.020 |
atch | -0.020 |
Wow | -0.020 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
ache | +0.024 |
sob | +0.023 |
ppa | +0.023 |
throat | +0.023 |
babys | +0.023 |
Neg logit contributions | |
sorts | -0.030 |
about | -0.028 |
pitches | -0.028 |
ised | -0.027 |
ites | -0.027 |
Token | would |
Token ID | 561 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
sob | +0.005 |
dentist | +0.005 |
doctor | +0.004 |
Nib | +0.004 |
ache | +0.004 |
Neg logit contributions | |
Run | -0.007 |
Wow | -0.007 |
atch | -0.007 |
sorts | -0.007 |
Mine | -0.007 |
Token | try |
Token ID | 1949 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
ites | +0.003 |
Wow | +0.003 |
ang | +0.003 |
Run | +0.003 |
cer | +0.003 |
Neg logit contributions | |
sob | -0.002 |
dentist | -0.002 |
doctor | -0.002 |
Nib | -0.002 |
Her | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
Nib | +0.025 |
sob | +0.025 |
ppa | +0.024 |
babys | +0.024 |
throat | +0.023 |
Neg logit contributions | |
sorts | -0.044 |
about | -0.043 |
atch | -0.041 |
ites | -0.041 |
blows | -0.041 |
Token | show |
Token ID | 905 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
sob | +0.018 |
dentist | +0.016 |
doctor | +0.016 |
anywhere | +0.016 |
Her | +0.016 |
Neg logit contributions | |
ang | -0.025 |
Wow | -0.025 |
Run | -0.024 |
ites | -0.024 |
acked | -0.024 |
Token | his |
Token ID | 465 |
Feature activation | -5.03e+00 |
Pos logit contributions | |
sob | +0.024 |
ache | +0.024 |
ppa | +0.023 |
Nib | +0.023 |
dentist | +0.023 |
Neg logit contributions | |
sorts | -0.034 |
Wow | -0.032 |
Run | -0.032 |
cer | -0.032 |
about | -0.032 |
Token | daughter |
Token ID | 4957 |
Feature activation | -7.94e+00 |
Pos logit contributions | |
sob | +0.072 |
Nib | +0.072 |
dentist | +0.066 |
ppa | +0.066 |
ache | +0.065 |
Neg logit contributions | |
sorts | -0.129 |
about | -0.127 |
OK | -0.127 |
Run | -0.126 |
ites | -0.126 |
Token | how |
Token ID | 703 |
Feature activation | +7.94e-02 |
Pos logit contributions | |
sob | +0.154 |
ppa | +0.154 |
ache | +0.151 |
dentist | +0.148 |
Nib | +0.148 |
Neg logit contributions | |
sorts | -0.175 |
about | -0.159 |
wins | -0.155 |
kinds | -0.155 |
pitches | -0.151 |
Token | to |
Token ID | 284 |
Feature activation | -2.17e-01 |
Pos logit contributions | |
Run | +0.002 |
sorts | +0.002 |
ites | +0.002 |
Wow | +0.002 |
atch | +0.002 |
Neg logit contributions | |
sob | -0.001 |
Nib | -0.001 |
dentist | -0.001 |
babys | -0.001 |
throat | -0.001 |
Token | do |
Token ID | 466 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
sob | +0.004 |
Her | +0.004 |
doctor | +0.004 |
dentist | +0.004 |
not | +0.004 |
Neg logit contributions | |
Wow | -0.005 |
Run | -0.005 |
ang | -0.005 |
cer | -0.005 |
mer | -0.005 |
Token | new |
Token ID | 649 |
Feature activation | +4.72e-01 |
Pos logit contributions | |
sob | +0.040 |
Nib | +0.039 |
babys | +0.038 |
dentist | +0.038 |
ache | +0.037 |
Neg logit contributions | |
sorts | -0.052 |
about | -0.051 |
ites | -0.050 |
Run | -0.050 |
atch | -0.049 |
Token | things |
Token ID | 1243 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
Run | +0.009 |
Wow | +0.008 |
OK | +0.008 |
atch | +0.008 |
ites | +0.008 |
Neg logit contributions | |
sob | -0.010 |
dentist | -0.010 |
Nib | -0.010 |
babys | -0.010 |
doctor | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | -3.12e-01 |
Pos logit contributions | |
sorts | +0.007 |
ites | +0.007 |
atch | +0.007 |
Wow | +0.007 |
Run | +0.007 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.003 |
Her | -0.003 |
babys | -0.003 |
dentist | -0.003 |
Token | Mom |
Token ID | 11254 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
sob | +0.003 |
Her | +0.003 |
Nib | +0.003 |
anywhere | +0.003 |
babys | +0.002 |
Neg logit contributions | |
ites | -0.010 |
sorts | -0.010 |
atch | -0.010 |
akes | -0.010 |
about | -0.010 |
Token | my |
Token ID | 1820 |
Feature activation | +9.80e-01 |
Pos logit contributions | |
dentist | +0.010 |
sob | +0.010 |
Her | +0.010 |
babys | +0.009 |
mom | +0.009 |
Neg logit contributions | |
ites | -0.033 |
mer | -0.032 |
Run | -0.032 |
ang | -0.032 |
ised | -0.032 |
Token | gave |
Token ID | 2921 |
Feature activation | -3.78e-01 |
Pos logit contributions | |
ites | +0.028 |
mer | +0.027 |
Wow | +0.027 |
ang | +0.027 |
Mine | +0.027 |
Neg logit contributions | |
sob | -0.013 |
crying | -0.013 |
Her | -0.012 |
babys | -0.012 |
dentist | -0.012 |
Token | her |
Token ID | 607 |
Feature activation | -5.36e+00 |
Pos logit contributions | |
sob | +0.005 |
Nib | +0.005 |
ache | +0.005 |
dentist | +0.005 |
throat | +0.005 |
Neg logit contributions | |
sorts | -0.010 |
Wow | -0.010 |
cy | -0.009 |
Run | -0.009 |
atch | -0.009 |
Token | daughter |
Token ID | 4957 |
Feature activation | -7.93e+00 |
Pos logit contributions | |
ache | +0.094 |
sob | +0.093 |
Nib | +0.092 |
ppa | +0.089 |
ocket | +0.087 |
Neg logit contributions | |
sorts | -0.122 |
cy | -0.117 |
about | -0.113 |
Wow | -0.112 |
Run | -0.111 |
Token | a |
Token ID | 257 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
sob | +0.147 |
ache | +0.147 |
Nib | +0.138 |
anywhere | +0.137 |
dentist | +0.137 |
Neg logit contributions | |
sorts | -0.180 |
cy | -0.166 |
about | -0.159 |
ee | -0.155 |
ites | -0.154 |
Token | new |
Token ID | 649 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
sob | +0.032 |
Nib | +0.032 |
ppa | +0.031 |
dentist | +0.030 |
ache | +0.030 |
Neg logit contributions | |
sorts | -0.036 |
OK | -0.035 |
Run | -0.035 |
Wow | -0.035 |
about | -0.035 |
Token | box |
Token ID | 3091 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
ites | +0.040 |
Run | +0.040 |
Wow | +0.040 |
atch | +0.040 |
ang | +0.039 |
Neg logit contributions | |
sob | -0.033 |
babys | -0.032 |
dentist | -0.032 |
Nib | -0.031 |
doctor | -0.031 |
Token | of |
Token ID | 286 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
sob | +0.019 |
Nib | +0.018 |
dentist | +0.018 |
babys | +0.018 |
throat | +0.018 |
Neg logit contributions | |
Run | -0.031 |
Wow | -0.031 |
ites | -0.031 |
sorts | -0.031 |
atch | -0.031 |
Token | cr |
Token ID | 1067 |
Feature activation | +7.77e-01 |
Pos logit contributions | |
sorts | +0.025 |
Run | +0.025 |
ites | +0.025 |
Wow | +0.025 |
OK | +0.025 |
Neg logit contributions | |
sob | -0.026 |
Nib | -0.025 |
dentist | -0.025 |
ache | -0.025 |
babys | -0.024 |
Token | a |
Token ID | 257 |
Feature activation | +9.55e-01 |
Pos logit contributions | |
babys | +0.016 |
ache | +0.016 |
ppa | +0.016 |
Nib | +0.016 |
throat | +0.015 |
Neg logit contributions | |
Wow | -0.018 |
Run | -0.018 |
sorts | -0.018 |
OK | -0.017 |
Mine | -0.017 |
Token | time |
Token ID | 640 |
Feature activation | +5.15e-01 |
Pos logit contributions | |
ites | +0.020 |
Wow | +0.018 |
cer | +0.018 |
sorts | +0.018 |
about | +0.018 |
Neg logit contributions | |
sob | -0.020 |
dentist | -0.019 |
Her | -0.018 |
stomach | -0.018 |
Nib | -0.018 |
Token | there |
Token ID | 612 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
Run | +0.012 |
Wow | +0.012 |
sorts | +0.012 |
ang | +0.012 |
atch | +0.012 |
Neg logit contributions | |
sob | -0.009 |
dentist | -0.008 |
ache | -0.008 |
Nib | -0.008 |
ppa | -0.008 |
Token | was |
Token ID | 373 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
sorts | +0.028 |
Wow | +0.028 |
Run | +0.027 |
cy | +0.027 |
about | +0.027 |
Neg logit contributions | |
sob | -0.030 |
ache | -0.030 |
dentist | -0.030 |
ppa | -0.030 |
Nib | -0.030 |
Token | a |
Token ID | 257 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
sob | +0.022 |
Nib | +0.021 |
dentist | +0.020 |
ache | +0.020 |
babys | +0.020 |
Neg logit contributions | |
Run | -0.044 |
sorts | -0.044 |
Wow | -0.044 |
ites | -0.044 |
atch | -0.043 |
Token | nos |
Token ID | 43630 |
Feature activation | +6.18e+00 |
Pos logit contributions | |
ites | +0.035 |
akes | +0.035 |
sorts | +0.034 |
atch | +0.034 |
acked | +0.034 |
Neg logit contributions | |
sob | -0.028 |
dentist | -0.028 |
doctor | -0.028 |
Nib | -0.027 |
babys | -0.027 |
Token | y |
Token ID | 88 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
Run | +0.063 |
OK | +0.063 |
atch | +0.063 |
ites | +0.061 |
Wow | +0.060 |
Neg logit contributions | |
sob | -0.181 |
Nib | -0.179 |
dentist | -0.177 |
ache | -0.176 |
babys | -0.175 |
Token | girl |
Token ID | 2576 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
ites | +0.092 |
sorts | +0.091 |
atch | +0.090 |
Run | +0.090 |
akes | +0.089 |
Neg logit contributions | |
sob | -0.075 |
Nib | -0.073 |
dentist | -0.073 |
babys | -0.071 |
doctor | -0.070 |
Token | . |
Token ID | 13 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
sob | +0.021 |
dentist | +0.020 |
Nib | +0.020 |
ache | +0.020 |
anywhere | +0.020 |
Neg logit contributions | |
ang | -0.023 |
sorts | -0.023 |
cy | -0.023 |
ites | -0.022 |
cer | -0.022 |
Token | She |
Token ID | 1375 |
Feature activation | +2.36e+00 |
Pos logit contributions | |
Wow | +0.032 |
sorts | +0.032 |
OK | +0.031 |
about | +0.031 |
Run | +0.031 |
Neg logit contributions | |
sob | -0.023 |
Nib | -0.023 |
ache | -0.023 |
ppa | -0.022 |
dentist | -0.022 |
Token | was |
Token ID | 373 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
OK | +0.034 |
sorts | +0.034 |
Wow | +0.034 |
Run | +0.034 |
atch | +0.033 |
Neg logit contributions | |
sob | -0.059 |
Nib | -0.058 |
dentist | -0.057 |
anywhere | -0.057 |
babys | -0.056 |
Token | time |
Token ID | 640 |
Feature activation | +2.74e-01 |
Pos logit contributions | |
ites | +0.021 |
Run | +0.020 |
Wow | +0.020 |
sorts | +0.019 |
cer | +0.019 |
Neg logit contributions | |
sob | -0.023 |
dentist | -0.022 |
Her | -0.022 |
stomach | -0.021 |
Nib | -0.021 |
Token | , |
Token ID | 11 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
Run | +0.007 |
sorts | +0.006 |
ites | +0.006 |
atch | +0.006 |
Wow | +0.006 |
Neg logit contributions | |
sob | -0.004 |
dentist | -0.004 |
Nib | -0.004 |
ache | -0.004 |
throat | -0.004 |
Token | there |
Token ID | 612 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
sob | +0.019 |
Nib | +0.018 |
anywhere | +0.017 |
Her | +0.017 |
doctor | +0.016 |
Neg logit contributions | |
ites | -0.033 |
sorts | -0.033 |
about | -0.032 |
atch | -0.032 |
akes | -0.032 |
Token | was |
Token ID | 373 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
sorts | +0.021 |
Wow | +0.021 |
Run | +0.021 |
about | +0.021 |
OK | +0.021 |
Neg logit contributions | |
sob | -0.021 |
Nib | -0.021 |
dentist | -0.021 |
ache | -0.020 |
babys | -0.020 |
Token | a |
Token ID | 257 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
sob | +0.020 |
Nib | +0.019 |
dentist | +0.019 |
babys | +0.018 |
throat | +0.018 |
Neg logit contributions | |
Run | -0.045 |
ites | -0.045 |
sorts | -0.045 |
Wow | -0.045 |
atch | -0.045 |
Token | tall |
Token ID | 7331 |
Feature activation | +6.15e+00 |
Pos logit contributions | |
ites | +0.036 |
akes | +0.035 |
atch | +0.035 |
sorts | +0.035 |
acked | +0.034 |
Neg logit contributions | |
sob | -0.028 |
dentist | -0.028 |
doctor | -0.028 |
Nib | -0.027 |
babys | -0.027 |
Token | gir |
Token ID | 37370 |
Feature activation | +4.10e+00 |
Pos logit contributions | |
akes | +0.159 |
Mine | +0.158 |
acked | +0.158 |
ites | +0.158 |
sorts | +0.158 |
Neg logit contributions | |
dentist | -0.102 |
doctor | -0.102 |
mom | -0.091 |
stomach | -0.091 |
Prince | -0.090 |
Token | affe |
Token ID | 21223 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
Run | +0.077 |
Wow | +0.076 |
OK | +0.075 |
sorts | +0.075 |
Mine | +0.074 |
Neg logit contributions | |
ache | -0.086 |
dentist | -0.086 |
sob | -0.085 |
Nib | -0.085 |
doctor | -0.082 |
Token | named |
Token ID | 3706 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
sob | +0.003 |
Nib | +0.003 |
babys | +0.003 |
dentist | +0.002 |
anywhere | +0.002 |
Neg logit contributions | |
ang | -0.003 |
sorts | -0.003 |
ites | -0.003 |
Run | -0.003 |
cer | -0.003 |
Token | Jerry |
Token ID | 13075 |
Feature activation | -6.59e-02 |
Pos logit contributions | |
sob | +0.037 |
dentist | +0.034 |
throat | +0.034 |
ache | +0.034 |
babys | +0.034 |
Neg logit contributions | |
Wow | -0.049 |
Run | -0.048 |
sorts | -0.048 |
atch | -0.048 |
ites | -0.048 |
Token | . |
Token ID | 13 |
Feature activation | +8.63e-01 |
Pos logit contributions | |
sob | +0.001 |
babys | +0.001 |
dentist | +0.001 |
throat | +0.001 |
grandmother | +0.001 |
Neg logit contributions | |
sorts | -0.001 |
cer | -0.001 |
ang | -0.001 |
atch | -0.001 |
cy | -0.001 |
Token | Suddenly |
Token ID | 38582 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
sob | +0.001 |
dentist | +0.001 |
doctor | +0.001 |
grandmother | +0.001 |
Her | +0.001 |
Neg logit contributions | |
akes | -0.001 |
cy | -0.001 |
cer | -0.001 |
ites | -0.001 |
mer | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
Run | +0.062 |
sorts | +0.061 |
Wow | +0.060 |
about | +0.060 |
OK | +0.060 |
Neg logit contributions | |
sob | -0.040 |
Nib | -0.039 |
dentist | -0.038 |
ache | -0.038 |
ppa | -0.038 |
Token | a |
Token ID | 257 |
Feature activation | +2.17e+00 |
Pos logit contributions | |
Run | +0.029 |
sorts | +0.029 |
Wow | +0.029 |
ites | +0.029 |
OK | +0.029 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.015 |
dentist | -0.015 |
ache | -0.015 |
babys | -0.015 |
Token | big |
Token ID | 1263 |
Feature activation | +5.96e+00 |
Pos logit contributions | |
Run | +0.044 |
sorts | +0.043 |
Wow | +0.043 |
ites | +0.043 |
OK | +0.043 |
Neg logit contributions | |
sob | -0.042 |
Nib | -0.041 |
dentist | -0.040 |
babys | -0.039 |
anywhere | -0.039 |
Token | blue |
Token ID | 4171 |
Feature activation | +4.92e+00 |
Pos logit contributions | |
akes | +0.138 |
ites | +0.138 |
acked | +0.134 |
atch | +0.132 |
cer | +0.129 |
Neg logit contributions | |
sob | -0.112 |
doctor | -0.111 |
dentist | -0.110 |
babys | -0.105 |
crying | -0.104 |
Token | j |
Token ID | 474 |
Feature activation | +7.61e+00 |
Pos logit contributions | |
ites | +0.124 |
sorts | +0.122 |
atch | +0.121 |
akes | +0.119 |
iling | +0.119 |
Neg logit contributions | |
doctor | -0.080 |
dentist | -0.076 |
babys | -0.075 |
grandmother | -0.073 |
throat | -0.073 |
Token | ay |
Token ID | 323 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
Wow | +0.201 |
Run | +0.183 |
Mine | +0.179 |
OK | +0.178 |
Quick | +0.176 |
Neg logit contributions | |
doctor | -0.127 |
stomach | -0.121 |
babys | -0.121 |
dentist | -0.120 |
ache | -0.119 |
Token | landed |
Token ID | 11406 |
Feature activation | +4.43e+00 |
Pos logit contributions | |
ites | +0.039 |
sorts | +0.039 |
OK | +0.039 |
akes | +0.039 |
atch | +0.039 |
Neg logit contributions | |
sob | -0.035 |
dentist | -0.033 |
doctor | -0.033 |
ache | -0.033 |
babys | -0.033 |
Token | on |
Token ID | 319 |
Feature activation | +3.91e+00 |
Pos logit contributions | |
sorts | +0.110 |
akes | +0.105 |
Mine | +0.104 |
Wow | +0.104 |
OK | +0.104 |
Neg logit contributions | |
sob | -0.072 |
Nib | -0.067 |
doctor | -0.066 |
dentist | -0.066 |
anywhere | -0.065 |
Token | the |
Token ID | 262 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
sorts | +0.086 |
Wow | +0.086 |
Run | +0.085 |
about | +0.083 |
OK | +0.082 |
Neg logit contributions | |
sob | -0.071 |
Nib | -0.069 |
ache | -0.069 |
ppa | -0.067 |
dentist | -0.067 |
Token | post |
Token ID | 1281 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
sorts | +0.000 |
ites | +0.000 |
akes | +0.000 |
Run | +0.000 |
ang | +0.000 |
Neg logit contributions | |
sob | -0.000 |
dentist | -0.000 |
Nib | -0.000 |
babys | -0.000 |
anywhere | -0.000 |
Token | trouble |
Token ID | 5876 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
Run | +0.059 |
sorts | +0.059 |
Wow | +0.058 |
cer | +0.056 |
Mine | +0.056 |
Neg logit contributions | |
sob | -0.051 |
Nib | -0.049 |
ppa | -0.049 |
ache | -0.048 |
dentist | -0.048 |
Token | . |
Token ID | 13 |
Feature activation | +8.27e-01 |
Pos logit contributions | |
Run | +0.044 |
sorts | +0.043 |
ites | +0.043 |
atch | +0.043 |
about | +0.043 |
Neg logit contributions | |
sob | -0.026 |
Nib | -0.026 |
dentist | -0.025 |
babys | -0.024 |
throat | -0.024 |
Token | The |
Token ID | 383 |
Feature activation | +5.19e-01 |
Pos logit contributions | |
Wow | +0.017 |
Run | +0.016 |
sorts | +0.016 |
OK | +0.016 |
ised | +0.016 |
Neg logit contributions | |
dentist | -0.016 |
anywhere | -0.016 |
ache | -0.016 |
sob | -0.015 |
ppa | -0.015 |
Token | farmer |
Token ID | 18739 |
Feature activation | -9.48e-01 |
Pos logit contributions | |
Run | +0.011 |
sorts | +0.011 |
ites | +0.011 |
Wow | +0.011 |
atch | +0.011 |
Neg logit contributions | |
sob | -0.010 |
Nib | -0.009 |
dentist | -0.009 |
babys | -0.009 |
throat | -0.009 |
Token | gently |
Token ID | 15165 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
Nib | +0.018 |
dentist | +0.018 |
anywhere | +0.018 |
sob | +0.018 |
throat | +0.018 |
Neg logit contributions | |
Run | -0.019 |
ang | -0.018 |
sorts | -0.018 |
ites | -0.018 |
atch | -0.018 |
Token | unt |
Token ID | 1418 |
Feature activation | +6.69e+00 |
Pos logit contributions | |
Run | +0.025 |
sorts | +0.025 |
ites | +0.025 |
Wow | +0.025 |
atch | +0.025 |
Neg logit contributions | |
sob | -0.026 |
Nib | -0.025 |
dentist | -0.025 |
babys | -0.025 |
throat | -0.024 |
Token | angled |
Token ID | 22393 |
Feature activation | +7.00e-01 |
Pos logit contributions | |
Run | +0.134 |
OK | +0.131 |
Wow | +0.130 |
sorts | +0.130 |
about | +0.128 |
Neg logit contributions | |
Nib | -0.131 |
sob | -0.130 |
ppa | -0.126 |
anywhere | -0.124 |
Her | -0.123 |
Token | Benny |
Token ID | 44275 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
Run | +0.017 |
Wow | +0.017 |
atch | +0.017 |
ites | +0.016 |
cer | +0.016 |
Neg logit contributions | |
sob | -0.011 |
dentist | -0.011 |
ache | -0.010 |
babys | -0.010 |
throat | -0.010 |
Token | 's |
Token ID | 338 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
sob | +0.051 |
Nib | +0.049 |
dentist | +0.047 |
ache | +0.047 |
anywhere | +0.047 |
Neg logit contributions | |
Run | -0.070 |
Wow | -0.070 |
ites | -0.070 |
sorts | -0.069 |
OK | -0.069 |
Token | horns |
Token ID | 26771 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
sob | +0.079 |
Nib | +0.078 |
dentist | +0.077 |
babys | +0.074 |
anywhere | +0.073 |
Neg logit contributions | |
Run | -0.102 |
sorts | -0.101 |
ites | -0.101 |
OK | -0.101 |
atch | -0.100 |
Token | from |
Token ID | 422 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
sob | +0.022 |
Nib | +0.022 |
dentist | +0.021 |
babys | +0.021 |
ache | +0.021 |
Neg logit contributions | |
Run | -0.019 |
sorts | -0.019 |
ites | -0.019 |
Wow | -0.019 |
atch | -0.019 |
Token | away |
Token ID | 1497 |
Feature activation | +8.43e-01 |
Pos logit contributions | |
sorts | +0.046 |
Wow | +0.045 |
Run | +0.045 |
OK | +0.044 |
about | +0.044 |
Neg logit contributions | |
sob | -0.042 |
dentist | -0.041 |
ache | -0.041 |
babys | -0.040 |
throat | -0.040 |
Token | and |
Token ID | 290 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
sorts | +0.018 |
Run | +0.018 |
ites | +0.017 |
OK | +0.017 |
about | +0.017 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.015 |
dentist | -0.015 |
babys | -0.015 |
ache | -0.015 |
Token | landed |
Token ID | 11406 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
Run | +0.011 |
sorts | +0.011 |
Wow | +0.010 |
ites | +0.010 |
OK | +0.010 |
Neg logit contributions | |
sob | -0.011 |
Nib | -0.011 |
dentist | -0.011 |
babys | -0.010 |
ache | -0.010 |
Token | in |
Token ID | 287 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
ang | +0.039 |
Run | +0.039 |
ab | +0.039 |
mer | +0.038 |
cer | +0.038 |
Neg logit contributions | |
sob | -0.047 |
dentist | -0.045 |
babys | -0.045 |
grandmother | -0.045 |
ache | -0.044 |
Token | a |
Token ID | 257 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
sorts | +0.044 |
Run | +0.043 |
Wow | +0.043 |
OK | +0.043 |
about | +0.043 |
Neg logit contributions | |
sob | -0.024 |
Nib | -0.023 |
ache | -0.022 |
dentist | -0.022 |
babys | -0.022 |
Token | deep |
Token ID | 2769 |
Feature activation | +6.59e+00 |
Pos logit contributions | |
Run | +0.021 |
sorts | +0.021 |
Wow | +0.021 |
ites | +0.021 |
OK | +0.021 |
Neg logit contributions | |
sob | -0.024 |
Nib | -0.023 |
dentist | -0.023 |
babys | -0.022 |
Her | -0.022 |
Token | dark |
Token ID | 3223 |
Feature activation | +5.12e+00 |
Pos logit contributions | |
ites | +0.148 |
OK | +0.147 |
akes | +0.147 |
Run | +0.144 |
Wow | +0.144 |
Neg logit contributions | |
sob | -0.122 |
throat | -0.119 |
Nib | -0.118 |
stomach | -0.116 |
doctor | -0.113 |
Token | forest |
Token ID | 8222 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
ites | +0.110 |
OK | +0.108 |
atch | +0.107 |
Run | +0.107 |
Mine | +0.105 |
Neg logit contributions | |
sob | -0.099 |
dentist | -0.097 |
doctor | -0.095 |
throat | -0.095 |
Nib | -0.094 |
Token | , |
Token ID | 11 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
sorts | +0.045 |
Run | +0.045 |
ites | +0.045 |
atch | +0.045 |
about | +0.045 |
Neg logit contributions | |
sob | -0.027 |
Nib | -0.026 |
dentist | -0.026 |
babys | -0.025 |
Her | -0.025 |
Token | far |
Token ID | 1290 |
Feature activation | +6.23e+00 |
Pos logit contributions | |
sob | +0.003 |
Nib | +0.002 |
dentist | +0.002 |
anywhere | +0.002 |
throat | +0.002 |
Neg logit contributions | |
ites | -0.005 |
akes | -0.005 |
about | -0.005 |
atch | -0.005 |
Wow | -0.005 |
Token | away |
Token ID | 1497 |
Feature activation | +2.34e+00 |
Pos logit contributions | |
akes | +0.175 |
ites | +0.175 |
sorts | +0.167 |
atch | +0.166 |
Run | +0.166 |
Neg logit contributions | |
anywhere | -0.080 |
Nib | -0.079 |
sob | -0.077 |
doctor | -0.074 |
ache | -0.072 |
Token | her |
Token ID | 607 |
Feature activation | -4.42e+00 |
Pos logit contributions | |
ache | +0.019 |
Nib | +0.016 |
ppa | +0.016 |
ridge | +0.016 |
sob | +0.015 |
Neg logit contributions | |
sorts | -0.024 |
Mine | -0.022 |
Wow | -0.022 |
kinds | -0.021 |
OK | -0.021 |
Token | mom |
Token ID | 1995 |
Feature activation | -4.71e+00 |
Pos logit contributions | |
ache | +0.064 |
ppa | +0.062 |
sob | +0.060 |
ridge | +0.058 |
gag | +0.054 |
Neg logit contributions | |
cy | -0.119 |
sorts | -0.117 |
Wow | -0.115 |
OK | -0.113 |
gol | -0.112 |
Token | . |
Token ID | 13 |
Feature activation | +9.19e-01 |
Pos logit contributions | |
sob | +0.093 |
Nib | +0.089 |
ache | +0.088 |
dentist | +0.087 |
throat | +0.085 |
Neg logit contributions | |
sorts | -0.100 |
cy | -0.100 |
atch | -0.096 |
ites | -0.094 |
cer | -0.093 |
Token | The |
Token ID | 383 |
Feature activation | +5.09e-01 |
Pos logit contributions | |
Run | +0.017 |
ites | +0.017 |
atch | +0.017 |
sorts | +0.017 |
ang | +0.016 |
Neg logit contributions | |
sob | -0.020 |
Nib | -0.019 |
dentist | -0.019 |
Her | -0.019 |
babys | -0.019 |
Token | museum |
Token ID | 13257 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
ites | +0.009 |
Run | +0.009 |
akes | +0.009 |
ised | +0.009 |
cer | +0.009 |
Neg logit contributions | |
dentist | -0.011 |
Nib | -0.011 |
babys | -0.011 |
doctor | -0.011 |
maid | -0.011 |
Token | had |
Token ID | 550 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Run | +0.027 |
akes | +0.026 |
atch | +0.026 |
ites | +0.026 |
ang | +0.026 |
Neg logit contributions | |
sob | -0.019 |
dentist | -0.019 |
doctor | -0.018 |
babys | -0.018 |
Nib | -0.018 |
Token | a |
Token ID | 257 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
sorts | +0.032 |
Wow | +0.032 |
Run | +0.031 |
OK | +0.031 |
ites | +0.031 |
Neg logit contributions | |
sob | -0.030 |
Nib | -0.029 |
ache | -0.028 |
ppa | -0.028 |
babys | -0.027 |
Token | big |
Token ID | 1263 |
Feature activation | +4.14e+00 |
Pos logit contributions | |
ites | +0.008 |
Run | +0.008 |
atch | +0.008 |
akes | +0.008 |
sorts | +0.008 |
Neg logit contributions | |
sob | -0.007 |
dentist | -0.007 |
Nib | -0.007 |
babys | -0.007 |
doctor | -0.006 |
Token | garden |
Token ID | 11376 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ites | +0.101 |
Run | +0.099 |
ang | +0.097 |
ised | +0.096 |
Quick | +0.096 |
Neg logit contributions | |
dentist | -0.074 |
stomach | -0.073 |
throat | -0.072 |
babys | -0.071 |
doctor | -0.071 |
Token | with |
Token ID | 351 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
Run | +0.010 |
Wow | +0.010 |
Quick | +0.010 |
ites | +0.010 |
Uh | +0.010 |
Neg logit contributions | |
sob | -0.006 |
dentist | -0.005 |
doctor | -0.005 |
throat | -0.005 |
Nib | -0.005 |
Token | many |
Token ID | 867 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
sob | +0.016 |
ache | +0.015 |
Nib | +0.015 |
ppa | +0.015 |
dentist | +0.015 |
Neg logit contributions | |
sorts | -0.014 |
Wow | -0.014 |
ites | -0.013 |
Run | -0.013 |
about | -0.013 |
Token | learn |
Token ID | 2193 |
Feature activation | -3.47e+00 |
Pos logit contributions | |
sorts | +0.015 |
pitch | +0.014 |
atch | +0.013 |
OK | +0.013 |
about | +0.013 |
Neg logit contributions | |
ache | -0.021 |
ppa | -0.020 |
sob | -0.020 |
babys | -0.019 |
Nib | -0.019 |
Token | about |
Token ID | 546 |
Feature activation | -2.65e+00 |
Pos logit contributions | |
sob | +0.060 |
throat | +0.058 |
Nib | +0.058 |
babys | +0.057 |
ppa | +0.056 |
Neg logit contributions | |
sorts | -0.082 |
ites | -0.079 |
about | -0.078 |
atch | -0.076 |
cer | -0.076 |
Token | . |
Token ID | 13 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
sob | +0.051 |
ache | +0.050 |
throat | +0.050 |
babys | +0.049 |
ppa | +0.049 |
Neg logit contributions | |
sorts | -0.056 |
ites | -0.053 |
atch | -0.052 |
about | -0.052 |
Wow | -0.051 |
Token |
|
Token ID | 198 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
ache | +0.022 |
sob | +0.021 |
ppa | +0.020 |
throat | +0.020 |
babys | +0.019 |
Neg logit contributions | |
sorts | -0.025 |
Wow | -0.025 |
cy | -0.024 |
akes | -0.024 |
OK | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
throat | +0.026 |
ache | +0.026 |
Nib | +0.024 |
sob | +0.024 |
ppa | +0.024 |
Neg logit contributions | |
sorts | -0.023 |
Wow | -0.022 |
ang | -0.021 |
ites | -0.021 |
ee | -0.021 |
Token | One |
Token ID | 3198 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
cer | +0.004 |
mer | +0.004 |
ites | +0.004 |
Run | +0.004 |
akes | +0.004 |
Neg logit contributions | |
sob | -0.003 |
Her | -0.003 |
dentist | -0.003 |
doctor | -0.003 |
Nib | -0.003 |
Token | day |
Token ID | 1110 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
ites | +0.032 |
Run | +0.031 |
atch | +0.031 |
about | +0.030 |
akes | +0.030 |
Neg logit contributions | |
sob | -0.057 |
dentist | -0.057 |
Nib | -0.056 |
Her | -0.056 |
doctor | -0.056 |
Token | , |
Token ID | 11 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
Run | +0.037 |
Wow | +0.036 |
sorts | +0.036 |
ites | +0.036 |
OK | +0.036 |
Neg logit contributions | |
sob | -0.024 |
dentist | -0.023 |
Nib | -0.023 |
ache | -0.022 |
babys | -0.022 |
Token | she |
Token ID | 673 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
Wow | +0.038 |
Run | +0.037 |
OK | +0.036 |
cy | +0.036 |
sorts | +0.035 |
Neg logit contributions | |
ache | -0.022 |
dentist | -0.021 |
sob | -0.021 |
ppa | -0.021 |
Nib | -0.020 |
Token | was |
Token ID | 373 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
akes | +0.050 |
ites | +0.050 |
ang | +0.050 |
Wow | +0.049 |
Run | +0.048 |
Neg logit contributions | |
sob | -0.036 |
dentist | -0.033 |
doctor | -0.032 |
Nib | -0.032 |
babys | -0.032 |
Token | playing |
Token ID | 2712 |
Feature activation | +7.68e-01 |
Pos logit contributions | |
Nib | +0.018 |
ache | +0.017 |
dentist | +0.017 |
sob | +0.017 |
ppa | +0.016 |
Neg logit contributions | |
sorts | -0.021 |
ang | -0.021 |
atch | -0.021 |
Run | -0.021 |
ites | -0.021 |
Token | |
Token ID | 220 |
Feature activation | +3.23e-02 |
Pos logit contributions | |
ache | +0.010 |
sob | +0.010 |
ppa | +0.010 |
throat | +0.009 |
maid | +0.009 |
Neg logit contributions | |
Wow | -0.013 |
sorts | -0.013 |
OK | -0.013 |
Run | -0.013 |
ites | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -8.50e-01 |
Pos logit contributions | |
Wow | +0.001 |
ites | +0.001 |
ang | +0.001 |
sorts | +0.001 |
akes | +0.001 |
Neg logit contributions | |
throat | -0.001 |
ache | -0.001 |
sob | -0.001 |
dentist | -0.001 |
Nib | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
throat | +0.018 |
ache | +0.018 |
maid | +0.017 |
sob | +0.017 |
Nib | +0.017 |
Neg logit contributions | |
sorts | -0.017 |
Wow | -0.017 |
ang | -0.016 |
ites | -0.016 |
OK | -0.016 |
Token | One |
Token ID | 3198 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
cer | +0.014 |
cy | +0.014 |
akes | +0.014 |
mer | +0.014 |
sorts | +0.014 |
Neg logit contributions | |
dentist | -0.010 |
sob | -0.010 |
Her | -0.010 |
doctor | -0.010 |
anywhere | -0.009 |
Token | day |
Token ID | 1110 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
ites | +0.034 |
Mine | +0.033 |
atch | +0.032 |
akes | +0.032 |
cer | +0.032 |
Neg logit contributions | |
doctor | -0.047 |
dentist | -0.047 |
sob | -0.046 |
Her | -0.045 |
mom | -0.045 |
Token | , |
Token ID | 11 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
sorts | +0.042 |
ites | +0.042 |
Run | +0.041 |
about | +0.041 |
ang | +0.041 |
Neg logit contributions | |
sob | -0.019 |
Nib | -0.019 |
dentist | -0.018 |
anywhere | -0.018 |
Her | -0.018 |
Token | Max |
Token ID | 5436 |
Feature activation | +7.27e-01 |
Pos logit contributions | |
Run | +0.030 |
sorts | +0.030 |
Wow | +0.030 |
ites | +0.030 |
OK | +0.030 |
Neg logit contributions | |
sob | -0.015 |
Nib | -0.015 |
dentist | -0.014 |
babys | -0.014 |
ache | -0.014 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
Run | +0.015 |
sorts | +0.015 |
ites | +0.015 |
Wow | +0.015 |
atch | +0.015 |
Neg logit contributions | |
sob | -0.014 |
Nib | -0.013 |
dentist | -0.013 |
babys | -0.013 |
throat | -0.013 |
Token | a |
Token ID | 257 |
Feature activation | +5.93e-01 |
Pos logit contributions | |
ppa | +0.021 |
ocket | +0.021 |
alo | +0.021 |
ache | +0.021 |
throat | +0.020 |
Neg logit contributions | |
Run | -0.019 |
Wow | -0.019 |
Pull | -0.019 |
sorts | -0.019 |
pitch | -0.018 |
Token | squirrel |
Token ID | 33039 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
ites | +0.012 |
sorts | +0.012 |
akes | +0.012 |
Run | +0.012 |
atch | +0.012 |
Neg logit contributions | |
sob | -0.011 |
dentist | -0.011 |
Nib | -0.011 |
babys | -0.011 |
doctor | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
Wow | +0.022 |
Run | +0.022 |
sorts | +0.022 |
OK | +0.022 |
ites | +0.021 |
Neg logit contributions | |
sob | -0.018 |
Nib | -0.018 |
dentist | -0.017 |
anywhere | -0.017 |
babys | -0.017 |
Token | enough |
Token ID | 1576 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
sorts | +0.037 |
ites | +0.036 |
Run | +0.036 |
atch | +0.035 |
about | +0.035 |
Neg logit contributions | |
sob | -0.027 |
Nib | -0.026 |
babys | -0.026 |
throat | -0.025 |
dentist | -0.025 |
Token | , |
Token ID | 11 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
ites | +0.043 |
Run | +0.042 |
OK | +0.042 |
sorts | +0.042 |
atch | +0.041 |
Neg logit contributions | |
sob | -0.039 |
ache | -0.039 |
dentist | -0.039 |
ppa | -0.038 |
babys | -0.037 |
Token | the |
Token ID | 262 |
Feature activation | -4.65e-01 |
Pos logit contributions | |
Run | +0.004 |
sorts | +0.004 |
Wow | +0.004 |
ites | +0.004 |
OK | +0.004 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.003 |
dentist | -0.003 |
babys | -0.003 |
ache | -0.003 |
Token | steam |
Token ID | 13324 |
Feature activation | +8.09e-01 |
Pos logit contributions | |
sob | +0.011 |
Nib | +0.010 |
dentist | +0.010 |
babys | +0.010 |
throat | +0.010 |
Neg logit contributions | |
Run | -0.008 |
sorts | -0.008 |
ites | -0.008 |
Wow | -0.008 |
atch | -0.008 |
Token | began |
Token ID | 2540 |
Feature activation | +8.63e-01 |
Pos logit contributions | |
sorts | +0.016 |
ites | +0.016 |
Wow | +0.016 |
atch | +0.016 |
Run | +0.016 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.015 |
dentist | -0.015 |
throat | -0.015 |
babys | -0.015 |
Token | to |
Token ID | 284 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
sorts | +0.023 |
ites | +0.022 |
atch | +0.022 |
Run | +0.022 |
mer | +0.022 |
Neg logit contributions | |
dentist | -0.012 |
ppa | -0.011 |
Nib | -0.011 |
sob | -0.011 |
maid | -0.011 |
Token | display |
Token ID | 3359 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
ites | +0.040 |
Wow | +0.039 |
Run | +0.039 |
ang | +0.039 |
atch | +0.039 |
Neg logit contributions | |
sob | -0.033 |
Nib | -0.032 |
dentist | -0.031 |
babys | -0.030 |
throat | -0.030 |
Token | in |
Token ID | 287 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
sorts | +0.006 |
ites | +0.006 |
Wow | +0.006 |
cer | +0.006 |
about | +0.006 |
Neg logit contributions | |
sob | -0.004 |
dentist | -0.004 |
babys | -0.004 |
Nib | -0.004 |
ppa | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
Run | +0.036 |
sorts | +0.036 |
ites | +0.036 |
Wow | +0.036 |
atch | +0.036 |
Neg logit contributions | |
sob | -0.025 |
Nib | -0.024 |
dentist | -0.024 |
babys | -0.023 |
ache | -0.023 |
Token | air |
Token ID | 1633 |
Feature activation | +5.60e-01 |
Pos logit contributions | |
ites | +0.019 |
cer | +0.019 |
sorts | +0.019 |
Run | +0.019 |
akes | +0.019 |
Neg logit contributions | |
sob | -0.028 |
Nib | -0.027 |
dentist | -0.027 |
babys | -0.026 |
doctor | -0.026 |
Token | like |
Token ID | 588 |
Feature activation | -8.92e-01 |
Pos logit contributions | |
sorts | +0.014 |
ites | +0.013 |
Run | +0.013 |
about | +0.013 |
atch | +0.013 |
Neg logit contributions | |
sob | -0.009 |
Nib | -0.009 |
dentist | -0.008 |
babys | -0.008 |
ppa | -0.008 |
Token | 're |
Token ID | 821 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
Wow | +0.031 |
sorts | +0.031 |
Run | +0.031 |
OK | +0.031 |
akes | +0.030 |
Neg logit contributions | |
sob | -0.044 |
dentist | -0.043 |
Nib | -0.043 |
babys | -0.042 |
ache | -0.042 |
Token | welcome |
Token ID | 7062 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
ache | +0.035 |
sob | +0.034 |
babys | +0.034 |
throat | +0.033 |
dentist | +0.033 |
Neg logit contributions | |
Wow | -0.019 |
sorts | -0.018 |
OK | -0.018 |
atch | -0.018 |
cy | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | -3.88e-01 |
Pos logit contributions | |
ache | +0.042 |
ppa | +0.041 |
gag | +0.041 |
sob | +0.041 |
ocket | +0.041 |
Neg logit contributions | |
cy | -0.022 |
ay | -0.021 |
atch | -0.020 |
OK | -0.020 |
mer | -0.019 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
sob | +0.006 |
ache | +0.006 |
Nib | +0.006 |
anywhere | +0.006 |
ppa | +0.006 |
Neg logit contributions | |
Wow | -0.009 |
OK | -0.009 |
Run | -0.009 |
sorts | -0.009 |
about | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
sob | +0.000 |
Nib | +0.000 |
babys | +0.000 |
dentist | +0.000 |
anywhere | +0.000 |
Neg logit contributions | |
OK | -0.001 |
cer | -0.001 |
sorts | -0.001 |
cy | -0.001 |
ites | -0.001 |
Token | You |
Token ID | 921 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
about | +0.041 |
ised | +0.041 |
ites | +0.041 |
Run | +0.040 |
sorts | +0.040 |
Neg logit contributions | |
Nib | -0.047 |
Her | -0.045 |
throat | -0.044 |
sob | -0.044 |
dentist | -0.043 |
Token | are |
Token ID | 389 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
ang | +0.047 |
Run | +0.047 |
about | +0.046 |
ites | +0.046 |
sorts | +0.046 |
Neg logit contributions | |
sob | -0.052 |
Nib | -0.050 |
dentist | -0.049 |
anywhere | -0.048 |
throat | -0.048 |
Token | a |
Token ID | 257 |
Feature activation | +7.87e-01 |
Pos logit contributions | |
ache | +0.034 |
sob | +0.034 |
babys | +0.033 |
dentist | +0.032 |
throat | +0.031 |
Neg logit contributions | |
sorts | -0.037 |
Wow | -0.036 |
cer | -0.035 |
OK | -0.035 |
atch | -0.035 |
Token | good |
Token ID | 922 |
Feature activation | +3.98e+00 |
Pos logit contributions | |
ites | +0.018 |
Run | +0.018 |
sorts | +0.017 |
atch | +0.017 |
about | +0.017 |
Neg logit contributions | |
sob | -0.014 |
Nib | -0.014 |
dentist | -0.013 |
doctor | -0.013 |
babys | -0.013 |
Token | sister |
Token ID | 6621 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
Run | +0.100 |
sorts | +0.100 |
ites | +0.099 |
OK | +0.099 |
Wow | +0.099 |
Neg logit contributions | |
sob | -0.058 |
Nib | -0.056 |
dentist | -0.055 |
anywhere | -0.053 |
babys | -0.053 |
Token | ." |
Token ID | 526 |
Feature activation | -4.15e-01 |
Pos logit contributions | |
sob | +0.051 |
Nib | +0.049 |
babys | +0.048 |
dentist | +0.047 |
Her | +0.047 |
Neg logit contributions | |
ites | -0.057 |
cer | -0.056 |
sorts | -0.056 |
OK | -0.056 |
Run | -0.056 |
Token | and |
Token ID | 290 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
Run | +0.014 |
Wow | +0.014 |
OK | +0.014 |
atch | +0.014 |
ites | +0.014 |
Neg logit contributions | |
sob | -0.012 |
Nib | -0.011 |
dentist | -0.011 |
throat | -0.011 |
ache | -0.011 |
Token | pans |
Token ID | 36209 |
Feature activation | +5.35e-01 |
Pos logit contributions | |
sob | +0.007 |
Nib | +0.007 |
throat | +0.007 |
dentist | +0.007 |
babys | +0.007 |
Neg logit contributions | |
akes | -0.007 |
atch | -0.007 |
ang | -0.007 |
cer | -0.007 |
ites | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -9.14e-01 |
Pos logit contributions | |
Run | +0.011 |
Wow | +0.011 |
atch | +0.011 |
OK | +0.011 |
ites | +0.011 |
Neg logit contributions | |
sob | -0.010 |
Nib | -0.010 |
dentist | -0.010 |
babys | -0.010 |
throat | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
sob | +0.018 |
Nib | +0.017 |
dentist | +0.017 |
babys | +0.016 |
throat | +0.016 |
Neg logit contributions | |
Run | -0.019 |
ites | -0.019 |
atch | -0.019 |
Wow | -0.019 |
OK | -0.019 |
Token | started |
Token ID | 2067 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
sob | +0.004 |
Nib | +0.004 |
dentist | +0.004 |
babys | +0.004 |
throat | +0.004 |
Neg logit contributions | |
Run | -0.005 |
atch | -0.005 |
ites | -0.005 |
Wow | -0.005 |
ang | -0.005 |
Token | to |
Token ID | 284 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
Nib | +0.001 |
sob | +0.001 |
dentist | +0.001 |
ppa | +0.001 |
ache | +0.001 |
Neg logit contributions | |
sorts | -0.003 |
Run | -0.003 |
atch | -0.003 |
ites | -0.003 |
akes | -0.003 |
Token | cook |
Token ID | 4255 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
ites | +0.016 |
ang | +0.016 |
Wow | +0.016 |
Run | +0.015 |
cer | +0.015 |
Neg logit contributions | |
sob | -0.013 |
Nib | -0.012 |
dentist | -0.012 |
throat | -0.012 |
babys | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
sob | +0.006 |
Nib | +0.006 |
dentist | +0.006 |
babys | +0.006 |
ache | +0.005 |
Neg logit contributions | |
sorts | -0.008 |
Run | -0.008 |
ites | -0.008 |
Wow | -0.008 |
about | -0.008 |
Token | Mia |
Token ID | 32189 |
Feature activation | +8.23e-01 |
Pos logit contributions | |
ache | +0.010 |
dentist | +0.010 |
sob | +0.010 |
anywhere | +0.009 |
ppa | +0.009 |
Neg logit contributions | |
Wow | -0.013 |
sorts | -0.013 |
Run | -0.013 |
ites | -0.012 |
OK | -0.012 |
Token | helped |
Token ID | 4193 |
Feature activation | -6.63e-01 |
Pos logit contributions | |
Wow | +0.019 |
Run | +0.019 |
ites | +0.019 |
atch | +0.019 |
OK | +0.018 |
Neg logit contributions | |
sob | -0.015 |
dentist | -0.013 |
throat | -0.013 |
Nib | -0.013 |
ache | -0.013 |
Token | by |
Token ID | 416 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
Nib | +0.009 |
ache | +0.009 |
sob | +0.009 |
dentist | +0.009 |
ppa | +0.009 |
Neg logit contributions | |
cy | -0.017 |
sorts | -0.017 |
about | -0.017 |
akes | -0.017 |
ee | -0.016 |
Token | " |
Token ID | 1 |
Feature activation | +3.62e+00 |
Pos logit contributions | |
akes | +0.031 |
cer | +0.029 |
sorts | +0.029 |
cy | +0.029 |
about | +0.028 |
Neg logit contributions | |
sob | -0.024 |
Her | -0.024 |
dentist | -0.024 |
doctor | -0.023 |
Her | -0.023 |
Token | Can |
Token ID | 6090 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
sorts | +0.046 |
akes | +0.044 |
about | +0.044 |
atch | +0.043 |
cer | +0.042 |
Neg logit contributions | |
sob | -0.101 |
Nib | -0.099 |
dentist | -0.098 |
doctor | -0.097 |
Her | -0.097 |
Token | I |
Token ID | 314 |
Feature activation | -5.50e-02 |
Pos logit contributions | |
OK | +0.003 |
Run | +0.003 |
Wow | +0.003 |
ites | +0.003 |
atch | +0.003 |
Neg logit contributions | |
ache | -0.007 |
ppa | -0.007 |
sob | -0.007 |
dentist | -0.007 |
ocket | -0.007 |
Token | go |
Token ID | 467 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
sob | +0.001 |
Nib | +0.001 |
dentist | +0.001 |
anywhere | +0.001 |
Prince | +0.001 |
Neg logit contributions | |
OK | -0.001 |
cy | -0.001 |
ites | -0.001 |
atch | -0.001 |
akes | -0.001 |
Token | play |
Token ID | 711 |
Feature activation | -7.91e-01 |
Pos logit contributions | |
gag | +0.025 |
sob | +0.025 |
ache | +0.025 |
Prince | +0.025 |
throat | +0.024 |
Neg logit contributions | |
ites | -0.023 |
cy | -0.023 |
ite | -0.022 |
ang | -0.021 |
ab | -0.021 |
Token | with |
Token ID | 351 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
sob | +0.016 |
Nib | +0.016 |
ache | +0.015 |
throat | +0.015 |
dentist | +0.015 |
Neg logit contributions | |
Run | -0.015 |
ites | -0.015 |
OK | -0.015 |
atch | -0.015 |
about | -0.015 |
Token | Ben |
Token ID | 3932 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
Nib | +0.041 |
sob | +0.040 |
ache | +0.040 |
babys | +0.039 |
ppa | +0.039 |
Neg logit contributions | |
ites | -0.025 |
Run | -0.025 |
atch | -0.025 |
ee | -0.024 |
OK | -0.024 |
Token | now |
Token ID | 783 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
Nib | +0.085 |
sob | +0.082 |
babys | +0.082 |
maid | +0.080 |
Her | +0.080 |
Neg logit contributions | |
cy | -0.069 |
cer | -0.068 |
atch | -0.068 |
ites | -0.067 |
OK | -0.067 |
Token | ?" |
Token ID | 1701 |
Feature activation | -9.03e-01 |
Pos logit contributions | |
sob | +0.006 |
Nib | +0.006 |
dentist | +0.006 |
babys | +0.006 |
ache | +0.006 |
Neg logit contributions | |
Run | -0.007 |
OK | -0.007 |
ites | -0.007 |
atch | -0.007 |
Wow | -0.007 |
Token | Lisa |
Token ID | 15378 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ache | +0.017 |
anywhere | +0.017 |
ppa | +0.017 |
Nib | +0.017 |
sob | +0.017 |
Neg logit contributions | |
Run | -0.019 |
OK | -0.019 |
sorts | -0.019 |
Wow | -0.019 |
ites | -0.018 |
Token | asks |
Token ID | 7893 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
Run | +0.006 |
blows | +0.006 |
about | +0.006 |
Wow | +0.006 |
OK | +0.006 |
Neg logit contributions | |
anywhere | -0.009 |
Nib | -0.009 |
throat | -0.009 |
ache | -0.009 |
babys | -0.009 |
Token | cheering |
Token ID | 29732 |
Feature activation | +6.15e-01 |
Pos logit contributions | |
akes | +0.001 |
Run | +0.001 |
atch | +0.001 |
about | +0.001 |
ites | +0.001 |
Neg logit contributions | |
sob | -0.001 |
Nib | -0.001 |
Her | -0.001 |
anywhere | -0.001 |
babys | -0.001 |
Token | as |
Token ID | 355 |
Feature activation | -7.43e-01 |
Pos logit contributions | |
Run | +0.015 |
sorts | +0.015 |
ites | +0.015 |
Wow | +0.015 |
atch | +0.014 |
Neg logit contributions | |
sob | -0.010 |
Nib | -0.009 |
dentist | -0.009 |
babys | -0.009 |
anywhere | -0.009 |
Token | Lucy |
Token ID | 22162 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
sob | +0.011 |
Nib | +0.010 |
dentist | +0.010 |
throat | +0.010 |
ache | +0.010 |
Neg logit contributions | |
sorts | -0.019 |
Run | -0.019 |
Wow | -0.019 |
OK | -0.019 |
ites | -0.019 |
Token | laughed |
Token ID | 13818 |
Feature activation | +4.03e-01 |
Pos logit contributions | |
Wow | +0.038 |
Run | +0.037 |
sorts | +0.037 |
akes | +0.037 |
atch | +0.036 |
Neg logit contributions | |
sob | -0.033 |
Nib | -0.031 |
ache | -0.030 |
dentist | -0.030 |
throat | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
Run | +0.010 |
sorts | +0.009 |
Wow | +0.009 |
about | +0.009 |
OK | +0.009 |
Neg logit contributions | |
sob | -0.006 |
Nib | -0.006 |
dentist | -0.006 |
babys | -0.006 |
throat | -0.006 |
Token | smiled |
Token ID | 13541 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
sob | +0.002 |
Nib | +0.002 |
Her | +0.002 |
throat | +0.002 |
babys | +0.002 |
Neg logit contributions | |
akes | -0.002 |
atch | -0.002 |
ites | -0.002 |
Run | -0.002 |
about | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -7.93e-01 |
Pos logit contributions | |
sorts | +0.005 |
cer | +0.005 |
OK | +0.005 |
Wow | +0.005 |
Run | +0.005 |
Neg logit contributions | |
sob | -0.004 |
dentist | -0.004 |
Nib | -0.004 |
babys | -0.004 |
ppa | -0.004 |
Token | It |
Token ID | 632 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
sob | +0.011 |
Her | +0.011 |
Nib | +0.011 |
dentist | +0.010 |
babys | +0.010 |
Neg logit contributions | |
Run | -0.021 |
atch | -0.020 |
ites | -0.020 |
cer | -0.020 |
sorts | -0.020 |
Token | was |
Token ID | 373 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
akes | +0.053 |
ites | +0.052 |
atch | +0.050 |
ang | +0.049 |
about | +0.049 |
Neg logit contributions | |
sob | -0.024 |
not | -0.020 |
doctor | -0.020 |
Her | -0.020 |
anywhere | -0.019 |
Token | the |
Token ID | 262 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
Run | +0.005 |
ites | +0.005 |
sorts | +0.005 |
Wow | +0.005 |
atch | +0.005 |
Neg logit contributions | |
sob | -0.003 |
Nib | -0.003 |
dentist | -0.003 |
babys | -0.003 |
anywhere | -0.003 |
Token | perfect |
Token ID | 2818 |
Feature activation | +2.97e+00 |
Pos logit contributions | |
Run | +0.032 |
ites | +0.032 |
ang | +0.031 |
sorts | +0.031 |
akes | +0.031 |
Neg logit contributions | |
sob | -0.021 |
dentist | -0.021 |
Nib | -0.020 |
anywhere | -0.020 |
doctor | -0.020 |
Token | for |
Token ID | 329 |
Feature activation | +9.23e-01 |
Pos logit contributions | |
Wow | +0.024 |
ites | +0.024 |
about | +0.024 |
Run | +0.024 |
ang | +0.024 |
Neg logit contributions | |
sob | -0.014 |
anywhere | -0.013 |
Nib | -0.013 |
ache | -0.012 |
throat | -0.012 |
Token | big |
Token ID | 1263 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
Wow | +0.020 |
about | +0.020 |
sorts | +0.020 |
Run | +0.020 |
ites | +0.020 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.016 |
dentist | -0.016 |
anywhere | -0.015 |
throat | -0.015 |
Token | birds |
Token ID | 10087 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
Wow | +0.075 |
acked | +0.074 |
ang | +0.074 |
cy | +0.073 |
cer | +0.073 |
Neg logit contributions | |
sob | -0.056 |
throat | -0.053 |
anywhere | -0.053 |
ache | -0.052 |
doctor | -0.052 |
Token | , |
Token ID | 11 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
sob | +0.013 |
Nib | +0.012 |
dentist | +0.012 |
anywhere | +0.012 |
ache | +0.012 |
Neg logit contributions | |
Run | -0.018 |
Wow | -0.018 |
sorts | -0.018 |
OK | -0.017 |
about | -0.017 |
Token | like |
Token ID | 588 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
sob | +0.004 |
Nib | +0.004 |
dentist | +0.004 |
anywhere | +0.004 |
doctor | +0.004 |
Neg logit contributions | |
akes | -0.007 |
cer | -0.007 |
ites | -0.007 |
about | -0.007 |
acked | -0.007 |
Token | me |
Token ID | 502 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
Run | +0.003 |
sorts | +0.003 |
ites | +0.003 |
Wow | +0.003 |
about | +0.003 |
Neg logit contributions | |
sob | -0.002 |
Nib | -0.002 |
dentist | -0.002 |
anywhere | -0.002 |
babys | -0.002 |
Token | ," |
Token ID | 553 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
sob | +0.013 |
Nib | +0.013 |
dentist | +0.013 |
babys | +0.012 |
throat | +0.012 |
Neg logit contributions | |
Run | -0.016 |
sorts | -0.016 |
ites | -0.016 |
atch | -0.016 |
Wow | -0.016 |
Token | it |
Token ID | 340 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
anywhere | +0.008 |
dentist | +0.008 |
babys | +0.008 |
ache | +0.008 |
maid | +0.008 |
Neg logit contributions | |
Run | -0.010 |
Wow | -0.010 |
sorts | -0.010 |
OK | -0.010 |
ised | -0.010 |
Token | sne |
Token ID | 10505 |
Feature activation | +3.68e+00 |
Pos logit contributions | |
Run | +0.038 |
OK | +0.037 |
ang | +0.036 |
Wow | +0.036 |
ab | +0.036 |
Neg logit contributions | |
dentist | -0.033 |
anywhere | -0.032 |
babys | -0.032 |
Nib | -0.032 |
maid | -0.030 |
Token | ered |
Token ID | 1068 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
Run | +0.072 |
sorts | +0.071 |
atch | +0.071 |
ites | +0.070 |
ang | +0.070 |
Neg logit contributions | |
sob | -0.074 |
dentist | -0.074 |
Nib | -0.073 |
babys | -0.072 |
anywhere | -0.071 |
Token | . |
Token ID | 13 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
akes | +0.043 |
OK | +0.043 |
ites | +0.043 |
atch | +0.043 |
Wow | +0.043 |
Neg logit contributions | |
sob | -0.037 |
Nib | -0.036 |
Her | -0.034 |
anywhere | -0.034 |
babys | -0.033 |
Token | a |
Token ID | 257 |
Feature activation | +7.84e-01 |
Pos logit contributions | |
ang | +0.036 |
Run | +0.035 |
akes | +0.035 |
Wow | +0.035 |
ites | +0.035 |
Neg logit contributions | |
sob | -0.019 |
Nib | -0.018 |
dentist | -0.018 |
anywhere | -0.017 |
Her | -0.017 |
Token | turn |
Token ID | 1210 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
sorts | +0.015 |
OK | +0.015 |
Run | +0.015 |
Wow | +0.015 |
atch | +0.014 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.016 |
dentist | -0.015 |
ppa | -0.015 |
Her | -0.015 |
Token | , |
Token ID | 11 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
Wow | +0.040 |
Run | +0.040 |
OK | +0.039 |
sorts | +0.039 |
ites | +0.039 |
Neg logit contributions | |
sob | -0.020 |
Nib | -0.019 |
anywhere | -0.019 |
dentist | -0.018 |
ache | -0.018 |
Token | the |
Token ID | 262 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
akes | +0.013 |
ites | +0.013 |
ang | +0.013 |
atch | +0.013 |
about | +0.012 |
Neg logit contributions | |
sob | -0.006 |
Nib | -0.006 |
dentist | -0.006 |
anywhere | -0.006 |
doctor | -0.006 |
Token | naughty |
Token ID | 45128 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
sob | +0.003 |
Nib | +0.002 |
doctor | +0.002 |
dentist | +0.002 |
babys | +0.002 |
Neg logit contributions | |
ites | -0.003 |
ang | -0.003 |
Run | -0.003 |
akes | -0.003 |
sorts | -0.003 |
Token | monkey |
Token ID | 21657 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
ites | +0.086 |
ang | +0.082 |
akes | +0.078 |
acked | +0.077 |
Run | +0.077 |
Neg logit contributions | |
crying | -0.056 |
sob | -0.056 |
doctor | -0.056 |
grandmother | -0.054 |
mom | -0.053 |
Token | climbed |
Token ID | 19952 |
Feature activation | +3.40e+00 |
Pos logit contributions | |
sob | +0.025 |
Nib | +0.025 |
dentist | +0.025 |
babys | +0.024 |
throat | +0.024 |
Neg logit contributions | |
Run | -0.025 |
sorts | -0.025 |
ites | -0.025 |
atch | -0.025 |
OK | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
Run | +0.076 |
sorts | +0.076 |
ites | +0.075 |
OK | +0.075 |
atch | +0.075 |
Neg logit contributions | |
sob | -0.059 |
Nib | -0.058 |
dentist | -0.056 |
anywhere | -0.056 |
babys | -0.055 |
Token | tree |
Token ID | 5509 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
sob | +0.010 |
Nib | +0.010 |
dentist | +0.010 |
anywhere | +0.010 |
doctor | +0.010 |
Neg logit contributions | |
Run | -0.008 |
ites | -0.008 |
ang | -0.008 |
akes | -0.007 |
cer | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +8.90e-01 |
Pos logit contributions | |
sob | +0.008 |
Nib | +0.007 |
dentist | +0.007 |
anywhere | +0.007 |
Her | +0.007 |
Neg logit contributions | |
Run | -0.012 |
Wow | -0.012 |
OK | -0.011 |
ites | -0.011 |
atch | -0.011 |
Token | managed |
Token ID | 5257 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
akes | +0.020 |
ites | +0.020 |
atch | +0.020 |
about | +0.020 |
sorts | +0.020 |
Neg logit contributions | |
sob | -0.016 |
Nib | -0.016 |
dentist | -0.015 |
anywhere | -0.015 |
doctor | -0.015 |
Token | her |
Token ID | 607 |
Feature activation | -4.10e+00 |
Pos logit contributions | |
ache | +0.019 |
sob | +0.018 |
throat | +0.017 |
ppa | +0.017 |
Nib | +0.017 |
Neg logit contributions | |
sorts | -0.024 |
Wow | -0.024 |
Run | -0.024 |
cy | -0.024 |
OK | -0.024 |
Token | , |
Token ID | 11 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
sob | +0.076 |
Nib | +0.075 |
dentist | +0.073 |
anywhere | +0.071 |
ache | +0.070 |
Neg logit contributions | |
ites | -0.086 |
sorts | -0.085 |
ang | -0.085 |
Run | -0.085 |
cer | -0.084 |
Token | looked |
Token ID | 3114 |
Feature activation | +6.35e-01 |
Pos logit contributions | |
sob | +0.003 |
Nib | +0.003 |
dentist | +0.003 |
babys | +0.003 |
throat | +0.003 |
Neg logit contributions | |
Run | -0.005 |
sorts | -0.005 |
ites | -0.005 |
Wow | -0.005 |
atch | -0.005 |
Token | up |
Token ID | 510 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
sorts | +0.013 |
Run | +0.013 |
ang | +0.013 |
Wow | +0.013 |
about | +0.013 |
Neg logit contributions | |
sob | -0.012 |
dentist | -0.012 |
Nib | -0.012 |
throat | -0.012 |
ache | -0.012 |
Token | at |
Token ID | 379 |
Feature activation | -8.35e-01 |
Pos logit contributions | |
akes | +0.034 |
Wow | +0.033 |
ites | +0.033 |
Run | +0.033 |
atch | +0.033 |
Neg logit contributions | |
sob | -0.030 |
Her | -0.029 |
Nib | -0.028 |
babys | -0.027 |
doctor | -0.027 |
Token | her |
Token ID | 607 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
ache | +0.014 |
sob | +0.013 |
throat | +0.012 |
Nib | +0.012 |
maid | +0.012 |
Neg logit contributions | |
sorts | -0.021 |
Wow | -0.021 |
cy | -0.020 |
Mine | -0.020 |
ites | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | -5.33e-01 |
Pos logit contributions | |
Nib | +0.075 |
sob | +0.074 |
dentist | +0.072 |
anywhere | +0.070 |
ache | +0.068 |
Neg logit contributions | |
Run | -0.110 |
sorts | -0.109 |
ites | -0.109 |
ang | -0.109 |
OK | -0.109 |
Token | asked |
Token ID | 1965 |
Feature activation | -4.52e+00 |
Pos logit contributions | |
dentist | +0.010 |
Nib | +0.010 |
anywhere | +0.009 |
sob | +0.009 |
ache | +0.009 |
Neg logit contributions | |
Run | -0.011 |
Wow | -0.011 |
OK | -0.011 |
sorts | -0.011 |
cy | -0.011 |
Token | : |
Token ID | 25 |
Feature activation | -5.91e+00 |
Pos logit contributions | |
ache | +0.091 |
throat | +0.089 |
gag | +0.086 |
ppa | +0.085 |
ridge | +0.084 |
Neg logit contributions | |
sorts | -0.087 |
Wow | -0.086 |
OK | -0.084 |
Run | -0.083 |
about | -0.082 |
Token |
|
Token ID | 198 |
Feature activation | -2.19e+00 |
Pos logit contributions | |
ache | +0.128 |
ppa | +0.127 |
dentist | +0.126 |
nightmares | +0.121 |
sob | +0.121 |
Neg logit contributions | |
Wow | -0.111 |
Run | -0.104 |
about | -0.103 |
OK | -0.102 |
ang | -0.100 |
Token |
|
Token ID | 198 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
throat | +0.043 |
anywhere | +0.042 |
Nib | +0.042 |
ache | +0.042 |
sob | +0.041 |
Neg logit contributions | |
Wow | -0.046 |
Run | -0.045 |
OK | -0.045 |
ites | -0.044 |
atch | -0.043 |
Token | sad |
Token ID | 6507 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
grandmother | +0.008 |
dentist | +0.008 |
ppa | +0.008 |
Nib | +0.008 |
maid | +0.008 |
Neg logit contributions | |
Run | -0.010 |
OK | -0.010 |
Wow | -0.009 |
blows | -0.009 |
ang | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +3.67e-03 |
Pos logit contributions | |
Run | +0.045 |
Wow | +0.044 |
OK | +0.043 |
than | +0.042 |
about | +0.042 |
Neg logit contributions | |
ppa | -0.046 |
babys | -0.043 |
grandmother | -0.043 |
Nib | -0.043 |
dentist | -0.043 |
Token | He |
Token ID | 679 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
Wow | +0.000 |
OK | +0.000 |
Run | +0.000 |
Mine | +0.000 |
acked | +0.000 |
Neg logit contributions | |
ppa | -0.000 |
ache | -0.000 |
anywhere | -0.000 |
ridge | -0.000 |
ocket | -0.000 |
Token | wished |
Token ID | 16555 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
Run | +0.021 |
OK | +0.021 |
Wow | +0.021 |
atch | +0.020 |
sorts | +0.019 |
Neg logit contributions | |
Nib | -0.022 |
anywhere | -0.022 |
dentist | -0.022 |
babys | -0.022 |
grandmother | -0.021 |
Token | he |
Token ID | 339 |
Feature activation | -8.92e-01 |
Pos logit contributions | |
ppa | +0.005 |
urger | +0.005 |
ridge | +0.005 |
ache | +0.005 |
gag | +0.005 |
Neg logit contributions | |
Wow | -0.006 |
OK | -0.005 |
Run | -0.005 |
blows | -0.005 |
gol | -0.005 |
Token | did |
Token ID | 750 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
sob | +0.018 |
Nib | +0.018 |
dentist | +0.018 |
babys | +0.018 |
Her | +0.017 |
Neg logit contributions | |
Run | -0.017 |
OK | -0.017 |
Wow | -0.017 |
ites | -0.017 |
cer | -0.017 |
Token | not |
Token ID | 407 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
babys | +0.061 |
ppa | +0.059 |
Nib | +0.058 |
sob | +0.056 |
throat | +0.054 |
Neg logit contributions | |
OK | -0.115 |
turns | -0.112 |
wins | -0.109 |
Good | -0.108 |
pitch | -0.108 |
Token | push |
Token ID | 4574 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
sob | +0.008 |
Nib | +0.007 |
dentist | +0.007 |
ache | +0.007 |
anywhere | +0.007 |
Neg logit contributions | |
ites | -0.010 |
ang | -0.010 |
akes | -0.010 |
Run | -0.010 |
sorts | -0.010 |
Token | Lily |
Token ID | 20037 |
Feature activation | -3.93e+00 |
Pos logit contributions | |
Wow | +0.074 |
ites | +0.071 |
cy | +0.071 |
Run | +0.071 |
atch | +0.071 |
Neg logit contributions | |
sob | -0.047 |
dentist | -0.046 |
ache | -0.046 |
throat | -0.045 |
proposal | -0.045 |
Token | . |
Token ID | 13 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
dentist | +0.076 |
sob | +0.076 |
grandmother | +0.075 |
Nib | +0.075 |
babys | +0.075 |
Neg logit contributions | |
atch | -0.078 |
cer | -0.077 |
about | -0.075 |
ab | -0.075 |
wins | -0.075 |
Token | He |
Token ID | 679 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
ppa | +0.003 |
ache | +0.003 |
ridge | +0.003 |
anywhere | +0.003 |
ocket | +0.003 |
Neg logit contributions | |
Wow | -0.003 |
OK | -0.002 |
Run | -0.002 |
sorts | -0.002 |
Uh | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | -3.87e+00 |
Pos logit contributions | |
cy | +0.029 |
Wow | +0.028 |
ites | +0.028 |
sorts | +0.027 |
atch | +0.027 |
Neg logit contributions | |
ache | -0.019 |
sob | -0.019 |
throat | -0.018 |
proposal | -0.017 |
dentist | -0.017 |
Token | a |
Token ID | 257 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
sob | +0.063 |
babys | +0.060 |
dentist | +0.059 |
Nib | +0.059 |
ache | +0.059 |
Neg logit contributions | |
sorts | -0.092 |
ites | -0.092 |
cy | -0.090 |
atch | -0.088 |
OK | -0.088 |
Token | spoon |
Token ID | 24556 |
Feature activation | -6.92e-01 |
Pos logit contributions | |
sob | +0.035 |
Nib | +0.034 |
dentist | +0.034 |
anywhere | +0.033 |
babys | +0.033 |
Neg logit contributions | |
Run | -0.040 |
sorts | -0.040 |
Wow | -0.040 |
ites | -0.040 |
OK | -0.040 |
Token | and |
Token ID | 290 |
Feature activation | -4.49e-01 |
Pos logit contributions | |
sob | +0.019 |
dentist | +0.018 |
babys | +0.018 |
anywhere | +0.018 |
Nib | +0.018 |
Neg logit contributions | |
sorts | -0.009 |
cy | -0.009 |
ang | -0.009 |
ites | -0.009 |
cer | -0.009 |
Token | lets |
Token ID | 8781 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
sob | +0.006 |
Nib | +0.006 |
dentist | +0.006 |
Her | +0.006 |
throat | +0.006 |
Neg logit contributions | |
ites | -0.011 |
sorts | -0.011 |
Wow | -0.011 |
akes | -0.011 |
atch | -0.011 |
Token | her |
Token ID | 607 |
Feature activation | -4.51e+00 |
Pos logit contributions | |
about | +0.010 |
cy | +0.010 |
Run | +0.010 |
atch | +0.010 |
akes | +0.010 |
Neg logit contributions | |
sob | -0.010 |
ache | -0.009 |
throat | -0.009 |
dentist | -0.009 |
Nib | -0.009 |
Token | taste |
Token ID | 6938 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
sob | +0.090 |
Nib | +0.088 |
dentist | +0.087 |
babys | +0.085 |
ache | +0.084 |
Neg logit contributions | |
Run | -0.089 |
sorts | -0.089 |
ites | -0.088 |
OK | -0.088 |
atch | -0.088 |
Token | the |
Token ID | 262 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
sob | +0.005 |
babys | +0.005 |
grandmother | +0.005 |
ache | +0.005 |
ppa | +0.005 |
Neg logit contributions | |
sorts | -0.006 |
about | -0.005 |
Wow | -0.005 |
blows | -0.005 |
OK | -0.005 |
Token | frost |
Token ID | 21682 |
Feature activation | -9.91e-01 |
Pos logit contributions | |
sob | +0.024 |
dentist | +0.024 |
Nib | +0.023 |
babys | +0.023 |
throat | +0.023 |
Neg logit contributions | |
ites | -0.031 |
cer | -0.031 |
Run | -0.031 |
atch | -0.031 |
ang | -0.031 |
Token | ing |
Token ID | 278 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
sob | +0.025 |
Nib | +0.025 |
dentist | +0.024 |
babys | +0.024 |
throat | +0.024 |
Neg logit contributions | |
Run | -0.014 |
sorts | -0.014 |
ites | -0.014 |
Wow | -0.014 |
atch | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
Run | +0.054 |
sorts | +0.054 |
Wow | +0.054 |
about | +0.054 |
ites | +0.053 |
Neg logit contributions | |
sob | -0.038 |
dentist | -0.037 |
Nib | -0.036 |
babys | -0.036 |
ache | -0.035 |
Token | with |
Token ID | 351 |
Feature activation | +1.57e-01 |
Pos logit contributions | |
sob | +0.023 |
Nib | +0.022 |
dentist | +0.022 |
babys | +0.021 |
throat | +0.021 |
Neg logit contributions | |
Run | -0.032 |
ites | -0.032 |
sorts | -0.032 |
Wow | -0.032 |
atch | -0.032 |
Token | a |
Token ID | 257 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
sorts | +0.004 |
Run | +0.004 |
Wow | +0.004 |
ised | +0.004 |
Mine | +0.004 |
Neg logit contributions | |
sob | -0.003 |
ache | -0.003 |
Nib | -0.002 |
ppa | -0.002 |
babys | -0.002 |
Token | big |
Token ID | 1263 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
sob | +0.005 |
Nib | +0.005 |
dentist | +0.005 |
babys | +0.004 |
ache | +0.004 |
Neg logit contributions | |
ites | -0.007 |
Run | -0.007 |
atch | -0.007 |
Wow | -0.007 |
akes | -0.007 |
Token | smile |
Token ID | 8212 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
ites | +0.116 |
akes | +0.115 |
Wow | +0.113 |
ang | +0.112 |
cer | +0.112 |
Neg logit contributions | |
sob | -0.032 |
stomach | -0.029 |
throat | -0.028 |
sorry | -0.027 |
babys | -0.026 |
Token | on |
Token ID | 319 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
Run | +0.003 |
sorts | +0.003 |
ites | +0.003 |
about | +0.003 |
Wow | +0.003 |
Neg logit contributions | |
sob | -0.002 |
Nib | -0.002 |
dentist | -0.002 |
babys | -0.002 |
anywhere | -0.002 |
Token | his |
Token ID | 465 |
Feature activation | -3.77e+00 |
Pos logit contributions | |
Run | +0.038 |
sorts | +0.038 |
Wow | +0.037 |
about | +0.037 |
OK | +0.037 |
Neg logit contributions | |
sob | -0.015 |
Nib | -0.015 |
dentist | -0.015 |
ache | -0.014 |
anywhere | -0.013 |
Token | face |
Token ID | 1986 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
Nib | +0.052 |
dentist | +0.052 |
anywhere | +0.048 |
babys | +0.048 |
ppa | +0.048 |
Neg logit contributions | |
about | -0.096 |
OK | -0.095 |
Run | -0.094 |
pitch | -0.094 |
pitches | -0.094 |
Token | , |
Token ID | 11 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
dentist | +0.045 |
Nib | +0.043 |
sob | +0.042 |
maid | +0.042 |
anywhere | +0.041 |
Neg logit contributions | |
about | -0.050 |
ised | -0.049 |
ang | -0.049 |
sorts | -0.049 |
Run | -0.048 |
Token | he |
Token ID | 339 |
Feature activation | +6.10e-01 |
Pos logit contributions | |
sob | +0.016 |
Nib | +0.015 |
dentist | +0.015 |
Her | +0.014 |
throat | +0.014 |
Neg logit contributions | |
akes | -0.031 |
ites | -0.031 |
atch | -0.031 |
Run | -0.031 |
Wow | -0.031 |
Token | took |
Token ID | 1718 |
Feature activation | +8.73e-01 |
Pos logit contributions | |
akes | +0.014 |
Wow | +0.014 |
Run | +0.014 |
ites | +0.014 |
atch | +0.014 |
Neg logit contributions | |
sob | -0.011 |
Nib | -0.010 |
dentist | -0.010 |
ache | -0.010 |
throat | -0.010 |
Token | the |
Token ID | 262 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
sorts | +0.023 |
Run | +0.022 |
Wow | +0.022 |
ites | +0.022 |
OK | +0.022 |
Neg logit contributions | |
sob | -0.012 |
Nib | -0.012 |
dentist | -0.012 |
babys | -0.011 |
ache | -0.011 |
Token | was |
Token ID | 373 |
Feature activation | -9.64e-01 |
Pos logit contributions | |
Run | +0.024 |
ites | +0.024 |
Wow | +0.024 |
akes | +0.024 |
ang | +0.024 |
Neg logit contributions | |
sob | -0.021 |
Nib | -0.020 |
dentist | -0.020 |
Her | -0.019 |
throat | -0.019 |
Token | so |
Token ID | 523 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
ache | +0.015 |
Nib | +0.015 |
babys | +0.015 |
dentist | +0.015 |
sob | +0.015 |
Neg logit contributions | |
sorts | -0.023 |
ang | -0.022 |
Run | -0.021 |
atch | -0.021 |
Wow | -0.021 |
Token | grateful |
Token ID | 14066 |
Feature activation | +4.90e-01 |
Pos logit contributions | |
sob | +0.003 |
Her | +0.002 |
Nib | +0.002 |
not | +0.002 |
stomach | +0.002 |
Neg logit contributions | |
ites | -0.006 |
about | -0.006 |
Run | -0.006 |
akes | -0.006 |
cer | -0.006 |
Token | to |
Token ID | 284 |
Feature activation | -2.81e+00 |
Pos logit contributions | |
sorts | +0.011 |
OK | +0.011 |
Run | +0.011 |
atch | +0.011 |
cer | +0.011 |
Neg logit contributions | |
sob | -0.008 |
Nib | -0.008 |
dentist | -0.008 |
babys | -0.008 |
maid | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
ache | +0.068 |
sob | +0.062 |
dentist | +0.059 |
anywhere | +0.059 |
ppa | +0.059 |
Neg logit contributions | |
sorts | -0.050 |
pitch | -0.044 |
cy | -0.042 |
Mine | -0.042 |
gol | -0.042 |
Token | farmer |
Token ID | 18739 |
Feature activation | -4.28e+00 |
Pos logit contributions | |
sob | +0.037 |
Nib | +0.035 |
Her | +0.035 |
anywhere | +0.034 |
throat | +0.034 |
Neg logit contributions | |
OK | -0.038 |
Run | -0.038 |
sorts | -0.038 |
Wow | -0.037 |
about | -0.037 |
Token | for |
Token ID | 329 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
sob | +0.092 |
babys | +0.090 |
dentist | +0.088 |
gag | +0.086 |
maid | +0.086 |
Neg logit contributions | |
sorts | -0.081 |
cy | -0.077 |
cer | -0.075 |
able | -0.072 |
mer | -0.072 |
Token | helping |
Token ID | 5742 |
Feature activation | -4.50e-01 |
Pos logit contributions | |
ache | +0.019 |
sob | +0.019 |
dentist | +0.018 |
babys | +0.018 |
Nib | +0.018 |
Neg logit contributions | |
sorts | -0.026 |
Run | -0.026 |
atch | -0.025 |
OK | -0.025 |
Wow | -0.025 |
Token | him |
Token ID | 683 |
Feature activation | -5.02e+00 |
Pos logit contributions | |
sob | +0.007 |
ache | +0.006 |
Nib | +0.006 |
dentist | +0.006 |
babys | +0.006 |
Neg logit contributions | |
sorts | -0.011 |
cer | -0.011 |
atch | -0.011 |
cy | -0.010 |
mer | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
sob | +0.093 |
dentist | +0.092 |
babys | +0.091 |
Nib | +0.091 |
grandmother | +0.087 |
Neg logit contributions | |
sorts | -0.108 |
atch | -0.105 |
cer | -0.102 |
cy | -0.102 |
about | -0.101 |
Token | |
Token ID | 220 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
sob | +0.017 |
ache | +0.017 |
dentist | +0.017 |
anywhere | +0.016 |
Nib | +0.016 |
Neg logit contributions | |
Wow | -0.024 |
sorts | -0.024 |
Run | -0.023 |
ites | -0.023 |
OK | -0.023 |