Token | dad |
Token ID | 9955 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
ate | +0.008 |
things | +0.005 |
his | +0.005 |
." | +0.005 |
gear | +0.005 |
Neg logit contributions | |
hy | -0.012 |
gust | -0.012 |
ited | -0.012 |
years | -0.012 |
seventeen | -0.012 |
Token | were |
Token ID | 547 |
Feature activation | -5.88e-03 |
Pos logit contributions | |
ate | +0.020 |
his | +0.018 |
things | +0.017 |
other | +0.017 |
| +0.016 |
Neg logit contributions | |
seventeen | -0.023 |
gust | -0.022 |
years | -0.022 |
ited | -0.021 |
hy | -0.021 |
Token | ignorant |
Token ID | 20109 |
Feature activation | +4.48e-03 |
Pos logit contributions | |
hy | +0.009 |
years | +0.009 |
gust | +0.009 |
seventeen | +0.009 |
ited | +0.009 |
Neg logit contributions | |
ate | -0.011 |
his | -0.009 |
things | -0.009 |
gear | -0.009 |
| -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -8.73e-03 |
Pos logit contributions | |
things | +0.001 |
ate | +0.001 |
his | +0.001 |
." | +0.001 |
other | +0.000 |
Neg logit contributions | |
ited | -0.015 |
seventeen | -0.015 |
years | -0.015 |
gust | -0.014 |
hy | -0.014 |
Token | Ign |
Token ID | 16583 |
Feature activation | +9.46e-03 |
Pos logit contributions | |
gust | +0.018 |
seventeen | +0.017 |
hy | +0.017 |
years | +0.017 |
bell | +0.016 |
Neg logit contributions | |
ate | -0.013 |
his | -0.010 |
things | -0.010 |
gear | -0.009 |
other | -0.009 |
Token | or |
Token ID | 273 |
Feature activation | +6.03e-02 |
Pos logit contributions | |
ate | +0.016 |
his | +0.013 |
things | +0.013 |
other | +0.012 |
." | +0.011 |
Neg logit contributions | |
seventeen | -0.018 |
ited | -0.018 |
hy | -0.018 |
gust | -0.018 |
years | -0.018 |
Token | ant |
Token ID | 415 |
Feature activation | +5.14e-02 |
Pos logit contributions | |
ate | +0.117 |
things | +0.096 |
place | +0.096 |
his | +0.093 |
| +0.092 |
Neg logit contributions | |
years | -0.092 |
ited | -0.090 |
hy | -0.089 |
ous | -0.088 |
seventeen | -0.084 |
Token | meant |
Token ID | 4001 |
Feature activation | +2.65e-02 |
Pos logit contributions | |
ate | +0.076 |
his | +0.052 |
things | +0.049 |
own | +0.045 |
| +0.044 |
Neg logit contributions | |
hy | -0.111 |
ited | -0.106 |
gust | -0.105 |
ous | -0.103 |
years | -0.102 |
Token | they |
Token ID | 484 |
Feature activation | +1.32e-02 |
Pos logit contributions | |
ate | +0.033 |
his | +0.025 |
things | +0.025 |
other | +0.022 |
gear | +0.020 |
Neg logit contributions | |
seventeen | -0.061 |
ited | -0.061 |
hy | -0.061 |
years | -0.060 |
gust | -0.060 |
Token | did |
Token ID | 750 |
Feature activation | +1.46e-02 |
Pos logit contributions | |
ate | +0.024 |
his | +0.020 |
things | +0.020 |
other | +0.018 |
." | +0.017 |
Neg logit contributions | |
ited | -0.024 |
seventeen | -0.023 |
hy | -0.023 |
years | -0.023 |
gust | -0.023 |
Token | not |
Token ID | 407 |
Feature activation | +7.02e-03 |
Pos logit contributions | |
ate | +0.023 |
his | +0.016 |
gear | +0.016 |
things | +0.016 |
| +0.015 |
Neg logit contributions | |
hy | -0.027 |
seventeen | -0.026 |
years | -0.026 |
ited | -0.026 |
gust | -0.026 |
Token | sign |
Token ID | 1051 |
Feature activation | +2.98e-03 |
Pos logit contributions | |
ate | +0.012 |
his | +0.010 |
things | +0.010 |
other | +0.009 |
gear | +0.008 |
Neg logit contributions | |
ited | -0.023 |
years | -0.023 |
hy | -0.022 |
seventeen | -0.022 |
gust | -0.022 |
Token | that |
Token ID | 326 |
Feature activation | +5.58e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.008 |
years | -0.008 |
gust | -0.008 |
seventeen | -0.008 |
aney | -0.008 |
Token | said |
Token ID | 531 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
ate | +0.009 |
things | +0.007 |
his | +0.007 |
other | +0.006 |
." | +0.006 |
Neg logit contributions | |
hy | -0.011 |
seventeen | -0.011 |
ited | -0.011 |
gust | -0.011 |
years | -0.011 |
Token | " |
Token ID | 366 |
Feature activation | +6.32e-03 |
Pos logit contributions | |
seventeen | +0.007 |
hy | +0.007 |
ited | +0.007 |
years | +0.007 |
gust | +0.007 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
other | -0.002 |
gear | -0.002 |
Token | Circ |
Token ID | 31560 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
ate | +0.010 |
his | +0.009 |
things | +0.009 |
other | +0.008 |
gear | +0.007 |
Neg logit contributions | |
ited | -0.012 |
hy | -0.012 |
seventeen | -0.012 |
years | -0.012 |
gust | -0.012 |
Token | us |
Token ID | 385 |
Feature activation | +5.75e-02 |
Pos logit contributions | |
ate | +0.023 |
his | +0.019 |
things | +0.018 |
other | +0.017 |
| +0.016 |
Neg logit contributions | |
ited | -0.030 |
seventeen | -0.030 |
years | -0.030 |
hy | -0.029 |
gust | -0.028 |
Token | ". |
Token ID | 1911 |
Feature activation | +9.15e-03 |
Pos logit contributions | |
ate | +0.070 |
his | +0.053 |
things | +0.048 |
other | +0.047 |
gear | +0.045 |
Neg logit contributions | |
seventeen | -0.133 |
hy | -0.132 |
ous | -0.130 |
years | -0.125 |
ho | -0.122 |
Token | They |
Token ID | 1119 |
Feature activation | +9.60e-03 |
Pos logit contributions | |
ate | +0.013 |
things | +0.010 |
gear | +0.009 |
his | +0.009 |
toy | +0.008 |
Neg logit contributions | |
gust | -0.018 |
seventeen | -0.018 |
oled | -0.017 |
aney | -0.017 |
hy | -0.017 |
Token | ran |
Token ID | 4966 |
Feature activation | -3.81e-03 |
Pos logit contributions | |
ate | +0.018 |
his | +0.015 |
things | +0.015 |
other | +0.014 |
." | +0.013 |
Neg logit contributions | |
ited | -0.016 |
seventeen | -0.016 |
hy | -0.016 |
years | -0.016 |
gust | -0.016 |
Token | inside |
Token ID | 2641 |
Feature activation | +4.88e-03 |
Pos logit contributions | |
hy | +0.007 |
years | +0.007 |
ited | +0.007 |
seventeen | +0.007 |
gust | +0.006 |
Neg logit contributions | |
ate | -0.007 |
things | -0.005 |
his | -0.005 |
other | -0.005 |
." | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
ate | +0.006 |
P | +0.004 |
things | +0.003 |
gear | +0.003 |
yourself | +0.003 |
Neg logit contributions | |
gust | -0.011 |
ited | -0.011 |
years | -0.011 |
stretched | -0.011 |
hy | -0.011 |
Token | others |
Token ID | 1854 |
Feature activation | +4.33e-03 |
Pos logit contributions | |
ate | +0.021 |
his | +0.016 |
things | +0.014 |
other | +0.014 |
gear | +0.013 |
Neg logit contributions | |
seventeen | -0.036 |
years | -0.035 |
hy | -0.035 |
ited | -0.035 |
gust | -0.034 |
Token | with |
Token ID | 351 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
ate | +0.005 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
gear | +0.002 |
Neg logit contributions | |
ited | -0.011 |
seventeen | -0.011 |
hy | -0.011 |
years | -0.011 |
gust | -0.011 |
Token | respect |
Token ID | 2461 |
Feature activation | -5.55e-03 |
Pos logit contributions | |
ate | +0.014 |
his | +0.011 |
things | +0.011 |
other | +0.009 |
gear | +0.009 |
Neg logit contributions | |
ited | -0.024 |
seventeen | -0.024 |
years | -0.024 |
hy | -0.024 |
gust | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +5.02e-03 |
Pos logit contributions | |
seventeen | +0.013 |
ited | +0.013 |
hy | +0.013 |
gust | +0.013 |
years | +0.013 |
Neg logit contributions | |
ate | -0.006 |
his | -0.004 |
things | -0.003 |
gear | -0.003 |
name | -0.003 |
Token | Ign |
Token ID | 16583 |
Feature activation | +9.10e-03 |
Pos logit contributions | |
ate | +0.006 |
things | +0.005 |
his | +0.005 |
gear | +0.005 |
toy | +0.005 |
Neg logit contributions | |
years | -0.010 |
seventeen | -0.010 |
hy | -0.010 |
ous | -0.010 |
istent | -0.010 |
Token | or |
Token ID | 273 |
Feature activation | +5.74e-02 |
Pos logit contributions | |
ate | +0.016 |
his | +0.013 |
things | +0.012 |
other | +0.011 |
." | +0.011 |
Neg logit contributions | |
seventeen | -0.017 |
gust | -0.017 |
hy | -0.017 |
ited | -0.017 |
years | -0.016 |
Token | ance |
Token ID | 590 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
ate | +0.100 |
his | +0.083 |
things | +0.081 |
other | +0.076 |
| +0.074 |
Neg logit contributions | |
ited | -0.103 |
years | -0.102 |
seventeen | -0.101 |
hy | -0.100 |
gust | -0.096 |
Token | can |
Token ID | 460 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
ate | +0.016 |
his | +0.012 |
things | +0.012 |
other | +0.010 |
." | +0.010 |
Neg logit contributions | |
ited | -0.033 |
seventeen | -0.033 |
years | -0.033 |
hy | -0.033 |
gust | -0.033 |
Token | lead |
Token ID | 1085 |
Feature activation | +3.61e-03 |
Pos logit contributions | |
ate | +0.014 |
his | +0.012 |
things | +0.011 |
other | +0.011 |
| +0.010 |
Neg logit contributions | |
years | -0.029 |
ited | -0.028 |
seventeen | -0.028 |
gust | -0.027 |
hy | -0.027 |
Token | to |
Token ID | 284 |
Feature activation | -5.09e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
gear | +0.003 |
Neg logit contributions | |
hy | -0.008 |
ited | -0.008 |
years | -0.008 |
seventeen | -0.008 |
gust | -0.008 |
Token | misunderstanding |
Token ID | 29789 |
Feature activation | -5.96e-03 |
Pos logit contributions | |
ited | +0.012 |
seventeen | +0.012 |
hy | +0.012 |
years | +0.012 |
gust | +0.012 |
Neg logit contributions | |
ate | -0.006 |
his | -0.005 |
things | -0.005 |
other | -0.005 |
." | -0.004 |
Token | kind |
Token ID | 1611 |
Feature activation | +2.81e-03 |
Pos logit contributions | |
ate | +0.008 |
his | +0.007 |
things | +0.006 |
other | +0.006 |
." | +0.005 |
Neg logit contributions | |
ited | -0.013 |
seventeen | -0.013 |
hy | -0.013 |
years | -0.013 |
gust | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +8.10e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
hy | -0.007 |
years | -0.007 |
gust | -0.007 |
Token | thoughtful |
Token ID | 22677 |
Feature activation | +5.88e-03 |
Pos logit contributions | |
ate | +0.011 |
his | +0.009 |
things | +0.009 |
other | +0.008 |
your | +0.008 |
Neg logit contributions | |
ited | -0.020 |
hy | -0.019 |
seventeen | -0.019 |
aney | -0.019 |
gust | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | -2.03e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
." | +0.002 |
Neg logit contributions | |
ited | -0.016 |
seventeen | -0.016 |
hy | -0.016 |
years | -0.016 |
gust | -0.016 |
Token | Ign |
Token ID | 16583 |
Feature activation | +6.52e-03 |
Pos logit contributions | |
seventeen | +0.004 |
years | +0.004 |
hy | +0.004 |
gust | +0.003 |
ous | +0.003 |
Neg logit contributions | |
ate | -0.003 |
things | -0.003 |
his | -0.003 |
gear | -0.003 |
other | -0.003 |
Token | or |
Token ID | 273 |
Feature activation | +5.68e-02 |
Pos logit contributions | |
ate | +0.012 |
things | +0.010 |
his | +0.010 |
." | +0.009 |
other | +0.009 |
Neg logit contributions | |
seventeen | -0.012 |
gust | -0.011 |
hy | -0.011 |
years | -0.011 |
ited | -0.011 |
Token | ance |
Token ID | 590 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
ate | +0.101 |
his | +0.085 |
things | +0.083 |
other | +0.077 |
." | +0.073 |
Neg logit contributions | |
ited | -0.102 |
seventeen | -0.101 |
hy | -0.100 |
years | -0.100 |
gust | -0.099 |
Token | never |
Token ID | 1239 |
Feature activation | +1.51e-02 |
Pos logit contributions | |
ate | +0.016 |
his | +0.012 |
things | +0.012 |
other | +0.010 |
." | +0.010 |
Neg logit contributions | |
ited | -0.035 |
seventeen | -0.035 |
years | -0.035 |
hy | -0.035 |
gust | -0.035 |
Token | leads |
Token ID | 5983 |
Feature activation | +2.56e-02 |
Pos logit contributions | |
ate | +0.018 |
his | +0.018 |
things | +0.017 |
other | +0.016 |
." | +0.015 |
Neg logit contributions | |
years | -0.036 |
seventeen | -0.036 |
ited | -0.035 |
hy | -0.034 |
gust | -0.034 |
Token | to |
Token ID | 284 |
Feature activation | -2.70e-03 |
Pos logit contributions | |
ate | +0.030 |
his | +0.024 |
things | +0.023 |
other | +0.020 |
." | +0.019 |
Neg logit contributions | |
ited | -0.062 |
seventeen | -0.062 |
hy | -0.061 |
years | -0.061 |
gust | -0.060 |
Token | kindness |
Token ID | 23887 |
Feature activation | -7.69e-03 |
Pos logit contributions | |
ited | +0.007 |
seventeen | +0.007 |
hy | +0.007 |
years | +0.007 |
gust | +0.007 |
Neg logit contributions | |
ate | -0.003 |
his | -0.002 |
things | -0.002 |
other | -0.002 |
." | -0.002 |
Token | away |
Token ID | 1497 |
Feature activation | +2.76e-02 |
Pos logit contributions | |
ited | +0.022 |
seventeen | +0.022 |
hy | +0.022 |
years | +0.022 |
gust | +0.022 |
Neg logit contributions | |
ate | -0.011 |
his | -0.008 |
things | -0.008 |
other | -0.007 |
gear | -0.006 |
Token | from |
Token ID | 422 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
ate | +0.031 |
his | +0.022 |
things | +0.021 |
other | +0.018 |
gear | +0.017 |
Neg logit contributions | |
ited | -0.066 |
seventeen | -0.066 |
hy | -0.066 |
years | -0.066 |
gust | -0.065 |
Token | home |
Token ID | 1363 |
Feature activation | +2.53e-02 |
Pos logit contributions | |
ate | +0.015 |
his | +0.012 |
things | +0.012 |
other | +0.010 |
." | +0.009 |
Neg logit contributions | |
ited | -0.029 |
seventeen | -0.029 |
hy | -0.029 |
years | -0.028 |
gust | -0.028 |
Token | . |
Token ID | 13 |
Feature activation | +5.01e-03 |
Pos logit contributions | |
ate | +0.027 |
his | +0.019 |
things | +0.017 |
other | +0.015 |
gear | +0.015 |
Neg logit contributions | |
years | -0.062 |
hy | -0.061 |
ited | -0.061 |
seventeen | -0.061 |
gust | -0.060 |
Token | Ign |
Token ID | 16583 |
Feature activation | +7.58e-03 |
Pos logit contributions | |
ate | +0.008 |
things | +0.006 |
his | +0.006 |
gear | +0.005 |
other | +0.005 |
Neg logit contributions | |
seventeen | -0.010 |
hy | -0.010 |
years | -0.010 |
gust | -0.010 |
ous | -0.010 |
Token | or |
Token ID | 273 |
Feature activation | +5.62e-02 |
Pos logit contributions | |
ate | +0.015 |
his | +0.013 |
things | +0.013 |
other | +0.012 |
." | +0.012 |
Neg logit contributions | |
seventeen | -0.012 |
gust | -0.012 |
hy | -0.012 |
years | -0.011 |
ited | -0.011 |
Token | ance |
Token ID | 590 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
ate | +0.099 |
his | +0.083 |
things | +0.081 |
other | +0.075 |
| +0.072 |
Neg logit contributions | |
ited | -0.102 |
seventeen | -0.101 |
years | -0.100 |
hy | -0.100 |
gust | -0.098 |
Token | is |
Token ID | 318 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
ate | +0.017 |
his | +0.014 |
things | +0.014 |
other | +0.012 |
." | +0.011 |
Neg logit contributions | |
ited | -0.033 |
seventeen | -0.033 |
years | -0.033 |
hy | -0.032 |
gust | -0.032 |
Token | not |
Token ID | 407 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
ate | +0.018 |
his | +0.016 |
things | +0.016 |
other | +0.014 |
the | +0.013 |
Neg logit contributions | |
ited | -0.028 |
hy | -0.028 |
seventeen | -0.028 |
gust | -0.027 |
years | -0.027 |
Token | always |
Token ID | 1464 |
Feature activation | +1.96e-02 |
Pos logit contributions | |
ate | +0.023 |
his | +0.019 |
things | +0.018 |
other | +0.017 |
." | +0.016 |
Neg logit contributions | |
ited | -0.032 |
seventeen | -0.031 |
years | -0.031 |
hy | -0.031 |
gust | -0.031 |
Token | bliss |
Token ID | 30533 |
Feature activation | -1.54e-03 |
Pos logit contributions | |
ate | +0.029 |
his | +0.023 |
things | +0.023 |
other | +0.021 |
." | +0.019 |
Neg logit contributions | |
ited | -0.041 |
seventeen | -0.041 |
hy | -0.041 |
years | -0.040 |
gust | -0.040 |
Token | sign |
Token ID | 1051 |
Feature activation | -3.55e-03 |
Pos logit contributions | |
hy | +0.011 |
seventeen | +0.011 |
gust | +0.011 |
ited | +0.011 |
years | +0.011 |
Neg logit contributions | |
ate | -0.007 |
his | -0.006 |
things | -0.005 |
gear | -0.005 |
." | -0.004 |
Token | says |
Token ID | 1139 |
Feature activation | +6.55e-04 |
Pos logit contributions | |
years | +0.011 |
ited | +0.011 |
seventeen | +0.010 |
gust | +0.010 |
hetically | +0.010 |
Neg logit contributions | |
ate | -0.003 |
things | -0.002 |
his | -0.002 |
other | -0.002 |
| -0.002 |
Token | : |
Token ID | 25 |
Feature activation | +2.81e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
| +0.001 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
years | -0.001 |
hy | -0.001 |
gust | -0.001 |
Token | " |
Token ID | 366 |
Feature activation | +1.17e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
seventeen | -0.006 |
hy | -0.006 |
years | -0.006 |
gust | -0.006 |
ited | -0.006 |
Token | Circ |
Token ID | 31560 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
ate | +0.002 |
his | +0.002 |
things | +0.002 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.002 |
seventeen | -0.002 |
years | -0.002 |
hy | -0.002 |
gust | -0.002 |
Token | us |
Token ID | 385 |
Feature activation | +5.49e-02 |
Pos logit contributions | |
ate | +0.016 |
his | +0.013 |
things | +0.013 |
other | +0.012 |
| +0.011 |
Neg logit contributions | |
ited | -0.021 |
years | -0.021 |
seventeen | -0.021 |
hy | -0.021 |
gust | -0.020 |
Token | is |
Token ID | 318 |
Feature activation | +9.41e-03 |
Pos logit contributions | |
ate | +0.071 |
his | +0.057 |
other | +0.052 |
things | +0.051 |
gear | +0.047 |
Neg logit contributions | |
hy | -0.121 |
seventeen | -0.118 |
ous | -0.117 |
years | -0.111 |
storm | -0.109 |
Token | here |
Token ID | 994 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
ate | +0.013 |
things | +0.009 |
his | +0.009 |
other | +0.008 |
gear | +0.008 |
Neg logit contributions | |
hy | -0.021 |
seventeen | -0.021 |
years | -0.020 |
ous | -0.020 |
gust | -0.019 |
Token | ! |
Token ID | 0 |
Feature activation | +8.13e-03 |
Pos logit contributions | |
ate | +0.015 |
his | +0.010 |
things | +0.010 |
other | +0.008 |
gear | +0.008 |
Neg logit contributions | |
hy | -0.036 |
seventeen | -0.036 |
ited | -0.035 |
years | -0.034 |
gust | -0.034 |
Token | Come |
Token ID | 7911 |
Feature activation | +2.09e-04 |
Pos logit contributions | |
ate | +0.014 |
things | +0.012 |
his | +0.011 |
other | +0.011 |
friends | +0.011 |
Neg logit contributions | |
hy | -0.015 |
seventeen | -0.015 |
years | -0.014 |
thirteen | -0.014 |
ous | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +2.28e-03 |
Pos logit contributions | |
ate | +0.000 |
other | +0.000 |
things | +0.000 |
his | +0.000 |
gear | +0.000 |
Neg logit contributions | |
hy | -0.000 |
bell | -0.000 |
seventeen | -0.000 |
ous | -0.000 |
years | -0.000 |
Token | " |
Token ID | 366 |
Feature activation | +3.13e-03 |
Pos logit contributions | |
ited | +0.028 |
years | +0.027 |
seventeen | +0.026 |
hy | +0.026 |
gust | +0.026 |
Neg logit contributions | |
ate | -0.007 |
his | -0.007 |
| -0.005 |
things | -0.005 |
." | -0.005 |
Token | You |
Token ID | 1639 |
Feature activation | +2.72e-04 |
Pos logit contributions | |
ate | +0.005 |
his | +0.004 |
things | +0.004 |
other | +0.004 |
gear | +0.003 |
Neg logit contributions | |
ited | -0.006 |
seventeen | -0.006 |
years | -0.006 |
hy | -0.006 |
gust | -0.006 |
Token | are |
Token ID | 389 |
Feature activation | -5.18e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.000 |
things | +0.000 |
other | +0.000 |
gear | +0.000 |
Neg logit contributions | |
ited | -0.000 |
seventeen | -0.000 |
hy | -0.000 |
years | -0.000 |
gust | -0.000 |
Token | a |
Token ID | 257 |
Feature activation | +4.55e-03 |
Pos logit contributions | |
hy | +0.012 |
seventeen | +0.012 |
years | +0.012 |
gust | +0.012 |
ited | +0.011 |
Neg logit contributions | |
ate | -0.007 |
things | -0.005 |
his | -0.005 |
gear | -0.004 |
other | -0.004 |
Token | good |
Token ID | 922 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
ate | +0.007 |
his | +0.005 |
things | +0.005 |
| +0.004 |
gear | +0.004 |
Neg logit contributions | |
seventeen | -0.010 |
gust | -0.010 |
hy | -0.010 |
ited | -0.009 |
years | -0.009 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.46e-02 |
Pos logit contributions | |
ate | +0.024 |
his | +0.017 |
things | +0.016 |
other | +0.014 |
| +0.013 |
Neg logit contributions | |
gust | -0.044 |
hy | -0.044 |
ited | -0.044 |
seventeen | -0.043 |
years | -0.043 |
Token | , |
Token ID | 11 |
Feature activation | +8.21e-03 |
Pos logit contributions | |
ate | +0.060 |
his | +0.045 |
things | +0.043 |
other | +0.037 |
." | +0.034 |
Neg logit contributions | |
ited | -0.136 |
seventeen | -0.135 |
years | -0.134 |
hy | -0.134 |
gust | -0.132 |
Token | Mia |
Token ID | 32189 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
ate | +0.013 |
his | +0.010 |
things | +0.010 |
other | +0.009 |
gear | +0.008 |
Neg logit contributions | |
seventeen | -0.017 |
ited | -0.017 |
gust | -0.017 |
hy | -0.017 |
years | -0.017 |
Token | ! |
Token ID | 0 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ate | +0.022 |
things | +0.015 |
his | +0.014 |
other | +0.013 |
gear | +0.012 |
Neg logit contributions | |
ited | -0.037 |
hy | -0.037 |
seventeen | -0.036 |
gust | -0.035 |
anne | -0.035 |
Token | That |
Token ID | 1320 |
Feature activation | -8.73e-03 |
Pos logit contributions | |
hy | +0.020 |
seventeen | +0.019 |
years | +0.019 |
gust | +0.018 |
ous | +0.018 |
Neg logit contributions | |
ate | -0.020 |
things | -0.016 |
his | -0.016 |
other | -0.015 |
gear | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | +5.86e-04 |
Pos logit contributions | |
ited | +0.022 |
seventeen | +0.022 |
hy | +0.022 |
gust | +0.021 |
years | +0.021 |
Neg logit contributions | |
ate | -0.009 |
his | -0.007 |
things | -0.006 |
other | -0.005 |
." | -0.005 |
Token | ron |
Token ID | 1313 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
ate | +0.031 |
things | +0.027 |
his | +0.027 |
." | +0.024 |
other | +0.023 |
Neg logit contributions | |
ited | -0.041 |
gust | -0.041 |
years | -0.041 |
seventeen | -0.040 |
hy | -0.039 |
Token | and |
Token ID | 290 |
Feature activation | +3.43e-03 |
Pos logit contributions | |
ate | +0.017 |
his | +0.013 |
things | +0.013 |
other | +0.011 |
." | +0.010 |
Neg logit contributions | |
seventeen | -0.043 |
ited | -0.043 |
gust | -0.043 |
years | -0.042 |
hy | -0.042 |
Token | vanilla |
Token ID | 16858 |
Feature activation | -2.58e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.004 |
things | +0.004 |
other | +0.004 |
friends | +0.003 |
Neg logit contributions | |
ited | -0.008 |
years | -0.008 |
hy | -0.008 |
seventeen | -0.008 |
gust | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
seventeen | +0.006 |
ited | +0.006 |
hy | +0.006 |
years | +0.006 |
gust | +0.006 |
Neg logit contributions | |
ate | -0.003 |
his | -0.002 |
things | -0.002 |
other | -0.001 |
gear | -0.001 |
Token | lic |
Token ID | 3476 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
ate | +0.016 |
his | +0.014 |
things | +0.013 |
other | +0.012 |
." | +0.011 |
Neg logit contributions | |
ited | -0.028 |
years | -0.027 |
hy | -0.027 |
gust | -0.027 |
seventeen | -0.027 |
Token | or |
Token ID | 273 |
Feature activation | +5.46e-02 |
Pos logit contributions | |
ate | +0.012 |
his | +0.010 |
things | +0.010 |
other | +0.009 |
." | +0.008 |
Neg logit contributions | |
ited | -0.015 |
seventeen | -0.015 |
hy | -0.015 |
gust | -0.015 |
years | -0.015 |
Token | ice |
Token ID | 501 |
Feature activation | +2.93e-02 |
Pos logit contributions | |
ate | +0.090 |
his | +0.074 |
things | +0.073 |
other | +0.067 |
gear | +0.063 |
Neg logit contributions | |
ited | -0.105 |
seventeen | -0.104 |
hy | -0.103 |
years | -0.103 |
gust | -0.101 |
Token | and |
Token ID | 290 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
ate | +0.031 |
his | +0.023 |
things | +0.022 |
other | +0.019 |
." | +0.017 |
Neg logit contributions | |
ited | -0.074 |
seventeen | -0.073 |
years | -0.073 |
hy | -0.073 |
gust | -0.072 |
Token | star |
Token ID | 3491 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
ate | +0.026 |
his | +0.023 |
things | +0.022 |
other | +0.020 |
." | +0.018 |
Neg logit contributions | |
ited | -0.043 |
years | -0.041 |
gust | -0.041 |
hy | -0.041 |
seventeen | -0.040 |
Token | an |
Token ID | 281 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
ate | +0.018 |
his | +0.015 |
things | +0.015 |
other | +0.013 |
." | +0.012 |
Neg logit contributions | |
ited | -0.031 |
seventeen | -0.030 |
gust | -0.030 |
years | -0.030 |
hy | -0.030 |
Token | ise |
Token ID | 786 |
Feature activation | +2.93e-02 |
Pos logit contributions | |
ate | +0.023 |
his | +0.019 |
things | +0.019 |
other | +0.018 |
." | +0.018 |
Neg logit contributions | |
gust | -0.028 |
ited | -0.028 |
seventeen | -0.027 |
hy | -0.027 |
years | -0.027 |
Token | sign |
Token ID | 1051 |
Feature activation | +1.12e-03 |
Pos logit contributions | |
ate | +0.010 |
things | +0.008 |
his | +0.008 |
other | +0.007 |
gear | +0.007 |
Neg logit contributions | |
ited | -0.018 |
years | -0.018 |
hy | -0.017 |
seventeen | -0.017 |
gust | -0.017 |
Token | that |
Token ID | 326 |
Feature activation | +2.86e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
." | +0.001 |
other | +0.001 |
Neg logit contributions | |
ited | -0.003 |
years | -0.003 |
gust | -0.003 |
seventeen | -0.003 |
hetically | -0.003 |
Token | says |
Token ID | 1139 |
Feature activation | -2.97e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
gear | +0.002 |
Neg logit contributions | |
seventeen | -0.006 |
hy | -0.006 |
ited | -0.006 |
gust | -0.006 |
years | -0.006 |
Token | " |
Token ID | 366 |
Feature activation | +4.78e-03 |
Pos logit contributions | |
seventeen | +0.007 |
hy | +0.007 |
gust | +0.007 |
ited | +0.007 |
years | +0.007 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
other | -0.002 |
gear | -0.002 |
Token | Circ |
Token ID | 31560 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
ate | +0.008 |
his | +0.007 |
things | +0.007 |
other | +0.006 |
." | +0.006 |
Neg logit contributions | |
ited | -0.009 |
seventeen | -0.009 |
hy | -0.009 |
years | -0.009 |
gust | -0.009 |
Token | us |
Token ID | 385 |
Feature activation | +5.45e-02 |
Pos logit contributions | |
ate | +0.021 |
his | +0.018 |
things | +0.017 |
other | +0.016 |
| +0.015 |
Neg logit contributions | |
ited | -0.024 |
years | -0.024 |
seventeen | -0.024 |
hy | -0.024 |
gust | -0.023 |
Token | ". |
Token ID | 1911 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
ate | +0.061 |
his | +0.048 |
things | +0.041 |
gear | +0.040 |
other | +0.040 |
Neg logit contributions | |
hy | -0.129 |
seventeen | -0.128 |
ous | -0.126 |
years | -0.123 |
ho | -0.119 |
Token | Lily |
Token ID | 20037 |
Feature activation | +7.54e-03 |
Pos logit contributions | |
ate | +0.019 |
things | +0.014 |
his | +0.013 |
gear | +0.013 |
other | +0.013 |
Neg logit contributions | |
gust | -0.022 |
hy | -0.022 |
seventeen | -0.021 |
aney | -0.021 |
oled | -0.020 |
Token | and |
Token ID | 290 |
Feature activation | -6.23e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.009 |
things | +0.009 |
other | +0.008 |
place | +0.007 |
Neg logit contributions | |
ited | -0.014 |
seventeen | -0.014 |
anne | -0.014 |
hy | -0.014 |
bell | -0.014 |
Token | Tom |
Token ID | 4186 |
Feature activation | -5.31e-03 |
Pos logit contributions | |
hy | +0.011 |
gust | +0.011 |
seventeen | +0.010 |
ited | +0.009 |
hetically | +0.009 |
Neg logit contributions | |
ate | -0.012 |
emo | -0.009 |
place | -0.009 |
." | -0.008 |
things | -0.008 |
Token | are |
Token ID | 389 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
years | +0.011 |
seventeen | +0.011 |
gust | +0.010 |
ited | +0.010 |
hy | +0.010 |
Neg logit contributions | |
ate | -0.008 |
his | -0.007 |
things | -0.007 |
other | -0.007 |
." | -0.006 |
Token | sign |
Token ID | 1051 |
Feature activation | +5.19e-03 |
Pos logit contributions | |
ate | +0.021 |
things | +0.017 |
his | +0.017 |
other | +0.015 |
gear | +0.014 |
Neg logit contributions | |
ited | -0.041 |
years | -0.041 |
seventeen | -0.039 |
hy | -0.039 |
gust | -0.038 |
Token | that |
Token ID | 326 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
ate | +0.005 |
things | +0.004 |
his | +0.004 |
| +0.004 |
other | +0.003 |
Neg logit contributions | |
ited | -0.015 |
years | -0.014 |
gust | -0.013 |
seventeen | -0.013 |
hetically | -0.013 |
Token | said |
Token ID | 531 |
Feature activation | -5.97e-03 |
Pos logit contributions | |
ate | +0.009 |
his | +0.008 |
things | +0.007 |
other | +0.007 |
gear | +0.006 |
Neg logit contributions | |
hy | -0.011 |
seventeen | -0.011 |
ited | -0.011 |
gust | -0.011 |
years | -0.011 |
Token | " |
Token ID | 366 |
Feature activation | +3.85e-03 |
Pos logit contributions | |
ited | +0.014 |
seventeen | +0.014 |
hy | +0.014 |
years | +0.014 |
gust | +0.014 |
Neg logit contributions | |
ate | -0.007 |
his | -0.005 |
things | -0.005 |
other | -0.005 |
." | -0.004 |
Token | Circ |
Token ID | 31560 |
Feature activation | +9.83e-03 |
Pos logit contributions | |
ate | +0.007 |
his | +0.006 |
things | +0.005 |
other | +0.005 |
| +0.005 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
years | -0.007 |
hy | -0.007 |
gust | -0.007 |
Token | us |
Token ID | 385 |
Feature activation | +5.44e-02 |
Pos logit contributions | |
ate | +0.016 |
his | +0.013 |
things | +0.012 |
other | +0.012 |
| +0.011 |
Neg logit contributions | |
ited | -0.019 |
years | -0.019 |
seventeen | -0.019 |
hy | -0.019 |
ous | -0.018 |
Token | ". |
Token ID | 1911 |
Feature activation | +9.24e-03 |
Pos logit contributions | |
ate | +0.063 |
his | +0.050 |
other | +0.045 |
things | +0.044 |
gear | +0.040 |
Neg logit contributions | |
ous | -0.126 |
hy | -0.125 |
seventeen | -0.125 |
years | -0.117 |
storm | -0.116 |
Token | Mom |
Token ID | 11254 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
ate | +0.013 |
things | +0.010 |
his | +0.009 |
gear | +0.009 |
other | +0.009 |
Neg logit contributions | |
seventeen | -0.019 |
hy | -0.019 |
gust | -0.019 |
aney | -0.019 |
ited | -0.019 |
Token | bought |
Token ID | 5839 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
ate | +0.019 |
his | +0.015 |
things | +0.014 |
| +0.013 |
other | +0.013 |
Neg logit contributions | |
ited | -0.029 |
gust | -0.029 |
seventeen | -0.029 |
hy | -0.029 |
years | -0.029 |
Token | tickets |
Token ID | 8587 |
Feature activation | +3.03e-03 |
Pos logit contributions | |
ate | +0.012 |
his | +0.009 |
things | +0.008 |
other | +0.007 |
gear | +0.007 |
Neg logit contributions | |
seventeen | -0.030 |
hy | -0.030 |
years | -0.029 |
ited | -0.029 |
gust | -0.029 |
Token | for |
Token ID | 329 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.008 |
seventeen | -0.008 |
years | -0.008 |
gust | -0.008 |
hy | -0.008 |
Token | it |
Token ID | 340 |
Feature activation | +1.81e-03 |
Pos logit contributions | |
ate | +0.009 |
his | +0.006 |
things | +0.006 |
other | +0.005 |
." | +0.004 |
Neg logit contributions | |
ited | -0.030 |
seventeen | -0.030 |
hy | -0.030 |
years | -0.030 |
gust | -0.030 |
Token | underneath |
Token ID | 14638 |
Feature activation | +6.31e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.002 |
things | +0.001 |
other | +0.001 |
the | +0.001 |
Neg logit contributions | |
seventeen | -0.005 |
gust | -0.005 |
years | -0.005 |
ited | -0.005 |
hy | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
| +0.002 |
Neg logit contributions | |
ited | -0.019 |
seventeen | -0.019 |
years | -0.018 |
hy | -0.018 |
gust | -0.018 |
Token | snow |
Token ID | 6729 |
Feature activation | +7.17e-03 |
Pos logit contributions | |
ate | +0.014 |
his | +0.012 |
things | +0.012 |
other | +0.011 |
gear | +0.010 |
Neg logit contributions | |
years | -0.029 |
ited | -0.029 |
seventeen | -0.028 |
hy | -0.028 |
gust | -0.027 |
Token | - |
Token ID | 12 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
ate | +0.009 |
his | +0.007 |
things | +0.007 |
other | +0.006 |
." | +0.006 |
Neg logit contributions | |
ited | -0.016 |
seventeen | -0.016 |
years | -0.016 |
hy | -0.016 |
gust | -0.016 |
Token | covered |
Token ID | 32111 |
Feature activation | +5.44e-02 |
Pos logit contributions | |
ate | +0.040 |
his | +0.035 |
things | +0.035 |
other | +0.033 |
gear | +0.031 |
Neg logit contributions | |
ited | -0.021 |
seventeen | -0.021 |
hy | -0.021 |
years | -0.021 |
gust | -0.020 |
Token | bush |
Token ID | 24484 |
Feature activation | +2.78e-03 |
Pos logit contributions | |
ate | +0.071 |
his | +0.055 |
things | +0.054 |
other | +0.048 |
." | +0.044 |
Neg logit contributions | |
ited | -0.124 |
seventeen | -0.123 |
hy | -0.122 |
years | -0.122 |
gust | -0.121 |
Token | . |
Token ID | 13 |
Feature activation | +3.77e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
. | +0.000 |
and | +0.000 |
." | +0.000 |
Neg logit contributions | |
years | -0.009 |
seventeen | -0.009 |
ited | -0.009 |
gust | -0.009 |
hy | -0.009 |
Token | The |
Token ID | 383 |
Feature activation | -5.28e-03 |
Pos logit contributions | |
ate | +0.006 |
his | +0.005 |
things | +0.005 |
other | +0.005 |
| +0.004 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
hy | -0.007 |
years | -0.007 |
gust | -0.007 |
Token | basket |
Token ID | 7988 |
Feature activation | -8.10e-03 |
Pos logit contributions | |
years | +0.014 |
ited | +0.014 |
seventeen | +0.014 |
hy | +0.014 |
gust | +0.014 |
Neg logit contributions | |
ate | -0.005 |
things | -0.004 |
his | -0.004 |
other | -0.003 |
gear | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | -4.76e-03 |
Pos logit contributions | |
years | +0.023 |
seventeen | +0.023 |
ited | +0.023 |
gust | +0.022 |
hy | +0.022 |
Neg logit contributions | |
ate | -0.006 |
his | -0.006 |
and | -0.005 |
other | -0.004 |
things | -0.004 |
Token | person |
Token ID | 1048 |
Feature activation | -4.81e-03 |
Pos logit contributions | |
years | +0.020 |
seventeen | +0.020 |
ited | +0.020 |
gust | +0.019 |
oled | +0.019 |
Neg logit contributions | |
ate | -0.010 |
things | -0.010 |
his | -0.009 |
other | -0.008 |
place | -0.008 |
Token | 's |
Token ID | 338 |
Feature activation | +4.80e-04 |
Pos logit contributions | |
seventeen | +0.012 |
gust | +0.011 |
ited | +0.011 |
years | +0.011 |
storm | +0.010 |
Neg logit contributions | |
ate | -0.006 |
his | -0.006 |
things | -0.005 |
other | -0.005 |
the | -0.005 |
Token | words |
Token ID | 2456 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
ate | +0.001 |
things | +0.001 |
his | +0.001 |
other | +0.001 |
friends | +0.000 |
Neg logit contributions | |
seventeen | -0.001 |
ited | -0.001 |
years | -0.001 |
gust | -0.001 |
storm | -0.001 |
Token | - |
Token ID | 532 |
Feature activation | -3.89e-03 |
Pos logit contributions | |
seventeen | +0.050 |
ited | +0.049 |
years | +0.049 |
gust | +0.048 |
hy | +0.046 |
Neg logit contributions | |
ate | -0.015 |
his | -0.014 |
things | -0.011 |
other | -0.010 |
the | -0.010 |
Token | " |
Token ID | 366 |
Feature activation | +7.79e-04 |
Pos logit contributions | |
ited | +0.009 |
seventeen | +0.009 |
years | +0.009 |
gust | +0.009 |
hy | +0.009 |
Neg logit contributions | |
ate | -0.005 |
his | -0.005 |
things | -0.004 |
other | -0.004 |
| -0.004 |
Token | im |
Token ID | 320 |
Feature activation | +5.40e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
| +0.001 |
Neg logit contributions | |
ited | -0.002 |
seventeen | -0.002 |
hy | -0.002 |
gust | -0.002 |
years | -0.002 |
Token | agine |
Token ID | 12756 |
Feature activation | +1.88e-02 |
Pos logit contributions | |
ate | +0.094 |
his | +0.078 |
things | +0.077 |
other | +0.071 |
." | +0.067 |
Neg logit contributions | |
ited | -0.100 |
seventeen | -0.099 |
hy | -0.098 |
years | -0.098 |
gust | -0.098 |
Token | ". |
Token ID | 1911 |
Feature activation | +8.85e-03 |
Pos logit contributions | |
ate | +0.024 |
his | +0.019 |
things | +0.019 |
other | +0.016 |
." | +0.016 |
Neg logit contributions | |
ited | -0.045 |
seventeen | -0.044 |
gust | -0.044 |
years | -0.044 |
hy | -0.043 |
Token | |
Token ID | 220 |
Feature activation | -1.95e-02 |
Pos logit contributions | |
ate | +0.011 |
things | +0.008 |
his | +0.008 |
other | +0.007 |
gear | +0.007 |
Neg logit contributions | |
hy | -0.021 |
years | -0.020 |
ited | -0.020 |
seventeen | -0.020 |
gust | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +5.50e-03 |
Pos logit contributions | |
hy | +0.050 |
seventeen | +0.049 |
ous | +0.048 |
aney | +0.048 |
anne | +0.048 |
Neg logit contributions | |
ate | -0.015 |
things | -0.013 |
his | -0.011 |
gear | -0.010 |
other | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +5.12e-03 |
Pos logit contributions | |
ate | +0.004 |
things | +0.003 |
his | +0.002 |
gear | +0.002 |
other | +0.002 |
Neg logit contributions | |
years | -0.015 |
seventeen | -0.015 |
hy | -0.015 |
ited | -0.015 |
gust | -0.015 |
Token | chooses |
Token ID | 19769 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.004 |
seventeen | -0.004 |
hy | -0.004 |
years | -0.004 |
gust | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | -4.05e-03 |
Pos logit contributions | |
hy | +0.027 |
seventeen | +0.027 |
years | +0.026 |
ited | +0.026 |
gust | +0.026 |
Neg logit contributions | |
ate | -0.010 |
things | -0.006 |
his | -0.005 |
." | -0.004 |
other | -0.004 |
Token | word |
Token ID | 1573 |
Feature activation | -8.12e-03 |
Pos logit contributions | |
seventeen | +0.009 |
ited | +0.009 |
hy | +0.009 |
years | +0.009 |
gust | +0.009 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
." | -0.003 |
Token | " |
Token ID | 366 |
Feature activation | -4.87e-04 |
Pos logit contributions | |
ited | +0.021 |
seventeen | +0.020 |
years | +0.020 |
gust | +0.020 |
hy | +0.020 |
Neg logit contributions | |
ate | -0.009 |
his | -0.007 |
things | -0.006 |
other | -0.006 |
." | -0.005 |
Token | ign |
Token ID | 570 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
ited | +0.001 |
seventeen | +0.001 |
years | +0.001 |
hy | +0.001 |
gust | +0.001 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
gear | -0.001 |
Token | or |
Token ID | 273 |
Feature activation | +5.37e-02 |
Pos logit contributions | |
ate | +0.042 |
his | +0.035 |
things | +0.034 |
other | +0.031 |
gear | +0.030 |
Neg logit contributions | |
ited | -0.043 |
seventeen | -0.041 |
years | -0.041 |
hy | -0.041 |
gust | -0.040 |
Token | ant |
Token ID | 415 |
Feature activation | +4.68e-02 |
Pos logit contributions | |
ate | +0.085 |
his | +0.069 |
things | +0.067 |
gear | +0.065 |
place | +0.063 |
Neg logit contributions | |
seventeen | -0.101 |
hy | -0.101 |
years | -0.099 |
ous | -0.098 |
ited | -0.097 |
Token | " |
Token ID | 1 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
ate | +0.058 |
his | +0.042 |
things | +0.039 |
gear | +0.036 |
place | +0.033 |
Neg logit contributions | |
hy | -0.108 |
seventeen | -0.107 |
ited | -0.106 |
years | -0.105 |
ous | -0.104 |
Token | and |
Token ID | 290 |
Feature activation | +2.24e-02 |
Pos logit contributions | |
ate | +0.030 |
his | +0.023 |
things | +0.023 |
gear | +0.021 |
our | +0.020 |
Neg logit contributions | |
hy | -0.042 |
years | -0.041 |
ited | -0.041 |
seventeen | -0.040 |
gust | -0.040 |
Token | the |
Token ID | 262 |
Feature activation | +1.58e-02 |
Pos logit contributions | |
ate | +0.031 |
his | +0.025 |
things | +0.025 |
other | +0.022 |
." | +0.021 |
Neg logit contributions | |
ited | -0.050 |
years | -0.049 |
seventeen | -0.049 |
hy | -0.049 |
gust | -0.048 |
Token | number |
Token ID | 1271 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
ate | +0.020 |
his | +0.015 |
things | +0.015 |
other | +0.013 |
." | +0.012 |
Neg logit contributions | |
ited | -0.037 |
seventeen | -0.037 |
years | -0.037 |
hy | -0.037 |
gust | -0.036 |
Token | " |
Token ID | 1 |
Feature activation | +1.55e-03 |
Pos logit contributions | |
ate | +0.001 |
things | +0.000 |
his | +0.000 |
other | +0.000 |
gear | +0.000 |
Neg logit contributions | |
seventeen | -0.001 |
ited | -0.001 |
years | -0.001 |
hy | -0.001 |
gust | -0.001 |
Token | You |
Token ID | 1639 |
Feature activation | -1.18e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.003 |
seventeen | -0.003 |
hy | -0.003 |
years | -0.003 |
gust | -0.003 |
Token | are |
Token ID | 389 |
Feature activation | -8.38e-03 |
Pos logit contributions | |
ited | +0.002 |
hy | +0.002 |
seventeen | +0.002 |
years | +0.002 |
gust | +0.002 |
Neg logit contributions | |
ate | -0.003 |
his | -0.002 |
things | -0.002 |
other | -0.002 |
gear | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +2.03e-03 |
Pos logit contributions | |
hy | +0.017 |
years | +0.017 |
seventeen | +0.017 |
gust | +0.017 |
thirteen | +0.016 |
Neg logit contributions | |
ate | -0.013 |
things | -0.009 |
gear | -0.009 |
his | -0.009 |
other | -0.008 |
Token | good |
Token ID | 922 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
himself | +0.002 |
gear | +0.002 |
Neg logit contributions | |
gust | -0.004 |
seventeen | -0.004 |
hy | -0.004 |
years | -0.004 |
ited | -0.004 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.37e-02 |
Pos logit contributions | |
ate | +0.022 |
his | +0.017 |
things | +0.015 |
other | +0.013 |
| +0.013 |
Neg logit contributions | |
gust | -0.042 |
hy | -0.041 |
ited | -0.040 |
seventeen | -0.040 |
ous | -0.039 |
Token | , |
Token ID | 11 |
Feature activation | +7.64e-03 |
Pos logit contributions | |
ate | +0.042 |
his | +0.033 |
things | +0.032 |
." | +0.029 |
other | +0.024 |
Neg logit contributions | |
years | -0.149 |
ited | -0.149 |
seventeen | -0.147 |
hy | -0.144 |
gust | -0.142 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.81e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
." | +0.007 |
Neg logit contributions | |
ited | -0.017 |
seventeen | -0.017 |
years | -0.017 |
hy | -0.017 |
gust | -0.017 |
Token | !" |
Token ID | 2474 |
Feature activation | +2.15e-03 |
Pos logit contributions | |
ate | +0.008 |
his | +0.006 |
things | +0.006 |
other | +0.006 |
gear | +0.005 |
Neg logit contributions | |
ited | -0.012 |
hy | -0.012 |
seventeen | -0.012 |
gust | -0.012 |
years | -0.011 |
Token | she |
Token ID | 673 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.003 |
things | +0.003 |
| +0.003 |
other | +0.003 |
Neg logit contributions | |
ited | -0.005 |
seventeen | -0.004 |
years | -0.004 |
hy | -0.004 |
ous | -0.004 |
Token | said |
Token ID | 531 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
ited | +0.024 |
hy | +0.024 |
seventeen | +0.024 |
gust | +0.024 |
years | +0.023 |
Neg logit contributions | |
ate | -0.020 |
things | -0.016 |
his | -0.016 |
other | -0.014 |
gear | -0.013 |
Token | put |
Token ID | 1234 |
Feature activation | +8.26e-03 |
Pos logit contributions | |
hy | +0.001 |
ited | +0.001 |
seventeen | +0.001 |
gust | +0.001 |
years | +0.001 |
Neg logit contributions | |
ate | -0.001 |
things | -0.001 |
his | -0.001 |
other | -0.001 |
gear | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | -2.47e-02 |
Pos logit contributions | |
ate | +0.010 |
his | +0.006 |
emo | +0.006 |
other | +0.006 |
| +0.006 |
Neg logit contributions | |
seventeen | -0.018 |
years | -0.017 |
gust | -0.017 |
hy | -0.017 |
ited | -0.017 |
Token | down |
Token ID | 866 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
seventeen | +0.058 |
ited | +0.058 |
gust | +0.057 |
hy | +0.057 |
years | +0.057 |
Neg logit contributions | |
ate | -0.031 |
his | -0.026 |
things | -0.025 |
other | -0.022 |
." | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | -3.73e-04 |
Pos logit contributions | |
ited | +0.030 |
seventeen | +0.030 |
years | +0.030 |
hy | +0.030 |
gust | +0.029 |
Neg logit contributions | |
ate | -0.012 |
his | -0.008 |
things | -0.008 |
other | -0.007 |
gear | -0.006 |
Token | Ign |
Token ID | 16583 |
Feature activation | +5.66e-03 |
Pos logit contributions | |
years | +0.001 |
seventeen | +0.001 |
hy | +0.001 |
gust | +0.001 |
thirteen | +0.001 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.000 |
gear | -0.000 |
Token | or |
Token ID | 273 |
Feature activation | +5.26e-02 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
." | +0.007 |
Neg logit contributions | |
seventeen | -0.011 |
hy | -0.010 |
gust | -0.010 |
ited | -0.010 |
years | -0.010 |
Token | ant |
Token ID | 415 |
Feature activation | +3.94e-02 |
Pos logit contributions | |
ate | +0.091 |
his | +0.076 |
things | +0.074 |
other | +0.069 |
place | +0.067 |
Neg logit contributions | |
years | -0.093 |
ited | -0.093 |
hy | -0.092 |
seventeen | -0.091 |
ous | -0.089 |
Token | children |
Token ID | 1751 |
Feature activation | +2.32e-02 |
Pos logit contributions | |
ate | +0.053 |
his | +0.040 |
things | +0.036 |
gear | +0.032 |
other | +0.032 |
Neg logit contributions | |
hy | -0.088 |
ited | -0.086 |
seventeen | -0.085 |
years | -0.085 |
gust | -0.084 |
Token | like |
Token ID | 588 |
Feature activation | -5.70e-03 |
Pos logit contributions | |
ate | +0.029 |
things | +0.024 |
his | +0.024 |
." | +0.022 |
other | +0.022 |
Neg logit contributions | |
seventeen | -0.055 |
gust | -0.054 |
ited | -0.053 |
years | -0.053 |
hy | -0.052 |
Token | you |
Token ID | 345 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
ited | +0.013 |
seventeen | +0.013 |
hy | +0.013 |
years | +0.013 |
gust | +0.013 |
Neg logit contributions | |
ate | -0.007 |
his | -0.005 |
things | -0.005 |
other | -0.005 |
gear | -0.004 |
Token | don |
Token ID | 836 |
Feature activation | -2.84e-03 |
Pos logit contributions | |
seventeen | +0.044 |
ited | +0.044 |
years | +0.043 |
gust | +0.043 |
hy | +0.043 |
Neg logit contributions | |
ate | -0.022 |
his | -0.017 |
things | -0.017 |
other | -0.015 |
." | -0.014 |
Token | " |
Token ID | 366 |
Feature activation | +8.55e-04 |
Pos logit contributions | |
ited | +0.019 |
seventeen | +0.018 |
hy | +0.018 |
years | +0.018 |
gust | +0.018 |
Neg logit contributions | |
ate | -0.008 |
his | -0.006 |
things | -0.006 |
other | -0.005 |
| -0.005 |
Token | You |
Token ID | 1639 |
Feature activation | +3.53e-04 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.002 |
seventeen | -0.002 |
years | -0.002 |
hy | -0.002 |
gust | -0.002 |
Token | are |
Token ID | 389 |
Feature activation | -7.31e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.000 |
gear | +0.000 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
hy | -0.001 |
years | -0.001 |
gust | -0.001 |
Token | very |
Token ID | 845 |
Feature activation | -1.47e-03 |
Pos logit contributions | |
seventeen | +0.015 |
hy | +0.015 |
years | +0.015 |
thirteen | +0.014 |
gust | +0.014 |
Neg logit contributions | |
ate | -0.011 |
things | -0.008 |
gear | -0.008 |
his | -0.008 |
emo | -0.007 |
Token | good |
Token ID | 922 |
Feature activation | +2.24e-02 |
Pos logit contributions | |
ited | +0.003 |
seventeen | +0.003 |
years | +0.003 |
hy | +0.003 |
gust | +0.003 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.002 |
other | -0.001 |
gear | -0.001 |
Token | chefs |
Token ID | 36236 |
Feature activation | +5.21e-02 |
Pos logit contributions | |
ate | +0.029 |
his | +0.022 |
things | +0.021 |
other | +0.019 |
gear | +0.018 |
Neg logit contributions | |
ited | -0.051 |
years | -0.051 |
hy | -0.050 |
seventeen | -0.050 |
gust | -0.050 |
Token | indeed |
Token ID | 5600 |
Feature activation | +9.85e-03 |
Pos logit contributions | |
ate | +0.060 |
his | +0.042 |
things | +0.040 |
other | +0.036 |
gear | +0.034 |
Neg logit contributions | |
hy | -0.124 |
ited | -0.121 |
seventeen | -0.121 |
years | -0.121 |
ous | -0.118 |
Token | . |
Token ID | 13 |
Feature activation | -7.47e-03 |
Pos logit contributions | |
ate | +0.012 |
his | +0.009 |
other | +0.008 |
gear | +0.008 |
things | +0.008 |
Neg logit contributions | |
seventeen | -0.022 |
ous | -0.021 |
hy | -0.021 |
ited | -0.021 |
years | -0.021 |
Token | And |
Token ID | 843 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
hy | +0.013 |
seventeen | +0.013 |
years | +0.013 |
thirteen | +0.012 |
ago | +0.012 |
Neg logit contributions | |
ate | -0.013 |
things | -0.011 |
his | -0.011 |
gear | -0.010 |
other | -0.010 |
Token | very |
Token ID | 845 |
Feature activation | +6.39e-03 |
Pos logit contributions | |
ited | +0.025 |
seventeen | +0.024 |
hy | +0.024 |
gust | +0.024 |
years | +0.024 |
Neg logit contributions | |
ate | -0.013 |
his | -0.010 |
things | -0.010 |
other | -0.009 |
." | -0.008 |
Token | good |
Token ID | 922 |
Feature activation | +1.90e-02 |
Pos logit contributions | |
ate | +0.008 |
things | +0.006 |
his | +0.006 |
other | +0.005 |
." | +0.005 |
Neg logit contributions | |
ited | -0.016 |
hy | -0.015 |
gust | -0.015 |
storm | -0.015 |
seventeen | -0.015 |
Token | He |
Token ID | 679 |
Feature activation | +5.52e-03 |
Pos logit contributions | |
ate | +0.014 |
things | +0.010 |
his | +0.010 |
other | +0.009 |
gear | +0.008 |
Neg logit contributions | |
seventeen | -0.025 |
ited | -0.025 |
hy | -0.025 |
gust | -0.025 |
years | -0.025 |
Token | says |
Token ID | 1139 |
Feature activation | -3.01e-03 |
Pos logit contributions | |
ate | +0.009 |
his | +0.007 |
things | +0.007 |
other | +0.006 |
." | +0.006 |
Neg logit contributions | |
seventeen | -0.011 |
ited | -0.011 |
hy | -0.011 |
years | -0.011 |
gust | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | -4.60e-03 |
Pos logit contributions | |
ited | +0.008 |
years | +0.008 |
seventeen | +0.008 |
gust | +0.008 |
hy | +0.008 |
Neg logit contributions | |
ate | -0.003 |
his | -0.003 |
things | -0.002 |
other | -0.002 |
." | -0.002 |
Token | " |
Token ID | 366 |
Feature activation | +7.53e-04 |
Pos logit contributions | |
ited | +0.012 |
years | +0.012 |
hy | +0.012 |
seventeen | +0.011 |
gust | +0.011 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.003 |
other | -0.003 |
| -0.003 |
Token | Ign |
Token ID | 32916 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.002 |
seventeen | -0.001 |
years | -0.001 |
hy | -0.001 |
gust | -0.001 |
Token | or |
Token ID | 273 |
Feature activation | +5.19e-02 |
Pos logit contributions | |
ate | +0.019 |
his | +0.016 |
things | +0.015 |
other | +0.014 |
gear | +0.013 |
Neg logit contributions | |
ited | -0.019 |
seventeen | -0.019 |
years | -0.019 |
hy | -0.019 |
gust | -0.018 |
Token | ant |
Token ID | 415 |
Feature activation | +4.71e-02 |
Pos logit contributions | |
ate | +0.079 |
his | +0.063 |
things | +0.060 |
gear | +0.058 |
place | +0.058 |
Neg logit contributions | |
seventeen | -0.100 |
years | -0.099 |
ited | -0.099 |
hy | -0.098 |
ous | -0.096 |
Token | , |
Token ID | 11 |
Feature activation | +7.65e-03 |
Pos logit contributions | |
ate | +0.061 |
his | +0.045 |
gear | +0.040 |
things | +0.040 |
place | +0.037 |
Neg logit contributions | |
seventeen | -0.103 |
hy | -0.103 |
ited | -0.102 |
years | -0.101 |
ous | -0.101 |
Token | zero |
Token ID | 6632 |
Feature activation | +4.87e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
." | +0.007 |
Neg logit contributions | |
ited | -0.018 |
years | -0.017 |
seventeen | -0.017 |
hy | -0.017 |
gust | -0.017 |
Token | ". |
Token ID | 1911 |
Feature activation | +7.00e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.004 |
things | +0.004 |
other | +0.003 |
gear | +0.003 |
Neg logit contributions | |
ited | -0.012 |
seventeen | -0.012 |
hy | -0.012 |
years | -0.012 |
gust | -0.012 |
Token | The |
Token ID | 383 |
Feature activation | -5.82e-03 |
Pos logit contributions | |
ate | +0.009 |
things | +0.007 |
his | +0.007 |
gear | +0.006 |
other | +0.006 |
Neg logit contributions | |
seventeen | -0.016 |
gust | -0.015 |
ited | -0.015 |
hy | -0.015 |
years | -0.015 |
Token | singing |
Token ID | 13777 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
his | +0.003 |
things | +0.003 |
the | +0.003 |
ate | +0.002 |
friends | +0.002 |
Neg logit contributions | |
ited | -0.014 |
seventeen | -0.014 |
years | -0.013 |
hy | -0.013 |
gust | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +5.77e-03 |
Pos logit contributions | |
ited | +0.053 |
seventeen | +0.052 |
years | +0.052 |
hy | +0.050 |
gust | +0.049 |
Neg logit contributions | |
ate | -0.012 |
his | -0.011 |
things | -0.009 |
other | -0.007 |
the | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | -5.08e-04 |
Pos logit contributions | |
his | +0.009 |
the | +0.009 |
things | +0.008 |
other | +0.008 |
friends | +0.007 |
Neg logit contributions | |
ited | -0.013 |
seventeen | -0.012 |
aney | -0.012 |
hy | -0.012 |
years | -0.012 |
Token | flag |
Token ID | 6056 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
years | +0.001 |
ited | +0.001 |
seventeen | +0.001 |
hy | +0.001 |
oled | +0.001 |
Neg logit contributions | |
ate | -0.001 |
things | -0.000 |
other | -0.000 |
his | -0.000 |
friends | -0.000 |
Token | unf |
Token ID | 3684 |
Feature activation | +1.63e-03 |
Pos logit contributions | |
years | +0.030 |
seventeen | +0.028 |
ited | +0.027 |
gary | +0.026 |
gust | +0.025 |
Neg logit contributions | |
his | -0.015 |
ate | -0.015 |
other | -0.013 |
things | -0.013 |
the | -0.012 |
Token | ro |
Token ID | 305 |
Feature activation | +5.17e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.003 |
things | +0.003 |
." | +0.003 |
| +0.003 |
Neg logit contributions | |
ited | -0.003 |
years | -0.003 |
gust | -0.002 |
seventeen | -0.002 |
hy | -0.002 |
Token | ze |
Token ID | 2736 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
ate | +0.086 |
his | +0.072 |
things | +0.070 |
other | +0.065 |
." | +0.061 |
Neg logit contributions | |
ited | -0.099 |
seventeen | -0.098 |
years | -0.097 |
hy | -0.097 |
gust | -0.096 |
Token | . |
Token ID | 13 |
Feature activation | +6.83e-03 |
Pos logit contributions | |
ate | +0.016 |
his | +0.016 |
things | +0.015 |
other | +0.013 |
." | +0.012 |
Neg logit contributions | |
years | -0.059 |
ited | -0.059 |
seventeen | -0.057 |
hy | -0.054 |
gust | -0.054 |
Token |
|
Token ID | 198 |
Feature activation | +7.00e-03 |
Pos logit contributions | |
ate | +0.009 |
things | +0.007 |
his | +0.007 |
other | +0.006 |
gear | +0.006 |
Neg logit contributions | |
gust | -0.015 |
seventeen | -0.015 |
hy | -0.015 |
years | -0.015 |
ited | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | +5.71e-03 |
Pos logit contributions | |
ate | +0.005 |
things | +0.003 |
his | +0.003 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
seventeen | -0.020 |
years | -0.020 |
ited | -0.020 |
hy | -0.020 |
gust | -0.020 |
Token | The |
Token ID | 464 |
Feature activation | -3.06e-03 |
Pos logit contributions | |
ate | +0.007 |
his | +0.006 |
things | +0.005 |
other | +0.005 |
| +0.005 |
Neg logit contributions | |
ited | -0.013 |
hy | -0.013 |
seventeen | -0.013 |
gust | -0.013 |
years | -0.013 |
Token | " |
Token ID | 366 |
Feature activation | -2.81e-03 |
Pos logit contributions | |
seventeen | +0.013 |
gust | +0.013 |
hy | +0.013 |
years | +0.012 |
stretched | +0.012 |
Neg logit contributions | |
ate | -0.009 |
things | -0.007 |
his | -0.006 |
other | -0.006 |
gear | -0.006 |
Token | You |
Token ID | 1639 |
Feature activation | -2.60e-03 |
Pos logit contributions | |
seventeen | +0.006 |
ited | +0.006 |
hy | +0.005 |
years | +0.005 |
gust | +0.005 |
Neg logit contributions | |
ate | -0.004 |
things | -0.004 |
his | -0.004 |
other | -0.003 |
friends | -0.003 |
Token | are |
Token ID | 389 |
Feature activation | -8.42e-03 |
Pos logit contributions | |
ited | +0.005 |
seventeen | +0.005 |
hy | +0.005 |
years | +0.005 |
gust | +0.005 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
gear | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | +8.43e-04 |
Pos logit contributions | |
years | +0.017 |
seventeen | +0.017 |
hy | +0.017 |
thirteen | +0.016 |
gust | +0.016 |
Neg logit contributions | |
ate | -0.013 |
things | -0.010 |
gear | -0.009 |
his | -0.009 |
other | -0.008 |
Token | good |
Token ID | 922 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
seventeen | -0.002 |
gust | -0.002 |
hy | -0.002 |
ited | -0.002 |
years | -0.002 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.17e-02 |
Pos logit contributions | |
ate | +0.020 |
his | +0.015 |
things | +0.013 |
other | +0.012 |
yourself | +0.011 |
Neg logit contributions | |
hy | -0.037 |
gust | -0.037 |
ited | -0.036 |
seventeen | -0.036 |
ous | -0.035 |
Token | and |
Token ID | 290 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
ate | +0.046 |
his | +0.034 |
things | +0.032 |
other | +0.026 |
." | +0.025 |
Neg logit contributions | |
ited | -0.138 |
seventeen | -0.137 |
years | -0.137 |
hy | -0.136 |
gust | -0.134 |
Token | a |
Token ID | 257 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
ate | +0.013 |
his | +0.011 |
things | +0.010 |
other | +0.009 |
." | +0.008 |
Neg logit contributions | |
ited | -0.024 |
seventeen | -0.024 |
hy | -0.023 |
gust | -0.023 |
years | -0.023 |
Token | good |
Token ID | 922 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
ate | +0.016 |
his | +0.012 |
things | +0.012 |
other | +0.010 |
." | +0.009 |
Neg logit contributions | |
ited | -0.034 |
seventeen | -0.034 |
hy | -0.033 |
years | -0.033 |
gust | -0.033 |
Token | sister |
Token ID | 6621 |
Feature activation | +2.52e-02 |
Pos logit contributions | |
ate | +0.020 |
his | +0.014 |
things | +0.013 |
other | +0.012 |
| +0.011 |
Neg logit contributions | |
gust | -0.035 |
hy | -0.035 |
ited | -0.035 |
seventeen | -0.034 |
ous | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
ate | +0.022 |
his | +0.015 |
things | +0.014 |
other | +0.011 |
." | +0.011 |
Neg logit contributions | |
ited | -0.069 |
seventeen | -0.068 |
years | -0.068 |
gust | -0.068 |
hy | -0.067 |
Token | " |
Token ID | 366 |
Feature activation | -4.25e-03 |
Pos logit contributions | |
ited | +0.026 |
years | +0.025 |
seventeen | +0.025 |
hy | +0.025 |
gust | +0.025 |
Neg logit contributions | |
ate | -0.011 |
his | -0.008 |
things | -0.008 |
other | -0.007 |
| -0.006 |
Token | You |
Token ID | 1639 |
Feature activation | +5.86e-04 |
Pos logit contributions | |
ited | +0.007 |
seventeen | +0.007 |
hy | +0.007 |
years | +0.007 |
gust | +0.007 |
Neg logit contributions | |
ate | -0.008 |
things | -0.007 |
his | -0.007 |
other | -0.006 |
gear | -0.006 |
Token | are |
Token ID | 389 |
Feature activation | -8.23e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
| +0.001 |
Neg logit contributions | |
ited | -0.001 |
hy | -0.001 |
seventeen | -0.001 |
years | -0.001 |
gust | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | -7.71e-04 |
Pos logit contributions | |
seventeen | +0.018 |
hy | +0.018 |
years | +0.018 |
gust | +0.017 |
ited | +0.017 |
Neg logit contributions | |
ate | -0.012 |
things | -0.009 |
his | -0.008 |
gear | -0.008 |
other | -0.007 |
Token | good |
Token ID | 922 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
seventeen | +0.002 |
gust | +0.002 |
hy | +0.002 |
ited | +0.002 |
years | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
| -0.001 |
other | -0.001 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.16e-02 |
Pos logit contributions | |
ate | +0.021 |
his | +0.015 |
things | +0.014 |
other | +0.013 |
| +0.013 |
Neg logit contributions | |
hy | -0.035 |
gust | -0.035 |
ited | -0.034 |
seventeen | -0.034 |
years | -0.033 |
Token | , |
Token ID | 11 |
Feature activation | +6.26e-03 |
Pos logit contributions | |
ate | +0.051 |
his | +0.038 |
things | +0.036 |
other | +0.030 |
." | +0.028 |
Neg logit contributions | |
ited | -0.134 |
seventeen | -0.133 |
years | -0.132 |
hy | -0.131 |
gust | -0.130 |
Token | Anna |
Token ID | 11735 |
Feature activation | +9.25e-03 |
Pos logit contributions | |
ate | +0.009 |
his | +0.006 |
things | +0.006 |
other | +0.006 |
." | +0.005 |
Neg logit contributions | |
hy | -0.014 |
seventeen | -0.014 |
gust | -0.014 |
ited | -0.014 |
years | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
ate | +0.012 |
things | +0.008 |
his | +0.008 |
other | +0.007 |
gear | +0.007 |
Neg logit contributions | |
hy | -0.020 |
ited | -0.020 |
anne | -0.019 |
seventeen | -0.019 |
ous | -0.019 |
Token | But |
Token ID | 887 |
Feature activation | -5.00e-03 |
Pos logit contributions | |
hy | +0.023 |
years | +0.021 |
seventeen | +0.021 |
gust | +0.020 |
ous | +0.020 |
Neg logit contributions | |
ate | -0.022 |
things | -0.018 |
his | -0.017 |
other | -0.017 |
gear | -0.015 |
Token | I |
Token ID | 314 |
Feature activation | -9.46e-03 |
Pos logit contributions | |
ited | +0.013 |
seventeen | +0.013 |
hy | +0.013 |
years | +0.013 |
gust | +0.013 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
your | -0.003 |
Token | often |
Token ID | 1690 |
Feature activation | +6.07e-04 |
Pos logit contributions | |
ate | +0.000 |
his | +0.000 |
things | +0.000 |
other | +0.000 |
." | +0.000 |
Neg logit contributions | |
seventeen | -0.000 |
years | -0.000 |
ited | -0.000 |
gust | -0.000 |
hy | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +2.63e-04 |
Pos logit contributions | |
ate | +0.000 |
his | +0.000 |
things | +0.000 |
." | +0.000 |
other | +0.000 |
Neg logit contributions | |
years | -0.002 |
seventeen | -0.002 |
ited | -0.002 |
gust | -0.002 |
hy | -0.002 |
Token | He |
Token ID | 679 |
Feature activation | +2.04e-03 |
Pos logit contributions | |
ate | +0.000 |
things | +0.000 |
his | +0.000 |
other | +0.000 |
P | +0.000 |
Neg logit contributions | |
hy | -0.001 |
seventeen | -0.001 |
years | -0.001 |
gust | -0.000 |
ous | -0.000 |
Token | held |
Token ID | 2714 |
Feature activation | +2.08e-05 |
Pos logit contributions | |
ate | +0.003 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
gear | +0.002 |
Neg logit contributions | |
seventeen | -0.004 |
hy | -0.004 |
gust | -0.004 |
ited | -0.004 |
years | -0.004 |
Token | his |
Token ID | 465 |
Feature activation | +6.57e-04 |
Pos logit contributions | |
ate | +0.000 |
." | +0.000 |
things | +0.000 |
place | +0.000 |
gear | +0.000 |
Neg logit contributions | |
years | -0.000 |
gust | -0.000 |
ited | -0.000 |
hy | -0.000 |
seventeen | -0.000 |
Token | gust |
Token ID | 35253 |
Feature activation | -7.77e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
." | +0.001 |
other | +0.001 |
Neg logit contributions | |
hy | -0.001 |
gust | -0.001 |
seventeen | -0.001 |
ited | -0.001 |
years | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | +6.15e-04 |
Pos logit contributions | |
seventeen | +0.152 |
gust | +0.148 |
ited | +0.142 |
storm | +0.138 |
hy | +0.134 |
Neg logit contributions | |
ate | -0.129 |
his | -0.125 |
things | -0.113 |
and | -0.107 |
| -0.106 |
Token | kept |
Token ID | 4030 |
Feature activation | +2.42e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
the | +0.001 |
Neg logit contributions | |
hy | -0.001 |
seventeen | -0.001 |
ited | -0.001 |
ous | -0.001 |
gust | -0.001 |
Token | checking |
Token ID | 10627 |
Feature activation | +3.32e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
." | +0.002 |
Neg logit contributions | |
ited | -0.005 |
seventeen | -0.005 |
hy | -0.005 |
years | -0.005 |
gust | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | +3.34e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
gear | +0.002 |
Neg logit contributions | |
hy | -0.008 |
years | -0.008 |
ited | -0.008 |
seventeen | -0.008 |
gust | -0.008 |
Token | mailbox |
Token ID | 37282 |
Feature activation | -2.07e-02 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.008 |
seventeen | -0.008 |
years | -0.008 |
hy | -0.007 |
gust | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +1.45e-03 |
Pos logit contributions | |
seventeen | +0.011 |
ited | +0.011 |
gust | +0.011 |
years | +0.010 |
hy | +0.010 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.001 |
." | -0.001 |
other | -0.001 |
Token | He |
Token ID | 679 |
Feature activation | -2.45e-03 |
Pos logit contributions | |
ate | +0.002 |
things | +0.002 |
his | +0.002 |
other | +0.002 |
P | +0.002 |
Neg logit contributions | |
seventeen | -0.003 |
hy | -0.003 |
gust | -0.003 |
ited | -0.003 |
years | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | -9.14e-03 |
Pos logit contributions | |
seventeen | +0.005 |
ited | +0.005 |
gust | +0.005 |
hy | +0.005 |
years | +0.005 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
other | -0.003 |
gear | -0.003 |
Token | wearing |
Token ID | 5762 |
Feature activation | +9.35e-03 |
Pos logit contributions | |
ited | +0.019 |
seventeen | +0.018 |
hy | +0.018 |
gust | +0.018 |
years | +0.018 |
Neg logit contributions | |
ate | -0.014 |
his | -0.013 |
things | -0.012 |
other | -0.011 |
." | -0.010 |
Token | his |
Token ID | 465 |
Feature activation | -3.00e-04 |
Pos logit contributions | |
ate | +0.008 |
things | +0.004 |
." | +0.004 |
other | +0.003 |
| +0.003 |
Neg logit contributions | |
hy | -0.025 |
gust | -0.024 |
seventeen | -0.024 |
years | -0.024 |
ited | -0.024 |
Token | brand |
Token ID | 4508 |
Feature activation | -7.43e-02 |
Pos logit contributions | |
hy | +0.001 |
ited | +0.001 |
years | +0.001 |
gust | +0.001 |
seventeen | +0.001 |
Neg logit contributions | |
ate | -0.000 |
his | -0.000 |
things | -0.000 |
other | -0.000 |
." | -0.000 |
Token | new |
Token ID | 649 |
Feature activation | -2.06e-02 |
Pos logit contributions | |
ited | +0.170 |
gust | +0.167 |
hy | +0.166 |
ous | +0.164 |
bell | +0.163 |
Neg logit contributions | |
ate | -0.078 |
his | -0.052 |
other | -0.047 |
yourself | -0.046 |
things | -0.046 |
Token | icy |
Token ID | 30284 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
hy | +0.045 |
ited | +0.045 |
years | +0.044 |
gust | +0.044 |
seventeen | +0.043 |
Neg logit contributions | |
ate | -0.028 |
his | -0.020 |
things | -0.019 |
other | -0.018 |
| -0.017 |
Token | blue |
Token ID | 4171 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
ited | +0.027 |
hy | +0.027 |
seventeen | +0.027 |
years | +0.027 |
gust | +0.027 |
Neg logit contributions | |
ate | -0.014 |
his | -0.010 |
things | -0.010 |
other | -0.009 |
| -0.008 |
Token | jacket |
Token ID | 15224 |
Feature activation | -9.56e-03 |
Pos logit contributions | |
hy | +0.024 |
ited | +0.023 |
gust | +0.023 |
years | +0.023 |
seventeen | +0.023 |
Neg logit contributions | |
ate | -0.013 |
his | -0.009 |
things | -0.009 |
other | -0.008 |
| -0.007 |
Token | as |
Token ID | 355 |
Feature activation | +4.78e-04 |
Pos logit contributions | |
ited | +0.025 |
hy | +0.024 |
seventeen | +0.024 |
years | +0.024 |
gust | +0.024 |
Neg logit contributions | |
ate | -0.010 |
his | -0.007 |
things | -0.006 |
other | -0.005 |
." | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +3.96e-03 |
Pos logit contributions | |
ate | +0.004 |
things | +0.004 |
gear | +0.003 |
his | +0.002 |
stuff | +0.002 |
Neg logit contributions | |
seventeen | -0.011 |
hy | -0.011 |
years | -0.011 |
gust | -0.010 |
aney | -0.010 |
Token | S |
Token ID | 50 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
ate | +0.006 |
things | +0.005 |
his | +0.004 |
gear | +0.004 |
name | +0.004 |
Neg logit contributions | |
seventeen | -0.009 |
ited | -0.008 |
hy | -0.008 |
years | -0.008 |
thirteen | -0.008 |
Token | ara |
Token ID | 3301 |
Feature activation | +1.79e-03 |
Pos logit contributions | |
ate | +0.020 |
his | +0.017 |
things | +0.016 |
other | +0.014 |
gear | +0.014 |
Neg logit contributions | |
ited | -0.031 |
seventeen | -0.030 |
hy | -0.030 |
gust | -0.029 |
years | -0.029 |
Token | felt |
Token ID | 2936 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
ited | -0.003 |
hy | -0.003 |
seventeen | -0.003 |
years | -0.003 |
gust | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | -8.84e-03 |
Pos logit contributions | |
ited | +0.019 |
seventeen | +0.018 |
years | +0.018 |
hy | +0.017 |
ous | +0.017 |
Neg logit contributions | |
ate | -0.019 |
his | -0.018 |
things | -0.017 |
other | -0.016 |
| -0.015 |
Token | gust |
Token ID | 35253 |
Feature activation | -7.07e-02 |
Pos logit contributions | |
gust | +0.019 |
ited | +0.019 |
seventeen | +0.019 |
hy | +0.019 |
years | +0.018 |
Neg logit contributions | |
ate | -0.013 |
his | -0.010 |
things | -0.010 |
other | -0.008 |
." | -0.008 |
Token | of |
Token ID | 286 |
Feature activation | -3.48e-02 |
Pos logit contributions | |
seventeen | +0.136 |
ited | +0.129 |
gust | +0.125 |
hy | +0.124 |
anne | +0.124 |
Neg logit contributions | |
ate | -0.113 |
his | -0.110 |
things | -0.100 |
| -0.099 |
other | -0.097 |
Token | wind |
Token ID | 2344 |
Feature activation | -2.36e-02 |
Pos logit contributions | |
seventeen | +0.070 |
ous | +0.070 |
years | +0.070 |
ited | +0.069 |
hy | +0.069 |
Neg logit contributions | |
ate | -0.053 |
his | -0.051 |
things | -0.048 |
other | -0.046 |
gear | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
seventeen | +0.064 |
years | +0.062 |
aney | +0.060 |
ited | +0.060 |
anne | +0.059 |
Neg logit contributions | |
his | -0.023 |
ate | -0.019 |
and | -0.019 |
. | -0.018 |
the | -0.018 |
Token | She |
Token ID | 1375 |
Feature activation | +4.34e-03 |
Pos logit contributions | |
hy | +0.018 |
gust | +0.018 |
seventeen | +0.018 |
years | +0.017 |
ited | +0.017 |
Neg logit contributions | |
ate | -0.026 |
things | -0.022 |
his | -0.022 |
other | -0.021 |
gear | -0.020 |
Token | saw |
Token ID | 2497 |
Feature activation | +5.53e-03 |
Pos logit contributions | |
ate | +0.008 |
things | +0.007 |
his | +0.007 |
other | +0.006 |
." | +0.006 |
Neg logit contributions | |
ited | -0.008 |
hy | -0.008 |
years | -0.007 |
gust | -0.007 |
seventeen | -0.007 |
Token | sparks |
Token ID | 38306 |
Feature activation | +1.97e-02 |
Pos logit contributions | |
his | +0.008 |
things | +0.008 |
ate | +0.007 |
other | +0.007 |
the | +0.006 |
Neg logit contributions | |
ited | -0.015 |
years | -0.014 |
aney | -0.014 |
hy | -0.013 |
istent | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -6.61e-03 |
Pos logit contributions | |
ate | +0.015 |
his | +0.012 |
things | +0.012 |
." | +0.010 |
other | +0.009 |
Neg logit contributions | |
years | -0.059 |
ited | -0.057 |
hy | -0.054 |
seventeen | -0.054 |
gust | -0.053 |
Token | They |
Token ID | 1119 |
Feature activation | +7.72e-03 |
Pos logit contributions | |
seventeen | +0.012 |
hy | +0.011 |
gust | +0.011 |
bell | +0.011 |
sing | +0.010 |
Neg logit contributions | |
ate | -0.011 |
his | -0.009 |
things | -0.009 |
gear | -0.008 |
your | -0.008 |
Token | feel |
Token ID | 1254 |
Feature activation | -7.63e-03 |
Pos logit contributions | |
ate | +0.012 |
his | +0.010 |
things | +0.010 |
other | +0.009 |
." | +0.009 |
Neg logit contributions | |
ited | -0.017 |
years | -0.016 |
seventeen | -0.016 |
hy | -0.016 |
gust | -0.016 |
Token | a |
Token ID | 257 |
Feature activation | -8.41e-03 |
Pos logit contributions | |
ited | +0.017 |
seventeen | +0.017 |
years | +0.017 |
hy | +0.017 |
gust | +0.017 |
Neg logit contributions | |
ate | -0.010 |
his | -0.008 |
things | -0.008 |
other | -0.007 |
| -0.007 |
Token | gust |
Token ID | 35253 |
Feature activation | -6.69e-02 |
Pos logit contributions | |
years | +0.019 |
ited | +0.019 |
seventeen | +0.018 |
hy | +0.018 |
gust | +0.017 |
Neg logit contributions | |
ate | -0.011 |
his | -0.010 |
things | -0.009 |
other | -0.009 |
| -0.008 |
Token | of |
Token ID | 286 |
Feature activation | -3.48e-02 |
Pos logit contributions | |
seventeen | +0.113 |
ited | +0.113 |
hy | +0.108 |
gust | +0.108 |
years | +0.108 |
Neg logit contributions | |
ate | -0.125 |
his | -0.112 |
things | -0.109 |
other | -0.103 |
| -0.102 |
Token | wind |
Token ID | 2344 |
Feature activation | -2.13e-02 |
Pos logit contributions | |
years | +0.073 |
ited | +0.073 |
seventeen | +0.072 |
ous | +0.072 |
hy | +0.072 |
Neg logit contributions | |
ate | -0.050 |
his | -0.049 |
things | -0.046 |
other | -0.043 |
the | -0.039 |
Token | . |
Token ID | 13 |
Feature activation | -8.24e-03 |
Pos logit contributions | |
years | +0.054 |
ited | +0.052 |
seventeen | +0.051 |
gust | +0.051 |
hy | +0.050 |
Neg logit contributions | |
ate | -0.025 |
his | -0.021 |
things | -0.020 |
." | -0.019 |
and | -0.017 |
Token | They |
Token ID | 1119 |
Feature activation | +6.83e-03 |
Pos logit contributions | |
seventeen | +0.015 |
hy | +0.015 |
gust | +0.015 |
aney | +0.014 |
anne | +0.014 |
Neg logit contributions | |
ate | -0.014 |
things | -0.010 |
his | -0.010 |
gear | -0.010 |
other | -0.009 |
Token | smell |
Token ID | 8508 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
ate | +0.010 |
his | +0.009 |
things | +0.009 |
other | +0.008 |
." | +0.008 |
Neg logit contributions | |
years | -0.014 |
ited | -0.014 |
seventeen | -0.014 |
hy | -0.013 |
gust | -0.013 |
Token | Suddenly |
Token ID | 24975 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
ate | +0.001 |
things | +0.001 |
other | +0.001 |
his | +0.001 |
friends | +0.001 |
Neg logit contributions | |
seventeen | -0.002 |
hy | -0.002 |
gust | -0.002 |
years | -0.002 |
ous | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | +3.52e-03 |
Pos logit contributions | |
ited | +0.036 |
seventeen | +0.035 |
years | +0.035 |
hy | +0.035 |
gust | +0.034 |
Neg logit contributions | |
ate | -0.017 |
his | -0.014 |
things | -0.013 |
other | -0.011 |
| -0.010 |
Token | he |
Token ID | 339 |
Feature activation | +6.51e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.008 |
seventeen | -0.008 |
hy | -0.008 |
years | -0.008 |
gust | -0.008 |
Token | felt |
Token ID | 2936 |
Feature activation | -1.83e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.010 |
other | +0.009 |
things | +0.009 |
| +0.008 |
Neg logit contributions | |
hy | -0.013 |
ited | -0.012 |
seventeen | -0.012 |
years | -0.012 |
ous | -0.012 |
Token | a |
Token ID | 257 |
Feature activation | -9.06e-03 |
Pos logit contributions | |
ited | +0.005 |
seventeen | +0.005 |
hy | +0.005 |
ous | +0.005 |
years | +0.005 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.001 |
other | -0.001 |
the | -0.001 |
Token | gust |
Token ID | 35253 |
Feature activation | -6.64e-02 |
Pos logit contributions | |
years | +0.021 |
seventeen | +0.019 |
hy | +0.019 |
anne | +0.019 |
ited | +0.019 |
Neg logit contributions | |
his | -0.011 |
ate | -0.010 |
things | -0.010 |
other | -0.010 |
water | -0.009 |
Token | of |
Token ID | 286 |
Feature activation | -2.91e-02 |
Pos logit contributions | |
seventeen | +0.126 |
ited | +0.122 |
gust | +0.119 |
anne | +0.116 |
hy | +0.116 |
Neg logit contributions | |
ate | -0.105 |
his | -0.099 |
| -0.091 |
things | -0.090 |
other | -0.087 |
Token | wind |
Token ID | 2344 |
Feature activation | -2.21e-02 |
Pos logit contributions | |
ous | +0.069 |
hy | +0.068 |
years | +0.065 |
seventeen | +0.064 |
storm | +0.064 |
Neg logit contributions | |
his | -0.040 |
ate | -0.036 |
things | -0.035 |
other | -0.034 |
water | -0.032 |
Token | ! |
Token ID | 0 |
Feature activation | +1.26e-03 |
Pos logit contributions | |
years | +0.050 |
seventeen | +0.048 |
ited | +0.045 |
aney | +0.044 |
hy | +0.043 |
Neg logit contributions | |
his | -0.030 |
and | -0.028 |
ate | -0.028 |
. | -0.027 |
the | -0.026 |
Token | He |
Token ID | 679 |
Feature activation | +5.50e-03 |
Pos logit contributions | |
ate | +0.002 |
things | +0.002 |
other | +0.001 |
his | +0.001 |
gear | +0.001 |
Neg logit contributions | |
gust | -0.003 |
hy | -0.003 |
seventeen | -0.003 |
years | -0.002 |
ous | -0.002 |
Token | was |
Token ID | 373 |
Feature activation | -4.05e-03 |
Pos logit contributions | |
ate | +0.008 |
his | +0.007 |
things | +0.007 |
other | +0.007 |
| +0.006 |
Neg logit contributions | |
hy | -0.011 |
seventeen | -0.011 |
years | -0.011 |
ited | -0.011 |
gust | -0.011 |
Token | diary |
Token ID | 26339 |
Feature activation | -3.76e-02 |
Pos logit contributions | |
ate | +0.019 |
his | +0.013 |
things | +0.013 |
." | +0.013 |
| +0.012 |
Neg logit contributions | |
years | -0.026 |
hy | -0.026 |
gust | -0.026 |
ited | -0.026 |
seventeen | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | +1.33e-03 |
Pos logit contributions | |
ited | +0.098 |
seventeen | +0.098 |
years | +0.097 |
hy | +0.096 |
gust | +0.095 |
Neg logit contributions | |
ate | -0.037 |
his | -0.028 |
things | -0.027 |
other | -0.023 |
." | -0.020 |
Token | George |
Token ID | 4502 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
ate | +0.002 |
things | +0.002 |
his | +0.002 |
other | +0.001 |
yourself | +0.001 |
Neg logit contributions | |
seventeen | -0.003 |
hy | -0.003 |
gust | -0.002 |
ited | -0.002 |
years | -0.002 |
Token | kept |
Token ID | 4030 |
Feature activation | -6.50e-03 |
Pos logit contributions | |
seventeen | +0.024 |
ited | +0.024 |
gust | +0.024 |
hy | +0.024 |
years | +0.023 |
Neg logit contributions | |
ate | -0.019 |
his | -0.016 |
things | -0.015 |
other | -0.014 |
| -0.014 |
Token | his |
Token ID | 465 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
years | +0.013 |
ited | +0.013 |
seventeen | +0.013 |
gust | +0.013 |
hy | +0.012 |
Neg logit contributions | |
ate | -0.010 |
things | -0.008 |
his | -0.008 |
other | -0.007 |
." | -0.007 |
Token | diary |
Token ID | 26339 |
Feature activation | -6.40e-02 |
Pos logit contributions | |
ited | +0.021 |
seventeen | +0.021 |
years | +0.021 |
hy | +0.021 |
gust | +0.021 |
Neg logit contributions | |
ate | -0.015 |
his | -0.013 |
things | -0.012 |
other | -0.011 |
." | -0.010 |
Token | in |
Token ID | 287 |
Feature activation | -7.31e-03 |
Pos logit contributions | |
seventeen | +0.160 |
ited | +0.155 |
years | +0.154 |
gust | +0.151 |
hy | +0.149 |
Neg logit contributions | |
ate | -0.077 |
his | -0.068 |
things | -0.064 |
other | -0.053 |
gear | -0.050 |
Token | a |
Token ID | 257 |
Feature activation | +1.83e-03 |
Pos logit contributions | |
ited | +0.018 |
years | +0.018 |
hy | +0.018 |
gust | +0.018 |
seventeen | +0.018 |
Neg logit contributions | |
ate | -0.008 |
things | -0.004 |
his | -0.004 |
other | -0.004 |
." | -0.004 |
Token | special |
Token ID | 2041 |
Feature activation | -1.72e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
toy | +0.002 |
Neg logit contributions | |
seventeen | -0.004 |
years | -0.004 |
ited | -0.004 |
hy | -0.004 |
ous | -0.004 |
Token | box |
Token ID | 3091 |
Feature activation | +3.58e-03 |
Pos logit contributions | |
ited | +0.005 |
seventeen | +0.005 |
years | +0.005 |
hy | +0.005 |
gust | +0.005 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.000 |
." | -0.000 |
Token | , |
Token ID | 11 |
Feature activation | -8.49e-04 |
Pos logit contributions | |
his | +0.003 |
ate | +0.003 |
and | +0.002 |
things | +0.002 |
. | +0.002 |
Neg logit contributions | |
seventeen | -0.010 |
years | -0.010 |
gust | -0.010 |
ited | -0.010 |
aney | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +4.19e-03 |
Pos logit contributions | |
ate | +0.004 |
things | +0.003 |
his | +0.002 |
gear | +0.002 |
toy | +0.002 |
Neg logit contributions | |
years | -0.015 |
hy | -0.014 |
ited | -0.014 |
seventeen | -0.014 |
gust | -0.014 |
Token | Suddenly |
Token ID | 38582 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
ate | +0.006 |
his | +0.005 |
things | +0.005 |
other | +0.005 |
| +0.005 |
Neg logit contributions | |
ited | -0.009 |
seventeen | -0.009 |
hy | -0.009 |
gust | -0.009 |
years | -0.008 |
Token | she |
Token ID | 673 |
Feature activation | +3.53e-03 |
Pos logit contributions | |
ited | +0.033 |
seventeen | +0.032 |
years | +0.032 |
hy | +0.031 |
aney | +0.030 |
Neg logit contributions | |
ate | -0.010 |
his | -0.009 |
things | -0.009 |
other | -0.007 |
the | -0.007 |
Token | felt |
Token ID | 2936 |
Feature activation | -2.65e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.005 |
other | +0.005 |
things | +0.004 |
| +0.004 |
Neg logit contributions | |
seventeen | -0.007 |
hy | -0.007 |
years | -0.007 |
ited | -0.007 |
ous | -0.007 |
Token | a |
Token ID | 257 |
Feature activation | -9.02e-03 |
Pos logit contributions | |
seventeen | +0.008 |
ited | +0.007 |
hy | +0.007 |
ous | +0.007 |
anne | +0.007 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.002 |
other | -0.001 |
the | -0.001 |
Token | gust |
Token ID | 35253 |
Feature activation | -6.29e-02 |
Pos logit contributions | |
years | +0.020 |
seventeen | +0.020 |
ited | +0.019 |
hy | +0.019 |
aney | +0.019 |
Neg logit contributions | |
his | -0.011 |
ate | -0.011 |
things | -0.010 |
other | -0.010 |
| -0.009 |
Token | of |
Token ID | 286 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
seventeen | +0.134 |
ited | +0.126 |
anne | +0.124 |
sing | +0.121 |
gust | +0.119 |
Neg logit contributions | |
his | -0.086 |
ate | -0.083 |
| -0.078 |
and | -0.077 |
things | -0.074 |
Token | wind |
Token ID | 2344 |
Feature activation | -1.96e-02 |
Pos logit contributions | |
ous | +0.060 |
years | +0.059 |
seventeen | +0.059 |
hy | +0.059 |
ited | +0.058 |
Neg logit contributions | |
his | -0.037 |
ate | -0.036 |
things | -0.034 |
other | -0.033 |
the | -0.030 |
Token | , |
Token ID | 11 |
Feature activation | +1.73e-03 |
Pos logit contributions | |
seventeen | +0.046 |
years | +0.046 |
aney | +0.044 |
ited | +0.043 |
gary | +0.042 |
Neg logit contributions | |
his | -0.025 |
and | -0.023 |
ate | -0.022 |
. | -0.021 |
the | -0.021 |
Token | and |
Token ID | 290 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
| +0.001 |
Neg logit contributions | |
ited | -0.005 |
seventeen | -0.005 |
years | -0.005 |
hy | -0.005 |
gust | -0.004 |
Token | she |
Token ID | 673 |
Feature activation | +6.53e-03 |
Pos logit contributions | |
his | +0.001 |
the | +0.001 |
things | +0.000 |
other | +0.000 |
ate | +0.000 |
Neg logit contributions | |
seventeen | -0.003 |
hy | -0.003 |
ited | -0.003 |
aney | -0.003 |
years | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -4.60e-03 |
Pos logit contributions | |
ate | +0.013 |
his | +0.010 |
things | +0.010 |
other | +0.009 |
| +0.008 |
Neg logit contributions | |
ited | -0.027 |
seventeen | -0.027 |
years | -0.026 |
hy | -0.026 |
gust | -0.026 |
Token | she |
Token ID | 673 |
Feature activation | +4.23e-04 |
Pos logit contributions | |
seventeen | +0.010 |
ited | +0.010 |
hy | +0.010 |
years | +0.010 |
gust | +0.010 |
Neg logit contributions | |
ate | -0.007 |
his | -0.006 |
things | -0.005 |
other | -0.005 |
| -0.005 |
Token | always |
Token ID | 1464 |
Feature activation | -2.35e-03 |
Pos logit contributions | |
ate | +0.001 |
things | +0.001 |
his | +0.001 |
stuff | +0.001 |
gear | +0.001 |
Neg logit contributions | |
years | -0.001 |
ited | -0.001 |
ous | -0.001 |
wil | -0.001 |
storm | -0.001 |
Token | kept |
Token ID | 4030 |
Feature activation | -1.35e-03 |
Pos logit contributions | |
ited | +0.004 |
seventeen | +0.004 |
years | +0.004 |
hy | +0.004 |
gust | +0.004 |
Neg logit contributions | |
ate | -0.004 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
." | -0.003 |
Token | her |
Token ID | 607 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
years | +0.003 |
gust | +0.003 |
ited | +0.003 |
hy | +0.002 |
seventeen | +0.002 |
Neg logit contributions | |
ate | -0.002 |
." | -0.001 |
gear | -0.001 |
things | -0.001 |
other | -0.001 |
Token | diary |
Token ID | 26339 |
Feature activation | -6.23e-02 |
Pos logit contributions | |
ited | +0.021 |
hy | +0.021 |
years | +0.021 |
seventeen | +0.021 |
gust | +0.021 |
Neg logit contributions | |
ate | -0.022 |
his | -0.018 |
things | -0.018 |
other | -0.017 |
." | -0.016 |
Token | close |
Token ID | 1969 |
Feature activation | -4.01e-03 |
Pos logit contributions | |
seventeen | +0.149 |
ited | +0.146 |
years | +0.145 |
gust | +0.142 |
hy | +0.142 |
Neg logit contributions | |
ate | -0.081 |
his | -0.066 |
things | -0.066 |
other | -0.056 |
." | -0.052 |
Token | by |
Token ID | 416 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
seventeen | +0.010 |
ited | +0.010 |
gust | +0.010 |
hy | +0.010 |
years | +0.010 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
other | -0.003 |
." | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -4.36e-03 |
Pos logit contributions | |
ate | +0.026 |
his | +0.023 |
things | +0.023 |
other | +0.021 |
the | +0.019 |
Neg logit contributions | |
ited | -0.042 |
seventeen | -0.041 |
hy | -0.040 |
years | -0.039 |
gust | -0.039 |
Token | just |
Token ID | 655 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
seventeen | +0.009 |
ited | +0.009 |
hy | +0.009 |
years | +0.009 |
gust | +0.009 |
Neg logit contributions | |
ate | -0.006 |
his | -0.006 |
things | -0.006 |
other | -0.005 |
the | -0.005 |
Token | in |
Token ID | 287 |
Feature activation | +6.56e-03 |
Pos logit contributions | |
his | +0.025 |
ate | +0.023 |
things | +0.023 |
the | +0.021 |
other | +0.020 |
Neg logit contributions | |
seventeen | -0.052 |
ited | -0.052 |
aney | -0.051 |
years | -0.050 |
anne | -0.049 |
Token | the |
Token ID | 262 |
Feature activation | +5.76e-03 |
Pos logit contributions | |
ited | +0.026 |
seventeen | +0.026 |
years | +0.026 |
hy | +0.025 |
gust | +0.024 |
Neg logit contributions | |
ate | -0.010 |
his | -0.008 |
things | -0.008 |
other | -0.007 |
the | -0.006 |
Token | angel |
Token ID | 18304 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
things | +0.009 |
other | +0.009 |
ate | +0.009 |
friends | +0.008 |
his | +0.008 |
Neg logit contributions | |
seventeen | -0.012 |
ited | -0.011 |
years | -0.011 |
hy | -0.011 |
oled | -0.011 |
Token | felt |
Token ID | 2936 |
Feature activation | +4.44e-04 |
Pos logit contributions | |
seventeen | +0.043 |
years | +0.042 |
hy | +0.040 |
ited | +0.039 |
aney | +0.038 |
Neg logit contributions | |
ate | -0.025 |
his | -0.024 |
other | -0.023 |
things | -0.022 |
friends | -0.022 |
Token | a |
Token ID | 257 |
Feature activation | -8.50e-03 |
Pos logit contributions | |
his | +0.000 |
ate | +0.000 |
things | +0.000 |
the | +0.000 |
other | +0.000 |
Neg logit contributions | |
seventeen | -0.001 |
ited | -0.001 |
ous | -0.001 |
storm | -0.001 |
hy | -0.001 |
Token | great |
Token ID | 1049 |
Feature activation | -3.44e-03 |
Pos logit contributions | |
years | +0.019 |
seventeen | +0.018 |
hy | +0.017 |
aney | +0.017 |
anne | +0.017 |
Neg logit contributions | |
his | -0.011 |
other | -0.010 |
things | -0.010 |
ate | -0.010 |
water | -0.010 |
Token | gust |
Token ID | 35253 |
Feature activation | -6.23e-02 |
Pos logit contributions | |
years | +0.008 |
seventeen | +0.008 |
hy | +0.007 |
ited | +0.007 |
hetically | +0.007 |
Neg logit contributions | |
ate | -0.005 |
his | -0.005 |
things | -0.004 |
place | -0.004 |
other | -0.004 |
Token | of |
Token ID | 286 |
Feature activation | -2.08e-02 |
Pos logit contributions | |
seventeen | +0.130 |
ited | +0.122 |
sing | +0.117 |
gust | +0.117 |
hy | +0.116 |
Neg logit contributions | |
ate | -0.089 |
his | -0.087 |
| -0.080 |
things | -0.078 |
and | -0.076 |
Token | wind |
Token ID | 2344 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
seventeen | +0.050 |
ous | +0.049 |
years | +0.049 |
aney | +0.048 |
hy | +0.047 |
Neg logit contributions | |
his | -0.027 |
things | -0.024 |
other | -0.024 |
water | -0.023 |
ate | -0.022 |
Token | and |
Token ID | 290 |
Feature activation | +7.29e-03 |
Pos logit contributions | |
years | +0.043 |
seventeen | +0.043 |
ited | +0.040 |
aney | +0.039 |
gary | +0.039 |
Neg logit contributions | |
his | -0.022 |
ate | -0.022 |
and | -0.021 |
. | -0.020 |
the | -0.019 |
Token | her |
Token ID | 607 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
his | +0.007 |
ate | +0.006 |
the | +0.006 |
things | +0.006 |
other | +0.005 |
Neg logit contributions | |
seventeen | -0.020 |
ited | -0.020 |
years | -0.019 |
aney | -0.019 |
hy | -0.019 |
Token | wings |
Token ID | 12098 |
Feature activation | -1.98e-02 |
Pos logit contributions | |
ate | +0.014 |
things | +0.013 |
his | +0.012 |
other | +0.012 |
friends | +0.011 |
Neg logit contributions | |
ited | -0.023 |
seventeen | -0.023 |
years | -0.023 |
hy | -0.021 |
ivated | -0.021 |
Token | secrets |
Token ID | 13141 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
ate | +0.014 |
his | +0.010 |
things | +0.009 |
other | +0.008 |
| +0.008 |
Neg logit contributions | |
hy | -0.026 |
ited | -0.025 |
gust | -0.025 |
seventeen | -0.025 |
years | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | +1.56e-03 |
Pos logit contributions | |
seventeen | +0.061 |
years | +0.060 |
ited | +0.060 |
gust | +0.058 |
hy | +0.056 |
Neg logit contributions | |
ate | -0.008 |
his | -0.006 |
things | -0.006 |
." | -0.004 |
other | -0.003 |
Token | She |
Token ID | 1375 |
Feature activation | +1.54e-03 |
Pos logit contributions | |
ate | +0.003 |
things | +0.002 |
his | +0.002 |
gear | +0.002 |
other | +0.002 |
Neg logit contributions | |
years | -0.003 |
hy | -0.003 |
gust | -0.003 |
seventeen | -0.003 |
ited | -0.003 |
Token | kept |
Token ID | 4030 |
Feature activation | -1.61e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
| +0.002 |
Neg logit contributions | |
seventeen | -0.003 |
ited | -0.003 |
gust | -0.003 |
years | -0.003 |
hy | -0.003 |
Token | her |
Token ID | 607 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
ited | +0.003 |
seventeen | +0.003 |
hy | +0.003 |
gust | +0.003 |
years | +0.003 |
Neg logit contributions | |
ate | -0.003 |
his | -0.002 |
things | -0.002 |
other | -0.002 |
| -0.002 |
Token | diary |
Token ID | 26339 |
Feature activation | -6.17e-02 |
Pos logit contributions | |
seventeen | +0.035 |
ited | +0.034 |
years | +0.034 |
hy | +0.033 |
gust | +0.033 |
Neg logit contributions | |
ate | -0.020 |
things | -0.017 |
his | -0.016 |
other | -0.015 |
friends | -0.013 |
Token | under |
Token ID | 739 |
Feature activation | -4.35e-03 |
Pos logit contributions | |
seventeen | +0.168 |
years | +0.161 |
ited | +0.160 |
gust | +0.156 |
thirteen | +0.151 |
Neg logit contributions | |
ate | -0.066 |
his | -0.056 |
things | -0.055 |
other | -0.043 |
and | -0.043 |
Token | her |
Token ID | 607 |
Feature activation | +8.56e-03 |
Pos logit contributions | |
ited | +0.011 |
seventeen | +0.011 |
hy | +0.011 |
years | +0.011 |
gust | +0.010 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
." | -0.003 |
Token | pillow |
Token ID | 28774 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
ate | +0.009 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
toy | +0.006 |
Neg logit contributions | |
ited | -0.022 |
seventeen | -0.022 |
years | -0.021 |
hy | -0.020 |
gust | -0.020 |
Token | and |
Token ID | 290 |
Feature activation | +3.70e-04 |
Pos logit contributions | |
seventeen | +0.076 |
ited | +0.076 |
years | +0.075 |
gust | +0.072 |
hy | +0.071 |
Neg logit contributions | |
ate | -0.020 |
his | -0.017 |
things | -0.014 |
other | -0.012 |
." | -0.012 |
Token | never |
Token ID | 1239 |
Feature activation | +6.76e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.000 |
other | +0.000 |
the | +0.000 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
years | -0.001 |
gust | -0.001 |
aney | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +3.74e-04 |
Pos logit contributions | |
seventeen | +0.009 |
ited | +0.009 |
hy | +0.009 |
years | +0.009 |
gust | +0.009 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.004 |
." | -0.003 |
Token | trees |
Token ID | 7150 |
Feature activation | -9.75e-04 |
Pos logit contributions | |
ate | +0.000 |
things | +0.000 |
his | +0.000 |
other | +0.000 |
friends | +0.000 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
hy | -0.001 |
years | -0.001 |
gust | -0.001 |
Token | waved |
Token ID | 26834 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
seventeen | +0.002 |
years | +0.002 |
hy | +0.002 |
ited | +0.002 |
aney | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
the | -0.001 |
Token | in |
Token ID | 287 |
Feature activation | +2.54e-03 |
Pos logit contributions | |
ited | +0.031 |
seventeen | +0.031 |
years | +0.031 |
hy | +0.030 |
gust | +0.029 |
Neg logit contributions | |
ate | -0.013 |
his | -0.011 |
things | -0.011 |
other | -0.009 |
." | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +2.31e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
gust | -0.007 |
hy | -0.007 |
years | -0.007 |
Token | gust |
Token ID | 35253 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
ate | +0.003 |
things | +0.003 |
other | +0.003 |
his | +0.003 |
friends | +0.003 |
Neg logit contributions | |
years | -0.005 |
seventeen | -0.005 |
ited | -0.005 |
hy | -0.005 |
aney | -0.005 |
Token | s |
Token ID | 82 |
Feature activation | +8.87e-03 |
Pos logit contributions | |
seventeen | +0.120 |
ited | +0.119 |
gust | +0.114 |
hy | +0.111 |
years | +0.109 |
Neg logit contributions | |
ate | -0.102 |
his | -0.095 |
things | -0.092 |
other | -0.087 |
| -0.087 |
Token | of |
Token ID | 286 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
ate | +0.011 |
things | +0.010 |
his | +0.009 |
other | +0.009 |
." | +0.008 |
Neg logit contributions | |
ited | -0.022 |
years | -0.021 |
seventeen | -0.021 |
hy | -0.020 |
gust | -0.019 |
Token | wind |
Token ID | 2344 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
ited | +0.034 |
seventeen | +0.033 |
years | +0.033 |
hy | +0.033 |
ous | +0.032 |
Neg logit contributions | |
ate | -0.032 |
his | -0.028 |
things | -0.027 |
other | -0.025 |
gear | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +8.74e-03 |
Pos logit contributions | |
years | +0.056 |
seventeen | +0.055 |
ited | +0.055 |
gust | +0.053 |
aney | +0.052 |
Neg logit contributions | |
ate | -0.006 |
his | -0.004 |
things | -0.003 |
." | -0.003 |
. | -0.001 |
Token | The |
Token ID | 383 |
Feature activation | -6.11e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
." | +0.006 |
Neg logit contributions | |
ited | -0.021 |
seventeen | -0.021 |
years | -0.021 |
hy | -0.021 |
gust | -0.020 |
Token | the |
Token ID | 262 |
Feature activation | +3.74e-04 |
Pos logit contributions | |
seventeen | +0.009 |
ited | +0.009 |
hy | +0.009 |
years | +0.009 |
gust | +0.009 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.004 |
." | -0.003 |
Token | trees |
Token ID | 7150 |
Feature activation | -9.75e-04 |
Pos logit contributions | |
ate | +0.000 |
things | +0.000 |
his | +0.000 |
other | +0.000 |
friends | +0.000 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
hy | -0.001 |
years | -0.001 |
gust | -0.001 |
Token | waved |
Token ID | 26834 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
seventeen | +0.002 |
years | +0.002 |
hy | +0.002 |
ited | +0.002 |
aney | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
the | -0.001 |
Token | in |
Token ID | 287 |
Feature activation | +2.54e-03 |
Pos logit contributions | |
ited | +0.031 |
seventeen | +0.031 |
years | +0.031 |
hy | +0.030 |
gust | +0.029 |
Neg logit contributions | |
ate | -0.013 |
his | -0.011 |
things | -0.011 |
other | -0.009 |
." | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +2.31e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
gust | -0.007 |
hy | -0.007 |
years | -0.007 |
Token | gust |
Token ID | 35253 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
ate | +0.003 |
things | +0.003 |
other | +0.003 |
his | +0.003 |
friends | +0.003 |
Neg logit contributions | |
years | -0.005 |
seventeen | -0.005 |
ited | -0.005 |
hy | -0.005 |
aney | -0.005 |
Token | s |
Token ID | 82 |
Feature activation | +8.87e-03 |
Pos logit contributions | |
seventeen | +0.120 |
ited | +0.119 |
gust | +0.114 |
hy | +0.111 |
years | +0.109 |
Neg logit contributions | |
ate | -0.102 |
his | -0.095 |
things | -0.092 |
other | -0.087 |
| -0.087 |
Token | of |
Token ID | 286 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
ate | +0.011 |
things | +0.010 |
his | +0.009 |
other | +0.009 |
." | +0.008 |
Neg logit contributions | |
ited | -0.022 |
years | -0.021 |
seventeen | -0.021 |
hy | -0.020 |
gust | -0.019 |
Token | wind |
Token ID | 2344 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
ited | +0.034 |
seventeen | +0.033 |
years | +0.033 |
hy | +0.033 |
ous | +0.032 |
Neg logit contributions | |
ate | -0.032 |
his | -0.028 |
things | -0.027 |
other | -0.025 |
gear | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +8.74e-03 |
Pos logit contributions | |
years | +0.056 |
seventeen | +0.055 |
ited | +0.055 |
gust | +0.053 |
aney | +0.052 |
Neg logit contributions | |
ate | -0.006 |
his | -0.004 |
things | -0.003 |
." | -0.003 |
. | -0.001 |
Token | The |
Token ID | 383 |
Feature activation | -6.11e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
." | +0.006 |
Neg logit contributions | |
ited | -0.021 |
seventeen | -0.021 |
years | -0.021 |
hy | -0.021 |
gust | -0.020 |
Token | on |
Token ID | 319 |
Feature activation | +9.34e-03 |
Pos logit contributions | |
ate | +0.015 |
things | +0.011 |
his | +0.010 |
gear | +0.009 |
other | +0.009 |
Neg logit contributions | |
gust | -0.020 |
hy | -0.020 |
years | -0.020 |
ited | -0.019 |
seventeen | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | -4.07e-03 |
Pos logit contributions | |
ate | +0.012 |
his | +0.009 |
things | +0.009 |
other | +0.008 |
gear | +0.008 |
Neg logit contributions | |
ited | -0.021 |
seventeen | -0.021 |
hy | -0.021 |
gust | -0.021 |
years | -0.021 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.21e-03 |
Pos logit contributions | |
ited | +0.009 |
hy | +0.009 |
gust | +0.009 |
years | +0.009 |
seventeen | +0.009 |
Neg logit contributions | |
ate | -0.006 |
things | -0.004 |
his | -0.004 |
gear | -0.004 |
other | -0.004 |
Token | kept |
Token ID | 4030 |
Feature activation | -5.74e-03 |
Pos logit contributions | |
ited | +0.004 |
years | +0.004 |
hy | +0.004 |
seventeen | +0.004 |
gust | +0.004 |
Neg logit contributions | |
ate | -0.004 |
things | -0.003 |
his | -0.003 |
other | -0.003 |
gear | -0.003 |
Token | her |
Token ID | 607 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
years | +0.009 |
ited | +0.009 |
seventeen | +0.009 |
gust | +0.009 |
hy | +0.009 |
Neg logit contributions | |
ate | -0.011 |
things | -0.009 |
his | -0.009 |
other | -0.009 |
." | -0.008 |
Token | diary |
Token ID | 26339 |
Feature activation | -6.10e-02 |
Pos logit contributions | |
seventeen | +0.040 |
ited | +0.040 |
years | +0.040 |
hy | +0.039 |
gust | +0.039 |
Neg logit contributions | |
ate | -0.024 |
things | -0.020 |
his | -0.019 |
other | -0.017 |
gear | -0.016 |
Token | in |
Token ID | 287 |
Feature activation | -8.44e-03 |
Pos logit contributions | |
seventeen | +0.160 |
ited | +0.154 |
years | +0.153 |
gust | +0.151 |
hy | +0.147 |
Neg logit contributions | |
ate | -0.068 |
his | -0.057 |
things | -0.055 |
other | -0.046 |
friends | -0.043 |
Token | a |
Token ID | 257 |
Feature activation | -2.81e-03 |
Pos logit contributions | |
years | +0.019 |
ited | +0.019 |
hy | +0.019 |
gust | +0.019 |
seventeen | +0.019 |
Neg logit contributions | |
ate | -0.011 |
things | -0.007 |
his | -0.007 |
." | -0.006 |
other | -0.006 |
Token | safe |
Token ID | 3338 |
Feature activation | +3.44e-03 |
Pos logit contributions | |
seventeen | +0.007 |
ous | +0.007 |
years | +0.007 |
ited | +0.007 |
hy | +0.006 |
Neg logit contributions | |
his | -0.003 |
ate | -0.003 |
things | -0.003 |
other | -0.003 |
toy | -0.003 |
Token | place |
Token ID | 1295 |
Feature activation | +9.72e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
place | +0.001 |
Neg logit contributions | |
years | -0.011 |
seventeen | -0.011 |
ited | -0.010 |
gust | -0.010 |
hy | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | +4.55e-03 |
Pos logit contributions | |
ate | +0.006 |
his | +0.006 |
things | +0.005 |
and | +0.004 |
." | +0.004 |
Neg logit contributions | |
seventeen | -0.030 |
gust | -0.029 |
ited | -0.029 |
years | -0.028 |
plet | -0.027 |
Token | you |
Token ID | 345 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
years | +0.034 |
seventeen | +0.033 |
hy | +0.033 |
gust | +0.033 |
ited | +0.033 |
Neg logit contributions | |
ate | -0.017 |
his | -0.012 |
things | -0.011 |
other | -0.010 |
gear | -0.010 |
Token | ." |
Token ID | 526 |
Feature activation | -2.00e-03 |
Pos logit contributions | |
hy | +0.059 |
seventeen | +0.059 |
years | +0.059 |
ited | +0.058 |
gust | +0.058 |
Neg logit contributions | |
ate | -0.032 |
his | -0.022 |
things | -0.021 |
gear | -0.019 |
other | -0.017 |
Token | They |
Token ID | 1119 |
Feature activation | +5.03e-04 |
Pos logit contributions | |
seventeen | +0.004 |
gust | +0.004 |
hy | +0.004 |
years | +0.004 |
ited | +0.004 |
Neg logit contributions | |
ate | -0.003 |
things | -0.002 |
his | -0.002 |
gear | -0.002 |
other | -0.002 |
Token | take |
Token ID | 1011 |
Feature activation | +1.48e-04 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
hy | -0.001 |
years | -0.001 |
gust | -0.001 |
Token | their |
Token ID | 511 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
ate | +0.000 |
things | +0.000 |
gear | +0.000 |
his | +0.000 |
." | +0.000 |
Neg logit contributions | |
gust | -0.000 |
seventeen | -0.000 |
years | -0.000 |
hy | -0.000 |
ited | -0.000 |
Token | diary |
Token ID | 26339 |
Feature activation | -6.08e-02 |
Pos logit contributions | |
ited | +0.011 |
years | +0.011 |
gust | +0.011 |
hy | +0.010 |
seventeen | +0.010 |
Neg logit contributions | |
ate | -0.010 |
his | -0.007 |
." | -0.006 |
things | -0.006 |
| -0.006 |
Token | and |
Token ID | 290 |
Feature activation | -1.61e-03 |
Pos logit contributions | |
ited | +0.155 |
hy | +0.154 |
seventeen | +0.153 |
gust | +0.152 |
years | +0.152 |
Neg logit contributions | |
ate | -0.061 |
his | -0.043 |
things | -0.041 |
other | -0.035 |
." | -0.030 |
Token | show |
Token ID | 905 |
Feature activation | +6.40e-03 |
Pos logit contributions | |
hy | +0.003 |
ited | +0.003 |
seventeen | +0.003 |
gust | +0.003 |
years | +0.003 |
Neg logit contributions | |
ate | -0.003 |
things | -0.002 |
his | -0.002 |
other | -0.002 |
." | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | -4.66e-03 |
Pos logit contributions | |
ate | +0.009 |
things | +0.006 |
gear | +0.006 |
his | +0.005 |
| +0.005 |
Neg logit contributions | |
gust | -0.014 |
hy | -0.013 |
years | -0.013 |
seventeen | -0.013 |
ited | -0.013 |
Token | to |
Token ID | 284 |
Feature activation | -3.34e-03 |
Pos logit contributions | |
ited | +0.011 |
seventeen | +0.011 |
years | +0.011 |
hy | +0.011 |
gust | +0.011 |
Neg logit contributions | |
ate | -0.006 |
his | -0.005 |
things | -0.005 |
other | -0.004 |
." | -0.004 |
Token | mom |
Token ID | 1995 |
Feature activation | +7.88e-03 |
Pos logit contributions | |
gust | +0.008 |
years | +0.008 |
seventeen | +0.008 |
hy | +0.008 |
ited | +0.008 |
Neg logit contributions | |
ate | -0.004 |
things | -0.003 |
his | -0.002 |
gear | -0.002 |
other | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | -4.22e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
." | +0.002 |
Neg logit contributions | |
ited | -0.010 |
seventeen | -0.010 |
years | -0.010 |
hy | -0.010 |
gust | -0.009 |
Token | h |
Token ID | 289 |
Feature activation | -1.43e-03 |
Pos logit contributions | |
ited | +0.011 |
seventeen | +0.011 |
years | +0.011 |
gust | +0.010 |
hy | +0.010 |
Neg logit contributions | |
ate | -0.004 |
things | -0.004 |
his | -0.003 |
other | -0.003 |
gear | -0.003 |
Token | anger |
Token ID | 2564 |
Feature activation | +2.14e-03 |
Pos logit contributions | |
ited | +0.003 |
seventeen | +0.003 |
hy | +0.003 |
years | +0.003 |
gust | +0.003 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.002 |
other | -0.002 |
." | -0.002 |
Token | for |
Token ID | 329 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
ate | +0.002 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.006 |
seventeen | -0.006 |
gust | -0.006 |
years | -0.006 |
hy | -0.006 |
Token | her |
Token ID | 607 |
Feature activation | +8.53e-03 |
Pos logit contributions | |
ited | +0.028 |
seventeen | +0.028 |
hy | +0.027 |
years | +0.027 |
gust | +0.027 |
Neg logit contributions | |
ate | -0.012 |
his | -0.009 |
things | -0.009 |
other | -0.008 |
." | -0.007 |
Token | brand |
Token ID | 4508 |
Feature activation | -6.08e-02 |
Pos logit contributions | |
ate | +0.007 |
his | +0.005 |
things | +0.005 |
other | +0.004 |
." | +0.003 |
Neg logit contributions | |
ited | -0.024 |
seventeen | -0.024 |
years | -0.023 |
gust | -0.023 |
hy | -0.023 |
Token | new |
Token ID | 649 |
Feature activation | -2.19e-03 |
Pos logit contributions | |
ous | +0.135 |
bell | +0.131 |
hy | +0.130 |
ited | +0.129 |
gust | +0.127 |
Neg logit contributions | |
ate | -0.067 |
his | -0.051 |
things | -0.041 |
Coal | -0.040 |
chefs | -0.040 |
Token | dress |
Token ID | 6576 |
Feature activation | +5.51e-03 |
Pos logit contributions | |
hy | +0.005 |
ited | +0.005 |
seventeen | +0.005 |
gust | +0.005 |
years | +0.005 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.001 |
other | -0.001 |
| -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +7.06e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
ited | -0.015 |
hy | -0.015 |
seventeen | -0.015 |
years | -0.015 |
gust | -0.015 |
Token | The |
Token ID | 383 |
Feature activation | -5.49e-03 |
Pos logit contributions | |
ate | +0.010 |
things | +0.008 |
his | +0.008 |
other | +0.007 |
gear | +0.007 |
Neg logit contributions | |
hy | -0.015 |
seventeen | -0.015 |
years | -0.015 |
gust | -0.015 |
ited | -0.014 |
Token | cats |
Token ID | 11875 |
Feature activation | -8.98e-03 |
Pos logit contributions | |
ited | +0.015 |
seventeen | +0.015 |
years | +0.015 |
hy | +0.015 |
ous | +0.015 |
Neg logit contributions | |
ate | -0.004 |
things | -0.003 |
his | -0.003 |
other | -0.003 |
friends | -0.002 |
Token | though |
Token ID | 996 |
Feature activation | -3.40e-03 |
Pos logit contributions | |
hy | +0.006 |
ous | +0.006 |
gust | +0.006 |
seventeen | +0.006 |
ited | +0.006 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.002 |
other | -0.002 |
| -0.002 |
Token | , |
Token ID | 11 |
Feature activation | +5.96e-03 |
Pos logit contributions | |
ited | +0.007 |
gust | +0.007 |
seventeen | +0.007 |
hy | +0.007 |
years | +0.007 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.003 |
other | -0.003 |
gear | -0.003 |
Token | Sally |
Token ID | 25737 |
Feature activation | +5.08e-03 |
Pos logit contributions | |
ate | +0.009 |
his | +0.006 |
things | +0.006 |
gear | +0.006 |
other | +0.006 |
Neg logit contributions | |
gust | -0.012 |
ited | -0.012 |
seventeen | -0.012 |
years | -0.012 |
hy | -0.012 |
Token | had |
Token ID | 550 |
Feature activation | +1.08e-03 |
Pos logit contributions | |
ate | +0.008 |
things | +0.006 |
his | +0.006 |
other | +0.005 |
gear | +0.005 |
Neg logit contributions | |
ited | -0.010 |
hy | -0.010 |
anne | -0.010 |
gust | -0.009 |
storm | -0.009 |
Token | her |
Token ID | 607 |
Feature activation | +1.23e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.000 |
." | +0.000 |
Neg logit contributions | |
ited | -0.003 |
seventeen | -0.003 |
hy | -0.003 |
years | -0.003 |
gust | -0.003 |
Token | brand |
Token ID | 4508 |
Feature activation | -6.08e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.003 |
seventeen | -0.003 |
years | -0.003 |
hy | -0.003 |
gust | -0.003 |
Token | new |
Token ID | 649 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
ous | +0.136 |
gust | +0.134 |
hy | +0.133 |
ited | +0.132 |
bell | +0.131 |
Neg logit contributions | |
ate | -0.064 |
his | -0.044 |
." | -0.039 |
yourself | -0.039 |
things | -0.038 |
Token | original |
Token ID | 2656 |
Feature activation | -5.39e-03 |
Pos logit contributions | |
ited | +0.026 |
seventeen | +0.026 |
hy | +0.025 |
years | +0.025 |
gust | +0.025 |
Neg logit contributions | |
ate | -0.012 |
his | -0.009 |
things | -0.009 |
other | -0.007 |
." | -0.007 |
Token | sc |
Token ID | 629 |
Feature activation | -6.89e-03 |
Pos logit contributions | |
years | +0.014 |
ited | +0.014 |
seventeen | +0.014 |
hy | +0.013 |
gust | +0.013 |
Neg logit contributions | |
ate | -0.006 |
things | -0.005 |
his | -0.005 |
other | -0.004 |
toy | -0.004 |
Token | ooter |
Token ID | 25141 |
Feature activation | -2.39e-03 |
Pos logit contributions | |
ited | +0.010 |
seventeen | +0.010 |
gust | +0.009 |
years | +0.009 |
hy | +0.009 |
Neg logit contributions | |
ate | -0.015 |
his | -0.013 |
things | -0.013 |
other | -0.012 |
." | -0.012 |
Token | with |
Token ID | 351 |
Feature activation | +1.37e-02 |
Pos logit contributions | |
ited | +0.006 |
seventeen | +0.006 |
years | +0.006 |
gust | +0.006 |
hy | +0.006 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.002 |
other | -0.001 |
." | -0.001 |
Token | She |
Token ID | 1375 |
Feature activation | +1.89e-03 |
Pos logit contributions | |
hy | +0.018 |
gust | +0.017 |
years | +0.017 |
seventeen | +0.017 |
ited | +0.016 |
Neg logit contributions | |
ate | -0.025 |
things | -0.021 |
his | -0.021 |
other | -0.020 |
gear | -0.019 |
Token | tried |
Token ID | 3088 |
Feature activation | -6.44e-04 |
Pos logit contributions | |
ate | +0.003 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.004 |
seventeen | -0.003 |
hy | -0.003 |
years | -0.003 |
gust | -0.003 |
Token | to |
Token ID | 284 |
Feature activation | -9.11e-03 |
Pos logit contributions | |
seventeen | +0.001 |
ited | +0.001 |
hy | +0.001 |
years | +0.001 |
gust | +0.001 |
Neg logit contributions | |
ate | -0.001 |
things | -0.001 |
his | -0.001 |
other | -0.001 |
gear | -0.001 |
Token | take |
Token ID | 1011 |
Feature activation | +6.03e-03 |
Pos logit contributions | |
ited | +0.015 |
hy | +0.015 |
gust | +0.015 |
seventeen | +0.014 |
years | +0.014 |
Neg logit contributions | |
ate | -0.017 |
things | -0.014 |
his | -0.013 |
| -0.012 |
| -0.012 |
Token | her |
Token ID | 607 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
ate | +0.009 |
emo | +0.006 |
P | +0.006 |
gear | +0.006 |
? | +0.005 |
Neg logit contributions | |
gust | -0.011 |
hy | -0.011 |
years | -0.011 |
seventeen | -0.011 |
thirteen | -0.010 |
Token | diary |
Token ID | 26339 |
Feature activation | -6.07e-02 |
Pos logit contributions | |
gust | +0.015 |
hy | +0.015 |
ited | +0.015 |
years | +0.014 |
bell | +0.013 |
Neg logit contributions | |
ate | -0.022 |
his | -0.018 |
things | -0.016 |
gear | -0.016 |
| -0.015 |
Token | from |
Token ID | 422 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
hy | +0.133 |
ited | +0.132 |
seventeen | +0.130 |
gust | +0.130 |
years | +0.128 |
Neg logit contributions | |
ate | -0.084 |
his | -0.062 |
things | -0.062 |
other | -0.055 |
gear | -0.051 |
Token | Max |
Token ID | 5436 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
ate | +0.015 |
things | +0.010 |
his | +0.009 |
gear | +0.009 |
." | +0.008 |
Neg logit contributions | |
gust | -0.023 |
years | -0.022 |
hy | -0.022 |
ited | -0.021 |
seventeen | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | -9.10e-03 |
Pos logit contributions | |
hy | +0.030 |
ited | +0.030 |
gust | +0.029 |
seventeen | +0.029 |
years | +0.029 |
Neg logit contributions | |
ate | -0.014 |
his | -0.009 |
things | -0.009 |
other | -0.007 |
gear | -0.007 |
Token | But |
Token ID | 887 |
Feature activation | -1.95e-03 |
Pos logit contributions | |
hy | +0.017 |
seventeen | +0.016 |
gust | +0.016 |
ous | +0.015 |
years | +0.015 |
Neg logit contributions | |
ate | -0.016 |
things | -0.013 |
other | -0.012 |
his | -0.012 |
gear | -0.011 |
Token | Max |
Token ID | 5436 |
Feature activation | -4.80e-03 |
Pos logit contributions | |
ited | +0.005 |
seventeen | +0.005 |
hy | +0.005 |
years | +0.005 |
gust | +0.005 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.002 |
other | -0.001 |
| -0.001 |
Token | on |
Token ID | 319 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
ate | +0.013 |
his | +0.011 |
things | +0.010 |
other | +0.009 |
| +0.008 |
Neg logit contributions | |
ited | -0.024 |
seventeen | -0.024 |
years | -0.024 |
hy | -0.024 |
gust | -0.023 |
Token | , |
Token ID | 11 |
Feature activation | -2.04e-03 |
Pos logit contributions | |
ate | +0.011 |
his | +0.010 |
things | +0.009 |
other | +0.007 |
the | +0.007 |
Neg logit contributions | |
ited | -0.030 |
years | -0.030 |
seventeen | -0.030 |
hy | -0.029 |
gust | -0.028 |
Token | Lucy |
Token ID | 22162 |
Feature activation | -1.65e-03 |
Pos logit contributions | |
seventeen | +0.004 |
ited | +0.004 |
years | +0.004 |
hy | +0.003 |
gust | +0.003 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
other | -0.003 |
| -0.003 |
Token | kept |
Token ID | 4030 |
Feature activation | -4.73e-03 |
Pos logit contributions | |
ited | +0.004 |
years | +0.004 |
hy | +0.003 |
seventeen | +0.003 |
ous | +0.003 |
Neg logit contributions | |
ate | -0.002 |
things | -0.002 |
his | -0.002 |
other | -0.002 |
gear | -0.002 |
Token | her |
Token ID | 607 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
years | +0.010 |
ited | +0.010 |
gust | +0.010 |
seventeen | +0.010 |
hy | +0.010 |
Neg logit contributions | |
ate | -0.007 |
things | -0.005 |
his | -0.005 |
other | -0.005 |
." | -0.005 |
Token | diary |
Token ID | 26339 |
Feature activation | -6.05e-02 |
Pos logit contributions | |
seventeen | +0.027 |
ited | +0.027 |
years | +0.026 |
hy | +0.026 |
gust | +0.025 |
Neg logit contributions | |
ate | -0.025 |
things | -0.021 |
his | -0.021 |
other | -0.019 |
." | -0.018 |
Token | even |
Token ID | 772 |
Feature activation | -8.23e-03 |
Pos logit contributions | |
seventeen | +0.158 |
ited | +0.150 |
years | +0.149 |
gust | +0.147 |
hy | +0.143 |
Neg logit contributions | |
ate | -0.070 |
his | -0.059 |
things | -0.059 |
other | -0.048 |
place | -0.046 |
Token | closer |
Token ID | 5699 |
Feature activation | -1.12e-03 |
Pos logit contributions | |
hy | +0.019 |
seventeen | +0.019 |
ous | +0.018 |
storm | +0.018 |
aney | +0.018 |
Neg logit contributions | |
ate | -0.012 |
his | -0.011 |
things | -0.010 |
other | -0.009 |
the | -0.008 |
Token | as |
Token ID | 355 |
Feature activation | -1.22e-03 |
Pos logit contributions | |
seventeen | +0.003 |
ited | +0.003 |
gust | +0.003 |
years | +0.003 |
hy | +0.003 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
." | -0.001 |
Token | she |
Token ID | 673 |
Feature activation | +2.37e-03 |
Pos logit contributions | |
years | +0.002 |
hy | +0.002 |
gust | +0.002 |
ited | +0.002 |
seventeen | +0.002 |
Neg logit contributions | |
ate | -0.002 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
gear | -0.001 |
Token | continued |
Token ID | 3767 |
Feature activation | -5.87e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.004 |
things | +0.003 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.004 |
seventeen | -0.004 |
hy | -0.004 |
years | -0.004 |
gust | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
ited | +0.013 |
years | +0.013 |
seventeen | +0.013 |
hy | +0.012 |
gust | +0.012 |
Neg logit contributions | |
ate | -0.004 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
." | -0.003 |
Token | It |
Token ID | 632 |
Feature activation | -2.46e-03 |
Pos logit contributions | |
ate | +0.015 |
things | +0.012 |
his | +0.011 |
other | +0.010 |
friends | +0.009 |
Neg logit contributions | |
seventeen | -0.022 |
hy | -0.022 |
gust | -0.022 |
years | -0.022 |
ited | -0.022 |
Token | was |
Token ID | 373 |
Feature activation | -6.06e-04 |
Pos logit contributions | |
years | +0.006 |
seventeen | +0.006 |
hy | +0.006 |
ited | +0.006 |
gust | +0.006 |
Neg logit contributions | |
ate | -0.003 |
his | -0.002 |
things | -0.002 |
other | -0.002 |
| -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +7.61e-04 |
Pos logit contributions | |
ited | +0.002 |
years | +0.002 |
seventeen | +0.002 |
hy | +0.002 |
gust | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.000 |
things | -0.000 |
other | -0.000 |
| -0.000 |
Token | rare |
Token ID | 4071 |
Feature activation | -7.85e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.002 |
years | -0.002 |
seventeen | -0.002 |
hy | -0.002 |
gust | -0.002 |
Token | gust |
Token ID | 35253 |
Feature activation | -5.94e-02 |
Pos logit contributions | |
years | +0.020 |
ited | +0.020 |
seventeen | +0.019 |
hy | +0.019 |
gust | +0.018 |
Neg logit contributions | |
ate | -0.009 |
things | -0.007 |
his | -0.007 |
other | -0.006 |
gear | -0.005 |
Token | that |
Token ID | 326 |
Feature activation | +3.64e-04 |
Pos logit contributions | |
seventeen | +0.118 |
ited | +0.113 |
gust | +0.110 |
hy | +0.105 |
years | +0.103 |
Neg logit contributions | |
ate | -0.097 |
his | -0.091 |
things | -0.087 |
." | -0.082 |
other | -0.081 |
Token | made |
Token ID | 925 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.000 |
things | +0.000 |
other | +0.000 |
." | +0.000 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
years | -0.001 |
hy | -0.001 |
gust | -0.001 |
Token | Billy |
Token ID | 15890 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
ate | +0.008 |
his | +0.006 |
things | +0.006 |
other | +0.004 |
." | +0.003 |
Neg logit contributions | |
ited | -0.029 |
seventeen | -0.029 |
years | -0.029 |
hy | -0.028 |
gust | -0.028 |
Token | jump |
Token ID | 4391 |
Feature activation | +4.54e-03 |
Pos logit contributions | |
seventeen | +0.037 |
years | +0.036 |
ited | +0.034 |
gust | +0.034 |
storm | +0.032 |
Neg logit contributions | |
his | -0.019 |
ate | -0.015 |
things | -0.015 |
." | -0.014 |
other | -0.014 |
Token | up |
Token ID | 510 |
Feature activation | +4.85e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.004 |
things | +0.004 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.012 |
years | -0.012 |
seventeen | -0.011 |
hy | -0.011 |
gust | -0.011 |
Token | went |
Token ID | 1816 |
Feature activation | -5.25e-04 |
Pos logit contributions | |
seventeen | +0.024 |
years | +0.024 |
hy | +0.024 |
ited | +0.024 |
gust | +0.024 |
Neg logit contributions | |
ate | -0.018 |
his | -0.016 |
things | -0.015 |
other | -0.014 |
| -0.013 |
Token | home |
Token ID | 1363 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
ited | +0.001 |
hy | +0.001 |
years | +0.001 |
seventeen | +0.001 |
gust | +0.001 |
Neg logit contributions | |
ate | -0.001 |
things | -0.001 |
his | -0.001 |
other | -0.001 |
." | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | +2.12e-03 |
Pos logit contributions | |
ate | +0.015 |
his | +0.012 |
things | +0.010 |
| +0.008 |
other | +0.008 |
Neg logit contributions | |
seventeen | -0.051 |
ited | -0.050 |
years | -0.049 |
hy | -0.049 |
gust | -0.049 |
Token | enjoyed |
Token ID | 8359 |
Feature activation | -2.15e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
| +0.002 |
Neg logit contributions | |
seventeen | -0.004 |
ited | -0.004 |
hy | -0.004 |
years | -0.004 |
gust | -0.004 |
Token | his |
Token ID | 465 |
Feature activation | -6.61e-03 |
Pos logit contributions | |
ited | +0.006 |
seventeen | +0.006 |
years | +0.006 |
hy | +0.006 |
gust | +0.006 |
Neg logit contributions | |
ate | -0.002 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
." | -0.001 |
Token | freshly |
Token ID | 29026 |
Feature activation | -5.93e-02 |
Pos logit contributions | |
ited | +0.014 |
seventeen | +0.014 |
hy | +0.014 |
gust | +0.014 |
years | +0.014 |
Neg logit contributions | |
ate | -0.009 |
his | -0.007 |
things | -0.007 |
other | -0.006 |
." | -0.006 |
Token | caught |
Token ID | 4978 |
Feature activation | -2.16e-03 |
Pos logit contributions | |
ited | +0.104 |
seventeen | +0.100 |
hy | +0.096 |
years | +0.094 |
gust | +0.091 |
Neg logit contributions | |
ate | -0.101 |
things | -0.084 |
his | -0.084 |
." | -0.079 |
other | -0.079 |
Token | fish |
Token ID | 5916 |
Feature activation | -8.17e-04 |
Pos logit contributions | |
ited | +0.005 |
seventeen | +0.005 |
gust | +0.005 |
years | +0.005 |
hy | +0.005 |
Neg logit contributions | |
ate | -0.003 |
his | -0.002 |
things | -0.002 |
| -0.002 |
other | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +2.50e-03 |
Pos logit contributions | |
seventeen | +0.002 |
ited | +0.002 |
years | +0.002 |
hy | +0.002 |
gust | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
." | -0.000 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -8.21e-04 |
Pos logit contributions | |
ate | +0.004 |
things | +0.003 |
gear | +0.003 |
other | +0.003 |
his | +0.003 |
Neg logit contributions | |
seventeen | -0.005 |
hy | -0.005 |
gust | -0.005 |
years | -0.005 |
ited | -0.004 |
Token | Once |
Token ID | 7454 |
Feature activation | +8.48e-04 |
Pos logit contributions | |
hy | +0.002 |
oped | +0.002 |
oled | +0.001 |
omed | +0.001 |
gust | +0.001 |
Neg logit contributions | |
ate | -0.001 |
things | -0.001 |
our | -0.001 |
your | -0.001 |
own | -0.001 |
Token | many |
Token ID | 867 |
Feature activation | -1.84e-02 |
Pos logit contributions | |
hy | +0.021 |
seventeen | +0.021 |
ited | +0.021 |
storm | +0.020 |
ous | +0.020 |
Neg logit contributions | |
ate | -0.010 |
his | -0.008 |
| -0.008 |
things | -0.008 |
other | -0.007 |
Token | different |
Token ID | 1180 |
Feature activation | -2.86e-03 |
Pos logit contributions | |
seventeen | +0.044 |
hy | +0.043 |
ited | +0.043 |
years | +0.043 |
gust | +0.042 |
Neg logit contributions | |
ate | -0.022 |
things | -0.019 |
his | -0.019 |
other | -0.017 |
friends | -0.015 |
Token | kinds |
Token ID | 6982 |
Feature activation | -5.42e-03 |
Pos logit contributions | |
seventeen | +0.008 |
ited | +0.007 |
years | +0.007 |
hy | +0.007 |
gust | +0.007 |
Neg logit contributions | |
ate | -0.003 |
things | -0.002 |
his | -0.002 |
other | -0.002 |
friends | -0.002 |
Token | of |
Token ID | 286 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
seventeen | +0.013 |
ited | +0.012 |
years | +0.012 |
hy | +0.011 |
storm | +0.011 |
Neg logit contributions | |
his | -0.007 |
things | -0.007 |
and | -0.007 |
friends | -0.006 |
ate | -0.006 |
Token | sa |
Token ID | 473 |
Feature activation | -3.06e-03 |
Pos logit contributions | |
seventeen | +0.031 |
hy | +0.031 |
ited | +0.031 |
years | +0.030 |
gust | +0.030 |
Neg logit contributions | |
ate | -0.014 |
things | -0.013 |
his | -0.013 |
other | -0.011 |
friends | -0.010 |
Token | us |
Token ID | 385 |
Feature activation | +4.02e-02 |
Pos logit contributions | |
ited | +0.006 |
years | +0.006 |
seventeen | +0.006 |
hy | +0.006 |
gust | +0.006 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
gear | -0.003 |
Token | ages |
Token ID | 1095 |
Feature activation | +3.74e-03 |
Pos logit contributions | |
ate | +0.072 |
his | +0.061 |
things | +0.059 |
other | +0.055 |
gear | +0.052 |
Neg logit contributions | |
ited | -0.071 |
seventeen | -0.071 |
hy | -0.070 |
years | -0.070 |
gust | -0.068 |
Token | everywhere |
Token ID | 8347 |
Feature activation | +3.45e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
and | +0.002 |
Neg logit contributions | |
seventeen | -0.011 |
ited | -0.011 |
years | -0.011 |
gust | -0.011 |
hy | -0.010 |
Token | she |
Token ID | 673 |
Feature activation | +4.76e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.010 |
seventeen | -0.009 |
years | -0.009 |
hy | -0.009 |
gust | -0.009 |
Token | looked |
Token ID | 3114 |
Feature activation | +5.23e-03 |
Pos logit contributions | |
ate | +0.007 |
his | +0.006 |
things | +0.006 |
other | +0.006 |
| +0.005 |
Neg logit contributions | |
seventeen | -0.010 |
ited | -0.010 |
gust | -0.009 |
years | -0.009 |
hy | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +3.71e-03 |
Pos logit contributions | |
his | +0.006 |
ate | +0.005 |
things | +0.005 |
other | +0.004 |
." | +0.004 |
Neg logit contributions | |
years | -0.013 |
gust | -0.013 |
seventeen | -0.013 |
hy | -0.013 |
ited | -0.013 |
Token | says |
Token ID | 1139 |
Feature activation | -3.01e-03 |
Pos logit contributions | |
ate | +0.009 |
his | +0.007 |
things | +0.007 |
other | +0.006 |
." | +0.006 |
Neg logit contributions | |
seventeen | -0.011 |
ited | -0.011 |
hy | -0.011 |
years | -0.011 |
gust | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | -4.60e-03 |
Pos logit contributions | |
ited | +0.008 |
years | +0.008 |
seventeen | +0.008 |
gust | +0.008 |
hy | +0.008 |
Neg logit contributions | |
ate | -0.003 |
his | -0.003 |
things | -0.002 |
other | -0.002 |
." | -0.002 |
Token | " |
Token ID | 366 |
Feature activation | +7.53e-04 |
Pos logit contributions | |
ited | +0.012 |
years | +0.012 |
hy | +0.012 |
seventeen | +0.011 |
gust | +0.011 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.003 |
other | -0.003 |
| -0.003 |
Token | Ign |
Token ID | 32916 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.002 |
seventeen | -0.001 |
years | -0.001 |
hy | -0.001 |
gust | -0.001 |
Token | or |
Token ID | 273 |
Feature activation | +5.19e-02 |
Pos logit contributions | |
ate | +0.019 |
his | +0.016 |
things | +0.015 |
other | +0.014 |
gear | +0.013 |
Neg logit contributions | |
ited | -0.019 |
seventeen | -0.019 |
years | -0.019 |
hy | -0.019 |
gust | -0.018 |
Token | ant |
Token ID | 415 |
Feature activation | +4.71e-02 |
Pos logit contributions | |
ate | +0.079 |
his | +0.063 |
things | +0.060 |
gear | +0.058 |
place | +0.058 |
Neg logit contributions | |
seventeen | -0.100 |
years | -0.099 |
ited | -0.099 |
hy | -0.098 |
ous | -0.096 |
Token | , |
Token ID | 11 |
Feature activation | +7.65e-03 |
Pos logit contributions | |
ate | +0.061 |
his | +0.045 |
gear | +0.040 |
things | +0.040 |
place | +0.037 |
Neg logit contributions | |
seventeen | -0.103 |
hy | -0.103 |
ited | -0.102 |
years | -0.101 |
ous | -0.101 |
Token | zero |
Token ID | 6632 |
Feature activation | +4.87e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
." | +0.007 |
Neg logit contributions | |
ited | -0.018 |
years | -0.017 |
seventeen | -0.017 |
hy | -0.017 |
gust | -0.017 |
Token | ". |
Token ID | 1911 |
Feature activation | +7.00e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.004 |
things | +0.004 |
other | +0.003 |
gear | +0.003 |
Neg logit contributions | |
ited | -0.012 |
seventeen | -0.012 |
hy | -0.012 |
years | -0.012 |
gust | -0.012 |
Token | The |
Token ID | 383 |
Feature activation | -5.82e-03 |
Pos logit contributions | |
ate | +0.009 |
things | +0.007 |
his | +0.007 |
gear | +0.006 |
other | +0.006 |
Neg logit contributions | |
seventeen | -0.016 |
gust | -0.015 |
ited | -0.015 |
hy | -0.015 |
years | -0.015 |
Token | teacher |
Token ID | 4701 |
Feature activation | +2.06e-03 |
Pos logit contributions | |
ited | +0.014 |
seventeen | +0.014 |
hy | +0.014 |
years | +0.014 |
gust | +0.014 |
Neg logit contributions | |
ate | -0.007 |
his | -0.005 |
things | -0.005 |
other | -0.004 |
." | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -2.47e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
ited | -0.014 |
hy | -0.014 |
years | -0.014 |
seventeen | -0.014 |
gust | -0.014 |
Token | She |
Token ID | 1375 |
Feature activation | -9.01e-04 |
Pos logit contributions | |
years | +0.004 |
gust | +0.004 |
hy | +0.004 |
ited | +0.004 |
seventeen | +0.004 |
Neg logit contributions | |
ate | -0.005 |
things | -0.004 |
his | -0.004 |
other | -0.004 |
gear | -0.004 |
Token | said |
Token ID | 531 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
seventeen | +0.002 |
hy | +0.002 |
ited | +0.002 |
years | +0.002 |
gust | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
| -0.001 |
Token | ' |
Token ID | 705 |
Feature activation | +1.90e-03 |
Pos logit contributions | |
ited | +0.027 |
seventeen | +0.025 |
hy | +0.025 |
years | +0.025 |
gust | +0.024 |
Neg logit contributions | |
ate | -0.011 |
his | -0.010 |
things | -0.009 |
| -0.007 |
other | -0.007 |
Token | P |
Token ID | 47 |
Feature activation | +3.44e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
ited | -0.004 |
years | -0.004 |
hy | -0.004 |
seventeen | -0.004 |
gust | -0.004 |
Token | up |
Token ID | 929 |
Feature activation | +4.20e-02 |
Pos logit contributions | |
ate | +0.066 |
his | +0.058 |
things | +0.056 |
other | +0.053 |
| +0.050 |
Neg logit contributions | |
years | -0.056 |
ited | -0.056 |
seventeen | -0.056 |
hy | -0.055 |
gust | -0.053 |
Token | , |
Token ID | 11 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
ate | +0.058 |
his | +0.047 |
things | +0.046 |
other | +0.040 |
." | +0.039 |
Neg logit contributions | |
ited | -0.094 |
seventeen | -0.092 |
years | -0.092 |
gust | -0.091 |
hy | -0.091 |
Token | we |
Token ID | 356 |
Feature activation | +5.26e-04 |
Pos logit contributions | |
ate | +0.002 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.002 |
seventeen | -0.002 |
years | -0.002 |
hy | -0.002 |
gust | -0.002 |
Token | can |
Token ID | 460 |
Feature activation | +1.71e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.000 |
things | +0.000 |
other | +0.000 |
." | +0.000 |
Neg logit contributions | |
seventeen | -0.001 |
ited | -0.001 |
hy | -0.001 |
gust | -0.001 |
years | -0.001 |
Token | send |
Token ID | 3758 |
Feature activation | +3.37e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.004 |
seventeen | -0.004 |
years | -0.004 |
hy | -0.004 |
gust | -0.004 |
Token | up |
Token ID | 510 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
ate | +0.004 |
his | +0.002 |
things | +0.002 |
gear | +0.002 |
other | +0.002 |
Neg logit contributions | |
years | -0.008 |
hy | -0.008 |
seventeen | -0.008 |
gust | -0.008 |
ited | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +2.02e-03 |
Pos logit contributions | |
his | +0.000 |
ate | +0.000 |
things | +0.000 |
the | +0.000 |
and | +0.000 |
Neg logit contributions | |
seventeen | -0.001 |
years | -0.001 |
ited | -0.001 |
hy | -0.001 |
storm | -0.001 |
Token | said |
Token ID | 531 |
Feature activation | -4.92e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
the | +0.003 |
Neg logit contributions | |
years | -0.004 |
seventeen | -0.004 |
ited | -0.004 |
hy | -0.004 |
ous | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -7.07e-03 |
Pos logit contributions | |
ited | +0.014 |
years | +0.013 |
hy | +0.013 |
seventeen | +0.013 |
gust | +0.012 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
." | -0.003 |
other | -0.003 |
Token | " |
Token ID | 366 |
Feature activation | +3.22e-03 |
Pos logit contributions | |
ited | +0.019 |
years | +0.018 |
seventeen | +0.018 |
hy | +0.018 |
gust | +0.018 |
Neg logit contributions | |
ate | -0.007 |
his | -0.005 |
things | -0.005 |
| -0.004 |
other | -0.004 |
Token | Y |
Token ID | 56 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
ate | +0.005 |
his | +0.004 |
things | +0.004 |
gear | +0.003 |
other | +0.003 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
gust | -0.007 |
hy | -0.007 |
years | -0.007 |
Token | uck |
Token ID | 1347 |
Feature activation | +3.75e-02 |
Pos logit contributions | |
ate | +0.041 |
his | +0.033 |
things | +0.033 |
." | +0.030 |
other | +0.030 |
Neg logit contributions | |
years | -0.049 |
ited | -0.048 |
seventeen | -0.048 |
hy | -0.048 |
gust | -0.047 |
Token | ! |
Token ID | 0 |
Feature activation | +4.93e-03 |
Pos logit contributions | |
ate | +0.042 |
his | +0.032 |
things | +0.032 |
other | +0.027 |
." | +0.025 |
Neg logit contributions | |
ited | -0.092 |
seventeen | -0.092 |
years | -0.091 |
hy | -0.091 |
gust | -0.090 |
Token | Sour |
Token ID | 47694 |
Feature activation | +5.50e-03 |
Pos logit contributions | |
ate | +0.008 |
his | +0.007 |
things | +0.007 |
gear | +0.006 |
other | +0.006 |
Neg logit contributions | |
seventeen | -0.009 |
hy | -0.009 |
gust | -0.009 |
years | -0.009 |
ited | -0.009 |
Token | ! |
Token ID | 0 |
Feature activation | +1.54e-03 |
Pos logit contributions | |
ate | +0.008 |
his | +0.007 |
things | +0.007 |
other | +0.006 |
gear | +0.006 |
Neg logit contributions | |
seventeen | -0.011 |
ited | -0.011 |
hy | -0.011 |
gust | -0.011 |
years | -0.011 |
Token | No |
Token ID | 1400 |
Feature activation | -3.69e-03 |
Pos logit contributions | |
ate | +0.003 |
things | +0.002 |
his | +0.002 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
seventeen | -0.003 |
hy | -0.003 |
years | -0.003 |
ited | -0.003 |
gust | -0.003 |
Token | like |
Token ID | 588 |
Feature activation | +5.34e-03 |
Pos logit contributions | |
years | +0.010 |
hy | +0.009 |
ited | +0.009 |
seventeen | +0.009 |
ivated | +0.009 |
Neg logit contributions | |
ate | -0.004 |
things | -0.003 |
his | -0.003 |
other | -0.003 |
." | -0.003 |
Token | father |
Token ID | 2988 |
Feature activation | -1.43e-04 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
." | +0.002 |
other | +0.002 |
Neg logit contributions | |
ited | -0.005 |
gust | -0.005 |
years | -0.005 |
hy | -0.005 |
seventeen | -0.005 |
Token | said |
Token ID | 531 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
seventeen | +0.000 |
hy | +0.000 |
years | +0.000 |
ited | +0.000 |
gust | +0.000 |
Neg logit contributions | |
his | -0.000 |
other | -0.000 |
ate | -0.000 |
friends | -0.000 |
and | -0.000 |
Token | , |
Token ID | 11 |
Feature activation | -1.28e-02 |
Pos logit contributions | |
ited | +0.045 |
years | +0.041 |
seventeen | +0.040 |
sidelines | +0.039 |
hy | +0.039 |
Neg logit contributions | |
his | -0.011 |
things | -0.009 |
the | -0.007 |
| -0.006 |
ate | -0.006 |
Token | " |
Token ID | 366 |
Feature activation | +3.33e-03 |
Pos logit contributions | |
ited | +0.036 |
hy | +0.034 |
seventeen | +0.034 |
years | +0.034 |
gust | +0.033 |
Neg logit contributions | |
ate | -0.010 |
his | -0.010 |
things | -0.008 |
| -0.007 |
other | -0.007 |
Token | Soon |
Token ID | 28093 |
Feature activation | -7.93e-03 |
Pos logit contributions | |
ate | +0.006 |
his | +0.005 |
things | +0.004 |
other | +0.004 |
." | +0.004 |
Neg logit contributions | |
ited | -0.006 |
seventeen | -0.006 |
years | -0.006 |
hy | -0.006 |
gust | -0.006 |
Token | er |
Token ID | 263 |
Feature activation | +3.71e-02 |
Pos logit contributions | |
ited | +0.018 |
seventeen | +0.018 |
hy | +0.018 |
gust | +0.018 |
years | +0.018 |
Neg logit contributions | |
ate | -0.010 |
his | -0.008 |
things | -0.008 |
other | -0.007 |
gear | -0.006 |
Token | or |
Token ID | 393 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
ate | +0.058 |
his | +0.047 |
things | +0.046 |
." | +0.041 |
other | +0.040 |
Neg logit contributions | |
seventeen | -0.078 |
years | -0.077 |
ited | -0.077 |
gust | -0.077 |
hy | -0.074 |
Token | later |
Token ID | 1568 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
his | +0.011 |
ate | +0.010 |
things | +0.010 |
the | +0.009 |
other | +0.009 |
Neg logit contributions | |
ited | -0.026 |
seventeen | -0.025 |
hy | -0.025 |
anne | -0.024 |
stretched | -0.024 |
Token | , |
Token ID | 11 |
Feature activation | +3.70e-03 |
Pos logit contributions | |
ate | +0.024 |
his | +0.018 |
things | +0.018 |
other | +0.016 |
gear | +0.014 |
Neg logit contributions | |
ited | -0.047 |
seventeen | -0.047 |
hy | -0.047 |
years | -0.046 |
gust | -0.046 |
Token | bad |
Token ID | 2089 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
ate | +0.005 |
his | +0.004 |
things | +0.004 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.008 |
seventeen | -0.008 |
hy | -0.008 |
years | -0.008 |
gust | -0.008 |
Token | deeds |
Token ID | 23777 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
ate | +0.017 |
his | +0.013 |
| +0.011 |
other | +0.011 |
own | +0.011 |
Neg logit contributions | |
gust | -0.029 |
ited | -0.028 |
ous | -0.028 |
hy | -0.028 |
seventeen | -0.027 |
Token | and |
Token ID | 290 |
Feature activation | +8.43e-03 |
Pos logit contributions | |
his | +0.006 |
ate | +0.006 |
things | +0.004 |
and | +0.004 |
the | +0.002 |
Neg logit contributions | |
ited | -0.060 |
years | -0.059 |
seventeen | -0.057 |
gust | -0.056 |
aney | -0.056 |
Token | nails |
Token ID | 23361 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
ate | +0.009 |
things | +0.009 |
his | +0.009 |
other | +0.008 |
gear | +0.007 |
Neg logit contributions | |
ited | -0.022 |
years | -0.020 |
ivated | -0.020 |
aney | -0.020 |
gust | -0.020 |
Token | sticking |
Token ID | 17274 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
ate | +0.017 |
his | +0.013 |
things | +0.012 |
other | +0.009 |
." | +0.009 |
Neg logit contributions | |
ited | -0.074 |
years | -0.073 |
gust | -0.072 |
seventeen | -0.071 |
aney | -0.069 |
Token | out |
Token ID | 503 |
Feature activation | +7.98e-03 |
Pos logit contributions | |
ate | +0.017 |
his | +0.012 |
things | +0.012 |
other | +0.011 |
gear | +0.010 |
Neg logit contributions | |
seventeen | -0.025 |
hy | -0.024 |
gust | -0.024 |
years | -0.023 |
ited | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | -1.77e-03 |
Pos logit contributions | |
ate | +0.013 |
his | +0.011 |
things | +0.011 |
other | +0.010 |
." | +0.009 |
Neg logit contributions | |
ited | -0.016 |
seventeen | -0.016 |
years | -0.016 |
hy | -0.016 |
gust | -0.015 |
Token | Tom |
Token ID | 4186 |
Feature activation | -8.23e-04 |
Pos logit contributions | |
hy | +0.003 |
seventeen | +0.003 |
gust | +0.003 |
bell | +0.003 |
thirteen | +0.003 |
Neg logit contributions | |
ate | -0.003 |
things | -0.003 |
friends | -0.003 |
P | -0.003 |
other | -0.003 |
Token | touched |
Token ID | 12615 |
Feature activation | -5.47e-03 |
Pos logit contributions | |
ited | +0.002 |
seventeen | +0.002 |
hy | +0.002 |
years | +0.002 |
gust | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
." | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +3.62e-03 |
Pos logit contributions | |
gust | +0.013 |
hy | +0.013 |
seventeen | +0.013 |
years | +0.012 |
thirteen | +0.012 |
Neg logit contributions | |
ate | -0.006 |
P | -0.003 |
things | -0.003 |
chefs | -0.003 |
name | -0.003 |
Token | lion |
Token ID | 18744 |
Feature activation | -5.30e-03 |
Pos logit contributions | |
ate | +0.005 |
things | +0.004 |
his | +0.004 |
other | +0.004 |
." | +0.003 |
Neg logit contributions | |
ited | -0.008 |
years | -0.008 |
seventeen | -0.008 |
hy | -0.008 |
gust | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | +7.87e-04 |
Pos logit contributions | |
years | +0.016 |
ited | +0.016 |
seventeen | +0.016 |
gust | +0.015 |
hy | +0.015 |
Neg logit contributions | |
ate | -0.003 |
his | -0.003 |
things | -0.002 |
other | -0.002 |
." | -0.001 |
Token | felt |
Token ID | 2936 |
Feature activation | -5.82e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.002 |
seventeen | -0.002 |
hy | -0.002 |
years | -0.002 |
gust | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -1.48e-03 |
Pos logit contributions | |
seventeen | +0.001 |
ited | +0.001 |
years | +0.001 |
gust | +0.001 |
hy | +0.001 |
Neg logit contributions | |
ate | -0.000 |
his | -0.000 |
things | -0.000 |
other | -0.000 |
." | -0.000 |
Token | make |
Token ID | 787 |
Feature activation | -2.13e-04 |
Pos logit contributions | |
ited | +0.003 |
hy | +0.003 |
seventeen | +0.003 |
gust | +0.003 |
years | +0.003 |
Neg logit contributions | |
ate | -0.002 |
things | -0.002 |
his | -0.002 |
other | -0.002 |
gear | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | -2.23e-02 |
Pos logit contributions | |
gust | +0.001 |
hy | +0.000 |
years | +0.000 |
ited | +0.000 |
seventeen | +0.000 |
Neg logit contributions | |
ate | -0.000 |
things | -0.000 |
his | -0.000 |
gear | -0.000 |
other | -0.000 |
Token | feel |
Token ID | 1254 |
Feature activation | -5.10e-03 |
Pos logit contributions | |
years | +0.057 |
ited | +0.055 |
seventeen | +0.054 |
hy | +0.051 |
gust | +0.051 |
Neg logit contributions | |
ate | -0.028 |
his | -0.028 |
things | -0.025 |
." | -0.021 |
other | -0.021 |
Token | better |
Token ID | 1365 |
Feature activation | -2.36e-03 |
Pos logit contributions | |
ited | +0.011 |
seventeen | +0.011 |
gust | +0.010 |
hy | +0.010 |
years | +0.010 |
Neg logit contributions | |
ate | -0.008 |
his | -0.006 |
things | -0.006 |
other | -0.005 |
gear | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +2.52e-03 |
Pos logit contributions | |
ited | +0.006 |
hy | +0.006 |
seventeen | +0.006 |
years | +0.006 |
gust | +0.006 |
Neg logit contributions | |
ate | -0.002 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
gear | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +4.85e-03 |
Pos logit contributions | |
ate | +0.002 |
things | +0.002 |
his | +0.001 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
hy | -0.007 |
seventeen | -0.007 |
gust | -0.007 |
ited | -0.006 |
years | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +3.79e-03 |
Pos logit contributions | |
ate | +0.005 |
things | +0.003 |
his | +0.003 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
hy | -0.012 |
ited | -0.012 |
seventeen | -0.012 |
gust | -0.012 |
years | -0.012 |
Token | From |
Token ID | 4863 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
ate | +0.006 |
his | +0.005 |
things | +0.005 |
other | +0.004 |
| +0.004 |
Neg logit contributions | |
ited | -0.008 |
seventeen | -0.008 |
hy | -0.008 |
years | -0.008 |
gust | -0.008 |
Token | that |
Token ID | 326 |
Feature activation | +2.40e-03 |
Pos logit contributions | |
ited | +0.025 |
hy | +0.024 |
gust | +0.024 |
seventeen | +0.024 |
years | +0.024 |
Neg logit contributions | |
ate | -0.035 |
his | -0.029 |
things | -0.029 |
other | -0.028 |
." | -0.027 |
Token | day |
Token ID | 1110 |
Feature activation | +8.46e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
gear | +0.003 |
Neg logit contributions | |
ited | -0.005 |
seventeen | -0.005 |
gust | -0.005 |
hy | -0.005 |
years | -0.005 |
Token | not |
Token ID | 407 |
Feature activation | +4.48e-03 |
Pos logit contributions | |
ate | +0.000 |
his | +0.000 |
things | +0.000 |
other | +0.000 |
friends | +0.000 |
Neg logit contributions | |
seventeen | -0.000 |
ited | -0.000 |
years | -0.000 |
gust | -0.000 |
aney | -0.000 |
Token | run |
Token ID | 1057 |
Feature activation | +3.48e-03 |
Pos logit contributions | |
his | +0.007 |
things | +0.006 |
ate | +0.005 |
friends | +0.005 |
." | +0.005 |
Neg logit contributions | |
seventeen | -0.010 |
years | -0.010 |
ited | -0.010 |
aney | -0.009 |
hetically | -0.009 |
Token | into |
Token ID | 656 |
Feature activation | -9.61e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.004 |
things | +0.004 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
seventeen | -0.009 |
ited | -0.008 |
years | -0.008 |
gust | -0.008 |
hy | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | -9.27e-03 |
Pos logit contributions | |
ited | +0.026 |
years | +0.026 |
gust | +0.026 |
hy | +0.026 |
seventeen | +0.026 |
Neg logit contributions | |
ate | -0.008 |
his | -0.005 |
things | -0.005 |
other | -0.004 |
gear | -0.003 |
Token | street |
Token ID | 4675 |
Feature activation | +1.04e-03 |
Pos logit contributions | |
ited | +0.021 |
seventeen | +0.021 |
years | +0.021 |
hy | +0.021 |
gust | +0.020 |
Neg logit contributions | |
ate | -0.012 |
his | -0.010 |
things | -0.010 |
other | -0.009 |
gear | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -1.39e-03 |
Pos logit contributions | |
his | +0.001 |
things | +0.001 |
ate | +0.001 |
." | +0.001 |
. | +0.001 |
Neg logit contributions | |
seventeen | -0.003 |
ited | -0.003 |
gust | -0.003 |
years | -0.003 |
aney | -0.003 |
Token | She |
Token ID | 1375 |
Feature activation | +2.32e-03 |
Pos logit contributions | |
ited | +0.003 |
seventeen | +0.003 |
hy | +0.003 |
years | +0.003 |
gust | +0.003 |
Neg logit contributions | |
ate | -0.002 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
gear | -0.001 |
Token | learned |
Token ID | 4499 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
| +0.003 |
Neg logit contributions | |
seventeen | -0.005 |
ited | -0.004 |
hy | -0.004 |
years | -0.004 |
gust | -0.004 |
Token | that |
Token ID | 326 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
hy | +0.009 |
years | +0.009 |
gust | +0.009 |
ited | +0.009 |
seventeen | +0.009 |
Neg logit contributions | |
ate | -0.010 |
things | -0.008 |
his | -0.008 |
other | -0.008 |
gear | -0.008 |
Token | it |
Token ID | 340 |
Feature activation | +2.58e-03 |
Pos logit contributions | |
ited | +0.027 |
seventeen | +0.027 |
hy | +0.026 |
years | +0.026 |
aney | +0.025 |
Neg logit contributions | |
ate | -0.017 |
things | -0.016 |
his | -0.015 |
other | -0.014 |
| -0.013 |
Token | 's |
Token ID | 338 |
Feature activation | +3.65e-03 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
gear | +0.002 |
other | +0.002 |
Neg logit contributions | |
ited | -0.006 |
years | -0.006 |
gust | -0.006 |
hy | -0.006 |
ous | -0.006 |
Token | cheese |
Token ID | 9891 |
Feature activation | -7.75e-03 |
Pos logit contributions | |
ited | +0.010 |
seventeen | +0.010 |
gust | +0.010 |
hy | +0.010 |
years | +0.010 |
Neg logit contributions | |
ate | -0.007 |
his | -0.006 |
things | -0.006 |
other | -0.005 |
gear | -0.005 |
Token | for |
Token ID | 329 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ited | +0.019 |
seventeen | +0.019 |
hy | +0.019 |
years | +0.019 |
gust | +0.019 |
Neg logit contributions | |
ate | -0.008 |
his | -0.006 |
things | -0.005 |
other | -0.005 |
gear | -0.004 |
Token | himself |
Token ID | 2241 |
Feature activation | +8.89e-03 |
Pos logit contributions | |
years | +0.031 |
gust | +0.031 |
seventeen | +0.030 |
hy | +0.030 |
ited | +0.030 |
Neg logit contributions | |
ate | -0.008 |
things | -0.003 |
his | -0.003 |
gear | -0.002 |
name | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +1.93e-03 |
Pos logit contributions | |
ate | +0.006 |
his | +0.004 |
things | +0.004 |
other | +0.003 |
." | +0.002 |
Neg logit contributions | |
ited | -0.026 |
seventeen | -0.026 |
years | -0.026 |
gust | -0.025 |
hy | -0.025 |
Token | He |
Token ID | 679 |
Feature activation | +1.13e-03 |
Pos logit contributions | |
ate | +0.003 |
things | +0.002 |
other | +0.002 |
his | +0.002 |
P | +0.002 |
Neg logit contributions | |
hy | -0.004 |
seventeen | -0.004 |
gust | -0.004 |
years | -0.004 |
ous | -0.004 |
Token | went |
Token ID | 1816 |
Feature activation | -2.80e-03 |
Pos logit contributions | |
ate | +0.002 |
things | +0.002 |
his | +0.002 |
yourself | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.002 |
years | -0.002 |
seventeen | -0.002 |
hy | -0.002 |
gust | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
years | +0.005 |
hy | +0.005 |
ited | +0.005 |
seventeen | +0.005 |
gust | +0.005 |
Neg logit contributions | |
ate | -0.004 |
things | -0.003 |
his | -0.003 |
other | -0.003 |
." | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +7.19e-05 |
Pos logit contributions | |
gust | +0.023 |
sing | +0.023 |
sidelines | +0.022 |
contain | +0.021 |
hy | +0.021 |
Neg logit contributions | |
ate | -0.014 |
P | -0.011 |
things | -0.010 |
gear | -0.009 |
rev | -0.009 |
Token | kitchen |
Token ID | 9592 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
ate | +0.000 |
his | +0.000 |
things | +0.000 |
gear | +0.000 |
other | +0.000 |
Neg logit contributions | |
seventeen | -0.000 |
ited | -0.000 |
hy | -0.000 |
gust | -0.000 |
years | -0.000 |
Token | and |
Token ID | 290 |
Feature activation | +3.03e-03 |
Pos logit contributions | |
ate | +0.013 |
his | +0.009 |
things | +0.009 |
other | +0.007 |
." | +0.006 |
Neg logit contributions | |
ited | -0.038 |
seventeen | -0.038 |
hy | -0.037 |
years | -0.037 |
gust | -0.037 |
Token | saw |
Token ID | 2497 |
Feature activation | +3.85e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.005 |
things | +0.005 |
other | +0.004 |
." | +0.004 |
Neg logit contributions | |
ited | -0.005 |
seventeen | -0.005 |
hy | -0.005 |
years | -0.005 |
gust | -0.005 |
Token | daughter |
Token ID | 4957 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
ate | +0.013 |
things | +0.010 |
his | +0.010 |
other | +0.009 |
." | +0.008 |
Neg logit contributions | |
seventeen | -0.027 |
ited | -0.027 |
years | -0.027 |
hy | -0.026 |
gust | -0.026 |
Token | and |
Token ID | 290 |
Feature activation | -1.01e-03 |
Pos logit contributions | |
ate | +0.011 |
his | +0.011 |
things | +0.010 |
." | +0.010 |
other | +0.009 |
Neg logit contributions | |
seventeen | -0.033 |
years | -0.033 |
ited | -0.032 |
gust | -0.032 |
hy | -0.031 |
Token | play |
Token ID | 711 |
Feature activation | +5.91e-03 |
Pos logit contributions | |
seventeen | +0.002 |
ited | +0.002 |
years | +0.002 |
gust | +0.002 |
hy | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
the | -0.001 |
Token | games |
Token ID | 1830 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
ate | +0.006 |
his | +0.005 |
things | +0.005 |
other | +0.004 |
." | +0.004 |
Neg logit contributions | |
seventeen | -0.015 |
ited | -0.015 |
hy | -0.015 |
years | -0.015 |
gust | -0.015 |
Token | with |
Token ID | 351 |
Feature activation | +1.02e-03 |
Pos logit contributions | |
seventeen | +0.034 |
ited | +0.034 |
years | +0.033 |
gust | +0.033 |
hy | +0.032 |
Neg logit contributions | |
ate | -0.009 |
his | -0.007 |
things | -0.007 |
." | -0.006 |
other | -0.006 |
Token | her |
Token ID | 607 |
Feature activation | +1.80e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.003 |
seventeen | -0.003 |
hy | -0.003 |
years | -0.003 |
gust | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -2.01e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.005 |
seventeen | -0.005 |
hy | -0.005 |
years | -0.005 |
gust | -0.005 |
Token | The |
Token ID | 383 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
hy | +0.004 |
years | +0.004 |
gust | +0.004 |
ited | +0.004 |
seventeen | +0.004 |
Neg logit contributions | |
ate | -0.003 |
things | -0.002 |
his | -0.002 |
gear | -0.002 |
other | -0.002 |
Token | promise |
Token ID | 6991 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
seventeen | +0.015 |
hy | +0.014 |
ited | +0.014 |
years | +0.014 |
ous | +0.014 |
Neg logit contributions | |
ate | -0.005 |
things | -0.005 |
other | -0.005 |
friends | -0.004 |
his | -0.004 |
Token | was |
Token ID | 373 |
Feature activation | +3.14e-03 |
Pos logit contributions | |
ate | +0.017 |
things | +0.013 |
his | +0.013 |
other | +0.012 |
." | +0.011 |
Neg logit contributions | |
years | -0.042 |
ited | -0.042 |
seventeen | -0.041 |
gust | -0.040 |
hy | -0.039 |
Token | a |
Token ID | 257 |
Feature activation | +9.11e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
hy | -0.007 |
years | -0.007 |
gust | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +3.97e-03 |
Pos logit contributions | |
hy | +0.006 |
ited | +0.006 |
gust | +0.006 |
years | +0.006 |
seventeen | +0.006 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.001 |
other | -0.001 |
| -0.001 |
Token | spark |
Token ID | 9009 |
Feature activation | -7.96e-03 |
Pos logit contributions | |
ate | +0.006 |
his | +0.005 |
things | +0.005 |
other | +0.004 |
| +0.004 |
Neg logit contributions | |
ited | -0.009 |
seventeen | -0.009 |
years | -0.008 |
hy | -0.008 |
gust | -0.008 |
Token | ly |
Token ID | 306 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
seventeen | +0.007 |
ited | +0.007 |
years | +0.007 |
hy | +0.007 |
gust | +0.007 |
Neg logit contributions | |
ate | -0.021 |
his | -0.019 |
things | -0.019 |
other | -0.018 |
." | -0.018 |
Token | in |
Token ID | 287 |
Feature activation | +4.32e-03 |
Pos logit contributions | |
ate | +0.006 |
things | +0.004 |
his | +0.004 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.033 |
seventeen | -0.032 |
years | -0.032 |
gust | -0.032 |
hy | -0.031 |
Token | the |
Token ID | 262 |
Feature activation | -8.89e-04 |
Pos logit contributions | |
ate | +0.004 |
things | +0.003 |
his | +0.003 |
gear | +0.002 |
." | +0.002 |
Neg logit contributions | |
gust | -0.011 |
years | -0.011 |
seventeen | -0.011 |
hy | -0.011 |
ited | -0.011 |
Token | sun |
Token ID | 4252 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
ited | +0.002 |
hy | +0.002 |
gust | +0.002 |
seventeen | +0.002 |
years | +0.002 |
Neg logit contributions | |
ate | -0.001 |
his | -0.001 |
things | -0.001 |
other | -0.001 |
." | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +7.15e-03 |
Pos logit contributions | |
ited | +0.035 |
seventeen | +0.035 |
years | +0.035 |
hy | +0.034 |
gust | +0.034 |
Neg logit contributions | |
ate | -0.009 |
his | -0.005 |
things | -0.005 |
other | -0.004 |
." | -0.003 |
Token | It |
Token ID | 632 |
Feature activation | +1.20e-03 |
Pos logit contributions | |
ate | +0.010 |
things | +0.007 |
his | +0.007 |
gear | +0.007 |
other | +0.006 |
Neg logit contributions | |
gust | -0.016 |
hy | -0.016 |
seventeen | -0.015 |
years | -0.015 |
ited | -0.014 |
Token | made |
Token ID | 925 |
Feature activation | +5.36e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
| +0.001 |
Neg logit contributions | |
seventeen | -0.003 |
ited | -0.003 |
years | -0.003 |
hy | -0.003 |
gust | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | -1.60e-02 |
Pos logit contributions | |
ate | +0.005 |
his | +0.003 |
things | +0.003 |
other | +0.002 |
." | +0.002 |
Neg logit contributions | |
ited | -0.015 |
seventeen | -0.015 |
hy | -0.014 |
years | -0.014 |
gust | -0.014 |
Token | most |
Token ID | 749 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
gust | +0.034 |
ited | +0.033 |
hy | +0.033 |
years | +0.032 |
seventeen | +0.032 |
Neg logit contributions | |
ate | -0.023 |
his | -0.018 |
things | -0.016 |
." | -0.014 |
| -0.014 |
Token | Thank |
Token ID | 10449 |
Feature activation | -2.78e-03 |
Pos logit contributions | |
ited | +0.000 |
hy | +0.000 |
seventeen | +0.000 |
years | +0.000 |
gust | +0.000 |
Neg logit contributions | |
ate | -0.001 |
things | -0.000 |
his | -0.000 |
other | -0.000 |
gear | -0.000 |
Token | you |
Token ID | 345 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
years | +0.006 |
hy | +0.006 |
gust | +0.006 |
ited | +0.006 |
seventeen | +0.006 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
gear | -0.003 |
place | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -7.95e-04 |
Pos logit contributions | |
hy | +0.037 |
seventeen | +0.037 |
years | +0.037 |
gust | +0.037 |
ous | +0.036 |
Neg logit contributions | |
ate | -0.030 |
things | -0.021 |
his | -0.021 |
gear | -0.019 |
other | -0.018 |
Token | Tom |
Token ID | 4186 |
Feature activation | -2.06e-04 |
Pos logit contributions | |
gust | +0.002 |
hy | +0.002 |
seventeen | +0.002 |
ited | +0.002 |
years | +0.002 |
Neg logit contributions | |
ate | -0.001 |
things | -0.001 |
his | -0.001 |
other | -0.001 |
gear | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -7.13e-03 |
Pos logit contributions | |
hy | +0.000 |
ited | +0.000 |
seventeen | +0.000 |
ous | +0.000 |
gust | +0.000 |
Neg logit contributions | |
ate | -0.000 |
things | -0.000 |
gear | -0.000 |
other | -0.000 |
his | -0.000 |
Token | You |
Token ID | 921 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
hy | +0.014 |
seventeen | +0.013 |
years | +0.013 |
gust | +0.013 |
ous | +0.012 |
Neg logit contributions | |
ate | -0.012 |
things | -0.010 |
his | -0.010 |
other | -0.010 |
gear | -0.009 |
Token | are |
Token ID | 389 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
ited | +0.030 |
hy | +0.029 |
seventeen | +0.029 |
years | +0.029 |
gust | +0.029 |
Neg logit contributions | |
ate | -0.031 |
his | -0.026 |
things | -0.026 |
other | -0.023 |
gear | -0.023 |
Token | a |
Token ID | 257 |
Feature activation | -1.73e-03 |
Pos logit contributions | |
years | +0.026 |
hy | +0.026 |
seventeen | +0.025 |
gust | +0.024 |
thirteen | +0.023 |
Neg logit contributions | |
ate | -0.014 |
gear | -0.010 |
things | -0.010 |
his | -0.009 |
suits | -0.009 |
Token | good |
Token ID | 922 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
gust | +0.003 |
years | +0.003 |
hy | +0.003 |
seventeen | +0.003 |
ited | +0.003 |
Neg logit contributions | |
ate | -0.003 |
his | -0.002 |
things | -0.002 |
gear | -0.002 |
himself | -0.002 |
Token | brother |
Token ID | 3956 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
ate | +0.020 |
his | +0.016 |
things | +0.014 |
himself | +0.012 |
yourself | +0.012 |
Neg logit contributions | |
gust | -0.031 |
hy | -0.030 |
ited | -0.029 |
ous | -0.029 |
years | -0.028 |
Token | ." |
Token ID | 526 |
Feature activation | -4.52e-03 |
Pos logit contributions | |
ate | +0.015 |
things | +0.009 |
his | +0.009 |
gear | +0.008 |
other | +0.007 |
Neg logit contributions | |
hy | -0.033 |
ited | -0.032 |
years | -0.032 |
seventeen | -0.032 |
gust | -0.031 |
Token | open |
Token ID | 1280 |
Feature activation | -7.07e-03 |
Pos logit contributions | |
ited | +0.019 |
hy | +0.019 |
gust | +0.019 |
seventeen | +0.019 |
years | +0.019 |
Neg logit contributions | |
ate | -0.015 |
his | -0.013 |
things | -0.012 |
other | -0.011 |
gear | -0.010 |
Token | it |
Token ID | 340 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
years | +0.015 |
gust | +0.015 |
ited | +0.014 |
seventeen | +0.014 |
bell | +0.014 |
Neg logit contributions | |
ate | -0.009 |
his | -0.006 |
emo | -0.006 |
name | -0.006 |
P | -0.005 |
Token | up |
Token ID | 510 |
Feature activation | +8.25e-03 |
Pos logit contributions | |
bell | +0.019 |
ous | +0.018 |
ited | +0.018 |
seventeen | +0.018 |
years | +0.018 |
Neg logit contributions | |
ate | -0.016 |
his | -0.014 |
things | -0.013 |
gear | -0.012 |
other | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | +2.99e-03 |
Pos logit contributions | |
ate | +0.011 |
his | +0.008 |
things | +0.008 |
gear | +0.007 |
name | +0.007 |
Neg logit contributions | |
years | -0.018 |
ited | -0.018 |
seventeen | -0.018 |
gust | -0.017 |
bell | -0.017 |
Token | try |
Token ID | 1949 |
Feature activation | +2.08e-04 |
Pos logit contributions | |
ate | +0.004 |
his | +0.003 |
things | +0.003 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
years | -0.007 |
hy | -0.007 |
gust | -0.006 |
Token | again |
Token ID | 757 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
ate | +0.000 |
his | +0.000 |
things | +0.000 |
gear | +0.000 |
P | +0.000 |
Neg logit contributions | |
ous | -0.000 |
seventeen | -0.000 |
years | -0.000 |
gust | -0.000 |
bell | -0.000 |
Token | ." |
Token ID | 526 |
Feature activation | +4.21e-03 |
Pos logit contributions | |
seventeen | +0.033 |
gust | +0.032 |
years | +0.032 |
ited | +0.032 |
ous | +0.032 |
Neg logit contributions | |
ate | -0.014 |
his | -0.011 |
things | -0.009 |
gear | -0.008 |
other | -0.007 |
Token | They |
Token ID | 1119 |
Feature activation | -3.62e-04 |
Pos logit contributions | |
ate | +0.006 |
his | +0.004 |
things | +0.004 |
other | +0.004 |
gear | +0.004 |
Neg logit contributions | |
gust | -0.009 |
ited | -0.009 |
hy | -0.009 |
seventeen | -0.009 |
years | -0.009 |
Token | opened |
Token ID | 4721 |
Feature activation | -3.54e-03 |
Pos logit contributions | |
seventeen | +0.001 |
hy | +0.001 |
ited | +0.001 |
gust | +0.001 |
storm | +0.001 |
Neg logit contributions | |
ate | -0.001 |
his | -0.000 |
things | -0.000 |
other | -0.000 |
the | -0.000 |
Token | up |
Token ID | 510 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
gust | +0.008 |
seventeen | +0.008 |
ited | +0.008 |
bell | +0.008 |
years | +0.008 |
Neg logit contributions | |
ate | -0.004 |
P | -0.002 |
emo | -0.002 |
his | -0.002 |
yourself | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +4.82e-03 |
Pos logit contributions | |
ate | +0.009 |
his | +0.005 |
things | +0.005 |
other | +0.004 |
." | +0.003 |
Neg logit contributions | |
ited | -0.033 |
gust | -0.033 |
hy | -0.033 |
seventeen | -0.033 |
years | -0.033 |
Token | and |
Token ID | 290 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
years | +0.011 |
seventeen | +0.011 |
ited | +0.011 |
hy | +0.010 |
gust | +0.010 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.002 |
other | -0.002 |
." | -0.002 |
Token | its |
Token ID | 663 |
Feature activation | +9.57e-03 |
Pos logit contributions | |
ate | +0.015 |
his | +0.015 |
things | +0.013 |
other | +0.013 |
the | +0.012 |
Neg logit contributions | |
ited | -0.028 |
years | -0.027 |
seventeen | -0.027 |
hy | -0.026 |
aney | -0.026 |
Token | rabbit |
Token ID | 22746 |
Feature activation | -1.57e-03 |
Pos logit contributions | |
ate | +0.011 |
things | +0.009 |
his | +0.009 |
other | +0.008 |
friends | +0.008 |
Neg logit contributions | |
ited | -0.024 |
seventeen | -0.024 |
years | -0.024 |
hy | -0.023 |
gust | -0.023 |
Token | friend |
Token ID | 1545 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
years | +0.004 |
seventeen | +0.004 |
ited | +0.004 |
gust | +0.004 |
hy | +0.004 |
Neg logit contributions | |
ate | -0.002 |
his | -0.002 |
things | -0.002 |
other | -0.002 |
friends | -0.001 |
Token | dancing |
Token ID | 15360 |
Feature activation | -6.81e-03 |
Pos logit contributions | |
ate | +0.013 |
his | +0.012 |
things | +0.011 |
other | +0.010 |
." | +0.010 |
Neg logit contributions | |
ited | -0.028 |
seventeen | -0.028 |
years | -0.028 |
gust | -0.028 |
hy | -0.026 |
Token | together |
Token ID | 1978 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
ited | +0.017 |
seventeen | +0.017 |
years | +0.017 |
gust | +0.017 |
hy | +0.017 |
Neg logit contributions | |
ate | -0.007 |
his | -0.006 |
things | -0.006 |
other | -0.005 |
." | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -1.38e-03 |
Pos logit contributions | |
seventeen | +0.035 |
ited | +0.035 |
years | +0.035 |
hy | +0.034 |
gust | +0.034 |
Neg logit contributions | |
ate | -0.005 |
his | -0.005 |
things | -0.004 |
other | -0.003 |
." | -0.002 |
Token | They |
Token ID | 1119 |
Feature activation | +2.65e-03 |
Pos logit contributions | |
seventeen | +0.003 |
years | +0.003 |
gust | +0.003 |
hy | +0.003 |
ous | +0.003 |
Neg logit contributions | |
ate | -0.002 |
things | -0.001 |
his | -0.001 |
gear | -0.001 |
stuff | -0.001 |
Token | thought |
Token ID | 1807 |
Feature activation | +7.77e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.004 |
other | +0.004 |
the | +0.003 |
things | +0.003 |
Neg logit contributions | |
seventeen | -0.006 |
hy | -0.005 |
ited | -0.005 |
years | -0.005 |
gust | -0.005 |
Token | it |
Token ID | 340 |
Feature activation | +1.90e-02 |
Pos logit contributions | |
ate | +0.007 |
his | +0.007 |
things | +0.007 |
other | +0.006 |
the | +0.006 |
Neg logit contributions | |
ited | -0.021 |
seventeen | -0.020 |
years | -0.020 |
hy | -0.020 |
gust | -0.019 |
Token | was |
Token ID | 373 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
ate | +0.020 |
his | +0.016 |
things | +0.015 |
other | +0.013 |
| +0.012 |
Neg logit contributions | |
seventeen | -0.049 |
ited | -0.048 |
hy | -0.048 |
years | -0.048 |
gust | -0.048 |
Token | named |
Token ID | 3706 |
Feature activation | -7.75e-03 |
Pos logit contributions | |
ate | +0.020 |
his | +0.017 |
things | +0.016 |
." | +0.015 |
other | +0.015 |
Neg logit contributions | |
seventeen | -0.038 |
ited | -0.038 |
hy | -0.037 |
years | -0.037 |
gust | -0.036 |
Token | Tweet |
Token ID | 18752 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
hy | +0.016 |
years | +0.016 |
gust | +0.016 |
seventeen | +0.016 |
ited | +0.016 |
Neg logit contributions | |
ate | -0.012 |
things | -0.009 |
his | -0.009 |
other | -0.008 |
gear | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-03 |
Pos logit contributions | |
seventeen | +0.017 |
gust | +0.016 |
ited | +0.016 |
hy | +0.016 |
years | +0.016 |
Neg logit contributions | |
ate | -0.024 |
his | -0.022 |
things | -0.021 |
other | -0.021 |
." | -0.020 |
Token | Tweet |
Token ID | 18752 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
ate | +0.003 |
things | +0.002 |
his | +0.002 |
other | +0.002 |
gear | +0.002 |
Neg logit contributions | |
seventeen | -0.004 |
hy | -0.004 |
years | -0.003 |
gust | -0.003 |
ited | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | -6.75e-03 |
Pos logit contributions | |
seventeen | +0.026 |
hy | +0.025 |
years | +0.024 |
gust | +0.024 |
ited | +0.024 |
Neg logit contributions | |
ate | -0.033 |
his | -0.029 |
things | -0.029 |
other | -0.027 |
| -0.026 |
Token | very |
Token ID | 845 |
Feature activation | -4.46e-03 |
Pos logit contributions | |
ited | +0.016 |
seventeen | +0.015 |
hy | +0.015 |
years | +0.015 |
gust | +0.015 |
Neg logit contributions | |
ate | -0.009 |
his | -0.008 |
things | -0.007 |
other | -0.007 |
| -0.007 |
Token | happy |
Token ID | 3772 |
Feature activation | -5.36e-03 |
Pos logit contributions | |
ited | +0.009 |
seventeen | +0.009 |
hy | +0.009 |
years | +0.009 |
gust | +0.009 |
Neg logit contributions | |
ate | -0.007 |
his | -0.006 |
things | -0.005 |
other | -0.005 |
| -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -6.86e-03 |
Pos logit contributions | |
seventeen | +0.014 |
ited | +0.014 |
hy | +0.014 |
years | +0.014 |
gust | +0.013 |
Neg logit contributions | |
ate | -0.005 |
his | -0.004 |
things | -0.004 |
other | -0.003 |
." | -0.003 |
Token | loved |
Token ID | 6151 |
Feature activation | -5.87e-03 |
Pos logit contributions | |
hy | +0.012 |
gust | +0.011 |
years | +0.011 |
ited | +0.011 |
seventeen | +0.011 |
Neg logit contributions | |
ate | -0.013 |
things | -0.011 |
his | -0.010 |
other | -0.010 |
gear | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | -8.48e-03 |
Pos logit contributions | |
years | +0.012 |
hy | +0.012 |
gust | +0.012 |
seventeen | +0.012 |
ited | +0.012 |
Neg logit contributions | |
ate | -0.009 |
his | -0.006 |
things | -0.006 |
other | -0.006 |
gear | -0.005 |
Token | fly |
Token ID | 6129 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
hy | +0.017 |
seventeen | +0.016 |
ited | +0.016 |
gust | +0.016 |
years | +0.016 |
Neg logit contributions | |
ate | -0.013 |
things | -0.011 |
his | -0.010 |
other | -0.010 |
gear | -0.009 |
Token | Lisa |
Token ID | 15378 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
ited | +0.028 |
seventeen | +0.028 |
hy | +0.028 |
years | +0.027 |
gust | +0.027 |
Neg logit contributions | |
ate | -0.010 |
his | -0.008 |
things | -0.007 |
other | -0.007 |
." | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -2.19e-03 |
Pos logit contributions | |
ited | +0.028 |
hy | +0.027 |
years | +0.027 |
seventeen | +0.027 |
gust | +0.027 |
Neg logit contributions | |
ate | -0.009 |
things | -0.006 |
his | -0.006 |
other | -0.005 |
gear | -0.004 |
Token | Lisa |
Token ID | 15378 |
Feature activation | -2.00e-02 |
Pos logit contributions | |
ited | +0.004 |
seventeen | +0.004 |
hy | +0.004 |
years | +0.004 |
gust | +0.004 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
other | -0.003 |
." | -0.003 |
Token | spent |
Token ID | 3377 |
Feature activation | -8.71e-03 |
Pos logit contributions | |
ited | +0.036 |
hy | +0.036 |
years | +0.035 |
seventeen | +0.035 |
gust | +0.035 |
Neg logit contributions | |
ate | -0.034 |
his | -0.029 |
things | -0.028 |
other | -0.026 |
gear | -0.025 |
Token | a |
Token ID | 257 |
Feature activation | -2.61e-02 |
Pos logit contributions | |
ited | +0.022 |
years | +0.022 |
gust | +0.022 |
seventeen | +0.022 |
hy | +0.022 |
Neg logit contributions | |
ate | -0.009 |
things | -0.006 |
his | -0.006 |
other | -0.005 |
." | -0.005 |
Token | lot |
Token ID | 1256 |
Feature activation | -5.57e-02 |
Pos logit contributions | |
ited | +0.053 |
seventeen | +0.053 |
years | +0.052 |
hy | +0.052 |
gust | +0.051 |
Neg logit contributions | |
ate | -0.040 |
his | -0.033 |
things | -0.033 |
other | -0.030 |
| -0.028 |
Token | of |
Token ID | 286 |
Feature activation | -3.25e-02 |
Pos logit contributions | |
ited | +0.084 |
seventeen | +0.084 |
hy | +0.082 |
gust | +0.082 |
years | +0.081 |
Neg logit contributions | |
ate | -0.117 |
his | -0.102 |
things | -0.100 |
other | -0.095 |
| -0.091 |
Token | time |
Token ID | 640 |
Feature activation | -8.46e-03 |
Pos logit contributions | |
ited | +0.069 |
gust | +0.068 |
years | +0.068 |
hy | +0.068 |
seventeen | +0.068 |
Neg logit contributions | |
ate | -0.047 |
his | -0.035 |
things | -0.034 |
other | -0.030 |
." | -0.030 |
Token | outside |
Token ID | 2354 |
Feature activation | -1.11e-03 |
Pos logit contributions | |
ited | +0.021 |
seventeen | +0.020 |
aney | +0.020 |
hy | +0.020 |
anne | +0.019 |
Neg logit contributions | |
ate | -0.011 |
his | -0.011 |
things | -0.010 |
and | -0.009 |
friends | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
seventeen | +0.003 |
ited | +0.003 |
hy | +0.003 |
aney | +0.003 |
anne | +0.003 |
Neg logit contributions | |
his | -0.001 |
things | -0.001 |
ate | -0.001 |
the | -0.001 |
and | -0.001 |
Token | playing |
Token ID | 2712 |
Feature activation | +6.80e-03 |
Pos logit contributions | |
seventeen | +0.031 |
ited | +0.030 |
hy | +0.028 |
years | +0.028 |
gust | +0.028 |
Neg logit contributions | |
his | -0.020 |
ate | -0.019 |
things | -0.018 |
the | -0.017 |
other | -0.016 |
Token | to |
Token ID | 284 |
Feature activation | -2.21e-03 |
Pos logit contributions | |
ited | +0.012 |
seventeen | +0.012 |
hy | +0.012 |
years | +0.012 |
gust | +0.012 |
Neg logit contributions | |
ate | -0.006 |
his | -0.005 |
things | -0.005 |
other | -0.004 |
gear | -0.004 |
Token | try |
Token ID | 1949 |
Feature activation | +3.19e-03 |
Pos logit contributions | |
seventeen | +0.005 |
hy | +0.004 |
ited | +0.004 |
gust | +0.004 |
years | +0.004 |
Neg logit contributions | |
ate | -0.003 |
things | -0.003 |
his | -0.003 |
other | -0.002 |
gear | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | +8.99e-03 |
Pos logit contributions | |
ate | +0.004 |
his | +0.002 |
P | +0.002 |
gear | +0.002 |
things | +0.002 |
Neg logit contributions | |
seventeen | -0.007 |
gust | -0.007 |
years | -0.007 |
ous | -0.007 |
stretched | -0.006 |
Token | put |
Token ID | 1234 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
ate | +0.011 |
his | +0.009 |
things | +0.009 |
other | +0.008 |
own | +0.007 |
Neg logit contributions | |
ited | -0.023 |
hy | -0.022 |
years | -0.022 |
seventeen | -0.022 |
aney | -0.022 |
Token | the |
Token ID | 262 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
ate | +0.018 |
emo | +0.013 |
urse | +0.011 |
ano | +0.011 |
rev | +0.011 |
Neg logit contributions | |
gust | -0.030 |
seventeen | -0.030 |
years | -0.029 |
ited | -0.029 |
thirteen | -0.029 |
Token | puzzle |
Token ID | 15027 |
Feature activation | -4.86e-02 |
Pos logit contributions | |
ited | +0.023 |
seventeen | +0.023 |
years | +0.023 |
hy | +0.023 |
gust | +0.022 |
Neg logit contributions | |
ate | -0.013 |
things | -0.011 |
his | -0.011 |
other | -0.010 |
." | -0.009 |
Token | together |
Token ID | 1978 |
Feature activation | -6.20e-03 |
Pos logit contributions | |
ited | +0.112 |
seventeen | +0.111 |
years | +0.110 |
hy | +0.110 |
gust | +0.109 |
Neg logit contributions | |
ate | -0.063 |
his | -0.050 |
things | -0.049 |
other | -0.043 |
." | -0.040 |
Token | . |
Token ID | 13 |
Feature activation | +5.61e-03 |
Pos logit contributions | |
ited | +0.016 |
seventeen | +0.016 |
hy | +0.016 |
years | +0.016 |
gust | +0.016 |
Neg logit contributions | |
ate | -0.006 |
things | -0.004 |
his | -0.004 |
other | -0.003 |
gear | -0.003 |
Token | He |
Token ID | 679 |
Feature activation | +3.47e-03 |
Pos logit contributions | |
ate | +0.008 |
things | +0.007 |
his | +0.006 |
toy | +0.006 |
other | +0.006 |
Neg logit contributions | |
gust | -0.011 |
hy | -0.011 |
seventeen | -0.011 |
oled | -0.010 |
years | -0.010 |
Token | worked |
Token ID | 3111 |
Feature activation | +4.94e-03 |
Pos logit contributions | |
ate | +0.005 |
things | +0.005 |
his | +0.004 |
other | +0.004 |
." | +0.004 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
years | -0.007 |
hy | -0.006 |
gust | -0.006 |
Token | so |
Token ID | 523 |
Feature activation | -4.35e-03 |
Pos logit contributions | |
ate | +0.009 |
things | +0.008 |
his | +0.007 |
other | +0.007 |
name | +0.007 |
Neg logit contributions | |
seventeen | -0.008 |
ited | -0.008 |
years | -0.008 |
gust | -0.008 |
hy | -0.007 |
Token | The |
Token ID | 464 |
Feature activation | -5.09e-03 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.007 |
other | +0.007 |
| +0.007 |
Neg logit contributions | |
seventeen | -0.016 |
ited | -0.016 |
hy | -0.016 |
gust | -0.016 |
years | -0.016 |
Token | little |
Token ID | 1310 |
Feature activation | +3.74e-03 |
Pos logit contributions | |
seventeen | +0.014 |
ited | +0.014 |
years | +0.014 |
hy | +0.014 |
gust | +0.013 |
Neg logit contributions | |
ate | -0.004 |
things | -0.003 |
his | -0.003 |
other | -0.003 |
friends | -0.002 |
Token | girl |
Token ID | 2576 |
Feature activation | -2.70e-03 |
Pos logit contributions | |
ate | +0.005 |
his | +0.004 |
things | +0.004 |
other | +0.003 |
." | +0.003 |
Neg logit contributions | |
ited | -0.009 |
seventeen | -0.009 |
hy | -0.009 |
years | -0.009 |
gust | -0.008 |
Token | put |
Token ID | 1234 |
Feature activation | +2.34e-03 |
Pos logit contributions | |
seventeen | +0.006 |
ited | +0.006 |
hy | +0.006 |
gust | +0.006 |
years | +0.006 |
Neg logit contributions | |
ate | -0.004 |
his | -0.003 |
things | -0.003 |
other | -0.003 |
| -0.003 |
Token | the |
Token ID | 262 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
." | +0.002 |
gear | +0.002 |
Neg logit contributions | |
years | -0.006 |
gust | -0.006 |
hy | -0.005 |
ited | -0.005 |
seventeen | -0.005 |
Token | bracelet |
Token ID | 42893 |
Feature activation | -4.93e-02 |
Pos logit contributions | |
seventeen | +0.032 |
ited | +0.032 |
years | +0.032 |
hy | +0.031 |
ous | +0.031 |
Neg logit contributions | |
ate | -0.026 |
things | -0.022 |
his | -0.021 |
other | -0.021 |
toy | -0.019 |
Token | on |
Token ID | 319 |
Feature activation | -3.57e-03 |
Pos logit contributions | |
seventeen | +0.139 |
ited | +0.135 |
years | +0.132 |
gust | +0.131 |
hy | +0.130 |
Neg logit contributions | |
ate | -0.046 |
his | -0.038 |
things | -0.037 |
other | -0.029 |
toy | -0.027 |
Token | her |
Token ID | 607 |
Feature activation | +5.88e-03 |
Pos logit contributions | |
gust | +0.008 |
hy | +0.008 |
years | +0.008 |
seventeen | +0.007 |
ited | +0.007 |
Neg logit contributions | |
ate | -0.004 |
gear | -0.003 |
things | -0.003 |
emo | -0.003 |
his | -0.003 |
Token | wrist |
Token ID | 15980 |
Feature activation | -2.33e-02 |
Pos logit contributions | |
ate | +0.010 |
his | +0.008 |
things | +0.008 |
other | +0.007 |
gear | +0.007 |
Neg logit contributions | |
hy | -0.011 |
gust | -0.011 |
seventeen | -0.011 |
ited | -0.011 |
years | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | +6.18e-04 |
Pos logit contributions | |
seventeen | +0.069 |
ited | +0.069 |
years | +0.068 |
gust | +0.067 |
hy | +0.067 |
Neg logit contributions | |
ate | -0.016 |
his | -0.011 |
things | -0.009 |
other | -0.007 |
." | -0.006 |
Token | rushed |
Token ID | 13999 |
Feature activation | -6.78e-03 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
hy | -0.001 |
years | -0.001 |
gust | -0.001 |
Token | of |
Token ID | 286 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
his | +0.006 |
ate | +0.006 |
things | +0.005 |
other | +0.005 |
the | +0.005 |
Neg logit contributions | |
seventeen | -0.028 |
years | -0.027 |
hy | -0.027 |
ited | -0.026 |
sing | -0.026 |
Token | a |
Token ID | 257 |
Feature activation | -4.07e-03 |
Pos logit contributions | |
ited | +0.035 |
seventeen | +0.035 |
hy | +0.035 |
years | +0.034 |
gust | +0.034 |
Neg logit contributions | |
ate | -0.009 |
his | -0.006 |
things | -0.006 |
other | -0.005 |
| -0.003 |
Token | sudden |
Token ID | 4802 |
Feature activation | +8.49e-03 |
Pos logit contributions | |
hy | +0.007 |
seventeen | +0.007 |
years | +0.007 |
ited | +0.007 |
ous | +0.007 |
Neg logit contributions | |
other | -0.007 |
things | -0.007 |
friends | -0.007 |
ate | -0.006 |
his | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +2.45e-03 |
Pos logit contributions | |
ate | +0.008 |
things | +0.007 |
his | +0.007 |
other | +0.006 |
the | +0.005 |
Neg logit contributions | |
ited | -0.022 |
seventeen | -0.022 |
years | -0.022 |
hy | -0.022 |
ous | -0.021 |
Token | a |
Token ID | 257 |
Feature activation | +6.76e-03 |
Pos logit contributions | |
ate | +0.002 |
his | +0.002 |
things | +0.002 |
other | +0.001 |
gear | +0.001 |
Neg logit contributions | |
ited | -0.006 |
seventeen | -0.006 |
gust | -0.006 |
hy | -0.006 |
years | -0.006 |
Token | gust |
Token ID | 35253 |
Feature activation | -4.91e-02 |
Pos logit contributions | |
things | +0.007 |
other | +0.006 |
his | +0.006 |
ate | +0.006 |
toy | +0.006 |
Neg logit contributions | |
years | -0.017 |
ited | -0.017 |
aney | -0.016 |
seventeen | -0.016 |
hetically | -0.016 |
Token | of |
Token ID | 286 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
seventeen | +0.099 |
ited | +0.094 |
hy | +0.093 |
sing | +0.092 |
years | +0.092 |
Neg logit contributions | |
ate | -0.073 |
his | -0.070 |
| -0.064 |
things | -0.063 |
other | -0.061 |
Token | wind |
Token ID | 2344 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
ous | +0.027 |
hy | +0.027 |
years | +0.027 |
seventeen | +0.027 |
aney | +0.026 |
Neg logit contributions | |
his | -0.016 |
ate | -0.016 |
things | -0.016 |
other | -0.015 |
water | -0.013 |
Token | blew |
Token ID | 17948 |
Feature activation | +2.66e-03 |
Pos logit contributions | |
years | +0.030 |
seventeen | +0.029 |
hy | +0.028 |
aney | +0.027 |
ited | +0.027 |
Neg logit contributions | |
ate | -0.018 |
his | -0.017 |
things | -0.015 |
and | -0.014 |
the | -0.014 |
Token | by |
Token ID | 416 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
ate | +0.003 |
his | +0.002 |
things | +0.002 |
other | +0.002 |
| +0.002 |
Neg logit contributions | |
ited | -0.007 |
seventeen | -0.007 |
years | -0.007 |
hy | -0.007 |
gust | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +6.44e-03 |
Pos logit contributions | |
ate | +0.016 |
his | +0.011 |
things | +0.011 |
other | +0.008 |
." | +0.007 |
Neg logit contributions | |
ited | -0.067 |
seventeen | -0.066 |
years | -0.066 |
hy | -0.066 |
gust | -0.065 |
Token | : |
Token ID | 25 |
Feature activation | -8.11e-03 |
Pos logit contributions | |
ited | +0.027 |
years | +0.025 |
seventeen | +0.025 |
gust | +0.024 |
hy | +0.024 |
Neg logit contributions | |
his | -0.007 |
ate | -0.007 |
things | -0.006 |
| -0.005 |
the | -0.004 |
Token | " |
Token ID | 366 |
Feature activation | +5.64e-04 |
Pos logit contributions | |
seventeen | +0.017 |
hy | +0.016 |
gust | +0.016 |
ous | +0.016 |
years | +0.016 |
Neg logit contributions | |
ate | -0.012 |
things | -0.010 |
his | -0.009 |
other | -0.009 |
gear | -0.009 |
Token | Jack |
Token ID | 14295 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
ate | +0.001 |
his | +0.001 |
things | +0.001 |
other | +0.001 |
." | +0.001 |
Neg logit contributions | |
ited | -0.001 |
seventeen | -0.001 |
hy | -0.001 |
years | -0.001 |
gust | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | -1.79e-04 |
Pos logit contributions | |
ate | +0.025 |
his | +0.019 |
things | +0.019 |
other | +0.018 |
gear | +0.016 |
Neg logit contributions | |
hy | -0.034 |
ited | -0.034 |
seventeen | -0.033 |
gust | -0.033 |
ous | -0.032 |
Token | do |
Token ID | 466 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
ited | +0.000 |
seventeen | +0.000 |
years | +0.000 |
hy | +0.000 |
gust | +0.000 |
Neg logit contributions | |
ate | -0.000 |
his | -0.000 |
things | -0.000 |
other | -0.000 |
gear | -0.000 |
Token | you |
Token ID | 345 |
Feature activation | -4.13e-02 |
Pos logit contributions | |
ate | +0.026 |
his | +0.019 |
toy | +0.018 |
emo | +0.018 |
other | +0.017 |
Neg logit contributions | |
hy | -0.028 |
years | -0.026 |
gust | -0.025 |
ous | -0.024 |
seventeen | -0.024 |
Token | want |
Token ID | 765 |
Feature activation | +7.40e-03 |
Pos logit contributions | |
seventeen | +0.077 |
years | +0.075 |
gust | +0.074 |
ous | +0.072 |
ited | +0.072 |
Neg logit contributions | |
ate | -0.073 |
his | -0.063 |
things | -0.061 |
." | -0.058 |
other | -0.058 |
Token | to |
Token ID | 284 |
Feature activation | -9.24e-03 |
Pos logit contributions | |
ate | +0.011 |
things | +0.008 |
his | +0.008 |
other | +0.007 |
name | +0.007 |
Neg logit contributions | |
years | -0.014 |
seventeen | -0.014 |
hy | -0.014 |
gust | -0.014 |
ited | -0.014 |
Token | lift |
Token ID | 10303 |
Feature activation | +1.71e-03 |
Pos logit contributions | |
hy | +0.016 |
ited | +0.016 |
seventeen | +0.016 |
gust | +0.015 |
bell | +0.015 |
Neg logit contributions | |
ate | -0.015 |
things | -0.013 |
his | -0.012 |
other | -0.011 |
gear | -0.011 |
Token | it |
Token ID | 340 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
ate | +0.002 |
emo | +0.001 |
place | +0.001 |
urse | +0.001 |
name | +0.001 |
Neg logit contributions | |
years | -0.003 |
seventeen | -0.003 |
gust | -0.003 |
thirteen | -0.003 |
ited | -0.003 |
Token | up |
Token ID | 510 |
Feature activation | +4.49e-03 |
Pos logit contributions | |
bell | +0.042 |
storm | +0.040 |
gust | +0.040 |
ous | +0.040 |
ited | +0.038 |
Neg logit contributions | |
ate | -0.031 |
things | -0.024 |
other | -0.024 |
friends | -0.023 |
P | -0.022 |