Token | was |
Token ID | 373 |
Feature activation | +5.60e-03 |
Pos logit contributions | |
yourself | +0.039 |
aj | +0.039 |
ich | +0.037 |
majesty | +0.037 |
yourselves | +0.037 |
Neg logit contributions | |
le | -0.041 |
inn | -0.041 |
eb | -0.039 |
him | -0.038 |
dog | -0.038 |
Token | very |
Token ID | 845 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
inn | +0.010 |
aster | +0.009 |
him | +0.009 |
eb | +0.009 |
ah | +0.009 |
Neg logit contributions | |
aj | -0.008 |
yourself | -0.008 |
majesty | -0.008 |
yourselves | -0.008 |
endant | -0.008 |
Token | happy |
Token ID | 3772 |
Feature activation | -7.39e-03 |
Pos logit contributions | |
yourself | +0.031 |
yourselves | +0.029 |
aj | +0.028 |
blo | +0.028 |
ich | +0.028 |
Neg logit contributions | |
inn | -0.044 |
aster | -0.040 |
le | -0.039 |
dog | -0.039 |
ny | -0.039 |
Token | . |
Token ID | 13 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
yourself | +0.015 |
aj | +0.014 |
majesty | +0.014 |
endant | +0.014 |
ich | +0.014 |
Neg logit contributions | |
him | -0.009 |
dog | -0.008 |
inn | -0.008 |
le | -0.008 |
eb | -0.008 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -6.18e-03 |
Pos logit contributions | |
yourself | +0.030 |
blo | +0.029 |
aj | +0.028 |
yourselves | +0.028 |
majesty | +0.028 |
Neg logit contributions | |
inn | -0.024 |
eb | -0.022 |
aster | -0.022 |
dog | -0.021 |
le | -0.021 |
Token | Far |
Token ID | 21428 |
Feature activation | +8.66e-02 |
Pos logit contributions | |
yourself | +0.007 |
blo | +0.007 |
aj | +0.006 |
yourselves | +0.006 |
window | +0.006 |
Neg logit contributions | |
inn | -0.013 |
aster | -0.012 |
le | -0.012 |
eb | -0.012 |
dog | -0.012 |
Token | away |
Token ID | 1497 |
Feature activation | -2.81e-02 |
Pos logit contributions | |
inn | +0.105 |
aster | +0.103 |
hot | +0.094 |
Jim | +0.087 |
war | +0.086 |
Neg logit contributions | |
yourself | -0.171 |
blo | -0.159 |
yourselves | -0.158 |
ich | -0.156 |
aj | -0.152 |
Token | in |
Token ID | 287 |
Feature activation | -1.41e-02 |
Pos logit contributions | |
yourself | +0.058 |
yourselves | +0.056 |
blo | +0.056 |
aj | +0.056 |
precious | +0.054 |
Neg logit contributions | |
inn | -0.029 |
eb | -0.028 |
Bob | -0.026 |
ny | -0.025 |
him | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | -1.71e-02 |
Pos logit contributions | |
yourself | +0.026 |
blo | +0.024 |
yourselves | +0.023 |
window | +0.023 |
aj | +0.022 |
Neg logit contributions | |
inn | -0.021 |
eb | -0.019 |
le | -0.019 |
war | -0.019 |
dog | -0.018 |
Token | sky |
Token ID | 6766 |
Feature activation | +4.20e-03 |
Pos logit contributions | |
yourself | +0.023 |
aj | +0.021 |
blo | +0.021 |
yourselves | +0.021 |
majesty | +0.021 |
Neg logit contributions | |
inn | -0.032 |
aster | -0.031 |
eb | -0.030 |
dog | -0.030 |
le | -0.029 |
Token | was |
Token ID | 373 |
Feature activation | +6.92e-03 |
Pos logit contributions | |
inn | +0.005 |
le | +0.005 |
eb | +0.005 |
dog | +0.005 |
aster | +0.005 |
Neg logit contributions | |
yourself | -0.008 |
majesty | -0.008 |
yourselves | -0.008 |
aj | -0.008 |
ich | -0.008 |
Token | scared |
Token ID | 12008 |
Feature activation | +8.62e-03 |
Pos logit contributions | |
eb | +0.041 |
aster | +0.041 |
inn | +0.040 |
war | +0.038 |
dog | +0.038 |
Neg logit contributions | |
blo | -0.016 |
precious | -0.016 |
yourself | -0.016 |
window | -0.014 |
aj | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | +5.52e-03 |
Pos logit contributions | |
inn | +0.019 |
aster | +0.018 |
war | +0.018 |
ah | +0.017 |
eb | +0.017 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.009 |
living | -0.008 |
window | -0.008 |
precious | -0.008 |
Token | |
Token ID | 220 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
inn | +0.008 |
le | +0.007 |
aster | +0.007 |
eb | +0.007 |
dog | +0.007 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.010 |
aj | -0.010 |
yourselves | -0.010 |
majesty | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | +8.38e-03 |
Pos logit contributions | |
yourself | +0.033 |
blo | +0.032 |
yourselves | +0.031 |
majesty | +0.030 |
aj | +0.030 |
Neg logit contributions | |
inn | -0.032 |
eb | -0.029 |
aster | -0.029 |
dog | -0.028 |
war | -0.028 |
Token |
|
Token ID | 198 |
Feature activation | +2.97e-03 |
Pos logit contributions | |
inn | +0.015 |
le | +0.014 |
eb | +0.014 |
aster | +0.014 |
dog | +0.014 |
Neg logit contributions | |
yourself | -0.012 |
blo | -0.011 |
aj | -0.011 |
yourselves | -0.011 |
majesty | -0.011 |
Token | Far |
Token ID | 21428 |
Feature activation | +8.03e-02 |
Pos logit contributions | |
inn | +0.006 |
eb | +0.005 |
le | +0.005 |
aster | +0.005 |
dog | +0.005 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
yourselves | -0.004 |
aj | -0.004 |
ich | -0.004 |
Token | mer |
Token ID | 647 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
aster | +0.107 |
inn | +0.101 |
Jim | +0.089 |
Finn | +0.087 |
omp | +0.087 |
Neg logit contributions | |
yourself | -0.152 |
blo | -0.143 |
ich | -0.141 |
yourselves | -0.140 |
receiver | -0.136 |
Token | Brown |
Token ID | 4373 |
Feature activation | +7.81e-03 |
Pos logit contributions | |
inn | +0.024 |
war | +0.023 |
aster | +0.023 |
le | +0.022 |
eb | +0.021 |
Neg logit contributions | |
yourself | -0.021 |
blo | -0.020 |
ich | -0.019 |
window | -0.019 |
yourselves | -0.018 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
inn | +0.014 |
aster | +0.013 |
war | +0.013 |
eb | +0.013 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.011 |
blo | -0.011 |
aj | -0.010 |
ich | -0.010 |
majesty | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
yourself | +0.028 |
blo | +0.026 |
aj | +0.026 |
yourselves | +0.025 |
majesty | +0.025 |
Neg logit contributions | |
inn | -0.026 |
aster | -0.025 |
eb | -0.024 |
le | -0.023 |
dog | -0.023 |
Token | said |
Token ID | 531 |
Feature activation | -1.35e-03 |
Pos logit contributions | |
inn | +0.020 |
eb | +0.019 |
aster | +0.019 |
le | +0.018 |
dog | +0.018 |
Neg logit contributions | |
yourself | -0.017 |
blo | -0.017 |
aj | -0.016 |
yourselves | -0.016 |
majesty | -0.016 |
Token | wall |
Token ID | 3355 |
Feature activation | +1.52e-03 |
Pos logit contributions | |
yourself | +0.021 |
aj | +0.020 |
blo | +0.020 |
majesty | +0.019 |
yourselves | +0.019 |
Neg logit contributions | |
inn | -0.020 |
dog | -0.019 |
aster | -0.019 |
le | -0.018 |
eb | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +4.35e-03 |
Pos logit contributions | |
inn | +0.002 |
aster | +0.002 |
le | +0.002 |
eb | +0.002 |
dog | +0.002 |
Neg logit contributions | |
yourself | -0.003 |
blo | -0.003 |
yourselves | -0.003 |
aj | -0.003 |
majesty | -0.003 |
Token | |
Token ID | 220 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
inn | +0.006 |
eb | +0.006 |
aster | +0.006 |
dog | +0.006 |
le | +0.006 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.008 |
aj | -0.007 |
yourselves | -0.007 |
majesty | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
yourself | +0.032 |
blo | +0.032 |
yourselves | +0.030 |
majesty | +0.030 |
aj | +0.030 |
Neg logit contributions | |
inn | -0.031 |
eb | -0.028 |
aster | -0.027 |
him | -0.026 |
dog | -0.026 |
Token |
|
Token ID | 198 |
Feature activation | +7.05e-03 |
Pos logit contributions | |
inn | +0.022 |
eb | +0.021 |
aster | +0.020 |
le | +0.020 |
dog | +0.020 |
Neg logit contributions | |
yourself | -0.021 |
blo | -0.020 |
aj | -0.019 |
yourselves | -0.019 |
majesty | -0.019 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.80e-02 |
Pos logit contributions | |
inn | +0.011 |
eb | +0.011 |
aster | +0.010 |
le | +0.010 |
dog | +0.010 |
Neg logit contributions | |
yourself | -0.012 |
blo | -0.011 |
aj | -0.011 |
yourselves | -0.011 |
majesty | -0.011 |
Token | ley |
Token ID | 1636 |
Feature activation | +9.19e-03 |
Pos logit contributions | |
aster | +0.106 |
inn | +0.098 |
Jim | +0.092 |
war | +0.084 |
dog | +0.083 |
Neg logit contributions | |
yourself | -0.152 |
blo | -0.141 |
yourselves | -0.140 |
ich | -0.138 |
precious | -0.134 |
Token | watched |
Token ID | 7342 |
Feature activation | -4.00e-04 |
Pos logit contributions | |
inn | +0.015 |
eb | +0.014 |
le | +0.014 |
dog | +0.014 |
aster | +0.014 |
Neg logit contributions | |
yourself | -0.015 |
yourselves | -0.014 |
blo | -0.014 |
aj | -0.013 |
majesty | -0.013 |
Token | as |
Token ID | 355 |
Feature activation | +3.56e-02 |
Pos logit contributions | |
yourself | +0.001 |
window | +0.001 |
blo | +0.001 |
sending | +0.001 |
hugging | +0.001 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
war | -0.001 |
ah | -0.001 |
ny | -0.001 |
Token | his |
Token ID | 465 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
inn | +0.052 |
eb | +0.047 |
le | +0.046 |
war | +0.045 |
dog | +0.045 |
Neg logit contributions | |
yourself | -0.067 |
blo | -0.063 |
yourselves | -0.061 |
majesty | -0.059 |
window | -0.059 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
inn | +0.029 |
aster | +0.027 |
dog | +0.027 |
eb | +0.026 |
le | +0.025 |
Neg logit contributions | |
yourself | -0.029 |
blo | -0.028 |
yourselves | -0.027 |
majesty | -0.024 |
aj | -0.024 |
Token | with |
Token ID | 351 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
inn | +0.070 |
ah | +0.066 |
aster | +0.065 |
eb | +0.064 |
war | +0.064 |
Neg logit contributions | |
yourself | -0.058 |
blo | -0.057 |
yourselves | -0.052 |
most | -0.048 |
precious | -0.047 |
Token | new |
Token ID | 649 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
yourself | +0.017 |
aj | +0.016 |
yourselves | +0.015 |
blo | +0.015 |
majesty | +0.015 |
Neg logit contributions | |
inn | -0.020 |
eb | -0.019 |
aster | -0.019 |
le | -0.019 |
dog | -0.018 |
Token | life |
Token ID | 1204 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
ich | +0.014 |
yourself | +0.014 |
yourselves | +0.013 |
aj | +0.013 |
majesty | +0.012 |
Neg logit contributions | |
le | -0.018 |
him | -0.017 |
inn | -0.017 |
dog | -0.017 |
ny | -0.016 |
Token | ! |
Token ID | 0 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
yourself | +0.018 |
blo | +0.017 |
aj | +0.017 |
yourselves | +0.016 |
majesty | +0.016 |
Neg logit contributions | |
inn | -0.016 |
eb | -0.015 |
aster | -0.015 |
le | -0.014 |
dog | -0.014 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.77e-03 |
Pos logit contributions | |
inn | +0.021 |
eb | +0.019 |
aster | +0.019 |
dog | +0.018 |
war | +0.018 |
Neg logit contributions | |
yourself | -0.025 |
blo | -0.024 |
yourselves | -0.023 |
majesty | -0.023 |
aj | -0.023 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.65e-02 |
Pos logit contributions | |
yourself | +0.002 |
blo | +0.002 |
aj | +0.002 |
yourselves | +0.002 |
window | +0.002 |
Neg logit contributions | |
inn | -0.004 |
aster | -0.004 |
eb | -0.004 |
le | -0.004 |
dog | -0.004 |
Token | mer |
Token ID | 647 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
aster | +0.105 |
inn | +0.096 |
hot | +0.092 |
omp | +0.090 |
Noah | +0.089 |
Neg logit contributions | |
yourself | -0.125 |
blo | -0.121 |
ich | -0.119 |
aj | -0.118 |
receiver | -0.114 |
Token | Fred |
Token ID | 8559 |
Feature activation | +4.12e-03 |
Pos logit contributions | |
inn | +0.023 |
aster | +0.022 |
eb | +0.021 |
le | +0.021 |
war | +0.021 |
Neg logit contributions | |
yourself | -0.025 |
blo | -0.024 |
aj | -0.024 |
yourselves | -0.023 |
majesty | -0.023 |
Token | was |
Token ID | 373 |
Feature activation | +8.17e-03 |
Pos logit contributions | |
inn | +0.006 |
eb | +0.006 |
le | +0.005 |
dog | +0.005 |
ny | +0.005 |
Neg logit contributions | |
yourself | -0.008 |
yourselves | -0.007 |
aj | -0.007 |
majesty | -0.007 |
ich | -0.007 |
Token | very |
Token ID | 845 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
inn | +0.014 |
aster | +0.013 |
eb | +0.012 |
dog | +0.012 |
him | +0.012 |
Neg logit contributions | |
yourself | -0.013 |
majesty | -0.012 |
yourselves | -0.012 |
aj | -0.012 |
blo | -0.012 |
Token | cheerful |
Token ID | 37999 |
Feature activation | -6.88e-03 |
Pos logit contributions | |
yourself | +0.029 |
yourselves | +0.027 |
aj | +0.027 |
blo | +0.027 |
majesty | +0.026 |
Neg logit contributions | |
inn | -0.031 |
aster | -0.028 |
dog | -0.027 |
eb | -0.027 |
him | -0.026 |
Token | books |
Token ID | 3835 |
Feature activation | +2.49e-03 |
Pos logit contributions | |
le | +0.023 |
inn | +0.023 |
him | +0.023 |
dog | +0.022 |
aster | +0.022 |
Neg logit contributions | |
yourself | -0.018 |
ich | -0.018 |
aj | -0.017 |
yourselves | -0.017 |
blo | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | +2.23e-04 |
Pos logit contributions | |
inn | +0.004 |
eb | +0.004 |
aster | +0.004 |
le | +0.004 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
aj | -0.004 |
yourselves | -0.004 |
majesty | -0.004 |
Token | |
Token ID | 220 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
inn | +0.000 |
le | +0.000 |
eb | +0.000 |
aster | +0.000 |
ah | +0.000 |
Neg logit contributions | |
yourself | -0.000 |
yourselves | -0.000 |
aj | -0.000 |
blo | -0.000 |
majesty | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | +7.14e-03 |
Pos logit contributions | |
yourself | +0.035 |
blo | +0.035 |
yourselves | +0.033 |
aj | +0.033 |
majesty | +0.032 |
Neg logit contributions | |
inn | -0.035 |
eb | -0.032 |
aster | -0.032 |
dog | -0.031 |
war | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | +2.30e-03 |
Pos logit contributions | |
le | +0.014 |
inn | +0.014 |
eb | +0.013 |
ah | +0.013 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.009 |
aj | -0.008 |
blo | -0.008 |
yourselves | -0.008 |
ich | -0.007 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.63e-02 |
Pos logit contributions | |
inn | +0.004 |
le | +0.004 |
eb | +0.004 |
dog | +0.004 |
war | +0.004 |
Neg logit contributions | |
yourself | -0.003 |
blo | -0.003 |
ich | -0.003 |
yourselves | -0.003 |
aj | -0.003 |
Token | mer |
Token ID | 647 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
aster | +0.099 |
inn | +0.096 |
Finn | +0.086 |
omp | +0.084 |
Jim | +0.081 |
Neg logit contributions | |
yourself | -0.146 |
yourselves | -0.135 |
ich | -0.132 |
receiver | -0.131 |
blo | -0.130 |
Token | David |
Token ID | 3271 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
inn | +0.018 |
war | +0.016 |
aster | +0.016 |
le | +0.016 |
eb | +0.015 |
Neg logit contributions | |
yourself | -0.020 |
blo | -0.018 |
ich | -0.018 |
yourselves | -0.018 |
window | -0.018 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
inn | +0.026 |
eb | +0.026 |
dog | +0.025 |
le | +0.025 |
ah | +0.025 |
Neg logit contributions | |
yourself | -0.026 |
yourselves | -0.025 |
blo | -0.024 |
aj | -0.024 |
majesty | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | +6.60e-03 |
Pos logit contributions | |
yourself | +0.028 |
blo | +0.027 |
yourselves | +0.026 |
aj | +0.026 |
majesty | +0.026 |
Neg logit contributions | |
inn | -0.024 |
eb | -0.022 |
le | -0.021 |
aster | -0.021 |
dog | -0.021 |
Token | He |
Token ID | 679 |
Feature activation | +4.50e-03 |
Pos logit contributions | |
inn | +0.007 |
eb | +0.006 |
aster | +0.006 |
dog | +0.006 |
le | +0.005 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.014 |
aj | -0.014 |
yourselves | -0.014 |
majesty | -0.014 |
Token | harvested |
Token ID | 34262 |
Feature activation | +8.64e-03 |
Pos logit contributions | |
yourself | +0.002 |
yourselves | +0.002 |
aj | +0.002 |
majesty | +0.002 |
ich | +0.002 |
Neg logit contributions | |
inn | -0.002 |
aster | -0.002 |
le | -0.002 |
eb | -0.002 |
dog | -0.002 |
Token | ! |
Token ID | 0 |
Feature activation | +4.85e-03 |
Pos logit contributions | |
inn | +0.015 |
aster | +0.013 |
eb | +0.013 |
war | +0.013 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.014 |
blo | -0.013 |
yourselves | -0.013 |
aj | -0.012 |
window | -0.012 |
Token | |
Token ID | 220 |
Feature activation | -1.98e-02 |
Pos logit contributions | |
inn | +0.008 |
le | +0.008 |
eb | +0.008 |
aster | +0.008 |
ah | +0.008 |
Neg logit contributions | |
yourself | -0.007 |
aj | -0.007 |
yourselves | -0.007 |
blo | -0.007 |
majesty | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +3.06e-03 |
Pos logit contributions | |
yourself | +0.030 |
blo | +0.028 |
aj | +0.027 |
yourselves | +0.027 |
majesty | +0.026 |
Neg logit contributions | |
inn | -0.035 |
eb | -0.033 |
aster | -0.032 |
le | -0.032 |
dog | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | -2.70e-03 |
Pos logit contributions | |
inn | +0.006 |
le | +0.006 |
eb | +0.005 |
aster | +0.005 |
dog | +0.005 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
aj | -0.004 |
yourselves | -0.004 |
majesty | -0.004 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.61e-02 |
Pos logit contributions | |
yourself | +0.004 |
blo | +0.004 |
yourselves | +0.004 |
aj | +0.004 |
majesty | +0.004 |
Neg logit contributions | |
inn | -0.005 |
eb | -0.005 |
le | -0.004 |
aster | -0.004 |
dog | -0.004 |
Token | mer |
Token ID | 647 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
aster | +0.100 |
inn | +0.095 |
omp | +0.081 |
Jim | +0.079 |
him | +0.078 |
Neg logit contributions | |
yourself | -0.148 |
blo | -0.139 |
ich | -0.136 |
yourselves | -0.135 |
precious | -0.132 |
Token | Joe |
Token ID | 5689 |
Feature activation | +9.66e-03 |
Pos logit contributions | |
inn | +0.021 |
aster | +0.020 |
war | +0.020 |
eb | +0.019 |
dog | +0.019 |
Neg logit contributions | |
yourself | -0.017 |
blo | -0.016 |
yourselves | -0.015 |
ich | -0.015 |
majesty | -0.015 |
Token | went |
Token ID | 1816 |
Feature activation | -4.82e-04 |
Pos logit contributions | |
inn | +0.017 |
eb | +0.016 |
aster | +0.016 |
le | +0.016 |
dog | +0.016 |
Neg logit contributions | |
yourself | -0.014 |
blo | -0.013 |
aj | -0.013 |
yourselves | -0.013 |
majesty | -0.013 |
Token | to |
Token ID | 284 |
Feature activation | -6.79e-03 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
aj | +0.001 |
window | +0.001 |
yourselves | +0.001 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
aster | -0.001 |
le | -0.001 |
dog | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -6.87e-03 |
Pos logit contributions | |
yourself | +0.014 |
blo | +0.013 |
yourselves | +0.013 |
majesty | +0.013 |
aj | +0.013 |
Neg logit contributions | |
inn | -0.009 |
eb | -0.008 |
le | -0.008 |
aster | -0.007 |
dog | -0.007 |
Token | cool |
Token ID | 3608 |
Feature activation | +1.60e-03 |
Pos logit contributions | |
inn | +0.005 |
aster | +0.004 |
eb | +0.004 |
dog | +0.004 |
le | +0.004 |
Neg logit contributions | |
yourself | -0.003 |
yourselves | -0.003 |
aj | -0.003 |
ich | -0.003 |
blo | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +2.08e-03 |
Pos logit contributions | |
inn | +0.003 |
aster | +0.003 |
eb | +0.003 |
war | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.002 |
blo | -0.002 |
yourselves | -0.002 |
aj | -0.002 |
window | -0.002 |
Token | |
Token ID | 220 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
inn | +0.002 |
eb | +0.002 |
him | +0.002 |
dog | +0.002 |
aster | +0.002 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
yourselves | -0.004 |
aj | -0.004 |
majesty | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
blo | +0.033 |
yourself | +0.032 |
majesty | +0.031 |
yourselves | +0.031 |
aj | +0.030 |
Neg logit contributions | |
inn | -0.028 |
eb | -0.025 |
him | -0.024 |
aster | -0.024 |
war | -0.023 |
Token |
|
Token ID | 198 |
Feature activation | +2.63e-03 |
Pos logit contributions | |
inn | +0.016 |
eb | +0.015 |
aster | +0.014 |
him | +0.014 |
dog | +0.014 |
Neg logit contributions | |
yourself | -0.019 |
blo | -0.019 |
yourselves | -0.018 |
aj | -0.018 |
majesty | -0.018 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.54e-02 |
Pos logit contributions | |
inn | +0.004 |
eb | +0.004 |
aster | +0.004 |
le | +0.004 |
dog | +0.004 |
Neg logit contributions | |
yourself | -0.004 |
aj | -0.004 |
blo | -0.004 |
majesty | -0.004 |
yourselves | -0.004 |
Token | ley |
Token ID | 1636 |
Feature activation | +4.92e-03 |
Pos logit contributions | |
aster | +0.099 |
inn | +0.092 |
Jim | +0.089 |
war | +0.081 |
dog | +0.080 |
Neg logit contributions | |
yourself | -0.148 |
blo | -0.139 |
yourselves | -0.136 |
ich | -0.134 |
precious | -0.133 |
Token | was |
Token ID | 373 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
eb | +0.007 |
inn | +0.007 |
le | +0.007 |
dog | +0.007 |
ah | +0.007 |
Neg logit contributions | |
yourself | -0.009 |
yourselves | -0.008 |
blo | -0.008 |
aj | -0.007 |
ich | -0.007 |
Token | so |
Token ID | 523 |
Feature activation | -2.16e-03 |
Pos logit contributions | |
inn | +0.017 |
aster | +0.017 |
eb | +0.016 |
Jim | +0.016 |
him | +0.016 |
Neg logit contributions | |
yourself | -0.016 |
aj | -0.016 |
yourselves | -0.016 |
majesty | -0.015 |
ich | -0.015 |
Token | happy |
Token ID | 3772 |
Feature activation | +5.35e-03 |
Pos logit contributions | |
yourself | +0.003 |
aj | +0.003 |
yourselves | +0.003 |
majesty | +0.003 |
ich | +0.003 |
Neg logit contributions | |
inn | -0.004 |
aster | -0.004 |
Jim | -0.003 |
eb | -0.003 |
him | -0.003 |
Token | to |
Token ID | 284 |
Feature activation | +8.55e-03 |
Pos logit contributions | |
inn | +0.007 |
eb | +0.006 |
him | +0.006 |
dog | +0.006 |
aster | +0.006 |
Neg logit contributions | |
yourself | -0.010 |
aj | -0.010 |
blo | -0.010 |
majesty | -0.010 |
yourselves | -0.010 |
Token | their |
Token ID | 511 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
yourself | +0.028 |
yourselves | +0.026 |
blo | +0.025 |
aj | +0.025 |
window | +0.024 |
Neg logit contributions | |
inn | -0.027 |
eb | -0.025 |
aster | -0.025 |
ah | -0.024 |
war | -0.024 |
Token | food |
Token ID | 2057 |
Feature activation | -2.56e-02 |
Pos logit contributions | |
yourself | +0.016 |
blo | +0.016 |
ich | +0.015 |
reetings | +0.015 |
yourselves | +0.015 |
Neg logit contributions | |
inn | -0.016 |
aster | -0.016 |
dog | -0.016 |
le | -0.016 |
him | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
yourself | +0.044 |
blo | +0.042 |
aj | +0.041 |
yourselves | +0.041 |
majesty | +0.041 |
Neg logit contributions | |
inn | -0.039 |
eb | -0.036 |
aster | -0.036 |
le | -0.035 |
dog | -0.035 |
Token |
|
Token ID | 198 |
Feature activation | -8.63e-03 |
Pos logit contributions | |
blo | +0.027 |
yourself | +0.027 |
ich | +0.026 |
majesty | +0.025 |
yourselves | +0.025 |
Neg logit contributions | |
inn | -0.017 |
aster | -0.014 |
eb | -0.014 |
dog | -0.014 |
him | -0.014 |
Token |
|
Token ID | 198 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
yourself | +0.014 |
blo | +0.013 |
aj | +0.013 |
yourselves | +0.013 |
majesty | +0.013 |
Neg logit contributions | |
inn | -0.014 |
aster | -0.013 |
eb | -0.013 |
dog | -0.013 |
le | -0.013 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.42e-02 |
Pos logit contributions | |
yourself | +0.026 |
blo | +0.025 |
aj | +0.024 |
majesty | +0.024 |
yourselves | +0.023 |
Neg logit contributions | |
inn | -0.030 |
aster | -0.028 |
eb | -0.027 |
dog | -0.026 |
war | -0.026 |
Token | mer |
Token ID | 647 |
Feature activation | +1.23e-02 |
Pos logit contributions | |
inn | +0.096 |
aster | +0.089 |
Jim | +0.077 |
hot | +0.077 |
omp | +0.077 |
Neg logit contributions | |
yourself | -0.150 |
yourselves | -0.138 |
ich | -0.135 |
blo | -0.134 |
receiver | -0.127 |
Token | Bob |
Token ID | 5811 |
Feature activation | +3.80e-03 |
Pos logit contributions | |
inn | +0.021 |
aster | +0.019 |
war | +0.019 |
eb | +0.019 |
le | +0.018 |
Neg logit contributions | |
yourself | -0.019 |
blo | -0.018 |
yourselves | -0.017 |
majesty | -0.017 |
aj | -0.017 |
Token | always |
Token ID | 1464 |
Feature activation | -6.69e-03 |
Pos logit contributions | |
inn | +0.007 |
aster | +0.007 |
eb | +0.007 |
le | +0.006 |
war | +0.006 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.005 |
aj | -0.005 |
yourselves | -0.005 |
majesty | -0.005 |
Token | made |
Token ID | 925 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
yourself | +0.011 |
ich | +0.011 |
blo | +0.011 |
aj | +0.011 |
yourselves | +0.011 |
Neg logit contributions | |
inn | -0.010 |
aster | -0.010 |
le | -0.009 |
dog | -0.009 |
eb | -0.009 |
Token | sure |
Token ID | 1654 |
Feature activation | +2.58e-03 |
Pos logit contributions | |
inn | +0.023 |
eb | +0.021 |
ah | +0.021 |
hot | +0.021 |
war | +0.020 |
Neg logit contributions | |
yourself | -0.019 |
yourselves | -0.017 |
majesty | -0.016 |
blo | -0.015 |
precious | -0.015 |
Token | to |
Token ID | 284 |
Feature activation | -6.40e-03 |
Pos logit contributions | |
inn | +0.036 |
eb | +0.034 |
le | +0.033 |
aster | +0.033 |
war | +0.032 |
Neg logit contributions | |
yourself | -0.034 |
blo | -0.033 |
window | -0.031 |
aj | -0.030 |
yourselves | -0.030 |
Token | her |
Token ID | 607 |
Feature activation | +1.32e-02 |
Pos logit contributions | |
yourself | +0.013 |
blo | +0.012 |
yourselves | +0.012 |
window | +0.012 |
majesty | +0.012 |
Neg logit contributions | |
inn | -0.009 |
eb | -0.008 |
le | -0.007 |
war | -0.007 |
aster | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | -5.56e-03 |
Pos logit contributions | |
dog | +0.018 |
aster | +0.018 |
inn | +0.018 |
him | +0.018 |
le | +0.018 |
Neg logit contributions | |
yourself | -0.023 |
yourselves | -0.023 |
blo | -0.021 |
majesty | -0.020 |
aj | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +1.58e-03 |
Pos logit contributions | |
yourself | +0.011 |
blo | +0.011 |
yourselves | +0.010 |
aj | +0.010 |
majesty | +0.010 |
Neg logit contributions | |
inn | -0.007 |
eb | -0.007 |
aster | -0.006 |
dog | -0.006 |
le | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -3.31e-03 |
Pos logit contributions | |
inn | +0.003 |
eb | +0.003 |
aster | +0.003 |
le | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.002 |
blo | -0.002 |
aj | -0.002 |
yourselves | -0.002 |
majesty | -0.002 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.34e-02 |
Pos logit contributions | |
yourself | +0.005 |
blo | +0.005 |
aj | +0.005 |
yourselves | +0.005 |
majesty | +0.005 |
Neg logit contributions | |
inn | -0.006 |
eb | -0.005 |
aster | -0.005 |
le | -0.005 |
dog | -0.005 |
Token | ah |
Token ID | 993 |
Feature activation | +6.44e-03 |
Pos logit contributions | |
aster | +0.095 |
inn | +0.092 |
omp | +0.078 |
Jim | +0.078 |
Finn | +0.075 |
Neg logit contributions | |
yourself | -0.144 |
blo | -0.132 |
ich | -0.129 |
yourselves | -0.129 |
receiver | -0.126 |
Token | and |
Token ID | 290 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
inn | +0.011 |
eb | +0.011 |
aster | +0.010 |
le | +0.010 |
dog | +0.010 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.009 |
yourselves | -0.009 |
aj | -0.009 |
majesty | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
inn | +0.029 |
le | +0.026 |
aster | +0.025 |
eb | +0.025 |
war | +0.024 |
Neg logit contributions | |
yourself | -0.040 |
blo | -0.038 |
yourselves | -0.036 |
majesty | -0.036 |
aj | -0.036 |
Token | bunny |
Token ID | 44915 |
Feature activation | -4.20e-03 |
Pos logit contributions | |
yourself | +0.018 |
aj | +0.017 |
yourselves | +0.017 |
blo | +0.017 |
majesty | +0.016 |
Neg logit contributions | |
inn | -0.018 |
aster | -0.018 |
dog | -0.018 |
ah | -0.018 |
eb | -0.018 |
Token | became |
Token ID | 2627 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
yourself | +0.006 |
blo | +0.006 |
aj | +0.006 |
majesty | +0.006 |
yourselves | +0.006 |
Neg logit contributions | |
inn | -0.007 |
aster | -0.007 |
eb | -0.007 |
le | -0.006 |
war | -0.006 |
Token | to |
Token ID | 284 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
him | +0.015 |
inn | +0.015 |
le | +0.015 |
Bob | +0.015 |
dog | +0.015 |
Neg logit contributions | |
yourself | -0.018 |
yourselves | -0.017 |
aj | -0.017 |
ich | -0.017 |
majesty | -0.016 |
Token | eat |
Token ID | 4483 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
inn | +0.020 |
aster | +0.019 |
eb | +0.018 |
dog | +0.018 |
le | +0.018 |
Neg logit contributions | |
yourself | -0.037 |
blo | -0.036 |
aj | -0.035 |
yourselves | -0.035 |
majesty | -0.034 |
Token | ." |
Token ID | 526 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
inn | +0.023 |
eb | +0.021 |
aster | +0.021 |
le | +0.021 |
dog | +0.021 |
Neg logit contributions | |
yourself | -0.012 |
blo | -0.011 |
yourselves | -0.011 |
aj | -0.011 |
majesty | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +7.93e-03 |
Pos logit contributions | |
inn | +0.029 |
le | +0.028 |
ah | +0.026 |
eb | +0.026 |
aster | +0.025 |
Neg logit contributions | |
yourself | -0.026 |
yourselves | -0.024 |
aj | -0.024 |
window | -0.024 |
blo | -0.023 |
Token |
|
Token ID | 198 |
Feature activation | +1.00e-03 |
Pos logit contributions | |
inn | +0.016 |
le | +0.015 |
eb | +0.015 |
ah | +0.014 |
aster | +0.014 |
Neg logit contributions | |
yourself | -0.010 |
aj | -0.009 |
yourselves | -0.009 |
blo | -0.009 |
ich | -0.009 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.30e-02 |
Pos logit contributions | |
inn | +0.002 |
le | +0.002 |
eb | +0.002 |
aster | +0.002 |
ah | +0.002 |
Neg logit contributions | |
yourself | -0.001 |
yourselves | -0.001 |
blo | -0.001 |
aj | -0.001 |
ich | -0.001 |
Token | mer |
Token ID | 647 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
aster | +0.096 |
inn | +0.093 |
omp | +0.083 |
Finn | +0.078 |
Jim | +0.077 |
Neg logit contributions | |
yourself | -0.139 |
yourselves | -0.128 |
blo | -0.127 |
receiver | -0.127 |
ich | -0.126 |
Token | Joe |
Token ID | 5689 |
Feature activation | +7.81e-03 |
Pos logit contributions | |
inn | +0.025 |
aster | +0.024 |
war | +0.023 |
le | +0.022 |
eb | +0.021 |
Neg logit contributions | |
yourself | -0.022 |
blo | -0.021 |
ich | -0.021 |
window | -0.021 |
yourselves | -0.020 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
inn | +0.015 |
aster | +0.014 |
war | +0.014 |
eb | +0.014 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.010 |
aj | -0.009 |
majesty | -0.009 |
window | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
yourself | +0.025 |
blo | +0.024 |
aj | +0.023 |
yourselves | +0.023 |
window | +0.022 |
Neg logit contributions | |
inn | -0.025 |
aster | -0.024 |
eb | -0.023 |
war | -0.023 |
dog | -0.023 |
Token | said |
Token ID | 531 |
Feature activation | +1.55e-03 |
Pos logit contributions | |
inn | +0.025 |
eb | +0.024 |
aster | +0.023 |
le | +0.023 |
dog | +0.023 |
Neg logit contributions | |
yourself | -0.022 |
blo | -0.021 |
aj | -0.020 |
yourselves | -0.020 |
majesty | -0.019 |
Token | twenty |
Token ID | 8208 |
Feature activation | +4.06e-02 |
Pos logit contributions | |
inn | +0.022 |
eb | +0.020 |
aster | +0.020 |
le | +0.020 |
dog | +0.020 |
Neg logit contributions | |
yourself | -0.024 |
blo | -0.023 |
yourselves | -0.023 |
aj | -0.023 |
majesty | -0.022 |
Token | - |
Token ID | 12 |
Feature activation | +7.17e-02 |
Pos logit contributions | |
inn | +0.074 |
eb | +0.071 |
aster | +0.070 |
war | +0.070 |
hot | +0.069 |
Neg logit contributions | |
yourself | -0.057 |
blo | -0.054 |
yourselves | -0.051 |
aj | -0.050 |
precious | -0.049 |
Token | eight |
Token ID | 26022 |
Feature activation | +8.73e-03 |
Pos logit contributions | |
inn | +0.100 |
eb | +0.097 |
aster | +0.091 |
le | +0.091 |
dog | +0.090 |
Neg logit contributions | |
yourself | -0.128 |
blo | -0.120 |
yourselves | -0.115 |
precious | -0.111 |
majesty | -0.110 |
Token | , |
Token ID | 11 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
inn | +0.014 |
aster | +0.013 |
eb | +0.013 |
le | +0.012 |
dog | +0.012 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.014 |
aj | -0.014 |
yourselves | -0.014 |
majesty | -0.013 |
Token | twenty |
Token ID | 8208 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
inn | +0.015 |
eb | +0.014 |
aster | +0.014 |
le | +0.013 |
war | +0.013 |
Neg logit contributions | |
yourself | -0.018 |
blo | -0.017 |
yourselves | -0.017 |
aj | -0.016 |
majesty | -0.016 |
Token | - |
Token ID | 12 |
Feature activation | +7.22e-02 |
Pos logit contributions | |
inn | +0.070 |
eb | +0.067 |
aster | +0.066 |
war | +0.066 |
hot | +0.065 |
Neg logit contributions | |
yourself | -0.063 |
blo | -0.061 |
aj | -0.057 |
yourselves | -0.057 |
majesty | -0.056 |
Token | nine |
Token ID | 30888 |
Feature activation | +5.50e-02 |
Pos logit contributions | |
inn | +0.102 |
eb | +0.100 |
le | +0.095 |
aster | +0.093 |
dog | +0.092 |
Neg logit contributions | |
yourself | -0.126 |
blo | -0.119 |
yourselves | -0.113 |
precious | -0.108 |
aj | -0.108 |
Token | , |
Token ID | 11 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
inn | +0.095 |
aster | +0.090 |
war | +0.085 |
eb | +0.085 |
le | +0.082 |
Neg logit contributions | |
yourself | -0.082 |
blo | -0.079 |
aj | -0.075 |
majesty | -0.073 |
yourselves | -0.071 |
Token | thirty |
Token ID | 12277 |
Feature activation | +3.84e-02 |
Pos logit contributions | |
inn | +0.012 |
eb | +0.011 |
le | +0.011 |
aster | +0.011 |
war | +0.011 |
Neg logit contributions | |
yourself | -0.013 |
blo | -0.013 |
yourselves | -0.012 |
aj | -0.012 |
majesty | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | +5.71e-03 |
Pos logit contributions | |
inn | +0.060 |
hot | +0.057 |
war | +0.057 |
aster | +0.056 |
eb | +0.056 |
Neg logit contributions | |
yourself | -0.062 |
blo | -0.059 |
aj | -0.057 |
majesty | -0.056 |
precious | -0.054 |
Token | thirty |
Token ID | 12277 |
Feature activation | +3.58e-02 |
Pos logit contributions | |
inn | +0.009 |
eb | +0.008 |
aster | +0.008 |
le | +0.008 |
war | +0.008 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.010 |
yourselves | -0.009 |
aj | -0.009 |
majesty | -0.009 |
Token | carrot |
Token ID | 40562 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
inn | +0.049 |
eb | +0.047 |
aster | +0.046 |
le | +0.045 |
dog | +0.045 |
Neg logit contributions | |
yourself | -0.022 |
blo | -0.020 |
aj | -0.019 |
yourselves | -0.019 |
majesty | -0.018 |
Token | each |
Token ID | 1123 |
Feature activation | +4.17e-02 |
Pos logit contributions | |
inn | +0.032 |
eb | +0.031 |
dog | +0.030 |
le | +0.030 |
aster | +0.030 |
Neg logit contributions | |
yourself | -0.028 |
blo | -0.027 |
yourselves | -0.026 |
majesty | -0.025 |
aj | -0.025 |
Token | ?" |
Token ID | 1701 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
inn | +0.083 |
aster | +0.081 |
dog | +0.081 |
le | +0.080 |
eb | +0.080 |
Neg logit contributions | |
yourself | -0.051 |
blo | -0.049 |
aj | -0.049 |
yourselves | -0.048 |
majesty | -0.047 |
Token |
|
Token ID | 198 |
Feature activation | +6.68e-03 |
Pos logit contributions | |
inn | +0.041 |
le | +0.038 |
war | +0.037 |
eb | +0.037 |
ah | +0.036 |
Neg logit contributions | |
yourself | -0.025 |
blo | -0.023 |
yourselves | -0.022 |
ich | -0.021 |
window | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -2.45e-03 |
Pos logit contributions | |
inn | +0.014 |
le | +0.013 |
eb | +0.013 |
ah | +0.013 |
war | +0.013 |
Neg logit contributions | |
yourself | -0.008 |
yourselves | -0.007 |
blo | -0.007 |
ich | -0.007 |
aj | -0.007 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.21e-02 |
Pos logit contributions | |
yourself | +0.004 |
yourselves | +0.004 |
blo | +0.004 |
ich | +0.004 |
majesty | +0.004 |
Neg logit contributions | |
inn | -0.004 |
le | -0.004 |
eb | -0.003 |
ah | -0.003 |
war | -0.003 |
Token | mer |
Token ID | 647 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
aster | +0.098 |
inn | +0.096 |
omp | +0.084 |
eb | +0.079 |
war | +0.078 |
Neg logit contributions | |
yourself | -0.132 |
blo | -0.126 |
yourselves | -0.123 |
ich | -0.123 |
receiver | -0.120 |
Token | Joe |
Token ID | 5689 |
Feature activation | +7.49e-03 |
Pos logit contributions | |
inn | +0.018 |
aster | +0.018 |
war | +0.017 |
eb | +0.016 |
le | +0.016 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.015 |
window | -0.015 |
yourselves | -0.015 |
receiver | -0.014 |
Token | looks |
Token ID | 3073 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
inn | +0.013 |
aster | +0.012 |
eb | +0.012 |
war | +0.012 |
le | +0.011 |
Neg logit contributions | |
yourself | -0.011 |
blo | -0.011 |
aj | -0.011 |
yourselves | -0.010 |
majesty | -0.010 |
Token | at |
Token ID | 379 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
inn | +0.016 |
aster | +0.016 |
eb | +0.016 |
dog | +0.015 |
ah | +0.015 |
Neg logit contributions | |
yourself | -0.017 |
blo | -0.017 |
aj | -0.016 |
precious | -0.016 |
window | -0.016 |
Token | them |
Token ID | 606 |
Feature activation | +1.26e-03 |
Pos logit contributions | |
war | +0.021 |
inn | +0.021 |
eb | +0.019 |
ar | +0.018 |
hot | +0.018 |
Neg logit contributions | |
yourself | -0.019 |
yourselves | -0.018 |
window | -0.017 |
blo | -0.017 |
most | -0.016 |
Token | flavors |
Token ID | 17361 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
yourself | +0.019 |
majesty | +0.018 |
blo | +0.018 |
aj | +0.018 |
yourselves | +0.018 |
Neg logit contributions | |
inn | -0.014 |
eb | -0.014 |
dog | -0.014 |
le | -0.013 |
aster | -0.013 |
Token | they |
Token ID | 484 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
inn | +0.003 |
eb | +0.003 |
aster | +0.003 |
le | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.003 |
blo | -0.003 |
aj | -0.003 |
yourselves | -0.003 |
majesty | -0.003 |
Token | liked |
Token ID | 8288 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
inn | +0.030 |
aster | +0.028 |
le | +0.028 |
eb | +0.028 |
dog | +0.028 |
Neg logit contributions | |
yourself | -0.032 |
aj | -0.030 |
yourselves | -0.030 |
blo | -0.030 |
ich | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | +1.33e-04 |
Pos logit contributions | |
inn | +0.027 |
eb | +0.025 |
aster | +0.025 |
dog | +0.024 |
le | +0.024 |
Neg logit contributions | |
yourself | -0.033 |
blo | -0.031 |
aj | -0.031 |
yourselves | -0.030 |
majesty | -0.030 |
Token | what |
Token ID | 644 |
Feature activation | +1.96e-02 |
Pos logit contributions | |
inn | +0.000 |
aster | +0.000 |
dog | +0.000 |
eb | +0.000 |
le | +0.000 |
Neg logit contributions | |
yourself | -0.000 |
blo | -0.000 |
aj | -0.000 |
yourselves | -0.000 |
ich | -0.000 |
Token | topp |
Token ID | 23126 |
Feature activation | +7.14e-02 |
Pos logit contributions | |
inn | +0.030 |
eb | +0.028 |
aster | +0.027 |
le | +0.027 |
dog | +0.026 |
Neg logit contributions | |
yourself | -0.034 |
blo | -0.033 |
yourselves | -0.031 |
aj | -0.031 |
majesty | -0.031 |
Token | ings |
Token ID | 654 |
Feature activation | +3.12e-02 |
Pos logit contributions | |
inn | +0.124 |
aster | +0.119 |
dog | +0.112 |
war | +0.111 |
hot | +0.111 |
Neg logit contributions | |
yourself | -0.110 |
yourselves | -0.101 |
blo | -0.097 |
aj | -0.096 |
majesty | -0.094 |
Token | would |
Token ID | 561 |
Feature activation | -4.88e-03 |
Pos logit contributions | |
inn | +0.043 |
eb | +0.040 |
aster | +0.040 |
le | +0.039 |
dog | +0.039 |
Neg logit contributions | |
yourself | -0.058 |
blo | -0.055 |
aj | -0.055 |
yourselves | -0.054 |
majesty | -0.054 |
Token | go |
Token ID | 467 |
Feature activation | +9.92e-03 |
Pos logit contributions | |
yourself | +0.008 |
aj | +0.008 |
blo | +0.008 |
majesty | +0.008 |
ich | +0.008 |
Neg logit contributions | |
inn | -0.008 |
aster | -0.007 |
eb | -0.007 |
dog | -0.007 |
le | -0.007 |
Token | best |
Token ID | 1266 |
Feature activation | -8.44e-04 |
Pos logit contributions | |
inn | +0.015 |
eb | +0.014 |
aster | +0.013 |
le | +0.013 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.018 |
blo | -0.017 |
aj | -0.017 |
majesty | -0.016 |
yourselves | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -8.41e-03 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
aj | +0.001 |
yourselves | +0.001 |
ich | +0.001 |
Neg logit contributions | |
inn | -0.001 |
aster | -0.001 |
eb | -0.001 |
dog | -0.001 |
le | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -1.50e-03 |
Pos logit contributions | |
yourself | +0.010 |
blo | +0.010 |
aj | +0.009 |
yourselves | +0.009 |
window | +0.009 |
Neg logit contributions | |
inn | -0.011 |
aster | -0.010 |
eb | -0.010 |
le | -0.010 |
dog | -0.009 |
Token | relax |
Token ID | 8960 |
Feature activation | -7.29e-03 |
Pos logit contributions | |
yourself | +0.003 |
aj | +0.003 |
blo | +0.003 |
ich | +0.003 |
yourselves | +0.003 |
Neg logit contributions | |
aster | -0.002 |
inn | -0.002 |
dog | -0.002 |
him | -0.002 |
eb | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -4.71e-03 |
Pos logit contributions | |
yourself | +0.011 |
blo | +0.011 |
yourselves | +0.010 |
aj | +0.010 |
window | +0.010 |
Neg logit contributions | |
inn | -0.013 |
aster | -0.012 |
eb | -0.012 |
war | -0.012 |
ah | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | +1.42e-03 |
Pos logit contributions | |
yourself | +0.008 |
aj | +0.007 |
blo | +0.007 |
yourselves | +0.007 |
majesty | +0.007 |
Neg logit contributions | |
inn | -0.007 |
le | -0.007 |
aster | -0.007 |
eb | -0.007 |
dog | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | -5.25e-03 |
Pos logit contributions | |
inn | +0.003 |
le | +0.003 |
eb | +0.003 |
aster | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.002 |
aj | -0.002 |
blo | -0.002 |
yourselves | -0.002 |
ich | -0.001 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.09e-02 |
Pos logit contributions | |
yourself | +0.007 |
blo | +0.007 |
yourselves | +0.007 |
aj | +0.006 |
majesty | +0.006 |
Neg logit contributions | |
inn | -0.010 |
eb | -0.009 |
le | -0.009 |
aster | -0.009 |
dog | -0.009 |
Token | mer |
Token ID | 647 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
aster | +0.096 |
inn | +0.092 |
omp | +0.078 |
olt | +0.076 |
Jim | +0.075 |
Neg logit contributions | |
yourself | -0.134 |
ich | -0.123 |
blo | -0.122 |
yourselves | -0.122 |
receiver | -0.119 |
Token | Joe |
Token ID | 5689 |
Feature activation | +6.69e-03 |
Pos logit contributions | |
inn | +0.018 |
aster | +0.017 |
war | +0.016 |
eb | +0.016 |
le | +0.015 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.015 |
yourselves | -0.015 |
ich | -0.015 |
window | -0.014 |
Token | smiled |
Token ID | 13541 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
inn | +0.012 |
aster | +0.011 |
eb | +0.011 |
war | +0.011 |
dog | +0.011 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.009 |
aj | -0.009 |
yourselves | -0.008 |
majesty | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
yourself | +0.037 |
blo | +0.035 |
yourselves | +0.035 |
aj | +0.035 |
majesty | +0.034 |
Neg logit contributions | |
inn | -0.029 |
eb | -0.027 |
le | -0.026 |
dog | -0.026 |
aster | -0.026 |
Token | said |
Token ID | 531 |
Feature activation | +2.24e-04 |
Pos logit contributions | |
inn | +0.021 |
eb | +0.020 |
aster | +0.019 |
dog | +0.019 |
le | +0.019 |
Neg logit contributions | |
yourself | -0.022 |
blo | -0.020 |
yourselves | -0.020 |
aj | -0.020 |
majesty | -0.019 |
Token | to |
Token ID | 284 |
Feature activation | +8.25e-03 |
Pos logit contributions | |
yourself | +0.003 |
yourselves | +0.003 |
aj | +0.003 |
majesty | +0.003 |
ich | +0.003 |
Neg logit contributions | |
inn | -0.002 |
eb | -0.002 |
him | -0.002 |
aster | -0.002 |
dog | -0.002 |
Token | grow |
Token ID | 1663 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
aster | +0.013 |
le | +0.013 |
inn | +0.012 |
dog | +0.012 |
him | +0.012 |
Neg logit contributions | |
aj | -0.013 |
yourself | -0.013 |
yourselves | -0.013 |
ich | -0.012 |
majesty | -0.012 |
Token | ! |
Token ID | 0 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
inn | +0.004 |
le | +0.004 |
eb | +0.004 |
aster | +0.004 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
aj | -0.004 |
yourselves | -0.004 |
majesty | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +1.53e-03 |
Pos logit contributions | |
inn | +0.017 |
le | +0.016 |
eb | +0.016 |
ah | +0.015 |
aster | +0.015 |
Neg logit contributions | |
yourself | -0.017 |
yourselves | -0.015 |
aj | -0.015 |
blo | -0.015 |
window | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -3.67e-03 |
Pos logit contributions | |
inn | +0.003 |
le | +0.003 |
eb | +0.003 |
ah | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.002 |
aj | -0.002 |
blo | -0.002 |
yourselves | -0.002 |
window | -0.002 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.08e-02 |
Pos logit contributions | |
yourself | +0.005 |
yourselves | +0.004 |
blo | +0.004 |
aj | +0.004 |
ich | +0.004 |
Neg logit contributions | |
inn | -0.007 |
le | -0.007 |
eb | -0.007 |
ah | -0.007 |
dog | -0.006 |
Token | mer |
Token ID | 647 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
inn | +0.093 |
aster | +0.092 |
omp | +0.082 |
Finn | +0.080 |
Jim | +0.075 |
Neg logit contributions | |
yourself | -0.134 |
yourselves | -0.125 |
ich | -0.121 |
receiver | -0.121 |
blo | -0.119 |
Token | John |
Token ID | 1757 |
Feature activation | +4.30e-03 |
Pos logit contributions | |
inn | +0.020 |
war | +0.018 |
aster | +0.018 |
le | +0.017 |
eb | +0.016 |
Neg logit contributions | |
yourself | -0.019 |
window | -0.017 |
blo | -0.017 |
ich | -0.017 |
yourselves | -0.017 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
inn | +0.008 |
eb | +0.007 |
aster | +0.007 |
le | +0.007 |
dog | +0.007 |
Neg logit contributions | |
yourself | -0.006 |
blo | -0.006 |
yourselves | -0.006 |
aj | -0.006 |
majesty | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +9.38e-03 |
Pos logit contributions | |
yourself | +0.026 |
blo | +0.025 |
aj | +0.024 |
yourselves | +0.024 |
majesty | +0.024 |
Neg logit contributions | |
inn | -0.024 |
aster | -0.022 |
eb | -0.022 |
le | -0.022 |
dog | -0.022 |
Token | He |
Token ID | 679 |
Feature activation | +5.92e-03 |
Pos logit contributions | |
inn | +0.009 |
eb | +0.008 |
aster | +0.008 |
dog | +0.008 |
le | +0.008 |
Neg logit contributions | |
yourself | -0.021 |
blo | -0.021 |
aj | -0.020 |
yourselves | -0.020 |
majesty | -0.020 |
Token | tasty |
Token ID | 25103 |
Feature activation | +2.86e-02 |
Pos logit contributions | |
inn | +0.031 |
eb | +0.029 |
aster | +0.028 |
le | +0.028 |
dog | +0.027 |
Neg logit contributions | |
yourself | -0.028 |
blo | -0.028 |
aj | -0.027 |
majesty | -0.026 |
window | -0.026 |
Token | snack |
Token ID | 26906 |
Feature activation | +3.24e-03 |
Pos logit contributions | |
inn | +0.050 |
eb | +0.045 |
hot | +0.044 |
war | +0.044 |
le | +0.043 |
Neg logit contributions | |
blo | -0.045 |
window | -0.042 |
yourself | -0.041 |
majesty | -0.040 |
precious | -0.039 |
Token | . |
Token ID | 13 |
Feature activation | +3.76e-03 |
Pos logit contributions | |
inn | +0.006 |
aster | +0.006 |
eb | +0.005 |
le | +0.005 |
war | +0.005 |
Neg logit contributions | |
blo | -0.004 |
yourself | -0.004 |
window | -0.004 |
aj | -0.004 |
ich | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +5.71e-03 |
Pos logit contributions | |
inn | +0.007 |
le | +0.006 |
aster | +0.006 |
eb | +0.006 |
dog | +0.006 |
Neg logit contributions | |
yourself | -0.006 |
blo | -0.005 |
aj | -0.005 |
yourselves | -0.005 |
majesty | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +1.59e-04 |
Pos logit contributions | |
inn | +0.010 |
le | +0.009 |
eb | +0.009 |
aster | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.009 |
blo | -0.008 |
aj | -0.008 |
yourselves | -0.008 |
majesty | -0.008 |
Token | Far |
Token ID | 21428 |
Feature activation | +7.02e-02 |
Pos logit contributions | |
inn | +0.000 |
eb | +0.000 |
aster | +0.000 |
le | +0.000 |
dog | +0.000 |
Neg logit contributions | |
yourself | -0.000 |
blo | -0.000 |
aj | -0.000 |
yourselves | -0.000 |
majesty | -0.000 |
Token | ah |
Token ID | 993 |
Feature activation | +5.13e-03 |
Pos logit contributions | |
aster | +0.091 |
inn | +0.087 |
Jim | +0.076 |
hot | +0.074 |
Freddy | +0.072 |
Neg logit contributions | |
yourself | -0.138 |
blo | -0.128 |
ich | -0.127 |
yourselves | -0.127 |
precious | -0.119 |
Token | and |
Token ID | 290 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
inn | +0.009 |
eb | +0.009 |
le | +0.008 |
aster | +0.008 |
dog | +0.008 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.007 |
yourselves | -0.007 |
aj | -0.007 |
majesty | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
inn | +0.040 |
le | +0.036 |
aster | +0.035 |
war | +0.034 |
eb | +0.033 |
Neg logit contributions | |
yourself | -0.044 |
blo | -0.043 |
majesty | -0.040 |
yourselves | -0.039 |
ich | -0.039 |
Token | bunny |
Token ID | 44915 |
Feature activation | -5.65e-03 |
Pos logit contributions | |
yourself | +0.019 |
aj | +0.019 |
yourselves | +0.018 |
blo | +0.018 |
majesty | +0.018 |
Neg logit contributions | |
inn | -0.018 |
dog | -0.017 |
aster | -0.017 |
le | -0.017 |
eb | -0.017 |
Token | were |
Token ID | 547 |
Feature activation | +3.86e-03 |
Pos logit contributions | |
yourself | +0.009 |
blo | +0.008 |
aj | +0.008 |
yourselves | +0.008 |
majesty | +0.008 |
Neg logit contributions | |
inn | -0.010 |
eb | -0.009 |
aster | -0.009 |
le | -0.009 |
dog | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | +5.39e-03 |
Pos logit contributions | |
inn | +0.021 |
le | +0.020 |
aster | +0.020 |
dog | +0.019 |
ah | +0.019 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.013 |
yourselves | -0.013 |
aj | -0.013 |
ich | -0.013 |
Token | Exc |
Token ID | 40127 |
Feature activation | +4.08e-02 |
Pos logit contributions | |
inn | +0.009 |
le | +0.009 |
aster | +0.009 |
eb | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.007 |
yourselves | -0.007 |
aj | -0.007 |
ich | -0.007 |
Token | ited |
Token ID | 863 |
Feature activation | +5.34e-03 |
Pos logit contributions | |
inn | +0.050 |
Finn | +0.049 |
Jim | +0.048 |
Noah | +0.045 |
Bob | +0.044 |
Neg logit contributions | |
yourself | -0.078 |
blo | -0.074 |
yourselves | -0.070 |
precious | -0.067 |
Dear | -0.067 |
Token | ly |
Token ID | 306 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
inn | +0.007 |
aster | +0.006 |
war | +0.006 |
dog | +0.006 |
hot | +0.006 |
Neg logit contributions | |
yourself | -0.011 |
blo | -0.010 |
aj | -0.010 |
yourselves | -0.010 |
window | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | +6.98e-03 |
Pos logit contributions | |
inn | +0.031 |
aster | +0.028 |
war | +0.028 |
le | +0.028 |
eb | +0.028 |
Neg logit contributions | |
yourself | -0.031 |
blo | -0.030 |
aj | -0.028 |
majesty | -0.028 |
yourselves | -0.028 |
Token | Ark |
Token ID | 9128 |
Feature activation | +6.92e-02 |
Pos logit contributions | |
inn | +0.010 |
war | +0.009 |
le | +0.009 |
aster | +0.009 |
dog | +0.008 |
Neg logit contributions | |
yourself | -0.013 |
blo | -0.013 |
yourselves | -0.012 |
window | -0.012 |
ich | -0.012 |
Token | ie |
Token ID | 494 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
inn | +0.091 |
aster | +0.084 |
dog | +0.081 |
eb | +0.080 |
hot | +0.079 |
Neg logit contributions | |
yourself | -0.133 |
blo | -0.124 |
yourselves | -0.121 |
aj | -0.120 |
majesty | -0.119 |
Token | grabbed |
Token ID | 13176 |
Feature activation | +3.08e-03 |
Pos logit contributions | |
yourself | +0.027 |
blo | +0.025 |
aj | +0.025 |
yourselves | +0.025 |
majesty | +0.024 |
Neg logit contributions | |
inn | -0.028 |
eb | -0.026 |
aster | -0.026 |
le | -0.025 |
dog | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | -3.10e-03 |
Pos logit contributions | |
eb | +0.005 |
war | +0.005 |
ah | +0.005 |
ny | +0.005 |
le | +0.005 |
Neg logit contributions | |
yourself | -0.004 |
most | -0.004 |
blo | -0.003 |
precious | -0.003 |
window | -0.003 |
Token | equipment |
Token ID | 5112 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
yourself | +0.005 |
blo | +0.004 |
aj | +0.004 |
yourselves | +0.004 |
majesty | +0.004 |
Neg logit contributions | |
inn | -0.005 |
eb | -0.005 |
aster | -0.005 |
le | -0.005 |
dog | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +8.44e-03 |
Pos logit contributions | |
yourself | +0.017 |
blo | +0.017 |
window | +0.016 |
aj | +0.015 |
yourselves | +0.015 |
Neg logit contributions | |
inn | -0.020 |
aster | -0.019 |
eb | -0.019 |
le | -0.019 |
war | -0.019 |
Token | bit |
Token ID | 1643 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
inn | +0.005 |
le | +0.005 |
dog | +0.005 |
aster | +0.005 |
ny | +0.005 |
Neg logit contributions | |
yourself | -0.007 |
aj | -0.007 |
yourselves | -0.007 |
ich | -0.007 |
blo | -0.006 |
Token | of |
Token ID | 286 |
Feature activation | -8.08e-03 |
Pos logit contributions | |
inn | +0.010 |
le | +0.010 |
aster | +0.009 |
eb | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.014 |
aj | -0.014 |
blo | -0.013 |
ich | -0.013 |
majesty | -0.013 |
Token | magic |
Token ID | 5536 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
aj | +0.014 |
ich | +0.013 |
majesty | +0.012 |
yourself | +0.012 |
blo | +0.012 |
Neg logit contributions | |
him | -0.012 |
aster | -0.012 |
le | -0.012 |
dog | -0.011 |
inn | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | -2.94e-03 |
Pos logit contributions | |
yourself | +0.028 |
aj | +0.027 |
yourselves | +0.027 |
ich | +0.027 |
blo | +0.026 |
Neg logit contributions | |
le | -0.022 |
inn | -0.022 |
eb | -0.020 |
aster | -0.020 |
dog | -0.020 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +4.45e-03 |
Pos logit contributions | |
yourself | +0.004 |
blo | +0.004 |
yourselves | +0.004 |
aj | +0.004 |
majesty | +0.004 |
Neg logit contributions | |
inn | -0.005 |
le | -0.005 |
aster | -0.005 |
eb | -0.005 |
dog | -0.005 |
Token | Isa |
Token ID | 39443 |
Feature activation | +6.83e-02 |
Pos logit contributions | |
inn | +0.010 |
aster | +0.010 |
le | +0.009 |
eb | +0.009 |
war | +0.009 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.004 |
yourselves | -0.004 |
aj | -0.004 |
window | -0.004 |
Token | ac |
Token ID | 330 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
inn | +0.124 |
dog | +0.120 |
hot | +0.117 |
aster | +0.115 |
eb | +0.115 |
Neg logit contributions | |
yourself | -0.092 |
blo | -0.086 |
aj | -0.084 |
majesty | -0.082 |
yourselves | -0.080 |
Token | was |
Token ID | 373 |
Feature activation | +3.39e-03 |
Pos logit contributions | |
inn | +0.019 |
aster | +0.018 |
dog | +0.017 |
eb | +0.017 |
war | +0.017 |
Neg logit contributions | |
yourself | -0.022 |
blo | -0.021 |
yourselves | -0.020 |
aj | -0.020 |
majesty | -0.020 |
Token | preparing |
Token ID | 10629 |
Feature activation | -4.55e-03 |
Pos logit contributions | |
inn | +0.006 |
aster | +0.005 |
him | +0.005 |
dog | +0.005 |
le | +0.005 |
Neg logit contributions | |
yourself | -0.006 |
yourselves | -0.005 |
majesty | -0.005 |
aj | -0.005 |
endant | -0.005 |
Token | breakfast |
Token ID | 12607 |
Feature activation | -3.91e-03 |
Pos logit contributions | |
yourself | +0.009 |
majesty | +0.008 |
aj | +0.008 |
ich | +0.008 |
blo | +0.008 |
Neg logit contributions | |
inn | -0.006 |
aster | -0.006 |
him | -0.006 |
dog | -0.005 |
eb | -0.005 |
Token | in |
Token ID | 287 |
Feature activation | -2.29e-02 |
Pos logit contributions | |
yourself | +0.006 |
blo | +0.006 |
aj | +0.006 |
yourselves | +0.006 |
window | +0.005 |
Neg logit contributions | |
inn | -0.007 |
aster | -0.006 |
eb | -0.006 |
war | -0.006 |
le | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | +6.61e-03 |
Pos logit contributions | |
inn | +0.000 |
eb | +0.000 |
aster | +0.000 |
le | +0.000 |
dog | +0.000 |
Neg logit contributions | |
yourself | -0.000 |
blo | -0.000 |
aj | -0.000 |
yourselves | -0.000 |
majesty | -0.000 |
Token | watched |
Token ID | 7342 |
Feature activation | -4.42e-04 |
Pos logit contributions | |
inn | +0.013 |
aster | +0.011 |
eb | +0.011 |
le | +0.011 |
war | +0.011 |
Neg logit contributions | |
blo | -0.009 |
yourself | -0.009 |
yourselves | -0.008 |
aj | -0.008 |
majesty | -0.008 |
Token | it |
Token ID | 340 |
Feature activation | -5.06e-03 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
sending | +0.001 |
window | +0.001 |
hugging | +0.001 |
Neg logit contributions | |
inn | -0.001 |
ah | -0.001 |
ny | -0.001 |
eb | -0.001 |
war | -0.001 |
Token | for |
Token ID | 329 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
yourself | +0.009 |
blo | +0.008 |
aj | +0.008 |
yourselves | +0.008 |
majesty | +0.008 |
Neg logit contributions | |
inn | -0.008 |
eb | -0.007 |
aster | -0.007 |
le | -0.007 |
dog | -0.007 |
Token | as |
Token ID | 355 |
Feature activation | +4.99e-02 |
Pos logit contributions | |
inn | +0.036 |
eb | +0.034 |
ny | +0.033 |
ah | +0.033 |
war | +0.033 |
Neg logit contributions | |
yourself | -0.023 |
blo | -0.021 |
yourselves | -0.020 |
sending | -0.019 |
precious | -0.019 |
Token | long |
Token ID | 890 |
Feature activation | +6.82e-02 |
Pos logit contributions | |
inn | +0.065 |
aster | +0.061 |
eb | +0.059 |
dog | +0.058 |
him | +0.057 |
Neg logit contributions | |
yourself | -0.096 |
aj | -0.092 |
blo | -0.092 |
yourselves | -0.090 |
majesty | -0.089 |
Token | as |
Token ID | 355 |
Feature activation | +5.19e-02 |
Pos logit contributions | |
inn | +0.110 |
war | +0.105 |
eb | +0.103 |
le | +0.102 |
ah | +0.100 |
Neg logit contributions | |
blo | -0.103 |
yourself | -0.101 |
aj | -0.095 |
window | -0.094 |
sending | -0.092 |
Token | they |
Token ID | 484 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
inn | +0.068 |
aster | +0.063 |
eb | +0.062 |
le | +0.060 |
dog | +0.060 |
Neg logit contributions | |
yourself | -0.100 |
blo | -0.096 |
aj | -0.096 |
yourselves | -0.094 |
majesty | -0.093 |
Token | could |
Token ID | 714 |
Feature activation | +8.25e-03 |
Pos logit contributions | |
inn | +0.030 |
aster | +0.028 |
eb | +0.028 |
le | +0.027 |
dog | +0.027 |
Neg logit contributions | |
blo | -0.025 |
yourself | -0.024 |
aj | -0.023 |
window | -0.022 |
precious | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +7.67e-03 |
Pos logit contributions | |
inn | +0.013 |
eb | +0.012 |
aster | +0.012 |
le | +0.012 |
dog | +0.012 |
Neg logit contributions | |
yourself | -0.014 |
blo | -0.013 |
aj | -0.013 |
yourselves | -0.013 |
majesty | -0.012 |
Token | They |
Token ID | 1119 |
Feature activation | -4.72e-03 |
Pos logit contributions | |
inn | +0.010 |
eb | +0.010 |
aster | +0.009 |
le | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.014 |
aj | -0.014 |
yourselves | -0.014 |
majesty | -0.014 |
Token | friend |
Token ID | 1545 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
inn | +0.009 |
dog | +0.008 |
eb | +0.008 |
le | +0.008 |
aster | +0.008 |
Neg logit contributions | |
yourself | -0.006 |
yourselves | -0.006 |
blo | -0.005 |
aj | -0.005 |
ich | -0.005 |
Token | will |
Token ID | 481 |
Feature activation | -9.21e-04 |
Pos logit contributions | |
yourself | +0.016 |
blo | +0.016 |
aj | +0.015 |
yourselves | +0.015 |
majesty | +0.015 |
Neg logit contributions | |
inn | -0.019 |
eb | -0.018 |
aster | -0.018 |
le | -0.017 |
dog | -0.017 |
Token | always |
Token ID | 1464 |
Feature activation | -1.71e-03 |
Pos logit contributions | |
yourself | +0.001 |
aj | +0.001 |
yourselves | +0.001 |
blo | +0.001 |
majesty | +0.001 |
Neg logit contributions | |
inn | -0.002 |
eb | -0.002 |
aster | -0.002 |
le | -0.002 |
dog | -0.001 |
Token | know |
Token ID | 760 |
Feature activation | -8.42e-03 |
Pos logit contributions | |
aj | +0.003 |
ich | +0.003 |
yourselves | +0.003 |
majesty | +0.003 |
endant | +0.003 |
Neg logit contributions | |
le | -0.003 |
aster | -0.002 |
him | -0.002 |
inn | -0.002 |
dog | -0.002 |
Token | how |
Token ID | 703 |
Feature activation | +2.28e-02 |
Pos logit contributions | |
aj | +0.015 |
yourself | +0.015 |
majesty | +0.015 |
ich | +0.015 |
blo | +0.014 |
Neg logit contributions | |
him | -0.011 |
inn | -0.011 |
le | -0.011 |
aster | -0.010 |
eb | -0.010 |
Token | depend |
Token ID | 4745 |
Feature activation | +6.81e-02 |
Pos logit contributions | |
him | +0.035 |
inn | +0.035 |
aster | +0.034 |
le | +0.034 |
dog | +0.032 |
Neg logit contributions | |
aj | -0.034 |
yourself | -0.034 |
ich | -0.033 |
majesty | -0.033 |
yourselves | -0.033 |
Token | able |
Token ID | 540 |
Feature activation | +2.97e-02 |
Pos logit contributions | |
inn | +0.093 |
aster | +0.082 |
omp | +0.081 |
Jim | +0.081 |
eb | +0.079 |
Neg logit contributions | |
yourself | -0.131 |
blo | -0.118 |
yourselves | -0.117 |
precious | -0.107 |
aj | -0.106 |
Token | and |
Token ID | 290 |
Feature activation | +9.46e-03 |
Pos logit contributions | |
inn | +0.048 |
eb | +0.045 |
aster | +0.045 |
le | +0.044 |
dog | +0.044 |
Neg logit contributions | |
yourself | -0.048 |
blo | -0.046 |
aj | -0.045 |
yourselves | -0.044 |
majesty | -0.044 |
Token | special |
Token ID | 2041 |
Feature activation | +2.74e-03 |
Pos logit contributions | |
him | +0.016 |
aster | +0.015 |
inn | +0.015 |
le | +0.015 |
dog | +0.015 |
Neg logit contributions | |
aj | -0.014 |
ich | -0.013 |
yourself | -0.013 |
majesty | -0.013 |
yourselves | -0.013 |
Token | of |
Token ID | 286 |
Feature activation | -3.05e-03 |
Pos logit contributions | |
le | +0.004 |
him | +0.004 |
dog | +0.004 |
inn | +0.004 |
eb | +0.004 |
Neg logit contributions | |
aj | -0.005 |
ich | -0.005 |
yourself | -0.005 |
majesty | -0.004 |
yourselves | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | -8.24e-03 |
Pos logit contributions | |
yourself | +0.005 |
aj | +0.005 |
blo | +0.005 |
majesty | +0.005 |
yourselves | +0.005 |
Neg logit contributions | |
inn | -0.004 |
aster | -0.004 |
eb | -0.004 |
le | -0.004 |
dog | -0.004 |
Token | 'm |
Token ID | 1101 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
inn | +0.026 |
eb | +0.024 |
aster | +0.024 |
le | +0.024 |
dog | +0.024 |
Neg logit contributions | |
yourself | -0.019 |
blo | -0.018 |
aj | -0.018 |
yourselves | -0.017 |
majesty | -0.017 |
Token | sad |
Token ID | 6507 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
yourself | +0.016 |
blo | +0.014 |
aj | +0.014 |
yourselves | +0.014 |
majesty | +0.014 |
Neg logit contributions | |
inn | -0.034 |
aster | -0.032 |
eb | -0.031 |
dog | -0.031 |
le | -0.031 |
Token | we |
Token ID | 356 |
Feature activation | +4.56e-04 |
Pos logit contributions | |
yourself | +0.043 |
blo | +0.042 |
aj | +0.042 |
majesty | +0.041 |
ich | +0.041 |
Neg logit contributions | |
inn | -0.032 |
le | -0.030 |
dog | -0.029 |
aster | -0.029 |
him | -0.029 |
Token | lost |
Token ID | 2626 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
inn | +0.001 |
le | +0.001 |
ny | +0.001 |
dog | +0.001 |
him | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
yourselves | -0.001 |
aj | -0.001 |
blo | -0.001 |
majesty | -0.001 |
Token | our |
Token ID | 674 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
yourself | +0.023 |
blo | +0.023 |
aj | +0.023 |
majesty | +0.023 |
ich | +0.022 |
Neg logit contributions | |
inn | -0.028 |
eb | -0.026 |
aster | -0.026 |
le | -0.026 |
dog | -0.026 |
Token | p |
Token ID | 279 |
Feature activation | -8.07e-02 |
Pos logit contributions | |
yourself | +0.027 |
yourselves | +0.025 |
aj | +0.024 |
ich | +0.024 |
receiver | +0.023 |
Neg logit contributions | |
inn | -0.024 |
him | -0.023 |
dog | -0.023 |
Bob | -0.022 |
eb | -0.022 |
Token | ears |
Token ID | 4127 |
Feature activation | -4.52e-02 |
Pos logit contributions | |
yourself | +0.135 |
sending | +0.127 |
blo | +0.125 |
yourselves | +0.124 |
Love | +0.120 |
Neg logit contributions | |
inn | -0.129 |
eb | -0.118 |
ah | -0.114 |
dog | -0.111 |
ny | -0.107 |
Token | ." |
Token ID | 526 |
Feature activation | +1.23e-02 |
Pos logit contributions | |
yourself | +0.073 |
blo | +0.070 |
aj | +0.068 |
yourselves | +0.068 |
majesty | +0.068 |
Neg logit contributions | |
inn | -0.073 |
eb | -0.068 |
aster | -0.068 |
le | -0.067 |
dog | -0.066 |
Token | Mia |
Token ID | 32189 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
inn | +0.017 |
eb | +0.016 |
le | +0.016 |
hot | +0.015 |
war | +0.015 |
Neg logit contributions | |
yourself | -0.022 |
blo | -0.021 |
yourselves | -0.021 |
majesty | -0.021 |
window | -0.021 |
Token | said |
Token ID | 531 |
Feature activation | -1.68e-03 |
Pos logit contributions | |
yourself | +0.015 |
blo | +0.014 |
aj | +0.014 |
window | +0.013 |
yourselves | +0.013 |
Neg logit contributions | |
inn | -0.024 |
aster | -0.023 |
eb | -0.022 |
war | -0.022 |
le | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
hugging | +0.002 |
yourself | +0.002 |
blo | +0.002 |
window | +0.002 |
aj | +0.002 |
Neg logit contributions | |
inn | -0.004 |
aster | -0.003 |
ah | -0.003 |
eb | -0.003 |
war | -0.003 |
Token | some |
Token ID | 617 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
aster | +0.031 |
inn | +0.030 |
eb | +0.028 |
ah | +0.028 |
dog | +0.028 |
Neg logit contributions | |
yourself | -0.025 |
yourselves | -0.020 |
blo | -0.019 |
most | -0.019 |
myself | -0.019 |
Token | water |
Token ID | 1660 |
Feature activation | +7.38e-03 |
Pos logit contributions | |
inn | +0.021 |
le | +0.020 |
aster | +0.019 |
dog | +0.019 |
eb | +0.019 |
Neg logit contributions | |
yourself | -0.026 |
aj | -0.026 |
majesty | -0.025 |
ich | -0.025 |
yourselves | -0.025 |
Token | and |
Token ID | 290 |
Feature activation | +5.46e-03 |
Pos logit contributions | |
inn | +0.014 |
aster | +0.013 |
eb | +0.013 |
le | +0.012 |
war | +0.012 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.010 |
yourselves | -0.009 |
window | -0.009 |
aj | -0.009 |
Token | fill |
Token ID | 6070 |
Feature activation | +8.48e-03 |
Pos logit contributions | |
inn | +0.007 |
aster | +0.007 |
dog | +0.007 |
le | +0.007 |
eb | +0.007 |
Neg logit contributions | |
yourself | -0.010 |
aj | -0.010 |
ich | -0.010 |
blo | -0.010 |
yourselves | -0.010 |
Token | his |
Token ID | 465 |
Feature activation | -2.10e-03 |
Pos logit contributions | |
ah | +0.015 |
aster | +0.014 |
war | +0.014 |
inn | +0.014 |
ited | +0.013 |
Neg logit contributions | |
yourself | -0.014 |
yourselves | -0.012 |
blo | -0.012 |
myself | -0.011 |
most | -0.011 |
Token | p |
Token ID | 279 |
Feature activation | -8.05e-02 |
Pos logit contributions | |
yourself | +0.004 |
aj | +0.004 |
reetings | +0.003 |
inas | +0.003 |
yourselves | +0.003 |
Neg logit contributions | |
inn | -0.003 |
aster | -0.002 |
dog | -0.002 |
le | -0.002 |
ny | -0.002 |
Token | ail |
Token ID | 603 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
yourself | +0.119 |
blo | +0.110 |
yourselves | +0.107 |
majesty | +0.102 |
sending | +0.102 |
Neg logit contributions | |
inn | -0.147 |
eb | -0.134 |
le | -0.129 |
aster | -0.128 |
dog | -0.126 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e-03 |
Pos logit contributions | |
yourself | +0.047 |
blo | +0.045 |
aj | +0.044 |
yourselves | +0.043 |
majesty | +0.042 |
Neg logit contributions | |
inn | -0.053 |
eb | -0.050 |
aster | -0.049 |
le | -0.048 |
dog | -0.048 |
Token | He |
Token ID | 679 |
Feature activation | -6.47e-04 |
Pos logit contributions | |
yourself | +0.002 |
blo | +0.002 |
yourselves | +0.002 |
window | +0.002 |
aj | +0.002 |
Neg logit contributions | |
le | -0.002 |
inn | -0.002 |
aster | -0.002 |
eb | -0.002 |
war | -0.002 |
Token | went |
Token ID | 1816 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
aj | +0.001 |
yourselves | +0.001 |
majesty | +0.001 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
aster | -0.001 |
le | -0.001 |
dog | -0.001 |
Token | over |
Token ID | 625 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
yourself | +0.021 |
blo | +0.020 |
yourselves | +0.019 |
aj | +0.019 |
majesty | +0.019 |
Neg logit contributions | |
inn | -0.018 |
aster | -0.016 |
eb | -0.016 |
le | -0.016 |
dog | -0.016 |
Token | 's |
Token ID | 338 |
Feature activation | -2.05e-03 |
Pos logit contributions | |
inn | +0.071 |
aster | +0.062 |
ah | +0.062 |
dog | +0.062 |
eb | +0.061 |
Neg logit contributions | |
yourself | -0.038 |
yourselves | -0.032 |
blo | -0.031 |
aj | -0.030 |
window | -0.030 |
Token | go |
Token ID | 467 |
Feature activation | -1.71e-03 |
Pos logit contributions | |
yourself | +0.004 |
aj | +0.004 |
blo | +0.004 |
majesty | +0.004 |
ich | +0.004 |
Neg logit contributions | |
inn | -0.003 |
aster | -0.002 |
le | -0.002 |
eb | -0.002 |
dog | -0.002 |
Token | get |
Token ID | 651 |
Feature activation | -2.52e-03 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
yourselves | +0.003 |
aj | +0.003 |
majesty | +0.003 |
Neg logit contributions | |
inn | -0.003 |
eb | -0.002 |
aster | -0.002 |
le | -0.002 |
dog | -0.002 |
Token | your |
Token ID | 534 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
majesty | +0.005 |
ich | +0.005 |
aj | +0.005 |
yourself | +0.005 |
blo | +0.005 |
Neg logit contributions | |
him | -0.003 |
inn | -0.003 |
aster | -0.003 |
le | -0.003 |
dog | -0.003 |
Token | p |
Token ID | 279 |
Feature activation | -7.66e-02 |
Pos logit contributions | |
yourself | +0.006 |
yourselves | +0.006 |
majesty | +0.006 |
ich | +0.006 |
blo | +0.006 |
Neg logit contributions | |
inn | -0.003 |
dog | -0.003 |
Finn | -0.003 |
le | -0.003 |
him | -0.003 |
Token | aj |
Token ID | 1228 |
Feature activation | -8.01e-02 |
Pos logit contributions | |
yourself | +0.096 |
blo | +0.089 |
yourselves | +0.085 |
sending | +0.084 |
receiver | +0.079 |
Neg logit contributions | |
inn | -0.159 |
eb | -0.144 |
le | -0.142 |
dog | -0.140 |
ah | -0.139 |
Token | amas |
Token ID | 17485 |
Feature activation | -5.20e-03 |
Pos logit contributions | |
yourself | +0.083 |
blo | +0.078 |
yourselves | +0.074 |
majesty | +0.071 |
aj | +0.069 |
Neg logit contributions | |
inn | -0.176 |
eb | -0.170 |
le | -0.166 |
dog | -0.166 |
aster | -0.163 |
Token | from |
Token ID | 422 |
Feature activation | +3.48e-03 |
Pos logit contributions | |
yourself | +0.007 |
majesty | +0.007 |
blo | +0.007 |
yourselves | +0.007 |
ich | +0.006 |
Neg logit contributions | |
inn | -0.009 |
le | -0.009 |
eb | -0.009 |
dog | -0.009 |
ny | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | +2.40e-03 |
Pos logit contributions | |
inn | +0.005 |
aster | +0.005 |
him | +0.005 |
le | +0.004 |
dog | +0.004 |
Neg logit contributions | |
yourself | -0.006 |
aj | -0.006 |
majesty | -0.006 |
blo | -0.006 |
ich | -0.006 |
Token | drawer |
Token ID | 33451 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
inn | +0.004 |
dog | +0.004 |
aster | +0.004 |
ny | +0.003 |
him | +0.003 |
Neg logit contributions | |
yourself | -0.004 |
aj | -0.004 |
majesty | -0.004 |
blo | -0.004 |
yourselves | -0.003 |
Token | ." |
Token ID | 526 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
inn | +0.020 |
le | +0.019 |
eb | +0.019 |
dog | +0.018 |
ny | +0.018 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.015 |
yourselves | -0.014 |
majesty | -0.014 |
precious | -0.014 |
Token | They |
Token ID | 1119 |
Feature activation | -9.53e-03 |
Pos logit contributions | |
yourself | +0.010 |
yourselves | +0.009 |
aj | +0.009 |
blo | +0.009 |
majesty | +0.009 |
Neg logit contributions | |
inn | -0.009 |
le | -0.009 |
eb | -0.009 |
aster | -0.008 |
ah | -0.008 |
Token | put |
Token ID | 1234 |
Feature activation | +4.58e-05 |
Pos logit contributions | |
yourself | +0.016 |
blo | +0.016 |
aj | +0.015 |
yourselves | +0.015 |
ich | +0.015 |
Neg logit contributions | |
inn | -0.014 |
aster | -0.014 |
le | -0.013 |
eb | -0.013 |
dog | -0.013 |
Token | on |
Token ID | 319 |
Feature activation | -5.77e-03 |
Pos logit contributions | |
inn | +0.000 |
war | +0.000 |
ah | +0.000 |
eb | +0.000 |
omp | +0.000 |
Neg logit contributions | |
yourself | -0.000 |
blo | -0.000 |
yourselves | -0.000 |
most | -0.000 |
precious | -0.000 |
Token | their |
Token ID | 511 |
Feature activation | +7.45e-04 |
Pos logit contributions | |
yourself | +0.008 |
blo | +0.008 |
yourselves | +0.008 |
window | +0.007 |
aj | +0.007 |
Neg logit contributions | |
inn | -0.012 |
omp | -0.011 |
ah | -0.010 |
hot | -0.010 |
le | -0.010 |
Token | p |
Token ID | 279 |
Feature activation | -6.29e-02 |
Pos logit contributions | |
aster | +0.001 |
dog | +0.001 |
him | +0.001 |
inn | +0.001 |
le | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
inas | -0.001 |
yourselves | -0.001 |
ich | -0.001 |
reetings | -0.001 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.94e-02 |
Pos logit contributions | |
yourself | +0.019 |
blo | +0.017 |
yourselves | +0.012 |
ich | +0.007 |
sending | +0.007 |
Neg logit contributions | |
inn | -0.186 |
eb | -0.179 |
aster | -0.178 |
dog | -0.174 |
ah | -0.174 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
yourself | +0.080 |
blo | +0.076 |
yourselves | +0.070 |
majesty | +0.068 |
aj | +0.066 |
Neg logit contributions | |
inn | -0.176 |
eb | -0.169 |
aster | -0.164 |
le | -0.164 |
dog | -0.164 |
Token | and |
Token ID | 290 |
Feature activation | +2.93e-03 |
Pos logit contributions | |
inn | +0.024 |
aster | +0.023 |
eb | +0.022 |
war | +0.022 |
le | +0.022 |
Neg logit contributions | |
yourself | -0.018 |
window | -0.017 |
aj | -0.017 |
blo | -0.017 |
yourselves | -0.016 |
Token | get |
Token ID | 651 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
inn | +0.004 |
aster | +0.004 |
eb | +0.004 |
le | +0.004 |
dog | +0.004 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.005 |
yourselves | -0.005 |
aj | -0.005 |
majesty | -0.005 |
Token | into |
Token ID | 656 |
Feature activation | -3.61e-02 |
Pos logit contributions | |
yourself | +0.025 |
blo | +0.024 |
aj | +0.024 |
yourselves | +0.024 |
majesty | +0.023 |
Neg logit contributions | |
inn | -0.021 |
aster | -0.020 |
eb | -0.020 |
le | -0.019 |
dog | -0.019 |
Token | their |
Token ID | 511 |
Feature activation | -9.51e-03 |
Pos logit contributions | |
yourself | +0.067 |
blo | +0.064 |
yourselves | +0.063 |
aj | +0.062 |
window | +0.060 |
Neg logit contributions | |
inn | -0.051 |
eb | -0.048 |
ah | -0.046 |
le | -0.046 |
war | -0.046 |
Token | and |
Token ID | 290 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
majesty | +0.036 |
ich | +0.035 |
blo | +0.035 |
endant | +0.035 |
aj | +0.034 |
Neg logit contributions | |
aster | -0.031 |
inn | -0.031 |
le | -0.029 |
him | -0.029 |
dog | -0.028 |
Token | put |
Token ID | 1234 |
Feature activation | +6.02e-04 |
Pos logit contributions | |
ich | +0.023 |
blo | +0.022 |
yourself | +0.022 |
aj | +0.022 |
majesty | +0.022 |
Neg logit contributions | |
aster | -0.017 |
inn | -0.016 |
le | -0.016 |
dog | -0.015 |
him | -0.015 |
Token | on |
Token ID | 319 |
Feature activation | -1.50e-02 |
Pos logit contributions | |
inn | +0.001 |
eb | +0.001 |
aster | +0.001 |
dog | +0.001 |
le | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
blo | -0.001 |
yourselves | -0.001 |
aj | -0.001 |
majesty | -0.001 |
Token | your |
Token ID | 534 |
Feature activation | -4.24e-03 |
Pos logit contributions | |
yourself | +0.024 |
blo | +0.023 |
aj | +0.022 |
majesty | +0.022 |
yourselves | +0.022 |
Neg logit contributions | |
inn | -0.024 |
aster | -0.023 |
eb | -0.023 |
le | -0.022 |
dog | -0.022 |
Token | p |
Token ID | 279 |
Feature activation | -6.58e-02 |
Pos logit contributions | |
yourself | +0.007 |
ich | +0.007 |
inas | +0.007 |
blo | +0.007 |
yourselves | +0.007 |
Neg logit contributions | |
inn | -0.006 |
dog | -0.006 |
aster | -0.006 |
Finn | -0.005 |
le | -0.005 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.90e-02 |
Pos logit contributions | |
yourself | +0.024 |
blo | +0.022 |
yourselves | +0.015 |
majesty | +0.012 |
ich | +0.012 |
Neg logit contributions | |
inn | -0.193 |
eb | -0.182 |
aster | -0.181 |
le | -0.179 |
dog | -0.179 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
yourself | +0.077 |
blo | +0.073 |
yourselves | +0.067 |
majesty | +0.066 |
aj | +0.064 |
Neg logit contributions | |
inn | -0.179 |
eb | -0.170 |
aster | -0.167 |
le | -0.167 |
dog | -0.167 |
Token | . |
Token ID | 13 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
inn | +0.018 |
eb | +0.017 |
aster | +0.017 |
le | +0.017 |
dog | +0.017 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.015 |
aj | -0.015 |
yourselves | -0.015 |
majesty | -0.014 |
Token | OK |
Token ID | 7477 |
Feature activation | -7.70e-03 |
Pos logit contributions | |
blo | +0.019 |
yourself | +0.018 |
ich | +0.018 |
aj | +0.018 |
majesty | +0.018 |
Neg logit contributions | |
inn | -0.018 |
aster | -0.017 |
dog | -0.017 |
eb | -0.017 |
hot | -0.016 |
Token | ?" |
Token ID | 1701 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
yourself | +0.008 |
majesty | +0.008 |
blo | +0.008 |
aj | +0.008 |
yourselves | +0.008 |
Neg logit contributions | |
inn | -0.016 |
le | -0.016 |
dog | -0.015 |
aster | -0.015 |
eb | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | +2.57e-03 |
Pos logit contributions | |
inn | +0.029 |
eb | +0.027 |
le | +0.027 |
aster | +0.026 |
ah | +0.026 |
Neg logit contributions | |
yourself | -0.021 |
blo | -0.020 |
yourselves | -0.019 |
aj | -0.019 |
majesty | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | +6.75e-03 |
Pos logit contributions | |
inn | +0.004 |
le | +0.003 |
aster | +0.003 |
dog | +0.003 |
eb | +0.003 |
Neg logit contributions | |
majesty | -0.003 |
blo | -0.003 |
yourself | -0.003 |
aj | -0.003 |
ich | -0.003 |
Token | get |
Token ID | 651 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
aster | +0.009 |
him | +0.009 |
dog | +0.008 |
le | +0.008 |
inn | +0.008 |
Neg logit contributions | |
ich | -0.012 |
blo | -0.012 |
aj | -0.012 |
endant | -0.011 |
yourself | -0.011 |
Token | into |
Token ID | 656 |
Feature activation | -3.51e-02 |
Pos logit contributions | |
majesty | +0.029 |
ich | +0.028 |
blo | +0.027 |
yourself | +0.027 |
aj | +0.027 |
Neg logit contributions | |
inn | -0.024 |
aster | -0.023 |
him | -0.023 |
le | -0.021 |
dog | -0.021 |
Token | your |
Token ID | 534 |
Feature activation | -5.22e-03 |
Pos logit contributions | |
blo | +0.057 |
yourself | +0.057 |
aj | +0.056 |
majesty | +0.056 |
ich | +0.056 |
Neg logit contributions | |
inn | -0.054 |
aster | -0.052 |
eb | -0.049 |
him | -0.049 |
le | -0.048 |
Token | p |
Token ID | 279 |
Feature activation | -6.93e-02 |
Pos logit contributions | |
yourself | +0.008 |
blo | +0.008 |
yourselves | +0.008 |
ich | +0.008 |
inas | +0.007 |
Neg logit contributions | |
aster | -0.008 |
dog | -0.008 |
inn | -0.008 |
him | -0.007 |
le | -0.007 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.87e-02 |
Pos logit contributions | |
yourself | +0.025 |
blo | +0.021 |
yourselves | +0.017 |
majesty | +0.012 |
ich | +0.012 |
Neg logit contributions | |
inn | -0.201 |
eb | -0.193 |
aster | -0.192 |
le | -0.189 |
dog | -0.189 |
Token | amas |
Token ID | 17485 |
Feature activation | -3.67e-03 |
Pos logit contributions | |
yourself | +0.084 |
blo | +0.080 |
yourselves | +0.076 |
majesty | +0.073 |
precious | +0.073 |
Neg logit contributions | |
inn | -0.167 |
eb | -0.163 |
dog | -0.158 |
le | -0.157 |
aster | -0.155 |
Token | ." |
Token ID | 526 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
yourself | +0.005 |
blo | +0.005 |
majesty | +0.005 |
yourselves | +0.004 |
aj | +0.004 |
Neg logit contributions | |
inn | -0.007 |
eb | -0.007 |
le | -0.007 |
dog | -0.007 |
aster | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | +1.96e-02 |
Pos logit contributions | |
inn | +0.038 |
aster | +0.036 |
le | +0.036 |
eb | +0.036 |
ah | +0.035 |
Neg logit contributions | |
yourself | -0.038 |
aj | -0.036 |
blo | -0.035 |
yourselves | -0.035 |
window | -0.034 |
Token |
|
Token ID | 198 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
inn | +0.041 |
aster | +0.040 |
ah | +0.039 |
eb | +0.039 |
le | +0.039 |
Neg logit contributions | |
yourself | -0.020 |
aj | -0.019 |
blo | -0.018 |
yourselves | -0.017 |
window | -0.016 |
Token | So |
Token ID | 2396 |
Feature activation | -4.04e-03 |
Pos logit contributions | |
inn | +0.015 |
eb | +0.014 |
aster | +0.014 |
le | +0.013 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.025 |
blo | -0.023 |
yourselves | -0.023 |
aj | -0.023 |
window | -0.021 |
Token | and |
Token ID | 290 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
majesty | +0.041 |
ich | +0.041 |
endant | +0.039 |
blo | +0.039 |
aj | +0.038 |
Neg logit contributions | |
aster | -0.033 |
him | -0.031 |
le | -0.030 |
inn | -0.030 |
dog | -0.028 |
Token | put |
Token ID | 1234 |
Feature activation | +4.58e-04 |
Pos logit contributions | |
ich | +0.020 |
blo | +0.019 |
aj | +0.019 |
majesty | +0.019 |
endant | +0.019 |
Neg logit contributions | |
aster | -0.014 |
him | -0.013 |
le | -0.013 |
inn | -0.012 |
dog | -0.012 |
Token | on |
Token ID | 319 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
inn | +0.001 |
le | +0.001 |
aster | +0.001 |
eb | +0.001 |
dog | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
blo | -0.001 |
aj | -0.001 |
majesty | -0.001 |
ich | -0.001 |
Token | your |
Token ID | 534 |
Feature activation | -4.24e-03 |
Pos logit contributions | |
ich | +0.023 |
majesty | +0.022 |
blo | +0.022 |
yourself | +0.022 |
aj | +0.022 |
Neg logit contributions | |
aster | -0.025 |
inn | -0.025 |
him | -0.024 |
le | -0.023 |
dog | -0.023 |
Token | p |
Token ID | 279 |
Feature activation | -6.53e-02 |
Pos logit contributions | |
yourself | +0.008 |
inas | +0.008 |
ich | +0.008 |
blo | +0.008 |
yourselves | +0.008 |
Neg logit contributions | |
dog | -0.005 |
inn | -0.005 |
Finn | -0.004 |
him | -0.004 |
aster | -0.004 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.81e-02 |
Pos logit contributions | |
yourself | +0.041 |
blo | +0.040 |
sending | +0.034 |
yourselves | +0.031 |
receiver | +0.028 |
Neg logit contributions | |
inn | -0.177 |
eb | -0.165 |
le | -0.157 |
dog | -0.157 |
aster | -0.157 |
Token | amas |
Token ID | 17485 |
Feature activation | +8.73e-03 |
Pos logit contributions | |
yourself | +0.082 |
blo | +0.080 |
yourselves | +0.073 |
majesty | +0.072 |
precious | +0.071 |
Neg logit contributions | |
inn | -0.170 |
eb | -0.162 |
dog | -0.158 |
le | -0.157 |
aster | -0.155 |
Token | ." |
Token ID | 526 |
Feature activation | +9.44e-03 |
Pos logit contributions | |
inn | +0.015 |
eb | +0.014 |
aster | +0.014 |
le | +0.014 |
dog | +0.014 |
Neg logit contributions | |
yourself | -0.013 |
blo | -0.013 |
yourselves | -0.012 |
aj | -0.012 |
majesty | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | +8.28e-03 |
Pos logit contributions | |
inn | +0.014 |
eb | +0.013 |
ah | +0.013 |
aster | +0.013 |
le | +0.012 |
Neg logit contributions | |
yourself | -0.017 |
yourselves | -0.016 |
aj | -0.016 |
blo | -0.016 |
majesty | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -2.62e-04 |
Pos logit contributions | |
inn | +0.016 |
eb | +0.016 |
aster | +0.015 |
ah | +0.015 |
le | +0.015 |
Neg logit contributions | |
yourself | -0.011 |
aj | -0.009 |
yourselves | -0.009 |
blo | -0.009 |
majesty | -0.009 |
Token | Anna |
Token ID | 31160 |
Feature activation | +7.61e-03 |
Pos logit contributions | |
yourself | +0.000 |
blo | +0.000 |
aj | +0.000 |
majesty | +0.000 |
yourselves | +0.000 |
Neg logit contributions | |
inn | -0.000 |
aster | -0.000 |
eb | -0.000 |
le | -0.000 |
dog | -0.000 |
Token | and |
Token ID | 290 |
Feature activation | -9.95e-03 |
Pos logit contributions | |
ich | +0.041 |
majesty | +0.041 |
endant | +0.040 |
aj | +0.039 |
blo | +0.039 |
Neg logit contributions | |
aster | -0.034 |
him | -0.032 |
le | -0.032 |
inn | -0.031 |
dog | -0.029 |
Token | put |
Token ID | 1234 |
Feature activation | +2.08e-03 |
Pos logit contributions | |
ich | +0.019 |
blo | +0.018 |
aj | +0.018 |
majesty | +0.018 |
endant | +0.018 |
Neg logit contributions | |
aster | -0.013 |
him | -0.012 |
le | -0.011 |
inn | -0.011 |
dog | -0.011 |
Token | on |
Token ID | 319 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
inn | +0.003 |
aster | +0.003 |
eb | +0.003 |
le | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
aj | -0.004 |
majesty | -0.004 |
ich | -0.004 |
Token | your |
Token ID | 534 |
Feature activation | -4.55e-03 |
Pos logit contributions | |
ich | +0.019 |
blo | +0.019 |
majesty | +0.019 |
yourself | +0.018 |
aj | +0.018 |
Neg logit contributions | |
inn | -0.025 |
aster | -0.025 |
him | -0.024 |
le | -0.023 |
dog | -0.023 |
Token | p |
Token ID | 279 |
Feature activation | -6.53e-02 |
Pos logit contributions | |
yourself | +0.009 |
ich | +0.009 |
inas | +0.009 |
blo | +0.009 |
yourselves | +0.009 |
Neg logit contributions | |
dog | -0.005 |
inn | -0.005 |
Finn | -0.004 |
him | -0.004 |
le | -0.004 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.80e-02 |
Pos logit contributions | |
yourself | +0.043 |
blo | +0.041 |
sending | +0.035 |
yourselves | +0.034 |
receiver | +0.032 |
Neg logit contributions | |
inn | -0.176 |
eb | -0.162 |
aster | -0.156 |
le | -0.155 |
dog | -0.155 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
yourself | +0.084 |
blo | +0.082 |
yourselves | +0.075 |
majesty | +0.073 |
precious | +0.073 |
Neg logit contributions | |
inn | -0.168 |
eb | -0.160 |
dog | -0.155 |
le | -0.155 |
aster | -0.151 |
Token | ." |
Token ID | 526 |
Feature activation | +8.99e-03 |
Pos logit contributions | |
inn | +0.018 |
eb | +0.016 |
aster | +0.016 |
le | +0.016 |
dog | +0.016 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.015 |
yourselves | -0.014 |
aj | -0.014 |
majesty | -0.014 |
Token |
|
Token ID | 198 |
Feature activation | +6.09e-03 |
Pos logit contributions | |
inn | +0.013 |
eb | +0.012 |
aster | +0.012 |
dog | +0.012 |
le | +0.011 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.016 |
aj | -0.015 |
yourselves | -0.015 |
majesty | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -2.30e-03 |
Pos logit contributions | |
inn | +0.010 |
eb | +0.010 |
aster | +0.010 |
le | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.009 |
aj | -0.009 |
yourselves | -0.009 |
majesty | -0.009 |
Token | L |
Token ID | 43 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
blo | +0.005 |
majesty | +0.005 |
ich | +0.004 |
aj | +0.004 |
endant | +0.004 |
Neg logit contributions | |
inn | -0.003 |
aster | -0.003 |
ny | -0.003 |
hot | -0.002 |
war | -0.002 |
Token | I |
Token ID | 40 |
Feature activation | +8.07e-03 |
Pos logit contributions | |
yourself | +0.022 |
blo | +0.021 |
majesty | +0.021 |
aj | +0.021 |
yourselves | +0.020 |
Neg logit contributions | |
inn | -0.027 |
aster | -0.025 |
eb | -0.025 |
dog | -0.025 |
le | -0.024 |
Token | love |
Token ID | 1842 |
Feature activation | -3.52e-03 |
Pos logit contributions | |
inn | +0.013 |
le | +0.012 |
aster | +0.012 |
ah | +0.012 |
dog | +0.012 |
Neg logit contributions | |
yourself | -0.014 |
yourselves | -0.014 |
ich | -0.013 |
blo | -0.013 |
aj | -0.012 |
Token | my |
Token ID | 616 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
yourself | +0.005 |
aj | +0.004 |
ich | +0.004 |
majesty | +0.004 |
blo | +0.004 |
Neg logit contributions | |
him | -0.007 |
aster | -0.006 |
dog | -0.006 |
inn | -0.006 |
eb | -0.006 |
Token | new |
Token ID | 649 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
yourself | +0.019 |
yourselves | +0.018 |
ich | +0.016 |
reetings | +0.016 |
Nothing | +0.015 |
Neg logit contributions | |
dog | -0.019 |
him | -0.018 |
aster | -0.017 |
le | -0.017 |
Bob | -0.017 |
Token | p |
Token ID | 279 |
Feature activation | -6.49e-02 |
Pos logit contributions | |
yourself | +0.028 |
yourselves | +0.027 |
ich | +0.025 |
endant | +0.024 |
aj | +0.024 |
Neg logit contributions | |
dog | -0.025 |
ah | -0.022 |
him | -0.022 |
inn | -0.022 |
le | -0.022 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.79e-02 |
Pos logit contributions | |
yourself | +0.054 |
yourselves | +0.047 |
blo | +0.045 |
sending | +0.043 |
receiver | +0.039 |
Neg logit contributions | |
inn | -0.160 |
eb | -0.152 |
ah | -0.149 |
dog | -0.148 |
le | -0.146 |
Token | amas |
Token ID | 17485 |
Feature activation | -6.10e-04 |
Pos logit contributions | |
yourself | +0.094 |
blo | +0.088 |
yourselves | +0.088 |
precious | +0.087 |
majesty | +0.081 |
Neg logit contributions | |
inn | -0.153 |
eb | -0.152 |
dog | -0.148 |
le | -0.146 |
aster | -0.139 |
Token | ," |
Token ID | 553 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
yourselves | +0.001 |
majesty | +0.001 |
aj | +0.001 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
le | -0.001 |
dog | -0.001 |
aster | -0.001 |
Token | said |
Token ID | 531 |
Feature activation | +1.01e-03 |
Pos logit contributions | |
inn | +0.019 |
aster | +0.018 |
eb | +0.018 |
dog | +0.017 |
le | +0.017 |
Neg logit contributions | |
yourself | -0.021 |
blo | -0.020 |
aj | -0.019 |
yourselves | -0.019 |
majesty | -0.019 |
Token | Lily |
Token ID | 20037 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
inn | +0.002 |
war | +0.002 |
ah | +0.002 |
eb | +0.002 |
le | +0.002 |
Neg logit contributions | |
yourself | -0.001 |
hugging | -0.001 |
blo | -0.001 |
grandmother | -0.001 |
aj | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
yourself | +0.025 |
blo | +0.024 |
yourselves | +0.023 |
aj | +0.023 |
majesty | +0.022 |
Neg logit contributions | |
inn | -0.022 |
eb | -0.020 |
aster | -0.020 |
le | -0.020 |
dog | -0.020 |
Token | Mia |
Token ID | 32189 |
Feature activation | -1.31e-03 |
Pos logit contributions | |
yourself | +0.052 |
yourselves | +0.049 |
blo | +0.049 |
majesty | +0.047 |
aj | +0.047 |
Neg logit contributions | |
inn | -0.036 |
eb | -0.033 |
aster | -0.032 |
war | -0.032 |
dog | -0.031 |
Token | . |
Token ID | 13 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
yourself | +0.002 |
blo | +0.002 |
aj | +0.002 |
yourselves | +0.002 |
majesty | +0.002 |
Neg logit contributions | |
inn | -0.002 |
eb | -0.002 |
aster | -0.002 |
le | -0.002 |
dog | -0.002 |
Token | That |
Token ID | 1320 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
yourself | +0.018 |
blo | +0.018 |
aj | +0.017 |
yourselves | +0.017 |
majesty | +0.017 |
Neg logit contributions | |
inn | -0.015 |
eb | -0.014 |
aster | -0.014 |
le | -0.014 |
dog | -0.014 |
Token | 's |
Token ID | 338 |
Feature activation | -4.69e-03 |
Pos logit contributions | |
aj | +0.030 |
yourself | +0.029 |
majesty | +0.028 |
yourselves | +0.028 |
blo | +0.027 |
Neg logit contributions | |
le | -0.028 |
ah | -0.028 |
dog | -0.028 |
eb | -0.028 |
ny | -0.027 |
Token | how |
Token ID | 703 |
Feature activation | -3.89e-03 |
Pos logit contributions | |
aj | +0.006 |
majesty | +0.006 |
blo | +0.006 |
yourself | +0.006 |
window | +0.006 |
Neg logit contributions | |
inn | -0.009 |
aster | -0.008 |
le | -0.008 |
him | -0.008 |
dog | -0.008 |
Token | pand |
Token ID | 19798 |
Feature activation | -7.78e-02 |
Pos logit contributions | |
yourself | +0.005 |
blo | +0.004 |
aj | +0.004 |
majesty | +0.004 |
yourselves | +0.004 |
Neg logit contributions | |
inn | -0.008 |
aster | -0.007 |
eb | -0.007 |
le | -0.007 |
dog | -0.007 |
Token | as |
Token ID | 292 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
yourself | +0.107 |
blo | +0.101 |
aj | +0.097 |
yourselves | +0.097 |
majesty | +0.097 |
Neg logit contributions | |
inn | -0.146 |
eb | -0.136 |
le | -0.135 |
aster | -0.133 |
dog | -0.131 |
Token | communicate |
Token ID | 10996 |
Feature activation | +3.46e-03 |
Pos logit contributions | |
aj | +0.031 |
yourself | +0.030 |
majesty | +0.029 |
blo | +0.029 |
yourselves | +0.028 |
Neg logit contributions | |
le | -0.027 |
inn | -0.027 |
him | -0.026 |
eb | -0.026 |
aster | -0.026 |
Token | . |
Token ID | 13 |
Feature activation | -8.83e-03 |
Pos logit contributions | |
le | +0.004 |
him | +0.004 |
dog | +0.004 |
inn | +0.004 |
hot | +0.004 |
Neg logit contributions | |
aj | -0.007 |
majesty | -0.007 |
ich | -0.007 |
blo | -0.007 |
window | -0.006 |
Token | They |
Token ID | 1119 |
Feature activation | -7.85e-03 |
Pos logit contributions | |
blo | +0.016 |
yourself | +0.015 |
aj | +0.015 |
ich | +0.015 |
window | +0.015 |
Neg logit contributions | |
inn | -0.012 |
eb | -0.011 |
dog | -0.011 |
aster | -0.011 |
hot | -0.011 |
Token | make |
Token ID | 787 |
Feature activation | -1.99e-05 |
Pos logit contributions | |
aj | +0.015 |
yourself | +0.014 |
ich | +0.014 |
yourselves | +0.014 |
majesty | +0.014 |
Neg logit contributions | |
le | -0.010 |
him | -0.010 |
dog | -0.009 |
ny | -0.009 |
ah | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
inn | +0.022 |
eb | +0.022 |
aster | +0.021 |
dog | +0.020 |
war | +0.020 |
Neg logit contributions | |
yourself | -0.019 |
blo | -0.018 |
aj | -0.017 |
yourselves | -0.017 |
window | -0.017 |
Token | put |
Token ID | 1234 |
Feature activation | +9.70e-03 |
Pos logit contributions | |
aster | +0.020 |
inn | +0.019 |
dog | +0.018 |
le | +0.018 |
him | +0.018 |
Neg logit contributions | |
yourself | -0.024 |
blo | -0.024 |
ich | -0.023 |
aj | -0.023 |
yourselves | -0.023 |
Token | on |
Token ID | 319 |
Feature activation | -4.38e-03 |
Pos logit contributions | |
inn | +0.016 |
eb | +0.015 |
omp | +0.015 |
ah | +0.015 |
war | +0.015 |
Neg logit contributions | |
yourself | -0.016 |
yourselves | -0.014 |
blo | -0.014 |
precious | -0.013 |
most | -0.013 |
Token | their |
Token ID | 511 |
Feature activation | +3.93e-03 |
Pos logit contributions | |
yourself | +0.007 |
yourselves | +0.007 |
blo | +0.007 |
aj | +0.006 |
window | +0.006 |
Neg logit contributions | |
inn | -0.008 |
eb | -0.007 |
ah | -0.007 |
ny | -0.007 |
le | -0.007 |
Token | p |
Token ID | 279 |
Feature activation | -6.17e-02 |
Pos logit contributions | |
dog | +0.006 |
aster | +0.006 |
inn | +0.006 |
le | +0.006 |
him | +0.005 |
Neg logit contributions | |
yourself | -0.007 |
blo | -0.006 |
ich | -0.006 |
yourselves | -0.006 |
inas | -0.006 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.77e-02 |
Pos logit contributions | |
yourself | +0.022 |
blo | +0.020 |
yourselves | +0.014 |
ich | +0.010 |
sending | +0.009 |
Neg logit contributions | |
inn | -0.181 |
eb | -0.172 |
aster | -0.171 |
le | -0.169 |
dog | -0.168 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
yourself | +0.081 |
blo | +0.077 |
yourselves | +0.072 |
majesty | +0.070 |
ich | +0.069 |
Neg logit contributions | |
inn | -0.170 |
eb | -0.162 |
le | -0.159 |
dog | -0.159 |
aster | -0.158 |
Token | first |
Token ID | 717 |
Feature activation | +4.43e-03 |
Pos logit contributions | |
inn | +0.018 |
aster | +0.018 |
eb | +0.018 |
omp | +0.017 |
war | +0.017 |
Neg logit contributions | |
yourself | -0.014 |
aj | -0.014 |
blo | -0.014 |
window | -0.013 |
yourselves | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | +3.65e-03 |
Pos logit contributions | |
inn | +0.006 |
le | +0.005 |
aster | +0.005 |
dog | +0.005 |
eb | +0.005 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.008 |
ich | -0.008 |
yourselves | -0.008 |
majesty | -0.008 |
Token | They |
Token ID | 1119 |
Feature activation | -5.70e-03 |
Pos logit contributions | |
inn | +0.005 |
le | +0.005 |
eb | +0.004 |
aster | +0.004 |
ah | +0.004 |
Neg logit contributions | |
yourself | -0.007 |
blo | -0.007 |
yourselves | -0.007 |
aj | -0.007 |
window | -0.007 |
Token | do |
Token ID | 466 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
yourself | +0.009 |
blo | +0.008 |
aj | +0.008 |
window | +0.008 |
majesty | +0.008 |
Neg logit contributions | |
inn | -0.010 |
eb | -0.009 |
war | -0.009 |
aster | -0.009 |
dog | -0.009 |
Token | was |
Token ID | 373 |
Feature activation | +4.32e-03 |
Pos logit contributions | |
yourself | +0.018 |
blo | +0.017 |
aj | +0.016 |
yourselves | +0.016 |
majesty | +0.016 |
Neg logit contributions | |
inn | -0.026 |
eb | -0.025 |
aster | -0.025 |
le | -0.024 |
dog | -0.024 |
Token | still |
Token ID | 991 |
Feature activation | +2.57e-03 |
Pos logit contributions | |
inn | +0.008 |
aster | +0.007 |
le | +0.007 |
dog | +0.007 |
eb | +0.007 |
Neg logit contributions | |
aj | -0.006 |
yourself | -0.006 |
majesty | -0.006 |
yourselves | -0.006 |
blo | -0.006 |
Token | wearing |
Token ID | 5762 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
inn | +0.004 |
aster | +0.004 |
Jim | +0.004 |
him | +0.004 |
dog | +0.004 |
Neg logit contributions | |
majesty | -0.004 |
aj | -0.004 |
yourself | -0.004 |
yourselves | -0.004 |
blo | -0.003 |
Token | her |
Token ID | 607 |
Feature activation | -6.04e-03 |
Pos logit contributions | |
yourself | +0.030 |
blo | +0.028 |
aj | +0.028 |
yourselves | +0.028 |
majesty | +0.028 |
Neg logit contributions | |
inn | -0.022 |
aster | -0.020 |
eb | -0.020 |
le | -0.019 |
dog | -0.019 |
Token | p |
Token ID | 279 |
Feature activation | -6.78e-02 |
Pos logit contributions | |
yourselves | +0.009 |
yourself | +0.009 |
inas | +0.008 |
majesty | +0.008 |
ich | +0.008 |
Neg logit contributions | |
inn | -0.009 |
dog | -0.009 |
aster | -0.009 |
ah | -0.009 |
le | -0.009 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.73e-02 |
Pos logit contributions | |
yourself | +0.047 |
yourselves | +0.041 |
blo | +0.039 |
sending | +0.038 |
receiver | +0.033 |
Neg logit contributions | |
inn | -0.177 |
eb | -0.166 |
ah | -0.162 |
dog | -0.159 |
war | -0.159 |
Token | amas |
Token ID | 17485 |
Feature activation | +3.08e-03 |
Pos logit contributions | |
yourself | +0.082 |
blo | +0.076 |
yourselves | +0.075 |
majesty | +0.073 |
precious | +0.069 |
Neg logit contributions | |
inn | -0.167 |
eb | -0.160 |
le | -0.156 |
dog | -0.156 |
aster | -0.152 |
Token | . |
Token ID | 13 |
Feature activation | -1.13e-05 |
Pos logit contributions | |
inn | +0.005 |
aster | +0.005 |
eb | +0.005 |
war | +0.005 |
dog | +0.005 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.004 |
aj | -0.004 |
window | -0.004 |
yourselves | -0.004 |
Token | |
Token ID | 220 |
Feature activation | -2.69e-02 |
Pos logit contributions | |
yourself | +0.000 |
blo | +0.000 |
yourselves | +0.000 |
ich | +0.000 |
aj | +0.000 |
Neg logit contributions | |
inn | -0.000 |
eb | -0.000 |
aster | -0.000 |
dog | -0.000 |
war | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | +9.24e-03 |
Pos logit contributions | |
yourself | +0.048 |
blo | +0.048 |
majesty | +0.046 |
yourselves | +0.045 |
aj | +0.045 |
Neg logit contributions | |
inn | -0.039 |
eb | -0.035 |
him | -0.034 |
aster | -0.034 |
war | -0.033 |
Token |
|
Token ID | 198 |
Feature activation | +1.69e-03 |
Pos logit contributions | |
inn | +0.016 |
eb | +0.015 |
aster | +0.015 |
le | +0.015 |
dog | +0.014 |
Neg logit contributions | |
yourself | -0.014 |
blo | -0.013 |
aj | -0.013 |
yourselves | -0.013 |
majesty | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +9.29e-03 |
Pos logit contributions | |
inn | +0.031 |
eb | +0.029 |
aster | +0.028 |
war | +0.028 |
ah | +0.028 |
Neg logit contributions | |
blo | -0.020 |
yourself | -0.020 |
window | -0.019 |
aj | -0.017 |
hugging | -0.017 |
Token | put |
Token ID | 1234 |
Feature activation | +8.43e-03 |
Pos logit contributions | |
inn | +0.013 |
aster | +0.013 |
le | +0.013 |
dog | +0.013 |
eb | +0.013 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.015 |
aj | -0.015 |
yourselves | -0.015 |
ich | -0.015 |
Token | on |
Token ID | 319 |
Feature activation | -3.31e-03 |
Pos logit contributions | |
inn | +0.014 |
eb | +0.014 |
omp | +0.013 |
war | +0.013 |
ah | +0.013 |
Neg logit contributions | |
yourself | -0.013 |
blo | -0.012 |
yourselves | -0.012 |
most | -0.011 |
window | -0.011 |
Token | their |
Token ID | 511 |
Feature activation | +6.14e-03 |
Pos logit contributions | |
yourself | +0.005 |
blo | +0.005 |
yourselves | +0.005 |
window | +0.004 |
living | +0.004 |
Neg logit contributions | |
inn | -0.007 |
eb | -0.006 |
hot | -0.006 |
ah | -0.006 |
omp | -0.006 |
Token | p |
Token ID | 279 |
Feature activation | -6.17e-02 |
Pos logit contributions | |
dog | +0.009 |
aster | +0.009 |
inn | +0.009 |
le | +0.009 |
him | +0.008 |
Neg logit contributions | |
yourself | -0.011 |
yourselves | -0.010 |
blo | -0.010 |
ich | -0.010 |
inas | -0.009 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.67e-02 |
Pos logit contributions | |
yourself | +0.023 |
blo | +0.020 |
yourselves | +0.015 |
sending | +0.010 |
ich | +0.010 |
Neg logit contributions | |
inn | -0.179 |
eb | -0.172 |
aster | -0.169 |
le | -0.168 |
dog | -0.167 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
yourself | +0.079 |
blo | +0.073 |
yourselves | +0.069 |
majesty | +0.067 |
ich | +0.065 |
Neg logit contributions | |
inn | -0.169 |
eb | -0.162 |
le | -0.158 |
dog | -0.158 |
aster | -0.158 |
Token | . |
Token ID | 13 |
Feature activation | -1.51e-03 |
Pos logit contributions | |
inn | +0.025 |
aster | +0.024 |
eb | +0.023 |
omp | +0.023 |
war | +0.023 |
Neg logit contributions | |
window | -0.015 |
blo | -0.014 |
yourself | -0.014 |
aj | -0.014 |
living | -0.012 |
Token | They |
Token ID | 1119 |
Feature activation | -7.79e-03 |
Pos logit contributions | |
yourself | +0.003 |
aj | +0.002 |
yourselves | +0.002 |
majesty | +0.002 |
window | +0.002 |
Neg logit contributions | |
inn | -0.002 |
eb | -0.002 |
ah | -0.002 |
le | -0.002 |
aster | -0.002 |
Token | hug |
Token ID | 16225 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
yourself | +0.013 |
blo | +0.013 |
aj | +0.012 |
yourselves | +0.012 |
majesty | +0.012 |
Neg logit contributions | |
inn | -0.012 |
aster | -0.011 |
eb | -0.011 |
le | -0.011 |
dog | -0.011 |
Token | their |
Token ID | 511 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
yourself | +0.034 |
yourselves | +0.032 |
window | +0.030 |
blo | +0.030 |
sisters | +0.030 |
Neg logit contributions | |
inn | -0.037 |
war | -0.031 |
eb | -0.030 |
olt | -0.030 |
omp | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
inn | +0.030 |
eb | +0.028 |
aster | +0.028 |
war | +0.027 |
ah | +0.026 |
Neg logit contributions | |
yourself | -0.023 |
blo | -0.022 |
window | -0.021 |
aj | -0.020 |
yourselves | -0.020 |
Token | put |
Token ID | 1234 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
inn | +0.020 |
eb | +0.018 |
aster | +0.018 |
le | +0.018 |
dog | +0.017 |
Neg logit contributions | |
yourself | -0.023 |
blo | -0.022 |
aj | -0.022 |
yourselves | -0.022 |
majesty | -0.021 |
Token | on |
Token ID | 319 |
Feature activation | -5.62e-03 |
Pos logit contributions | |
inn | +0.015 |
war | +0.015 |
omp | +0.015 |
olt | +0.015 |
eb | +0.014 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.016 |
yourselves | -0.015 |
most | -0.015 |
precious | -0.015 |
Token | their |
Token ID | 511 |
Feature activation | +5.47e-03 |
Pos logit contributions | |
yourself | +0.008 |
blo | +0.008 |
yourselves | +0.008 |
window | +0.007 |
precious | +0.007 |
Neg logit contributions | |
inn | -0.011 |
hot | -0.010 |
omp | -0.010 |
olt | -0.010 |
war | -0.010 |
Token | p |
Token ID | 279 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
inn | +0.007 |
aster | +0.007 |
dog | +0.007 |
eb | +0.007 |
le | +0.006 |
Neg logit contributions | |
yourself | -0.011 |
blo | -0.010 |
yourselves | -0.010 |
aj | -0.010 |
ich | -0.010 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.66e-02 |
Pos logit contributions | |
yourself | +0.007 |
aj | +0.006 |
blo | +0.001 |
majesty | +0.001 |
yourselves | -0.000 |
Neg logit contributions | |
inn | -0.183 |
aster | -0.177 |
le | -0.176 |
eb | -0.176 |
dog | -0.174 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
yourself | +0.070 |
blo | +0.064 |
aj | +0.061 |
yourselves | +0.060 |
majesty | +0.058 |
Neg logit contributions | |
inn | -0.180 |
eb | -0.171 |
aster | -0.170 |
le | -0.168 |
dog | -0.167 |
Token | . |
Token ID | 13 |
Feature activation | +2.86e-04 |
Pos logit contributions | |
inn | +0.028 |
aster | +0.027 |
omp | +0.026 |
eb | +0.026 |
war | +0.026 |
Neg logit contributions | |
window | -0.017 |
yourself | -0.017 |
aj | -0.017 |
blo | -0.016 |
yourselves | -0.015 |
Token | They |
Token ID | 1119 |
Feature activation | -5.04e-03 |
Pos logit contributions | |
inn | +0.000 |
eb | +0.000 |
aster | +0.000 |
le | +0.000 |
dog | +0.000 |
Neg logit contributions | |
yourself | -0.001 |
blo | -0.001 |
aj | -0.001 |
yourselves | -0.001 |
majesty | -0.000 |
Token | hug |
Token ID | 16225 |
Feature activation | -1.96e-02 |
Pos logit contributions | |
yourself | +0.008 |
blo | +0.008 |
aj | +0.007 |
majesty | +0.007 |
yourselves | +0.007 |
Neg logit contributions | |
inn | -0.008 |
eb | -0.008 |
aster | -0.008 |
le | -0.007 |
war | -0.007 |
Token | their |
Token ID | 511 |
Feature activation | +4.99e-03 |
Pos logit contributions | |
yourself | +0.035 |
yourselves | +0.033 |
blo | +0.031 |
window | +0.030 |
hugging | +0.029 |
Neg logit contributions | |
inn | -0.033 |
war | -0.029 |
omp | -0.028 |
ah | -0.027 |
olt | -0.027 |
Token | let |
Token ID | 1309 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
yourself | +0.029 |
blo | +0.027 |
yourselves | +0.026 |
aj | +0.026 |
majesty | +0.025 |
Neg logit contributions | |
inn | -0.040 |
eb | -0.037 |
aster | -0.037 |
le | -0.036 |
dog | -0.036 |
Token | 's |
Token ID | 338 |
Feature activation | -2.05e-03 |
Pos logit contributions | |
inn | +0.071 |
aster | +0.062 |
ah | +0.062 |
dog | +0.062 |
eb | +0.061 |
Neg logit contributions | |
yourself | -0.038 |
yourselves | -0.032 |
blo | -0.031 |
aj | -0.030 |
window | -0.030 |
Token | go |
Token ID | 467 |
Feature activation | -1.71e-03 |
Pos logit contributions | |
yourself | +0.004 |
aj | +0.004 |
blo | +0.004 |
majesty | +0.004 |
ich | +0.004 |
Neg logit contributions | |
inn | -0.003 |
aster | -0.002 |
le | -0.002 |
eb | -0.002 |
dog | -0.002 |
Token | get |
Token ID | 651 |
Feature activation | -2.52e-03 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
yourselves | +0.003 |
aj | +0.003 |
majesty | +0.003 |
Neg logit contributions | |
inn | -0.003 |
eb | -0.002 |
aster | -0.002 |
le | -0.002 |
dog | -0.002 |
Token | your |
Token ID | 534 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
majesty | +0.005 |
ich | +0.005 |
aj | +0.005 |
yourself | +0.005 |
blo | +0.005 |
Neg logit contributions | |
him | -0.003 |
inn | -0.003 |
aster | -0.003 |
le | -0.003 |
dog | -0.003 |
Token | p |
Token ID | 279 |
Feature activation | -7.66e-02 |
Pos logit contributions | |
yourself | +0.006 |
yourselves | +0.006 |
majesty | +0.006 |
ich | +0.006 |
blo | +0.006 |
Neg logit contributions | |
inn | -0.003 |
dog | -0.003 |
Finn | -0.003 |
le | -0.003 |
him | -0.003 |
Token | aj |
Token ID | 1228 |
Feature activation | -8.01e-02 |
Pos logit contributions | |
yourself | +0.096 |
blo | +0.089 |
yourselves | +0.085 |
sending | +0.084 |
receiver | +0.079 |
Neg logit contributions | |
inn | -0.159 |
eb | -0.144 |
le | -0.142 |
dog | -0.140 |
ah | -0.139 |
Token | amas |
Token ID | 17485 |
Feature activation | -5.20e-03 |
Pos logit contributions | |
yourself | +0.083 |
blo | +0.078 |
yourselves | +0.074 |
majesty | +0.071 |
aj | +0.069 |
Neg logit contributions | |
inn | -0.176 |
eb | -0.170 |
le | -0.166 |
dog | -0.166 |
aster | -0.163 |
Token | from |
Token ID | 422 |
Feature activation | +3.48e-03 |
Pos logit contributions | |
yourself | +0.007 |
majesty | +0.007 |
blo | +0.007 |
yourselves | +0.007 |
ich | +0.006 |
Neg logit contributions | |
inn | -0.009 |
le | -0.009 |
eb | -0.009 |
dog | -0.009 |
ny | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | +2.40e-03 |
Pos logit contributions | |
inn | +0.005 |
aster | +0.005 |
him | +0.005 |
le | +0.004 |
dog | +0.004 |
Neg logit contributions | |
yourself | -0.006 |
aj | -0.006 |
majesty | -0.006 |
blo | -0.006 |
ich | -0.006 |
Token | drawer |
Token ID | 33451 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
inn | +0.004 |
dog | +0.004 |
aster | +0.004 |
ny | +0.003 |
him | +0.003 |
Neg logit contributions | |
yourself | -0.004 |
aj | -0.004 |
majesty | -0.004 |
blo | -0.004 |
yourselves | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +9.68e-03 |
Pos logit contributions | |
inn | +0.035 |
eb | +0.034 |
aster | +0.032 |
omp | +0.032 |
ah | +0.032 |
Neg logit contributions | |
yourself | -0.026 |
blo | -0.025 |
window | -0.024 |
aj | -0.023 |
yourselves | -0.022 |
Token | put |
Token ID | 1234 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
inn | +0.015 |
aster | +0.015 |
le | +0.014 |
dog | +0.014 |
eb | +0.014 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.015 |
yourselves | -0.015 |
aj | -0.015 |
ich | -0.015 |
Token | on |
Token ID | 319 |
Feature activation | -7.80e-04 |
Pos logit contributions | |
inn | +0.023 |
eb | +0.021 |
war | +0.021 |
omp | +0.021 |
ah | +0.021 |
Neg logit contributions | |
yourself | -0.023 |
blo | -0.021 |
yourselves | -0.021 |
most | -0.020 |
precious | -0.020 |
Token | their |
Token ID | 511 |
Feature activation | +3.86e-03 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
yourselves | +0.001 |
window | +0.001 |
precious | +0.001 |
Neg logit contributions | |
inn | -0.002 |
omp | -0.001 |
hot | -0.001 |
eb | -0.001 |
ny | -0.001 |
Token | p |
Token ID | 279 |
Feature activation | -6.33e-02 |
Pos logit contributions | |
aster | +0.006 |
dog | +0.005 |
inn | +0.005 |
him | +0.005 |
le | +0.005 |
Neg logit contributions | |
yourself | -0.007 |
inas | -0.006 |
yourselves | -0.006 |
ich | -0.006 |
aj | -0.006 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.62e-02 |
Pos logit contributions | |
yourself | +0.042 |
blo | +0.037 |
yourselves | +0.033 |
sending | +0.029 |
receiver | +0.028 |
Neg logit contributions | |
inn | -0.166 |
eb | -0.158 |
aster | -0.157 |
ah | -0.152 |
dog | -0.152 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
yourself | +0.080 |
blo | +0.076 |
yourselves | +0.071 |
majesty | +0.069 |
precious | +0.068 |
Neg logit contributions | |
inn | -0.164 |
eb | -0.159 |
le | -0.154 |
dog | -0.153 |
aster | -0.152 |
Token | . |
Token ID | 13 |
Feature activation | +4.29e-03 |
Pos logit contributions | |
inn | +0.032 |
aster | +0.030 |
eb | +0.030 |
omp | +0.029 |
war | +0.029 |
Neg logit contributions | |
yourself | -0.024 |
blo | -0.024 |
aj | -0.023 |
window | -0.023 |
yourselves | -0.022 |
Token | They |
Token ID | 1119 |
Feature activation | -1.56e-03 |
Pos logit contributions | |
inn | +0.006 |
eb | +0.006 |
aster | +0.006 |
le | +0.006 |
dog | +0.006 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.007 |
aj | -0.007 |
yourselves | -0.007 |
majesty | -0.007 |
Token | said |
Token ID | 531 |
Feature activation | -9.02e-03 |
Pos logit contributions | |
yourself | +0.002 |
blo | +0.002 |
yourselves | +0.002 |
aj | +0.002 |
majesty | +0.002 |
Neg logit contributions | |
inn | -0.003 |
eb | -0.003 |
aster | -0.003 |
le | -0.002 |
dog | -0.002 |
Token | good |
Token ID | 922 |
Feature activation | +9.70e-03 |
Pos logit contributions | |
yourself | +0.016 |
blo | +0.015 |
aj | +0.015 |
yourselves | +0.015 |
majesty | +0.015 |
Neg logit contributions | |
inn | -0.014 |
eb | -0.013 |
aster | -0.012 |
le | -0.012 |
dog | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | +9.71e-03 |
Pos logit contributions | |
inn | +0.047 |
eb | +0.043 |
aster | +0.043 |
omp | +0.042 |
ah | +0.042 |
Neg logit contributions | |
blo | -0.030 |
yourself | -0.030 |
window | -0.029 |
aj | -0.028 |
precious | -0.026 |
Token | put |
Token ID | 1234 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
inn | +0.015 |
aster | +0.015 |
le | +0.015 |
dog | +0.015 |
eb | +0.015 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.014 |
yourselves | -0.014 |
ich | -0.014 |
aj | -0.014 |
Token | on |
Token ID | 319 |
Feature activation | +6.69e-04 |
Pos logit contributions | |
inn | +0.025 |
war | +0.023 |
eb | +0.022 |
ah | +0.022 |
Jim | +0.022 |
Neg logit contributions | |
yourself | -0.031 |
blo | -0.030 |
yourselves | -0.030 |
precious | -0.028 |
window | -0.028 |
Token | their |
Token ID | 511 |
Feature activation | +3.45e-03 |
Pos logit contributions | |
inn | +0.001 |
hot | +0.001 |
omp | +0.001 |
olt | +0.001 |
ah | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
yourselves | -0.001 |
blo | -0.001 |
window | -0.001 |
aj | -0.001 |
Token | p |
Token ID | 279 |
Feature activation | -5.94e-02 |
Pos logit contributions | |
dog | +0.006 |
aster | +0.005 |
inn | +0.005 |
him | +0.005 |
le | +0.005 |
Neg logit contributions | |
yourself | -0.005 |
ich | -0.005 |
blo | -0.005 |
inas | -0.005 |
yourselves | -0.005 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.59e-02 |
Pos logit contributions | |
yourself | +0.031 |
blo | +0.028 |
yourselves | +0.022 |
sending | +0.021 |
ich | +0.018 |
Neg logit contributions | |
inn | -0.166 |
eb | -0.157 |
aster | -0.154 |
ah | -0.153 |
dog | -0.152 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
yourself | +0.087 |
blo | +0.083 |
yourselves | +0.077 |
precious | +0.076 |
majesty | +0.075 |
Neg logit contributions | |
inn | -0.157 |
eb | -0.151 |
le | -0.147 |
dog | -0.147 |
aster | -0.143 |
Token | . |
Token ID | 13 |
Feature activation | -8.18e-04 |
Pos logit contributions | |
inn | +0.030 |
aster | +0.028 |
eb | +0.027 |
war | +0.027 |
omp | +0.027 |
Neg logit contributions | |
yourself | -0.022 |
blo | -0.021 |
aj | -0.021 |
window | -0.021 |
yourselves | -0.019 |
Token | They |
Token ID | 1119 |
Feature activation | -1.87e-03 |
Pos logit contributions | |
yourself | +0.002 |
blo | +0.002 |
ich | +0.002 |
majesty | +0.002 |
yourselves | +0.002 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
aster | -0.001 |
dog | -0.001 |
him | -0.001 |
Token | climbed |
Token ID | 19952 |
Feature activation | -2.71e-03 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
yourselves | +0.003 |
aj | +0.003 |
majesty | +0.002 |
Neg logit contributions | |
inn | -0.003 |
eb | -0.003 |
aster | -0.003 |
le | -0.003 |
dog | -0.003 |
Token | into |
Token ID | 656 |
Feature activation | -3.06e-02 |
Pos logit contributions | |
blo | +0.004 |
yourself | +0.004 |
window | +0.004 |
aj | +0.004 |
yourselves | +0.004 |
Neg logit contributions | |
inn | -0.005 |
aster | -0.005 |
eb | -0.005 |
war | -0.004 |
dog | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
inn | +0.014 |
eb | +0.013 |
aster | +0.013 |
dog | +0.013 |
le | +0.013 |
Neg logit contributions | |
yourself | -0.014 |
blo | -0.013 |
aj | -0.013 |
yourselves | -0.012 |
window | -0.012 |
Token | put |
Token ID | 1234 |
Feature activation | +6.62e-03 |
Pos logit contributions | |
aster | +0.018 |
inn | +0.017 |
dog | +0.017 |
le | +0.017 |
eb | +0.016 |
Neg logit contributions | |
yourself | -0.021 |
blo | -0.020 |
ich | -0.020 |
aj | -0.020 |
yourselves | -0.020 |
Token | on |
Token ID | 319 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
inn | +0.010 |
aster | +0.009 |
eb | +0.009 |
war | +0.009 |
ah | +0.009 |
Neg logit contributions | |
blo | -0.012 |
yourself | -0.011 |
yourselves | -0.011 |
precious | -0.010 |
window | -0.010 |
Token | their |
Token ID | 511 |
Feature activation | +3.05e-03 |
Pos logit contributions | |
yourself | +0.004 |
blo | +0.004 |
yourselves | +0.004 |
window | +0.004 |
aj | +0.004 |
Neg logit contributions | |
inn | -0.005 |
ah | -0.005 |
war | -0.005 |
hot | -0.005 |
omp | -0.005 |
Token | p |
Token ID | 279 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
him | +0.004 |
inn | +0.004 |
dog | +0.004 |
ny | +0.004 |
aster | +0.004 |
Neg logit contributions | |
yourself | -0.005 |
ich | -0.005 |
yourselves | -0.005 |
inas | -0.005 |
Nothing | -0.005 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.57e-02 |
Pos logit contributions | |
yourself | +0.060 |
blo | +0.054 |
yourselves | +0.052 |
sending | +0.052 |
hugging | +0.048 |
Neg logit contributions | |
inn | -0.143 |
eb | -0.134 |
ah | -0.127 |
aster | -0.125 |
le | -0.125 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
yourself | +0.082 |
blo | +0.076 |
yourselves | +0.074 |
precious | +0.070 |
majesty | +0.070 |
Neg logit contributions | |
inn | -0.162 |
eb | -0.156 |
dog | -0.151 |
le | -0.150 |
aster | -0.148 |
Token | . |
Token ID | 13 |
Feature activation | -4.70e-03 |
Pos logit contributions | |
inn | +0.021 |
aster | +0.021 |
eb | +0.020 |
omp | +0.020 |
war | +0.020 |
Neg logit contributions | |
window | -0.014 |
blo | -0.014 |
yourself | -0.013 |
aj | -0.013 |
ich | -0.012 |
Token | They |
Token ID | 1119 |
Feature activation | -9.62e-03 |
Pos logit contributions | |
yourself | +0.007 |
yourselves | +0.007 |
aj | +0.007 |
window | +0.007 |
majesty | +0.007 |
Neg logit contributions | |
ah | -0.008 |
le | -0.008 |
inn | -0.007 |
aster | -0.007 |
eb | -0.007 |
Token | each |
Token ID | 1123 |
Feature activation | +6.37e-03 |
Pos logit contributions | |
yourself | +0.016 |
blo | +0.016 |
aj | +0.015 |
yourselves | +0.015 |
majesty | +0.015 |
Neg logit contributions | |
inn | -0.015 |
eb | -0.014 |
aster | -0.014 |
dog | -0.013 |
le | -0.013 |
Token | pick |
Token ID | 2298 |
Feature activation | -4.72e-03 |
Pos logit contributions | |
inn | +0.011 |
eb | +0.010 |
aster | +0.010 |
le | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.009 |
aj | -0.009 |
majesty | -0.009 |
window | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
inn | +0.000 |
aster | +0.000 |
le | +0.000 |
dog | +0.000 |
eb | +0.000 |
Neg logit contributions | |
blo | -0.001 |
yourself | -0.001 |
aj | -0.001 |
ich | -0.001 |
yourselves | -0.001 |
Token | you |
Token ID | 345 |
Feature activation | +6.23e-03 |
Pos logit contributions | |
yourself | +0.014 |
aj | +0.013 |
blo | +0.013 |
yourselves | +0.012 |
majesty | +0.012 |
Neg logit contributions | |
inn | -0.022 |
eb | -0.022 |
aster | -0.022 |
dog | -0.021 |
le | -0.021 |
Token | will |
Token ID | 481 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
le | +0.009 |
inn | +0.009 |
ny | +0.009 |
eb | +0.009 |
ah | +0.009 |
Neg logit contributions | |
aj | -0.011 |
yourself | -0.011 |
yourselves | -0.010 |
ich | -0.010 |
blo | -0.010 |
Token | be |
Token ID | 307 |
Feature activation | -5.75e-03 |
Pos logit contributions | |
aj | +0.022 |
ich | +0.020 |
endant | +0.020 |
yourselves | +0.020 |
yourself | +0.019 |
Neg logit contributions | |
aster | -0.018 |
him | -0.018 |
le | -0.018 |
dog | -0.018 |
inn | -0.017 |
Token | my |
Token ID | 616 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
aj | +0.008 |
yourself | +0.008 |
blo | +0.008 |
majesty | +0.008 |
ich | +0.008 |
Neg logit contributions | |
inn | -0.010 |
aster | -0.009 |
le | -0.009 |
eb | -0.009 |
him | -0.009 |
Token | royal |
Token ID | 15100 |
Feature activation | -7.56e-02 |
Pos logit contributions | |
yourself | +0.027 |
yourselves | +0.026 |
aj | +0.026 |
blo | +0.025 |
endant | +0.023 |
Neg logit contributions | |
inn | -0.040 |
dog | -0.039 |
ah | -0.038 |
le | -0.038 |
aster | -0.038 |
Token | helper |
Token ID | 31904 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
yourselves | +0.122 |
yourself | +0.121 |
aj | +0.107 |
Nothing | +0.106 |
endant | +0.104 |
Neg logit contributions | |
le | -0.112 |
dog | -0.109 |
eb | -0.105 |
ah | -0.102 |
ny | -0.102 |
Token | ." |
Token ID | 526 |
Feature activation | +7.70e-03 |
Pos logit contributions | |
yourself | +0.041 |
blo | +0.041 |
aj | +0.040 |
yourselves | +0.039 |
endant | +0.038 |
Neg logit contributions | |
inn | -0.042 |
le | -0.042 |
eb | -0.041 |
dog | -0.041 |
ah | -0.041 |
Token | And |
Token ID | 843 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
inn | +0.013 |
eb | +0.012 |
aster | +0.012 |
le | +0.012 |
dog | +0.011 |
Neg logit contributions | |
yourself | -0.012 |
blo | -0.012 |
aj | -0.011 |
yourselves | -0.011 |
majesty | -0.011 |
Token | so |
Token ID | 523 |
Feature activation | +4.58e-03 |
Pos logit contributions | |
yourself | +0.030 |
blo | +0.028 |
yourselves | +0.027 |
aj | +0.027 |
majesty | +0.027 |
Neg logit contributions | |
inn | -0.027 |
aster | -0.025 |
eb | -0.025 |
le | -0.025 |
dog | -0.024 |
Token | , |
Token ID | 11 |
Feature activation | -7.36e-03 |
Pos logit contributions | |
inn | +0.007 |
eb | +0.007 |
aster | +0.007 |
le | +0.007 |
dog | +0.006 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.007 |
aj | -0.007 |
yourselves | -0.007 |
majesty | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
inn | +0.031 |
eb | +0.029 |
aster | +0.028 |
ah | +0.028 |
war | +0.028 |
Neg logit contributions | |
yourself | -0.024 |
blo | -0.023 |
window | -0.022 |
aj | -0.022 |
yourselves | -0.021 |
Token | put |
Token ID | 1234 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
inn | +0.016 |
aster | +0.015 |
dog | +0.015 |
le | +0.015 |
eb | +0.015 |
Neg logit contributions | |
yourself | -0.019 |
blo | -0.018 |
aj | -0.017 |
yourselves | -0.017 |
ich | -0.017 |
Token | on |
Token ID | 319 |
Feature activation | -4.35e-03 |
Pos logit contributions | |
inn | +0.014 |
eb | +0.014 |
aster | +0.013 |
war | +0.013 |
ah | +0.013 |
Neg logit contributions | |
yourself | -0.021 |
blo | -0.021 |
yourselves | -0.020 |
window | -0.019 |
most | -0.019 |
Token | their |
Token ID | 511 |
Feature activation | +2.98e-03 |
Pos logit contributions | |
yourself | +0.007 |
blo | +0.007 |
yourselves | +0.006 |
aj | +0.006 |
window | +0.006 |
Neg logit contributions | |
inn | -0.008 |
eb | -0.007 |
hot | -0.007 |
le | -0.007 |
omp | -0.007 |
Token | p |
Token ID | 279 |
Feature activation | -6.01e-02 |
Pos logit contributions | |
dog | +0.004 |
him | +0.004 |
aster | +0.004 |
inn | +0.004 |
war | +0.004 |
Neg logit contributions | |
yourself | -0.005 |
ich | -0.005 |
blo | -0.005 |
reetings | -0.005 |
inas | -0.004 |
Token | aj |
Token ID | 1228 |
Feature activation | -7.56e-02 |
Pos logit contributions | |
yourself | +0.032 |
blo | +0.031 |
sending | +0.021 |
yourselves | +0.021 |
ich | +0.020 |
Neg logit contributions | |
inn | -0.166 |
eb | -0.156 |
aster | -0.154 |
ah | -0.153 |
war | -0.151 |
Token | amas |
Token ID | 17485 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
yourself | +0.081 |
blo | +0.078 |
yourselves | +0.071 |
majesty | +0.070 |
precious | +0.069 |
Neg logit contributions | |
inn | -0.162 |
eb | -0.156 |
le | -0.152 |
dog | -0.151 |
aster | -0.150 |
Token | . |
Token ID | 13 |
Feature activation | +1.98e-03 |
Pos logit contributions | |
inn | +0.030 |
aster | +0.029 |
eb | +0.029 |
omp | +0.028 |
war | +0.028 |
Neg logit contributions | |
yourself | -0.019 |
window | -0.019 |
blo | -0.019 |
aj | -0.019 |
hugging | -0.017 |
Token | They |
Token ID | 1119 |
Feature activation | -2.52e-03 |
Pos logit contributions | |
inn | +0.003 |
aster | +0.002 |
eb | +0.002 |
dog | +0.002 |
le | +0.002 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
aj | -0.004 |
yourselves | -0.004 |
majesty | -0.004 |
Token | get |
Token ID | 651 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
yourself | +0.004 |
blo | +0.004 |
aj | +0.004 |
yourselves | +0.004 |
majesty | +0.004 |
Neg logit contributions | |
inn | -0.004 |
eb | -0.004 |
aster | -0.004 |
le | -0.004 |
dog | -0.004 |
Token | into |
Token ID | 656 |
Feature activation | -3.85e-02 |
Pos logit contributions | |
yourself | +0.022 |
blo | +0.021 |
majesty | +0.020 |
aj | +0.020 |
yourselves | +0.020 |
Neg logit contributions | |
inn | -0.021 |
aster | -0.020 |
eb | -0.019 |
le | -0.019 |
dog | -0.019 |
Token | nice |
Token ID | 3621 |
Feature activation | -8.42e-03 |
Pos logit contributions | |
inn | +0.001 |
le | +0.001 |
him | +0.001 |
aster | +0.001 |
ny | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
ich | -0.001 |
majesty | -0.001 |
blo | -0.001 |
yourselves | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -7.19e-03 |
Pos logit contributions | |
yourself | +0.016 |
majesty | +0.015 |
blo | +0.015 |
ich | +0.015 |
yourselves | +0.015 |
Neg logit contributions | |
inn | -0.011 |
le | -0.010 |
him | -0.010 |
eb | -0.010 |
dog | -0.010 |
Token | not |
Token ID | 407 |
Feature activation | +2.09e-03 |
Pos logit contributions | |
yourself | +0.011 |
ich | +0.011 |
aj | +0.011 |
blo | +0.011 |
majesty | +0.011 |
Neg logit contributions | |
him | -0.011 |
aster | -0.011 |
inn | -0.011 |
dog | -0.010 |
le | -0.010 |
Token | be |
Token ID | 307 |
Feature activation | -9.67e-04 |
Pos logit contributions | |
him | +0.003 |
aster | +0.003 |
inn | +0.003 |
dog | +0.003 |
ny | +0.003 |
Neg logit contributions | |
aj | -0.004 |
yourself | -0.004 |
majesty | -0.003 |
ich | -0.003 |
yourselves | -0.003 |
Token | too |
Token ID | 1165 |
Feature activation | +3.92e-03 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
aj | +0.001 |
majesty | +0.001 |
yourselves | +0.001 |
Neg logit contributions | |
inn | -0.002 |
aster | -0.002 |
eb | -0.002 |
le | -0.002 |
dog | -0.002 |
Token | long |
Token ID | 890 |
Feature activation | +4.69e-02 |
Pos logit contributions | |
inn | +0.007 |
aster | +0.007 |
eb | +0.007 |
le | +0.007 |
dog | +0.007 |
Neg logit contributions | |
yourself | -0.006 |
blo | -0.005 |
yourselves | -0.005 |
aj | -0.005 |
majesty | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
inn | +0.066 |
le | +0.060 |
eb | +0.059 |
aster | +0.059 |
dog | +0.059 |
Neg logit contributions | |
yourself | -0.086 |
blo | -0.082 |
majesty | -0.081 |
yourselves | -0.081 |
aj | -0.081 |
Token | Tim |
Token ID | 5045 |
Feature activation | -2.26e-03 |
Pos logit contributions | |
le | +0.017 |
inn | +0.016 |
aster | +0.016 |
eb | +0.015 |
ah | +0.014 |
Neg logit contributions | |
yourself | -0.027 |
aj | -0.027 |
yourselves | -0.026 |
window | -0.026 |
blo | -0.025 |
Token | my |
Token ID | 1820 |
Feature activation | -5.21e-03 |
Pos logit contributions | |
yourself | +0.003 |
aj | +0.003 |
blo | +0.003 |
yourselves | +0.002 |
window | +0.002 |
Neg logit contributions | |
inn | -0.005 |
aster | -0.004 |
eb | -0.004 |
dog | -0.004 |
war | -0.004 |
Token | realized |
Token ID | 6939 |
Feature activation | -1.60e-03 |
Pos logit contributions | |
yourself | +0.007 |
blo | +0.007 |
aj | +0.007 |
yourselves | +0.006 |
majesty | +0.006 |
Neg logit contributions | |
inn | -0.010 |
aster | -0.009 |
eb | -0.009 |
le | -0.009 |
dog | -0.009 |
Token | that |
Token ID | 326 |
Feature activation | +2.83e-03 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
yourselves | +0.003 |
aj | +0.003 |
ich | +0.003 |
Neg logit contributions | |
inn | -0.002 |
war | -0.002 |
le | -0.002 |
eb | -0.002 |
ny | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.19e-02 |
Pos logit contributions | |
yourself | +0.010 |
blo | +0.009 |
aj | +0.009 |
yourselves | +0.009 |
ich | +0.009 |
Neg logit contributions | |
inn | -0.007 |
aster | -0.007 |
dog | -0.007 |
eb | -0.007 |
le | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +6.86e-03 |
Pos logit contributions | |
yourself | +0.033 |
blo | +0.031 |
aj | +0.029 |
yourselves | +0.029 |
window | +0.029 |
Neg logit contributions | |
inn | -0.040 |
eb | -0.037 |
aster | -0.036 |
ah | -0.035 |
le | -0.035 |
Token | He |
Token ID | 679 |
Feature activation | -4.55e-04 |
Pos logit contributions | |
inn | +0.006 |
aster | +0.005 |
eb | +0.005 |
dog | +0.005 |
him | +0.005 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.016 |
aj | -0.015 |
majesty | -0.015 |
yourselves | -0.015 |
Token | did |
Token ID | 750 |
Feature activation | -6.01e-03 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
yourselves | +0.001 |
aj | +0.001 |
majesty | +0.001 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
le | -0.001 |
dog | -0.001 |
aster | -0.001 |
Token | not |
Token ID | 407 |
Feature activation | +9.42e-03 |
Pos logit contributions | |
yourself | +0.005 |
blo | +0.005 |
aj | +0.005 |
majesty | +0.004 |
yourselves | +0.004 |
Neg logit contributions | |
inn | -0.014 |
aster | -0.014 |
eb | -0.014 |
le | -0.014 |
dog | -0.013 |
Token | mean |
Token ID | 1612 |
Feature activation | +4.61e-02 |
Pos logit contributions | |
inn | +0.016 |
eb | +0.015 |
aster | +0.014 |
war | +0.014 |
dog | +0.014 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.014 |
yourselves | -0.013 |
majesty | -0.013 |
aj | -0.013 |
Token | it |
Token ID | 340 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
inn | +0.103 |
eb | +0.090 |
ah | +0.088 |
aster | +0.088 |
le | +0.087 |
Neg logit contributions | |
yourself | -0.064 |
yourselves | -0.057 |
window | -0.046 |
blo | -0.043 |
precious | -0.042 |
Token | . |
Token ID | 13 |
Feature activation | +2.14e-03 |
Pos logit contributions | |
inn | +0.029 |
eb | +0.027 |
aster | +0.027 |
le | +0.026 |
dog | +0.025 |
Neg logit contributions | |
yourself | -0.027 |
blo | -0.025 |
yourselves | -0.025 |
aj | -0.024 |
window | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | -8.50e-04 |
Pos logit contributions | |
inn | +0.002 |
eb | +0.002 |
aster | +0.002 |
le | +0.002 |
dog | +0.002 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.005 |
aj | -0.005 |
yourselves | -0.005 |
majesty | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -7.73e-03 |
Pos logit contributions | |
yourself | +0.001 |
aj | +0.001 |
yourselves | +0.001 |
blo | +0.001 |
window | +0.001 |
Neg logit contributions | |
inn | -0.002 |
le | -0.002 |
eb | -0.002 |
ah | -0.002 |
aster | -0.002 |
Token | Tom |
Token ID | 13787 |
Feature activation | +8.77e-03 |
Pos logit contributions | |
yourself | +0.013 |
yourselves | +0.012 |
aj | +0.012 |
blo | +0.012 |
majesty | +0.011 |
Neg logit contributions | |
inn | -0.012 |
le | -0.012 |
eb | -0.012 |
aster | -0.011 |
dog | -0.011 |
Token | of |
Token ID | 286 |
Feature activation | +7.44e-03 |
Pos logit contributions | |
inn | +0.012 |
aster | +0.011 |
eb | +0.011 |
war | +0.010 |
dog | +0.010 |
Neg logit contributions | |
blo | -0.010 |
yourself | -0.010 |
window | -0.010 |
precious | -0.009 |
aj | -0.009 |
Token | them |
Token ID | 606 |
Feature activation | -4.27e-03 |
Pos logit contributions | |
war | +0.010 |
inn | +0.010 |
le | +0.009 |
ny | +0.009 |
hot | +0.009 |
Neg logit contributions | |
yourself | -0.015 |
yourselves | -0.013 |
blo | -0.013 |
myself | -0.012 |
my | -0.012 |
Token | was |
Token ID | 373 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
yourself | +0.007 |
blo | +0.006 |
aj | +0.006 |
yourselves | +0.006 |
majesty | +0.006 |
Neg logit contributions | |
inn | -0.007 |
eb | -0.007 |
aster | -0.007 |
le | -0.007 |
dog | -0.006 |
Token | as |
Token ID | 355 |
Feature activation | +4.13e-02 |
Pos logit contributions | |
inn | +0.038 |
eb | +0.035 |
aster | +0.035 |
le | +0.035 |
dog | +0.035 |
Neg logit contributions | |
yourself | -0.027 |
aj | -0.025 |
yourselves | -0.025 |
blo | -0.025 |
majesty | -0.025 |
Token | nice |
Token ID | 3621 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
inn | +0.081 |
eb | +0.076 |
aster | +0.076 |
le | +0.074 |
dog | +0.074 |
Neg logit contributions | |
yourself | -0.053 |
blo | -0.050 |
aj | -0.049 |
yourselves | -0.048 |
majesty | -0.047 |
Token | as |
Token ID | 355 |
Feature activation | +4.87e-02 |
Pos logit contributions | |
inn | +0.025 |
eb | +0.023 |
dog | +0.023 |
le | +0.023 |
aster | +0.023 |
Neg logit contributions | |
yourself | -0.034 |
aj | -0.032 |
blo | -0.032 |
yourselves | -0.032 |
majesty | -0.032 |
Token | Bob |
Token ID | 5811 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
inn | +0.061 |
eb | +0.055 |
aster | +0.055 |
le | +0.053 |
dog | +0.052 |
Neg logit contributions | |
yourself | -0.099 |
blo | -0.095 |
yourselves | -0.092 |
aj | -0.092 |
majesty | -0.091 |
Token | o |
Token ID | 78 |
Feature activation | +1.96e-02 |
Pos logit contributions | |
inn | +0.019 |
aster | +0.018 |
le | +0.016 |
eb | +0.016 |
dog | +0.016 |
Neg logit contributions | |
yourself | -0.024 |
aj | -0.023 |
blo | -0.023 |
ich | -0.022 |
majesty | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +3.55e-03 |
Pos logit contributions | |
inn | +0.031 |
eb | +0.029 |
aster | +0.029 |
le | +0.028 |
dog | +0.028 |
Neg logit contributions | |
yourself | -0.033 |
blo | -0.031 |
aj | -0.030 |
yourselves | -0.030 |
majesty | -0.030 |
Token | Then |
Token ID | 3244 |
Feature activation | -2.49e-02 |
Pos logit contributions | |
le | +0.005 |
inn | +0.005 |
aster | +0.005 |
eb | +0.005 |
ah | +0.005 |
Neg logit contributions | |
yourself | -0.006 |
yourselves | -0.006 |
majesty | -0.006 |
aj | -0.006 |
window | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -5.25e-03 |
Pos logit contributions | |
yourself | +0.042 |
blo | +0.039 |
yourselves | +0.038 |
majesty | +0.037 |
aj | +0.036 |
Neg logit contributions | |
inn | -0.042 |
aster | -0.038 |
war | -0.037 |
eb | -0.037 |
le | -0.037 |
Token | happy |
Token ID | 3772 |
Feature activation | -1.12e-03 |
Pos logit contributions | |
ich | +0.024 |
aj | +0.022 |
majesty | +0.022 |
yourselves | +0.022 |
inas | +0.021 |
Neg logit contributions | |
him | -0.018 |
inn | -0.018 |
aster | -0.018 |
le | -0.017 |
he | -0.017 |
Token | and |
Token ID | 290 |
Feature activation | -4.36e-03 |
Pos logit contributions | |
yourself | +0.002 |
aj | +0.002 |
majesty | +0.002 |
yourselves | +0.002 |
ich | +0.002 |
Neg logit contributions | |
him | -0.001 |
inn | -0.001 |
eb | -0.001 |
dog | -0.001 |
le | -0.001 |
Token | wore |
Token ID | 12408 |
Feature activation | +1.04e-03 |
Pos logit contributions | |
aj | +0.008 |
yourselves | +0.008 |
yourself | +0.008 |
ich | +0.007 |
majesty | +0.007 |
Neg logit contributions | |
him | -0.006 |
Jim | -0.005 |
hot | -0.005 |
Bob | -0.005 |
aster | -0.005 |
Token | her |
Token ID | 607 |
Feature activation | -2.60e-03 |
Pos logit contributions | |
inn | +0.001 |
aster | +0.001 |
eb | +0.001 |
him | +0.001 |
le | +0.001 |
Neg logit contributions | |
yourself | -0.002 |
aj | -0.002 |
ich | -0.002 |
blo | -0.002 |
yourselves | -0.002 |
Token | jacket |
Token ID | 15224 |
Feature activation | -8.45e-03 |
Pos logit contributions | |
majesty | +0.004 |
yourselves | +0.004 |
yourself | +0.004 |
blo | +0.004 |
inas | +0.004 |
Neg logit contributions | |
him | -0.004 |
inn | -0.004 |
eb | -0.004 |
dog | -0.004 |
ah | -0.003 |
Token | every |
Token ID | 790 |
Feature activation | +4.79e-02 |
Pos logit contributions | |
yourself | +0.015 |
blo | +0.014 |
aj | +0.014 |
yourselves | +0.014 |
majesty | +0.014 |
Neg logit contributions | |
inn | -0.012 |
eb | -0.011 |
aster | -0.011 |
le | -0.011 |
dog | -0.011 |
Token | day |
Token ID | 1110 |
Feature activation | +8.20e-03 |
Pos logit contributions | |
inn | +0.072 |
eb | +0.067 |
aster | +0.066 |
le | +0.065 |
dog | +0.064 |
Neg logit contributions | |
yourself | -0.083 |
blo | -0.080 |
aj | -0.077 |
yourselves | -0.076 |
majesty | -0.075 |
Token | . |
Token ID | 13 |
Feature activation | +1.89e-03 |
Pos logit contributions | |
inn | +0.014 |
aster | +0.013 |
eb | +0.013 |
le | +0.013 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.013 |
blo | -0.012 |
aj | -0.011 |
window | -0.011 |
yourselves | -0.011 |
Token | She |
Token ID | 1375 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
inn | +0.003 |
aster | +0.002 |
eb | +0.002 |
him | +0.002 |
dog | +0.002 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.003 |
yourselves | -0.003 |
ich | -0.003 |
aj | -0.003 |
Token | never |
Token ID | 1239 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
yourselves | +0.030 |
yourself | +0.030 |
ich | +0.026 |
majesty | +0.026 |
receiver | +0.026 |
Neg logit contributions | |
eb | -0.023 |
ah | -0.022 |
inn | -0.022 |
him | -0.021 |
dog | -0.021 |
Token | twisted |
Token ID | 19074 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
yourself | +0.018 |
yourselves | +0.017 |
blo | +0.017 |
aj | +0.017 |
ich | +0.016 |
Neg logit contributions | |
inn | -0.020 |
eb | -0.019 |
aster | -0.018 |
le | -0.018 |
dog | -0.018 |
Token | a |
Token ID | 257 |
Feature activation | -4.89e-04 |
Pos logit contributions | |
inn | +0.008 |
eb | +0.008 |
aster | +0.008 |
le | +0.008 |
war | +0.007 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.008 |
yourselves | -0.008 |
window | -0.007 |
majesty | -0.007 |
Token | bird |
Token ID | 6512 |
Feature activation | +2.09e-02 |
Pos logit contributions | |
yourself | +0.001 |
yourselves | +0.001 |
aj | +0.001 |
majesty | +0.001 |
blo | +0.001 |
Neg logit contributions | |
inn | -0.001 |
dog | -0.001 |
eb | -0.001 |
ah | -0.001 |
aster | -0.001 |
Token | perched |
Token ID | 49264 |
Feature activation | +2.59e-02 |
Pos logit contributions | |
inn | +0.039 |
eb | +0.037 |
aster | +0.037 |
le | +0.037 |
dog | +0.037 |
Neg logit contributions | |
yourself | -0.028 |
aj | -0.026 |
blo | -0.026 |
yourselves | -0.026 |
majesty | -0.026 |
Token | on |
Token ID | 319 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
inn | +0.046 |
aster | +0.045 |
war | +0.043 |
eb | +0.043 |
dog | +0.042 |
Neg logit contributions | |
yourself | -0.039 |
blo | -0.037 |
ich | -0.034 |
yourselves | -0.034 |
window | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
inn | +0.036 |
war | +0.033 |
omp | +0.033 |
eb | +0.032 |
le | +0.032 |
Neg logit contributions | |
yourself | -0.020 |
blo | -0.018 |
yourselves | -0.017 |
window | -0.016 |
most | -0.015 |
Token | branch |
Token ID | 8478 |
Feature activation | +5.29e-02 |
Pos logit contributions | |
inn | +0.026 |
eb | +0.024 |
aster | +0.024 |
le | +0.023 |
dog | +0.023 |
Neg logit contributions | |
yourself | -0.031 |
blo | -0.030 |
aj | -0.029 |
yourselves | -0.029 |
majesty | -0.029 |
Token | . |
Token ID | 13 |
Feature activation | +7.73e-03 |
Pos logit contributions | |
inn | +0.094 |
eb | +0.087 |
aster | +0.086 |
war | +0.084 |
le | +0.083 |
Neg logit contributions | |
blo | -0.075 |
yourself | -0.075 |
window | -0.072 |
yourselves | -0.065 |
aj | -0.064 |
Token | " |
Token ID | 366 |
Feature activation | -8.24e-03 |
Pos logit contributions | |
inn | +0.011 |
le | +0.010 |
eb | +0.010 |
aster | +0.010 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.015 |
blo | -0.014 |
aj | -0.014 |
yourselves | -0.014 |
majesty | -0.013 |
Token | Yes |
Token ID | 5297 |
Feature activation | -5.08e-03 |
Pos logit contributions | |
yourself | +0.012 |
blo | +0.011 |
yourselves | +0.011 |
aj | +0.010 |
majesty | +0.010 |
Neg logit contributions | |
inn | -0.015 |
eb | -0.014 |
aster | -0.014 |
le | -0.014 |
dog | -0.014 |
Token | , |
Token ID | 11 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
yourself | +0.007 |
majesty | +0.006 |
blo | +0.006 |
window | +0.006 |
yourselves | +0.006 |
Neg logit contributions | |
inn | -0.010 |
war | -0.009 |
aster | -0.009 |
eb | -0.009 |
dog | -0.009 |
Token | I |
Token ID | 314 |
Feature activation | +3.85e-02 |
Pos logit contributions | |
yourself | +0.034 |
blo | +0.032 |
yourselves | +0.031 |
aj | +0.030 |
majesty | +0.030 |
Neg logit contributions | |
inn | -0.048 |
eb | -0.044 |
aster | -0.044 |
le | -0.043 |
dog | -0.042 |
Token | hot |
Token ID | 3024 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
inn | +0.016 |
aster | +0.016 |
eb | +0.015 |
ah | +0.014 |
omp | +0.014 |
Neg logit contributions | |
blo | -0.015 |
yourself | -0.015 |
window | -0.014 |
most | -0.014 |
yourselves | -0.013 |
Token | cocoa |
Token ID | 35845 |
Feature activation | -1.71e-02 |
Pos logit contributions | |
inn | +0.020 |
eb | +0.019 |
aster | +0.019 |
ah | +0.018 |
war | +0.018 |
Neg logit contributions | |
yourself | -0.018 |
blo | -0.018 |
yourselves | -0.016 |
aj | -0.016 |
window | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
blo | +0.025 |
yourself | +0.025 |
window | +0.023 |
aj | +0.023 |
yourselves | +0.023 |
Neg logit contributions | |
inn | -0.030 |
aster | -0.028 |
eb | -0.028 |
war | -0.027 |
le | -0.026 |
Token | feeling |
Token ID | 4203 |
Feature activation | -3.09e-03 |
Pos logit contributions | |
inn | +0.016 |
aster | +0.015 |
eb | +0.015 |
le | +0.014 |
dog | +0.014 |
Neg logit contributions | |
yourself | -0.017 |
blo | -0.016 |
aj | -0.016 |
yourselves | -0.015 |
majesty | -0.015 |
Token | much |
Token ID | 881 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
yourself | +0.004 |
blo | +0.004 |
yourselves | +0.003 |
aj | +0.003 |
precious | +0.003 |
Neg logit contributions | |
inn | -0.006 |
eb | -0.006 |
aster | -0.006 |
ah | -0.006 |
dog | -0.006 |
Token | better |
Token ID | 1365 |
Feature activation | +4.34e-03 |
Pos logit contributions | |
inn | +0.031 |
eb | +0.029 |
aster | +0.029 |
le | +0.028 |
dog | +0.028 |
Neg logit contributions | |
yourself | -0.024 |
blo | -0.023 |
aj | -0.022 |
yourselves | -0.022 |
majesty | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | -1.41e-03 |
Pos logit contributions | |
inn | +0.006 |
le | +0.006 |
eb | +0.005 |
aster | +0.005 |
dog | +0.005 |
Neg logit contributions | |
yourself | -0.008 |
aj | -0.008 |
majesty | -0.008 |
blo | -0.008 |
yourselves | -0.007 |
Token | The |
Token ID | 383 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
ich | +0.003 |
majesty | +0.003 |
yourselves | +0.003 |
Neg logit contributions | |
inn | -0.002 |
Jim | -0.002 |
aster | -0.001 |
him | -0.001 |
eb | -0.001 |
Token | rain |
Token ID | 6290 |
Feature activation | -4.15e-02 |
Pos logit contributions | |
yourself | +0.019 |
yourselves | +0.018 |
majesty | +0.017 |
ich | +0.017 |
blo | +0.017 |
Neg logit contributions | |
inn | -0.015 |
dog | -0.015 |
aster | -0.014 |
le | -0.014 |
ah | -0.013 |
Token | outside |
Token ID | 2354 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
yourself | +0.059 |
blo | +0.056 |
aj | +0.054 |
yourselves | +0.053 |
majesty | +0.052 |
Neg logit contributions | |
inn | -0.076 |
eb | -0.071 |
aster | -0.071 |
le | -0.069 |
dog | -0.069 |
Token | stopped |
Token ID | 5025 |
Feature activation | -9.38e-03 |
Pos logit contributions | |
yourself | +0.020 |
blo | +0.019 |
aj | +0.019 |
yourselves | +0.019 |
majesty | +0.018 |
Neg logit contributions | |
inn | -0.021 |
eb | -0.020 |
aster | -0.020 |
le | -0.019 |
dog | -0.019 |
Token | a |
Token ID | 257 |
Feature activation | +6.74e-03 |
Pos logit contributions | |
aj | +0.012 |
majesty | +0.011 |
yourself | +0.011 |
ich | +0.011 |
yourselves | +0.011 |
Neg logit contributions | |
him | -0.007 |
Bob | -0.006 |
dog | -0.006 |
aster | -0.006 |
Jim | -0.006 |
Token | big |
Token ID | 1263 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
dog | +0.010 |
ah | +0.010 |
ny | +0.010 |
aster | +0.009 |
eb | +0.009 |
Neg logit contributions | |
yourself | -0.012 |
yourselves | -0.011 |
aj | -0.011 |
myself | -0.009 |
endant | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
inn | +0.037 |
eb | +0.033 |
aster | +0.033 |
le | +0.033 |
war | +0.032 |
Neg logit contributions | |
yourself | -0.032 |
blo | -0.031 |
majesty | -0.029 |
window | -0.029 |
aj | -0.029 |
Token | friendly |
Token ID | 8030 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
inn | +0.023 |
dog | +0.023 |
aster | +0.022 |
le | +0.022 |
eb | +0.021 |
Neg logit contributions | |
yourself | -0.018 |
yourselves | -0.017 |
aj | -0.016 |
majesty | -0.016 |
blo | -0.016 |
Token | bear |
Token ID | 6842 |
Feature activation | +9.08e-03 |
Pos logit contributions | |
inn | +0.024 |
aster | +0.022 |
eb | +0.022 |
le | +0.021 |
war | +0.021 |
Neg logit contributions | |
yourself | -0.018 |
blo | -0.018 |
majesty | -0.017 |
window | -0.017 |
yourselves | -0.017 |
Token | who |
Token ID | 508 |
Feature activation | +5.34e-03 |
Pos logit contributions | |
inn | +0.017 |
aster | +0.016 |
war | +0.016 |
eb | +0.015 |
le | +0.015 |
Neg logit contributions | |
blo | -0.012 |
yourself | -0.012 |
ich | -0.012 |
window | -0.011 |
aj | -0.011 |
Token | lived |
Token ID | 5615 |
Feature activation | -8.04e-03 |
Pos logit contributions | |
inn | +0.009 |
eb | +0.009 |
le | +0.009 |
aster | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.008 |
aj | -0.007 |
yourselves | -0.007 |
blo | -0.007 |
majesty | -0.007 |
Token | in |
Token ID | 287 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
yourself | +0.014 |
blo | +0.013 |
aj | +0.013 |
yourselves | +0.013 |
majesty | +0.013 |
Neg logit contributions | |
inn | -0.013 |
eb | -0.011 |
aster | -0.011 |
le | -0.011 |
dog | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
yourself | +0.046 |
blo | +0.043 |
yourselves | +0.043 |
aj | +0.041 |
window | +0.040 |
Neg logit contributions | |
inn | -0.043 |
eb | -0.039 |
le | -0.039 |
aster | -0.038 |
war | -0.038 |
Token | forest |
Token ID | 8222 |
Feature activation | +6.42e-03 |
Pos logit contributions | |
yourself | +0.028 |
aj | +0.027 |
yourselves | +0.026 |
majesty | +0.026 |
blo | +0.026 |
Neg logit contributions | |
aster | -0.029 |
inn | -0.029 |
dog | -0.029 |
eb | -0.028 |
ah | -0.027 |
Token | . |
Token ID | 13 |
Feature activation | +8.17e-04 |
Pos logit contributions | |
inn | +0.010 |
eb | +0.009 |
aster | +0.009 |
le | +0.009 |
dog | +0.009 |
Neg logit contributions | |
yourself | -0.011 |
blo | -0.010 |
aj | -0.010 |
yourselves | -0.010 |
majesty | -0.010 |
Token | joined |
Token ID | 5399 |
Feature activation | -9.46e-03 |
Pos logit contributions | |
yourself | +0.015 |
blo | +0.015 |
window | +0.014 |
yourselves | +0.013 |
aj | +0.013 |
Neg logit contributions | |
inn | -0.018 |
eb | -0.016 |
aster | -0.016 |
le | -0.016 |
dog | -0.015 |
Token | him |
Token ID | 683 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
yourself | +0.017 |
yourselves | +0.015 |
sisters | +0.015 |
hugging | +0.015 |
receiver | +0.015 |
Neg logit contributions | |
eb | -0.013 |
ah | -0.013 |
inn | -0.013 |
aster | -0.013 |
omp | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +2.01e-03 |
Pos logit contributions | |
inn | +0.022 |
eb | +0.020 |
aster | +0.020 |
le | +0.019 |
dog | +0.019 |
Neg logit contributions | |
yourself | -0.025 |
blo | -0.024 |
yourselves | -0.024 |
aj | -0.024 |
majesty | -0.023 |
Token | They |
Token ID | 1119 |
Feature activation | -6.90e-03 |
Pos logit contributions | |
inn | +0.002 |
dog | +0.002 |
aster | +0.002 |
eb | +0.002 |
war | +0.002 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
yourselves | -0.004 |
ich | -0.004 |
aj | -0.004 |
Token | played |
Token ID | 2826 |
Feature activation | -2.43e-02 |
Pos logit contributions | |
blo | +0.008 |
singing | +0.006 |
window | +0.006 |
reminded | +0.006 |
sisters | +0.006 |
Neg logit contributions | |
inn | -0.014 |
aster | -0.014 |
eb | -0.014 |
le | -0.013 |
dog | -0.013 |
Token | together |
Token ID | 1978 |
Feature activation | +3.49e-03 |
Pos logit contributions | |
yourself | +0.029 |
blo | +0.026 |
yourselves | +0.025 |
most | +0.024 |
living | +0.023 |
Neg logit contributions | |
eb | -0.051 |
inn | -0.051 |
aster | -0.049 |
ah | -0.047 |
le | -0.046 |
Token | for |
Token ID | 329 |
Feature activation | +3.34e-03 |
Pos logit contributions | |
eb | +0.007 |
inn | +0.007 |
aster | +0.007 |
hot | +0.007 |
war | +0.006 |
Neg logit contributions | |
blo | -0.004 |
window | -0.004 |
yourself | -0.004 |
living | -0.004 |
singing | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
inn | +0.008 |
eb | +0.007 |
omp | +0.007 |
ah | +0.007 |
le | +0.007 |
Neg logit contributions | |
yourself | -0.004 |
yourselves | -0.003 |
blo | -0.003 |
precious | -0.003 |
sending | -0.003 |
Token | while |
Token ID | 981 |
Feature activation | +4.19e-02 |
Pos logit contributions | |
eb | +0.024 |
inn | +0.023 |
omp | +0.023 |
le | +0.022 |
hot | +0.022 |
Neg logit contributions | |
blo | -0.016 |
precious | -0.016 |
window | -0.015 |
ich | -0.015 |
majesty | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
inn | +0.072 |
eb | +0.069 |
aster | +0.067 |
war | +0.067 |
le | +0.066 |
Neg logit contributions | |
yourself | -0.063 |
blo | -0.061 |
window | -0.059 |
yourselves | -0.057 |
aj | -0.056 |
Token | had |
Token ID | 550 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
inn | +0.019 |
eb | +0.018 |
aster | +0.018 |
le | +0.017 |
dog | +0.017 |
Neg logit contributions | |
yourself | -0.016 |
blo | -0.016 |
yourselves | -0.015 |
aj | -0.015 |
majesty | -0.014 |
Token | down |
Token ID | 866 |
Feature activation | +1.09e-03 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
yourselves | +0.003 |
window | +0.003 |
ich | +0.003 |
Neg logit contributions | |
inn | -0.003 |
eb | -0.003 |
aster | -0.003 |
war | -0.003 |
le | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
inn | +0.002 |
eb | +0.001 |
aster | +0.001 |
le | +0.001 |
dog | +0.001 |
Neg logit contributions | |
yourself | -0.002 |
blo | -0.002 |
yourselves | -0.002 |
window | -0.002 |
aj | -0.002 |
Token | but |
Token ID | 475 |
Feature activation | -5.78e-03 |
Pos logit contributions | |
yourself | +0.020 |
blo | +0.019 |
aj | +0.019 |
yourselves | +0.019 |
majesty | +0.019 |
Neg logit contributions | |
inn | -0.016 |
aster | -0.014 |
eb | -0.014 |
dog | -0.014 |
le | -0.014 |
Token | Max |
Token ID | 5436 |
Feature activation | -6.37e-03 |
Pos logit contributions | |
yourself | +0.011 |
blo | +0.011 |
aj | +0.010 |
majesty | +0.010 |
yourselves | +0.010 |
Neg logit contributions | |
inn | -0.008 |
aster | -0.007 |
eb | -0.007 |
him | -0.007 |
le | -0.007 |
Token | knew |
Token ID | 2993 |
Feature activation | -7.79e-03 |
Pos logit contributions | |
yourself | +0.008 |
blo | +0.008 |
aj | +0.008 |
yourselves | +0.007 |
ich | +0.007 |
Neg logit contributions | |
inn | -0.012 |
aster | -0.012 |
eb | -0.011 |
war | -0.011 |
le | -0.011 |
Token | it |
Token ID | 340 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
yourself | +0.014 |
blo | +0.014 |
aj | +0.013 |
yourselves | +0.013 |
majesty | +0.013 |
Neg logit contributions | |
inn | -0.011 |
eb | -0.010 |
aster | -0.010 |
le | -0.010 |
dog | -0.010 |
Token | was |
Token ID | 373 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
inn | +0.028 |
aster | +0.028 |
eb | +0.026 |
le | +0.025 |
war | +0.025 |
Neg logit contributions | |
yourself | -0.012 |
blo | -0.012 |
precious | -0.010 |
aj | -0.010 |
yourselves | -0.010 |
Token | too |
Token ID | 1165 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
inn | +0.021 |
ny | +0.018 |
dog | +0.018 |
le | +0.018 |
aster | +0.018 |
Neg logit contributions | |
yourself | -0.021 |
majesty | -0.021 |
aj | -0.021 |
yourselves | -0.020 |
blo | -0.020 |
Token | dangerous |
Token ID | 4923 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
inn | +0.030 |
eb | +0.029 |
aster | +0.028 |
le | +0.028 |
dog | +0.027 |
Neg logit contributions | |
yourself | -0.020 |
blo | -0.020 |
aj | -0.019 |
precious | -0.018 |
window | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +7.17e-04 |
Pos logit contributions | |
inn | +0.071 |
aster | +0.071 |
eb | +0.066 |
ah | +0.066 |
war | +0.065 |
Neg logit contributions | |
yourself | -0.043 |
blo | -0.038 |
yourselves | -0.036 |
window | -0.034 |
living | -0.034 |
Token | Max |
Token ID | 5436 |
Feature activation | -7.89e-03 |
Pos logit contributions | |
inn | +0.001 |
aster | +0.001 |
eb | +0.001 |
le | +0.001 |
dog | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
aj | -0.001 |
blo | -0.001 |
yourselves | -0.001 |
majesty | -0.001 |
Token | 't |
Token ID | 470 |
Feature activation | -1.35e-03 |
Pos logit contributions | |
inn | +0.005 |
aster | +0.005 |
eb | +0.005 |
le | +0.005 |
him | +0.005 |
Neg logit contributions | |
aj | -0.004 |
yourself | -0.004 |
majesty | -0.004 |
blo | -0.004 |
yourselves | -0.004 |
Token | stay |
Token ID | 2652 |
Feature activation | +2.70e-03 |
Pos logit contributions | |
yourself | +0.002 |
aj | +0.002 |
blo | +0.002 |
yourselves | +0.002 |
majesty | +0.002 |
Neg logit contributions | |
inn | -0.002 |
aster | -0.002 |
le | -0.002 |
eb | -0.002 |
dog | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -4.13e-03 |
Pos logit contributions | |
inn | +0.004 |
eb | +0.004 |
aster | +0.004 |
le | +0.004 |
dog | +0.004 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.004 |
aj | -0.004 |
yourselves | -0.004 |
majesty | -0.004 |
Token | She |
Token ID | 1375 |
Feature activation | -3.90e-03 |
Pos logit contributions | |
yourself | +0.006 |
blo | +0.006 |
aj | +0.006 |
yourselves | +0.006 |
majesty | +0.006 |
Neg logit contributions | |
inn | -0.007 |
eb | -0.007 |
aster | -0.007 |
le | -0.007 |
dog | -0.006 |
Token | tried |
Token ID | 3088 |
Feature activation | +1.37e-03 |
Pos logit contributions | |
yourself | +0.004 |
blo | +0.004 |
aj | +0.004 |
window | +0.004 |
precious | +0.004 |
Neg logit contributions | |
inn | -0.008 |
war | -0.008 |
aster | -0.007 |
eb | -0.007 |
hot | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +2.98e-03 |
Pos logit contributions | |
inn | +0.002 |
eb | +0.002 |
aster | +0.002 |
le | +0.002 |
dog | +0.002 |
Neg logit contributions | |
yourself | -0.002 |
blo | -0.002 |
yourselves | -0.002 |
aj | -0.002 |
window | -0.002 |
Token | tried |
Token ID | 3088 |
Feature activation | +4.75e-03 |
Pos logit contributions | |
inn | +0.005 |
war | +0.005 |
eb | +0.005 |
dog | +0.005 |
le | +0.005 |
Neg logit contributions | |
yourself | -0.004 |
blo | -0.004 |
yourselves | -0.004 |
hugging | -0.004 |
sending | -0.003 |
Token | until |
Token ID | 1566 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
inn | +0.007 |
eb | +0.007 |
aster | +0.007 |
le | +0.007 |
dog | +0.007 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.008 |
yourselves | -0.008 |
aj | -0.007 |
majesty | -0.007 |
Token | she |
Token ID | 673 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
blo | +0.011 |
yourself | +0.011 |
window | +0.009 |
yourselves | +0.009 |
hugging | +0.008 |
Neg logit contributions | |
inn | -0.028 |
le | -0.028 |
eb | -0.027 |
dog | -0.027 |
ny | -0.027 |
Token | felt |
Token ID | 2936 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
inn | +0.023 |
aster | +0.022 |
war | +0.021 |
dog | +0.021 |
eb | +0.021 |
Neg logit contributions | |
yourself | -0.014 |
blo | -0.013 |
aj | -0.013 |
majesty | -0.012 |
yourselves | -0.012 |
Token | something |
Token ID | 1223 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
inn | +0.019 |
eb | +0.018 |
aster | +0.018 |
dog | +0.017 |
le | +0.017 |
Neg logit contributions | |
yourself | -0.018 |
blo | -0.017 |
yourselves | -0.016 |
aj | -0.016 |
majesty | -0.015 |
Token | toys |
Token ID | 14958 |
Feature activation | -3.96e-02 |
Pos logit contributions | |
him | +0.012 |
inn | +0.012 |
dog | +0.011 |
ny | +0.011 |
Bob | +0.011 |
Neg logit contributions | |
yourself | -0.010 |
blo | -0.010 |
yourselves | -0.009 |
ich | -0.009 |
majesty | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +2.51e-03 |
Pos logit contributions | |
yourself | +0.069 |
blo | +0.066 |
yourselves | +0.063 |
aj | +0.063 |
majesty | +0.061 |
Neg logit contributions | |
inn | -0.060 |
aster | -0.055 |
eb | -0.055 |
le | -0.054 |
dog | -0.054 |
Token | make |
Token ID | 787 |
Feature activation | +2.17e-03 |
Pos logit contributions | |
inn | +0.003 |
aster | +0.003 |
eb | +0.003 |
dog | +0.003 |
him | +0.003 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.004 |
aj | -0.004 |
yourselves | -0.004 |
ich | -0.004 |
Token | his |
Token ID | 465 |
Feature activation | -9.75e-03 |
Pos logit contributions | |
inn | +0.004 |
eb | +0.003 |
ah | +0.003 |
dog | +0.003 |
hot | +0.003 |
Neg logit contributions | |
yourself | -0.004 |
yourselves | -0.003 |
precious | -0.003 |
blo | -0.003 |
majesty | -0.003 |
Token | mom |
Token ID | 1995 |
Feature activation | -2.82e-02 |
Pos logit contributions | |
yourself | +0.013 |
blo | +0.012 |
yourselves | +0.011 |
aj | +0.011 |
majesty | +0.011 |
Neg logit contributions | |
inn | -0.019 |
aster | -0.018 |
eb | -0.018 |
le | -0.018 |
dog | -0.018 |
Token | upset |
Token ID | 9247 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
yourself | +0.034 |
blo | +0.032 |
aj | +0.030 |
window | +0.029 |
yourselves | +0.029 |
Neg logit contributions | |
inn | -0.060 |
eb | -0.055 |
aster | -0.054 |
dog | -0.052 |
war | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
yourself | +0.030 |
blo | +0.028 |
yourselves | +0.027 |
aj | +0.027 |
majesty | +0.026 |
Neg logit contributions | |
inn | -0.027 |
aster | -0.025 |
eb | -0.025 |
dog | -0.024 |
le | -0.024 |
Token | From |
Token ID | 3574 |
Feature activation | -6.13e-03 |
Pos logit contributions | |
inn | +0.013 |
eb | +0.012 |
aster | +0.012 |
dog | +0.012 |
le | +0.012 |
Neg logit contributions | |
yourself | -0.019 |
blo | -0.019 |
aj | -0.018 |
yourselves | -0.018 |
majesty | -0.018 |
Token | then |
Token ID | 788 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
yourself | +0.012 |
blo | +0.012 |
majesty | +0.011 |
aj | +0.011 |
yourselves | +0.011 |
Neg logit contributions | |
inn | -0.008 |
aster | -0.007 |
eb | -0.007 |
le | -0.007 |
dog | -0.007 |
Token | on |
Token ID | 319 |
Feature activation | +3.47e-03 |
Pos logit contributions | |
inn | +0.018 |
le | +0.018 |
eb | +0.018 |
aster | +0.018 |
dog | +0.018 |
Neg logit contributions | |
yourself | -0.013 |
blo | -0.013 |
yourselves | -0.011 |
sending | -0.011 |
aj | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | -3.16e-03 |
Pos logit contributions | |
inn | +0.006 |
war | +0.005 |
le | +0.005 |
aster | +0.005 |
eb | +0.005 |
Neg logit contributions | |
yourself | -0.006 |
blo | -0.005 |
aj | -0.005 |
yourselves | -0.005 |
majesty | -0.005 |
Token | so |
Token ID | 523 |
Feature activation | -4.74e-03 |
Pos logit contributions | |
inn | +0.010 |
aster | +0.010 |
Jim | +0.010 |
Noah | +0.009 |
eb | +0.009 |
Neg logit contributions | |
yourself | -0.010 |
yourselves | -0.010 |
aj | -0.010 |
majesty | -0.010 |
ich | -0.009 |
Token | excited |
Token ID | 6568 |
Feature activation | +2.93e-04 |
Pos logit contributions | |
yourself | +0.008 |
aj | +0.008 |
yourselves | +0.008 |
majesty | +0.008 |
ich | +0.008 |
Neg logit contributions | |
inn | -0.007 |
Jim | -0.006 |
Bob | -0.006 |
aster | -0.006 |
Noah | -0.006 |
Token | that |
Token ID | 326 |
Feature activation | +7.21e-03 |
Pos logit contributions | |
inn | +0.000 |
eb | +0.000 |
le | +0.000 |
dog | +0.000 |
aster | +0.000 |
Neg logit contributions | |
yourself | -0.001 |
aj | -0.001 |
majesty | -0.001 |
blo | -0.001 |
yourselves | -0.001 |
Token | she |
Token ID | 673 |
Feature activation | -1.53e-02 |
Pos logit contributions | |
inn | +0.012 |
aster | +0.012 |
him | +0.012 |
eb | +0.012 |
Jim | +0.011 |
Neg logit contributions | |
aj | -0.011 |
yourself | -0.010 |
majesty | -0.010 |
yourselves | -0.010 |
blo | -0.010 |
Token | started |
Token ID | 2067 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
yourself | +0.029 |
yourselves | +0.028 |
aj | +0.027 |
blo | +0.026 |
ich | +0.026 |
Neg logit contributions | |
inn | -0.020 |
le | -0.020 |
eb | -0.019 |
ny | -0.019 |
dog | -0.019 |
Token | to |
Token ID | 284 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
yourself | +0.019 |
aj | +0.019 |
majesty | +0.019 |
yourselves | +0.018 |
blo | +0.018 |
Neg logit contributions | |
inn | -0.016 |
aster | -0.016 |
dog | -0.015 |
him | -0.015 |
eb | -0.015 |
Token | climb |
Token ID | 12080 |
Feature activation | +8.70e-04 |
Pos logit contributions | |
yourself | +0.022 |
aj | +0.021 |
yourselves | +0.021 |
blo | +0.020 |
ich | +0.020 |
Neg logit contributions | |
inn | -0.014 |
aster | -0.014 |
dog | -0.014 |
eb | -0.013 |
le | -0.013 |
Token | it |
Token ID | 340 |
Feature activation | +3.92e-03 |
Pos logit contributions | |
inn | +0.001 |
aster | +0.001 |
eb | +0.001 |
le | +0.001 |
dog | +0.001 |
Neg logit contributions | |
yourself | -0.002 |
blo | -0.002 |
yourselves | -0.001 |
aj | -0.001 |
window | -0.001 |
Token | with |
Token ID | 351 |
Feature activation | +8.19e-03 |
Pos logit contributions | |
inn | +0.005 |
le | +0.005 |
eb | +0.005 |
dog | +0.005 |
ny | +0.005 |
Neg logit contributions | |
yourself | -0.007 |
aj | -0.007 |
majesty | -0.007 |
yourselves | -0.007 |
blo | -0.007 |
Token | no |
Token ID | 645 |
Feature activation | +7.17e-03 |
Pos logit contributions | |
inn | +0.015 |
eb | +0.014 |
aster | +0.013 |
le | +0.013 |
dog | +0.013 |
Neg logit contributions | |
yourself | -0.012 |
blo | -0.012 |
yourselves | -0.011 |
window | -0.011 |
aj | -0.011 |
Token | fear |
Token ID | 3252 |
Feature activation | -7.94e-03 |
Pos logit contributions | |
inn | +0.012 |
aster | +0.011 |
eb | +0.011 |
le | +0.011 |
dog | +0.011 |
Neg logit contributions | |
yourself | -0.011 |
blo | -0.011 |
aj | -0.011 |
yourselves | -0.011 |
majesty | -0.010 |
Token | money |
Token ID | 1637 |
Feature activation | -1.87e-02 |
Pos logit contributions | |
yourself | +0.018 |
yourselves | +0.017 |
ich | +0.016 |
aj | +0.016 |
blo | +0.016 |
Neg logit contributions | |
aster | -0.020 |
dog | -0.020 |
him | -0.019 |
le | -0.019 |
ah | -0.019 |
Token | ," |
Token ID | 553 |
Feature activation | -3.19e-03 |
Pos logit contributions | |
aj | +0.035 |
majesty | +0.035 |
blo | +0.035 |
yourself | +0.034 |
ich | +0.034 |
Neg logit contributions | |
him | -0.022 |
dog | -0.021 |
le | -0.020 |
eb | -0.020 |
ny | -0.019 |
Token | she |
Token ID | 673 |
Feature activation | -5.70e-03 |
Pos logit contributions | |
yourself | +0.005 |
blo | +0.005 |
yourselves | +0.005 |
aj | +0.005 |
majesty | +0.005 |
Neg logit contributions | |
inn | -0.005 |
eb | -0.005 |
le | -0.005 |
aster | -0.004 |
war | -0.004 |
Token | said |
Token ID | 531 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
yourself | +0.010 |
ich | +0.010 |
yourselves | +0.010 |
blo | +0.009 |
aj | +0.009 |
Neg logit contributions | |
inn | -0.008 |
le | -0.008 |
aster | -0.008 |
eb | -0.008 |
Jim | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +8.82e-04 |
Pos logit contributions | |
inn | +0.003 |
eb | +0.003 |
aster | +0.003 |
le | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.003 |
blo | -0.003 |
aj | -0.003 |
yourselves | -0.003 |
majesty | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +7.42e-04 |
Pos logit contributions | |
inn | +0.001 |
eb | +0.001 |
aster | +0.001 |
dog | +0.001 |
le | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
blo | -0.001 |
yourselves | -0.001 |
aj | -0.001 |
majesty | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -8.21e-03 |
Pos logit contributions | |
inn | +0.001 |
eb | +0.001 |
aster | +0.001 |
dog | +0.001 |
le | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
blo | -0.001 |
aj | -0.001 |
yourselves | -0.001 |
majesty | -0.001 |
Token | The |
Token ID | 464 |
Feature activation | -5.47e-03 |
Pos logit contributions | |
yourself | +0.013 |
blo | +0.012 |
aj | +0.012 |
majesty | +0.012 |
yourselves | +0.012 |
Neg logit contributions | |
inn | -0.014 |
aster | -0.013 |
eb | -0.013 |
dog | -0.013 |
war | -0.012 |
Token | shop |
Token ID | 6128 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
yourself | +0.009 |
aj | +0.008 |
yourselves | +0.008 |
blo | +0.008 |
majesty | +0.008 |
Neg logit contributions | |
dog | -0.008 |
aster | -0.008 |
inn | -0.008 |
le | -0.008 |
ny | -0.008 |
Token | keeper |
Token ID | 13884 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
yourself | +0.014 |
blo | +0.014 |
aj | +0.013 |
window | +0.013 |
majesty | +0.013 |
Neg logit contributions | |
inn | -0.023 |
aster | -0.021 |
eb | -0.021 |
le | -0.021 |
war | -0.021 |
Token | was |
Token ID | 373 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
inn | +0.048 |
war | +0.045 |
aster | +0.044 |
eb | +0.043 |
hot | +0.042 |
Neg logit contributions | |
blo | -0.024 |
aj | -0.022 |
window | -0.022 |
yourself | -0.021 |
hugging | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | -5.31e-03 |
Pos logit contributions | |
inn | +0.036 |
aster | +0.034 |
eb | +0.034 |
le | +0.033 |
ah | +0.033 |
Neg logit contributions | |
yourself | -0.030 |
blo | -0.030 |
window | -0.028 |
aj | -0.027 |
yourselves | -0.027 |
Token | She |
Token ID | 1375 |
Feature activation | -8.11e-03 |
Pos logit contributions | |
yourself | +0.008 |
blo | +0.008 |
yourselves | +0.008 |
aj | +0.008 |
majesty | +0.008 |
Neg logit contributions | |
inn | -0.009 |
eb | -0.008 |
aster | -0.008 |
le | -0.008 |
dog | -0.008 |
Token | ran |
Token ID | 4966 |
Feature activation | +3.10e-03 |
Pos logit contributions | |
yourself | +0.015 |
yourselves | +0.014 |
aj | +0.014 |
majesty | +0.013 |
blo | +0.013 |
Neg logit contributions | |
inn | -0.012 |
aster | -0.011 |
eb | -0.011 |
le | -0.011 |
dog | -0.011 |
Token | around |
Token ID | 1088 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
aster | +0.005 |
inn | +0.005 |
eb | +0.005 |
omp | +0.005 |
le | +0.005 |
Neg logit contributions | |
yourself | -0.004 |
window | -0.004 |
blo | -0.004 |
yourselves | -0.004 |
aj | -0.004 |
Token | with |
Token ID | 351 |
Feature activation | -2.01e-03 |
Pos logit contributions | |
yourself | +0.019 |
blo | +0.019 |
yourselves | +0.017 |
window | +0.017 |
majesty | +0.017 |
Neg logit contributions | |
inn | -0.018 |
eb | -0.017 |
war | -0.016 |
aster | -0.016 |
le | -0.016 |
Token | it |
Token ID | 340 |
Feature activation | -3.30e-03 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
window | +0.003 |
yourselves | +0.003 |
precious | +0.003 |
Neg logit contributions | |
inn | -0.003 |
eb | -0.003 |
le | -0.003 |
ah | -0.003 |
aster | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -1.34e-03 |
Pos logit contributions | |
yourself | +0.007 |
yourselves | +0.007 |
aj | +0.006 |
majesty | +0.006 |
ich | +0.006 |
Neg logit contributions | |
inn | -0.004 |
le | -0.004 |
dog | -0.004 |
ny | -0.004 |
eb | -0.003 |
Token | swung |
Token ID | 28507 |
Feature activation | -1.75e-03 |
Pos logit contributions | |
yourself | +0.002 |
aj | +0.002 |
yourselves | +0.002 |
majesty | +0.002 |
blo | +0.002 |
Neg logit contributions | |
inn | -0.002 |
dog | -0.002 |
aster | -0.002 |
eb | -0.002 |
le | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | +1.74e-03 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
window | +0.003 |
yourselves | +0.003 |
precious | +0.002 |
Neg logit contributions | |
aster | -0.003 |
inn | -0.003 |
eb | -0.003 |
le | -0.003 |
dog | -0.003 |
Token | in |
Token ID | 287 |
Feature activation | -3.44e-03 |
Pos logit contributions | |
inn | +0.002 |
eb | +0.002 |
le | +0.002 |
aster | +0.002 |
dog | +0.002 |
Neg logit contributions | |
yourself | -0.003 |
blo | -0.003 |
yourselves | -0.003 |
aj | -0.003 |
majesty | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
yourself | +0.006 |
blo | +0.006 |
yourselves | +0.005 |
window | +0.005 |
myself | +0.005 |
Neg logit contributions | |
inn | -0.006 |
eb | -0.005 |
le | -0.005 |
war | -0.005 |
dog | -0.005 |
Token | said |
Token ID | 531 |
Feature activation | +7.33e-04 |
Pos logit contributions | |
yourself | +0.018 |
aj | +0.017 |
blo | +0.017 |
precious | +0.016 |
window | +0.016 |
Neg logit contributions | |
inn | -0.032 |
aster | -0.031 |
eb | -0.030 |
le | -0.029 |
dog | -0.029 |
Token | . |
Token ID | 13 |
Feature activation | +1.39e-03 |
Pos logit contributions | |
inn | +0.001 |
eb | +0.001 |
ah | +0.001 |
aster | +0.001 |
war | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
blo | -0.001 |
hugging | -0.001 |
window | -0.001 |
aj | -0.001 |
Token | " |
Token ID | 366 |
Feature activation | +1.57e-03 |
Pos logit contributions | |
inn | +0.002 |
him | +0.002 |
ny | +0.002 |
hot | +0.002 |
dog | +0.002 |
Neg logit contributions | |
yourself | -0.003 |
blo | -0.003 |
ich | -0.003 |
yourselves | -0.002 |
majesty | -0.002 |
Token | I |
Token ID | 40 |
Feature activation | +8.23e-03 |
Pos logit contributions | |
inn | +0.003 |
aster | +0.003 |
dog | +0.003 |
eb | +0.003 |
le | +0.003 |
Neg logit contributions | |
blo | -0.002 |
yourself | -0.002 |
aj | -0.002 |
majesty | -0.002 |
yourselves | -0.002 |
Token | have |
Token ID | 423 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
inn | +0.015 |
eb | +0.014 |
aster | +0.014 |
le | +0.014 |
dog | +0.014 |
Neg logit contributions | |
yourself | -0.012 |
blo | -0.011 |
aj | -0.011 |
yourselves | -0.010 |
majesty | -0.010 |
Token | an |
Token ID | 281 |
Feature activation | -9.98e-04 |
Pos logit contributions | |
ich | +0.027 |
blo | +0.027 |
majesty | +0.026 |
inas | +0.026 |
aj | +0.025 |
Neg logit contributions | |
him | -0.015 |
aster | -0.015 |
inn | -0.013 |
dog | -0.013 |
Jim | -0.013 |
Token | extra |
Token ID | 3131 |
Feature activation | -1.37e-02 |
Pos logit contributions | |
yourself | +0.002 |
blo | +0.002 |
aj | +0.002 |
yourselves | +0.002 |
majesty | +0.001 |
Neg logit contributions | |
inn | -0.002 |
eb | -0.001 |
aster | -0.001 |
le | -0.001 |
dog | -0.001 |
Token | belt |
Token ID | 10999 |
Feature activation | +8.56e-03 |
Pos logit contributions | |
yourself | +0.023 |
yourselves | +0.023 |
blo | +0.023 |
ich | +0.021 |
hugging | +0.020 |
Neg logit contributions | |
inn | -0.022 |
aster | -0.021 |
dog | -0.020 |
ah | -0.020 |
war | -0.020 |
Token | in |
Token ID | 287 |
Feature activation | -6.75e-03 |
Pos logit contributions | |
hot | +0.009 |
inn | +0.009 |
him | +0.009 |
le | +0.009 |
dog | +0.009 |
Neg logit contributions | |
blo | -0.018 |
majesty | -0.018 |
yourself | -0.017 |
aj | -0.017 |
ich | -0.017 |
Token | my |
Token ID | 616 |
Feature activation | -2.64e-03 |
Pos logit contributions | |
aj | +0.008 |
majesty | +0.008 |
ich | +0.008 |
blo | +0.007 |
endant | +0.007 |
Neg logit contributions | |
aster | -0.013 |
inn | -0.013 |
him | -0.013 |
eb | -0.012 |
dog | -0.012 |
Token | bag |
Token ID | 6131 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
yourself | +0.003 |
blo | +0.003 |
aj | +0.003 |
yourselves | +0.003 |
majesty | +0.003 |
Neg logit contributions | |
inn | -0.005 |
eb | -0.005 |
aster | -0.005 |
le | -0.005 |
dog | -0.005 |
Token | boy |
Token ID | 2933 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
inn | +0.009 |
war | +0.009 |
eb | +0.008 |
le | +0.008 |
omp | +0.008 |
Neg logit contributions | |
window | -0.007 |
blo | -0.006 |
yourself | -0.006 |
ich | -0.006 |
yourselves | -0.006 |
Token | came |
Token ID | 1625 |
Feature activation | -4.67e-03 |
Pos logit contributions | |
inn | +0.038 |
war | +0.034 |
aster | +0.033 |
eb | +0.033 |
le | +0.033 |
Neg logit contributions | |
yourself | -0.026 |
blo | -0.026 |
window | -0.024 |
ich | -0.024 |
yourselves | -0.024 |
Token | and |
Token ID | 290 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
yourself | +0.008 |
majesty | +0.008 |
aj | +0.008 |
blo | +0.008 |
yourselves | +0.008 |
Neg logit contributions | |
inn | -0.007 |
eb | -0.006 |
le | -0.006 |
dog | -0.006 |
aster | -0.006 |
Token | snatched |
Token ID | 43276 |
Feature activation | -1.53e-03 |
Pos logit contributions | |
yourself | +0.021 |
yourselves | +0.020 |
aj | +0.020 |
majesty | +0.019 |
blo | +0.019 |
Neg logit contributions | |
inn | -0.015 |
dog | -0.014 |
aster | -0.014 |
ny | -0.014 |
him | -0.014 |
Token | her |
Token ID | 607 |
Feature activation | -6.12e-03 |
Pos logit contributions | |
yourself | +0.002 |
my | +0.002 |
yourselves | +0.002 |
myself | +0.001 |
precious | +0.001 |
Neg logit contributions | |
inn | -0.003 |
ah | -0.003 |
aster | -0.003 |
dog | -0.003 |
rost | -0.003 |
Token | t |
Token ID | 256 |
Feature activation | -4.22e-02 |
Pos logit contributions | |
yourself | +0.010 |
blo | +0.010 |
majesty | +0.010 |
aj | +0.010 |
yourselves | +0.010 |
Neg logit contributions | |
inn | -0.010 |
le | -0.009 |
eb | -0.009 |
dog | -0.009 |
him | -0.009 |
Token | eddy |
Token ID | 21874 |
Feature activation | -2.95e-03 |
Pos logit contributions | |
yourself | +0.048 |
aj | +0.043 |
blo | +0.043 |
yourselves | +0.043 |
ich | +0.041 |
Neg logit contributions | |
inn | -0.088 |
aster | -0.085 |
eb | -0.082 |
dog | -0.082 |
le | -0.081 |
Token | bear |
Token ID | 6842 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
yourself | +0.004 |
blo | +0.004 |
aj | +0.004 |
window | +0.004 |
yourselves | +0.004 |
Neg logit contributions | |
inn | -0.005 |
aster | -0.005 |
eb | -0.005 |
war | -0.005 |
omp | -0.005 |
Token | away |
Token ID | 1497 |
Feature activation | -1.90e-03 |
Pos logit contributions | |
inn | +0.020 |
aster | +0.019 |
ah | +0.018 |
omp | +0.018 |
Jim | +0.018 |
Neg logit contributions | |
yourself | -0.015 |
window | -0.013 |
blo | -0.013 |
aj | -0.013 |
yourselves | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | +8.14e-03 |
Pos logit contributions | |
yourself | +0.004 |
majesty | +0.003 |
aj | +0.003 |
blo | +0.003 |
yourselves | +0.003 |
Neg logit contributions | |
inn | -0.003 |
le | -0.002 |
eb | -0.002 |
dog | -0.002 |
aster | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
inn | +0.011 |
eb | +0.011 |
le | +0.011 |
aster | +0.010 |
ah | +0.010 |
Neg logit contributions | |
yourself | -0.015 |
aj | -0.014 |
majesty | -0.014 |
window | -0.014 |
yourselves | -0.014 |
Token | welcome |
Token ID | 7062 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
aj | +0.017 |
ich | +0.015 |
majesty | +0.015 |
endant | +0.015 |
yourself | +0.015 |
Neg logit contributions | |
inn | -0.021 |
him | -0.021 |
aster | -0.020 |
Bob | -0.020 |
Jim | -0.020 |
Token | to |
Token ID | 284 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
yourself | +0.017 |
blo | +0.016 |
aj | +0.016 |
yourselves | +0.016 |
majesty | +0.016 |
Neg logit contributions | |
inn | -0.015 |
eb | -0.015 |
dog | -0.015 |
le | -0.014 |
him | -0.014 |
Token | play |
Token ID | 711 |
Feature activation | -3.15e-02 |
Pos logit contributions | |
yourself | +0.021 |
blo | +0.021 |
aj | +0.020 |
yourselves | +0.020 |
majesty | +0.019 |
Neg logit contributions | |
inn | -0.026 |
aster | -0.025 |
eb | -0.025 |
dog | -0.024 |
le | -0.024 |
Token | in |
Token ID | 287 |
Feature activation | -2.85e-02 |
Pos logit contributions | |
yourself | +0.049 |
blo | +0.049 |
aj | +0.048 |
majesty | +0.046 |
ich | +0.045 |
Neg logit contributions | |
inn | -0.051 |
le | -0.049 |
aster | -0.048 |
dog | -0.048 |
eb | -0.048 |
Token | the |
Token ID | 262 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
aj | +0.046 |
blo | +0.046 |
yourself | +0.045 |
majesty | +0.045 |
ich | +0.044 |
Neg logit contributions | |
inn | -0.043 |
aster | -0.043 |
eb | -0.041 |
him | -0.040 |
le | -0.040 |
Token | p |
Token ID | 279 |
Feature activation | -4.87e-02 |
Pos logit contributions | |
yourself | +0.021 |
aj | +0.021 |
majesty | +0.020 |
blo | +0.020 |
yourselves | +0.020 |
Neg logit contributions | |
aster | -0.023 |
inn | -0.023 |
dog | -0.023 |
eb | -0.022 |
le | -0.022 |
Token | udd |
Token ID | 4185 |
Feature activation | +2.90e-03 |
Pos logit contributions | |
yourself | +0.072 |
blo | +0.067 |
yourselves | +0.065 |
majesty | +0.062 |
sending | +0.062 |
Neg logit contributions | |
inn | -0.087 |
eb | -0.081 |
le | -0.079 |
aster | -0.078 |
ah | -0.078 |
Token | les |
Token ID | 829 |
Feature activation | +5.18e-04 |
Pos logit contributions | |
inn | +0.004 |
aster | +0.003 |
war | +0.003 |
Noah | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.006 |
blo | -0.006 |
yourselves | -0.006 |
aj | -0.005 |
window | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -1.28e-02 |
Pos logit contributions | |
inn | +0.001 |
le | +0.001 |
eb | +0.001 |
aster | +0.001 |
dog | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
blo | -0.001 |
aj | -0.001 |
majesty | -0.001 |
yourselves | -0.001 |
Token | but |
Token ID | 475 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
yourself | +0.023 |
aj | +0.023 |
majesty | +0.023 |
blo | +0.023 |
yourselves | +0.022 |
Neg logit contributions | |
inn | -0.016 |
him | -0.015 |
aster | -0.015 |
dog | -0.015 |
Jim | -0.015 |
Token | please |
Token ID | 3387 |
Feature activation | -7.28e-03 |
Pos logit contributions | |
aj | +0.015 |
majesty | +0.013 |
yourself | +0.013 |
ich | +0.013 |
blo | +0.013 |
Neg logit contributions | |
him | -0.020 |
inn | -0.020 |
aster | -0.019 |
Bob | -0.019 |
Finn | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
blo | +0.003 |
yourself | +0.003 |
aj | +0.003 |
window | +0.003 |
ich | +0.002 |
Neg logit contributions | |
inn | -0.004 |
aster | -0.004 |
eb | -0.003 |
war | -0.003 |
omp | -0.003 |
Token | said |
Token ID | 531 |
Feature activation | +2.63e-03 |
Pos logit contributions | |
inn | +0.028 |
eb | +0.028 |
aster | +0.028 |
le | +0.027 |
dog | +0.027 |
Neg logit contributions | |
yourself | -0.029 |
yourselves | -0.027 |
aj | -0.027 |
blo | -0.027 |
ich | -0.026 |
Token | , |
Token ID | 11 |
Feature activation | +1.02e-03 |
Pos logit contributions | |
inn | +0.003 |
eb | +0.003 |
aster | +0.003 |
le | +0.003 |
dog | +0.003 |
Neg logit contributions | |
yourself | -0.005 |
blo | -0.005 |
yourselves | -0.005 |
aj | -0.005 |
ich | -0.005 |
Token | " |
Token ID | 366 |
Feature activation | +5.98e-03 |
Pos logit contributions | |
inn | +0.002 |
dog | +0.001 |
eb | +0.001 |
him | +0.001 |
aster | +0.001 |
Neg logit contributions | |
yourself | -0.002 |
yourselves | -0.002 |
aj | -0.002 |
majesty | -0.002 |
blo | -0.002 |
Token | Good |
Token ID | 10248 |
Feature activation | -1.06e-03 |
Pos logit contributions | |
inn | +0.012 |
aster | +0.011 |
eb | +0.011 |
le | +0.011 |
war | +0.011 |
Neg logit contributions | |
yourself | -0.008 |
blo | -0.007 |
yourselves | -0.007 |
aj | -0.007 |
ich | -0.007 |
Token | bye |
Token ID | 16390 |
Feature activation | -4.23e-02 |
Pos logit contributions | |
yourself | +0.002 |
blo | +0.002 |
aj | +0.002 |
yourselves | +0.002 |
majesty | +0.002 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
le | -0.001 |
dog | -0.001 |
ah | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | -3.60e-02 |
Pos logit contributions | |
yourself | +0.070 |
blo | +0.066 |
yourselves | +0.065 |
aj | +0.064 |
majesty | +0.062 |
Neg logit contributions | |
inn | -0.066 |
eb | -0.063 |
aster | -0.062 |
dog | -0.062 |
le | -0.062 |
Token | clumsy |
Token ID | 39120 |
Feature activation | -5.95e-03 |
Pos logit contributions | |
yourself | +0.077 |
blo | +0.074 |
aj | +0.073 |
yourselves | +0.072 |
majesty | +0.071 |
Neg logit contributions | |
inn | -0.040 |
eb | -0.036 |
aster | -0.036 |
dog | -0.035 |
le | -0.035 |
Token | beetle |
Token ID | 45489 |
Feature activation | -4.56e-04 |
Pos logit contributions | |
yourself | +0.009 |
blo | +0.009 |
yourselves | +0.008 |
aj | +0.008 |
majesty | +0.008 |
Neg logit contributions | |
inn | -0.010 |
eb | -0.009 |
aster | -0.009 |
le | -0.009 |
war | -0.009 |
Token | ! |
Token ID | 0 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
yourself | +0.001 |
yourselves | +0.001 |
aj | +0.001 |
blo | +0.001 |
ich | +0.001 |
Neg logit contributions | |
le | -0.001 |
ah | -0.001 |
ny | -0.001 |
eb | -0.001 |
dog | -0.001 |
Token | I |
Token ID | 314 |
Feature activation | +6.00e-03 |
Pos logit contributions | |
blo | +0.020 |
yourself | +0.020 |
aj | +0.019 |
yourselves | +0.018 |
window | +0.018 |
Neg logit contributions | |
inn | -0.029 |
eb | -0.028 |
dog | -0.027 |
aster | -0.027 |
hot | -0.026 |
Token | why |
Token ID | 1521 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
yourself | +0.039 |
blo | +0.038 |
aj | +0.038 |
yourselves | +0.037 |
ich | +0.036 |
Neg logit contributions | |
inn | -0.039 |
aster | -0.038 |
eb | -0.037 |
him | -0.037 |
dog | -0.036 |
Token | are |
Token ID | 389 |
Feature activation | -9.85e-04 |
Pos logit contributions | |
inn | +0.029 |
aster | +0.028 |
eb | +0.028 |
le | +0.027 |
dog | +0.027 |
Neg logit contributions | |
yourself | -0.023 |
blo | -0.022 |
aj | -0.021 |
majesty | -0.021 |
yourselves | -0.021 |
Token | you |
Token ID | 345 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
aj | +0.001 |
majesty | +0.001 |
yourselves | +0.001 |
Neg logit contributions | |
inn | -0.002 |
aster | -0.002 |
eb | -0.002 |
dog | -0.002 |
le | -0.002 |
Token | moving |
Token ID | 3867 |
Feature activation | -3.13e-03 |
Pos logit contributions | |
inn | +0.034 |
him | +0.032 |
aster | +0.031 |
eb | +0.031 |
omp | +0.031 |
Neg logit contributions | |
majesty | -0.024 |
endant | -0.023 |
yourself | -0.023 |
aj | -0.022 |
blo | -0.022 |
Token | my |
Token ID | 616 |
Feature activation | -8.99e-03 |
Pos logit contributions | |
blo | +0.005 |
majesty | +0.005 |
yourself | +0.005 |
aj | +0.005 |
ich | +0.005 |
Neg logit contributions | |
inn | -0.005 |
aster | -0.005 |
him | -0.005 |
le | -0.005 |
dog | -0.005 |
Token | bed |
Token ID | 3996 |
Feature activation | -3.93e-02 |
Pos logit contributions | |
yourself | +0.015 |
blo | +0.014 |
yourselves | +0.014 |
Nothing | +0.013 |
endant | +0.013 |
Neg logit contributions | |
dog | -0.013 |
aster | -0.013 |
inn | -0.013 |
le | -0.013 |
him | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | -4.41e-03 |
Pos logit contributions | |
blo | +0.048 |
majesty | +0.048 |
yourself | +0.047 |
ich | +0.044 |
yourselves | +0.043 |
Neg logit contributions | |
inn | -0.077 |
le | -0.075 |
aster | -0.072 |
dog | -0.072 |
eb | -0.071 |
Token | my |
Token ID | 616 |
Feature activation | -4.97e-03 |
Pos logit contributions | |
ich | +0.006 |
aj | +0.006 |
blo | +0.006 |
endant | +0.006 |
reetings | +0.006 |
Neg logit contributions | |
him | -0.007 |
aster | -0.007 |
Bob | -0.007 |
Jim | -0.006 |
dog | -0.006 |
Token | toys |
Token ID | 14958 |
Feature activation | -4.43e-02 |
Pos logit contributions | |
yourself | +0.008 |
yourselves | +0.007 |
blo | +0.007 |
ich | +0.007 |
endant | +0.006 |
Neg logit contributions | |
dog | -0.008 |
aster | -0.008 |
inn | -0.008 |
le | -0.007 |
him | -0.007 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
majesty | +0.059 |
blo | +0.056 |
ich | +0.055 |
yourself | +0.053 |
aj | +0.052 |
Neg logit contributions | |
him | -0.081 |
le | -0.078 |
aster | -0.077 |
inn | -0.077 |
dog | -0.076 |
Token | His |
Token ID | 2399 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
inn | +0.027 |
eb | +0.024 |
aster | +0.024 |
dog | +0.024 |
le | +0.023 |
Neg logit contributions | |
yourself | -0.040 |
blo | -0.038 |
aj | -0.037 |
yourselves | -0.037 |
majesty | -0.036 |
Token | . |
Token ID | 13 |
Feature activation | -6.67e-04 |
Pos logit contributions | |
le | +0.001 |
inn | +0.001 |
him | +0.001 |
dog | +0.001 |
eb | +0.001 |
Neg logit contributions | |
yourself | -0.001 |
aj | -0.001 |
majesty | -0.001 |
yourselves | -0.001 |
blo | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -5.97e-03 |
Pos logit contributions | |
yourself | +0.001 |
blo | +0.001 |
yourselves | +0.001 |
aj | +0.001 |
majesty | +0.001 |
Neg logit contributions | |
inn | -0.001 |
eb | -0.001 |
aster | -0.001 |
le | -0.001 |
ah | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
yourself | +0.010 |
blo | +0.009 |
aj | +0.009 |
majesty | +0.009 |
yourselves | +0.009 |
Neg logit contributions | |
inn | -0.010 |
aster | -0.009 |
eb | -0.009 |
dog | -0.009 |
le | -0.009 |
Token | " |
Token ID | 1 |
Feature activation | -3.93e-03 |
Pos logit contributions | |
yourself | +0.016 |
blo | +0.016 |
aj | +0.016 |
majesty | +0.016 |
yourselves | +0.015 |
Neg logit contributions | |
inn | -0.019 |
aster | -0.018 |
eb | -0.018 |
le | -0.017 |
dog | -0.017 |
Token | Wow |
Token ID | 22017 |
Feature activation | -7.23e-03 |
Pos logit contributions | |
yourself | +0.006 |
aj | +0.006 |
blo | +0.005 |
majesty | +0.005 |
yourselves | +0.005 |
Neg logit contributions | |
inn | -0.007 |
dog | -0.007 |
eb | -0.007 |
le | -0.007 |
aster | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -4.35e-02 |
Pos logit contributions | |
yourself | +0.012 |
blo | +0.012 |
aj | +0.012 |
yourselves | +0.011 |
majesty | +0.011 |
Neg logit contributions | |
inn | -0.011 |
eb | -0.010 |
aster | -0.010 |
le | -0.010 |
dog | -0.010 |
Token | you |
Token ID | 345 |
Feature activation | +5.33e-03 |
Pos logit contributions | |
yourself | +0.072 |
blo | +0.068 |
yourselves | +0.066 |
majesty | +0.065 |
aj | +0.064 |
Neg logit contributions | |
inn | -0.073 |
eb | -0.066 |
aster | -0.065 |
le | -0.065 |
dog | -0.064 |
Token | can |
Token ID | 460 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
eb | +0.007 |
le | +0.007 |
ah | +0.007 |
him | +0.007 |
inn | +0.006 |
Neg logit contributions | |
aj | -0.010 |
yourself | -0.009 |
yourselves | -0.009 |
ich | -0.009 |
blo | -0.009 |
Token | talk |
Token ID | 1561 |
Feature activation | -9.98e-03 |
Pos logit contributions | |
aj | +0.019 |
yourself | +0.019 |
yourselves | +0.018 |
blo | +0.018 |
majesty | +0.018 |
Neg logit contributions | |
inn | -0.019 |
le | -0.019 |
aster | -0.018 |
dog | -0.018 |
eb | -0.018 |
Token | !" |
Token ID | 2474 |
Feature activation | +2.37e-02 |
Pos logit contributions | |
aj | +0.017 |
majesty | +0.017 |
yourself | +0.017 |
blo | +0.017 |
ich | +0.017 |
Neg logit contributions | |
le | -0.014 |
him | -0.014 |
inn | -0.014 |
dog | -0.013 |
eb | -0.013 |
Token | Lily |
Token ID | 20037 |
Feature activation | -7.33e-03 |
Pos logit contributions | |
inn | +0.035 |
eb | +0.032 |
le | +0.031 |
war | +0.030 |
ah | +0.030 |
Neg logit contributions | |
yourself | -0.042 |
blo | -0.041 |
yourselves | -0.040 |
window | -0.039 |
aj | -0.039 |