Token | had |
Token ID | 550 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
storm | +0.010 |
liv | +0.010 |
ugg | +0.010 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.012 |
triple | -0.012 |
forward | -0.011 |
out | -0.010 |
Token | saved |
Token ID | 7448 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
ller | +0.029 |
xt | +0.028 |
liv | +0.027 |
ugg | +0.026 |
storm | +0.026 |
Neg logit contributions | |
questions | -0.028 |
groups | -0.027 |
triple | -0.025 |
forward | -0.024 |
out | -0.024 |
Token | him |
Token ID | 683 |
Feature activation | -1.92e-03 |
Pos logit contributions | |
Twe | +0.021 |
ller | +0.020 |
xt | +0.020 |
Karen | +0.019 |
Stella | +0.019 |
Neg logit contributions | |
groups | -0.018 |
triple | -0.017 |
questions | -0.017 |
increasingly | -0.016 |
ibr | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +1.14e-03 |
Pos logit contributions | |
triple | +0.003 |
questions | +0.003 |
cabinets | +0.003 |
groups | +0.003 |
iam | +0.003 |
Neg logit contributions | |
ller | -0.003 |
Twe | -0.002 |
xt | -0.002 |
bye | -0.002 |
Blue | -0.002 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.88e-03 |
Pos logit contributions | |
ller | +0.002 |
xt | +0.002 |
storm | +0.002 |
liv | +0.002 |
leanor | +0.002 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
triple | -0.001 |
brothers | -0.001 |
forward | -0.001 |
Token | Charl |
Token ID | 24453 |
Feature activation | +7.69e-02 |
Pos logit contributions | |
ller | +0.004 |
xt | +0.003 |
liv | +0.003 |
ugg | +0.003 |
storm | +0.003 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
forward | -0.002 |
out | -0.002 |
Token | otte |
Token ID | 11404 |
Feature activation | +2.71e-02 |
Pos logit contributions | |
ller | +0.107 |
storm | +0.097 |
bye | +0.097 |
mm | +0.096 |
liv | +0.095 |
Neg logit contributions | |
groups | -0.131 |
questions | -0.127 |
triple | -0.121 |
forward | -0.119 |
into | -0.118 |
Token | and |
Token ID | 290 |
Feature activation | -3.44e-04 |
Pos logit contributions | |
ller | +0.056 |
xt | +0.055 |
liv | +0.053 |
ugg | +0.051 |
storm | +0.051 |
Neg logit contributions | |
questions | -0.031 |
groups | -0.029 |
triple | -0.027 |
forward | -0.025 |
out | -0.025 |
Token | her |
Token ID | 607 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
triple | +0.000 |
forward | +0.000 |
out | +0.000 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
liv | -0.001 |
ugg | -0.001 |
leanor | -0.001 |
Token | mom |
Token ID | 1995 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
xt | +0.036 |
ller | +0.036 |
ugg | +0.033 |
leanor | +0.033 |
liv | +0.033 |
Neg logit contributions | |
groups | -0.022 |
questions | -0.021 |
triple | -0.019 |
forward | -0.018 |
increasingly | -0.018 |
Token | were |
Token ID | 547 |
Feature activation | -2.26e-02 |
Pos logit contributions | |
ller | +0.031 |
xt | +0.031 |
liv | +0.029 |
ugg | +0.029 |
storm | +0.028 |
Neg logit contributions | |
questions | -0.024 |
groups | -0.023 |
triple | -0.021 |
forward | -0.020 |
out | -0.019 |
Token | was |
Token ID | 373 |
Feature activation | +2.39e-02 |
Pos logit contributions | |
ller | +0.046 |
xt | +0.045 |
liv | +0.043 |
ugg | +0.042 |
leanor | +0.042 |
Neg logit contributions | |
questions | -0.025 |
groups | -0.025 |
triple | -0.023 |
out | -0.022 |
into | -0.021 |
Token | green |
Token ID | 4077 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
ller | +0.049 |
xt | +0.048 |
liv | +0.046 |
ugg | +0.045 |
storm | +0.045 |
Neg logit contributions | |
questions | -0.027 |
groups | -0.026 |
triple | -0.024 |
out | -0.023 |
forward | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
ller | +0.021 |
xt | +0.020 |
storm | +0.019 |
liv | +0.019 |
ugg | +0.019 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
triple | -0.010 |
forward | -0.009 |
brothers | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -3.31e-03 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.021 |
storm | +0.020 |
liv | +0.020 |
bye | +0.020 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.014 |
out | -0.013 |
forward | -0.013 |
into | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | +5.35e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
out | +0.002 |
forward | +0.002 |
triple | +0.002 |
Neg logit contributions | |
ller | -0.008 |
xt | -0.007 |
storm | -0.007 |
sed | -0.007 |
bye | -0.007 |
Token | Charl |
Token ID | 24453 |
Feature activation | +7.23e-02 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.010 |
liv | +0.009 |
ugg | +0.009 |
storm | +0.009 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
triple | -0.006 |
forward | -0.006 |
out | -0.006 |
Token | otte |
Token ID | 11404 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
ller | +0.124 |
mm | +0.119 |
bye | +0.118 |
storm | +0.117 |
Twe | +0.116 |
Neg logit contributions | |
groups | -0.094 |
forward | -0.093 |
questions | -0.092 |
into | -0.087 |
triple | -0.085 |
Token | 's |
Token ID | 338 |
Feature activation | -3.87e-03 |
Pos logit contributions | |
ller | +0.033 |
xt | +0.032 |
liv | +0.031 |
storm | +0.030 |
ugg | +0.030 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.018 |
triple | -0.017 |
out | -0.016 |
into | -0.016 |
Token | mom |
Token ID | 1995 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.006 |
triple | +0.006 |
increasingly | +0.006 |
iece | +0.006 |
Neg logit contributions | |
sed | -0.005 |
xt | -0.005 |
ller | -0.005 |
ugg | -0.005 |
bye | -0.004 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.018 |
liv | +0.017 |
ugg | +0.016 |
storm | +0.016 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.019 |
triple | -0.018 |
forward | -0.017 |
out | -0.017 |
Token | at |
Token ID | 379 |
Feature activation | +2.67e-03 |
Pos logit contributions | |
triple | +0.016 |
groups | +0.015 |
questions | +0.014 |
ibr | +0.014 |
cabinets | +0.014 |
Neg logit contributions | |
ller | -0.018 |
xt | -0.016 |
bye | -0.016 |
Twe | -0.015 |
Raven | -0.014 |
Token | that |
Token ID | 326 |
Feature activation | +5.48e-03 |
Pos logit contributions | |
questions | +0.036 |
groups | +0.036 |
triple | +0.035 |
forward | +0.032 |
brothers | +0.032 |
Neg logit contributions | |
ller | -0.029 |
xt | -0.028 |
storm | -0.025 |
liv | -0.025 |
seven | -0.025 |
Token | !" |
Token ID | 2474 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.007 |
storm | +0.007 |
liv | +0.007 |
bye | +0.007 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.010 |
triple | -0.009 |
forward | -0.009 |
brothers | -0.008 |
Token | |
Token ID | 220 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
ller | +0.030 |
xt | +0.030 |
storm | +0.029 |
liv | +0.028 |
seven | +0.027 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.018 |
out | -0.017 |
forward | -0.017 |
into | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +7.30e-03 |
Pos logit contributions | |
ller | +0.026 |
xt | +0.025 |
liv | +0.024 |
storm | +0.024 |
ugg | +0.024 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.016 |
triple | -0.015 |
forward | -0.014 |
out | -0.014 |
Token |
|
Token ID | 198 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
ller | +0.017 |
xt | +0.017 |
storm | +0.016 |
bye | +0.016 |
round | +0.016 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
out | -0.005 |
forward | -0.005 |
into | -0.005 |
Token | Charl |
Token ID | 24453 |
Feature activation | +6.61e-02 |
Pos logit contributions | |
ller | +0.020 |
xt | +0.019 |
storm | +0.018 |
liv | +0.017 |
ugg | +0.017 |
Neg logit contributions | |
questions | -0.025 |
groups | -0.024 |
triple | -0.023 |
forward | -0.022 |
out | -0.022 |
Token | otte |
Token ID | 11404 |
Feature activation | +5.81e-03 |
Pos logit contributions | |
ller | +0.120 |
bye | +0.115 |
storm | +0.115 |
Twe | +0.115 |
mm | +0.114 |
Neg logit contributions | |
groups | -0.077 |
forward | -0.077 |
questions | -0.074 |
into | -0.071 |
at | -0.067 |
Token | thanked |
Token ID | 26280 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.010 |
liv | +0.009 |
ugg | +0.009 |
storm | +0.009 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.008 |
triple | -0.008 |
forward | -0.007 |
out | -0.007 |
Token | her |
Token ID | 607 |
Feature activation | +1.18e-03 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.021 |
liv | +0.020 |
ugg | +0.020 |
leanor | +0.020 |
Neg logit contributions | |
groups | -0.011 |
questions | -0.011 |
triple | -0.011 |
forward | -0.009 |
out | -0.009 |
Token | mother |
Token ID | 2802 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
ller | +0.002 |
xt | +0.002 |
bye | +0.002 |
Stella | +0.002 |
Dove | +0.002 |
Neg logit contributions | |
triple | -0.002 |
groups | -0.002 |
questions | -0.002 |
and | -0.002 |
increasingly | -0.002 |
Token | for |
Token ID | 329 |
Feature activation | -9.40e-03 |
Pos logit contributions | |
groups | +0.016 |
triple | +0.016 |
increasingly | +0.014 |
ibr | +0.014 |
ports | +0.014 |
Neg logit contributions | |
ller | -0.019 |
ugg | -0.018 |
bye | -0.018 |
xt | -0.018 |
zy | -0.017 |
Token | the |
Token ID | 262 |
Feature activation | +5.94e-03 |
Pos logit contributions | |
questions | +0.019 |
groups | +0.018 |
triple | +0.016 |
forward | +0.015 |
out | +0.015 |
Neg logit contributions | |
ller | -0.037 |
xt | -0.037 |
liv | -0.035 |
ugg | -0.034 |
storm | -0.034 |
Token | shed |
Token ID | 14999 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
ller | +0.010 |
storm | +0.010 |
xt | +0.009 |
bow | +0.009 |
liv | +0.009 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.008 |
triple | -0.007 |
ac | -0.007 |
ices | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
ller | +0.024 |
xt | +0.024 |
liv | +0.022 |
storm | +0.022 |
ugg | +0.022 |
Neg logit contributions | |
questions | -0.017 |
triple | -0.016 |
groups | -0.016 |
forward | -0.014 |
increasingly | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -2.31e-04 |
Pos logit contributions | |
ller | +0.020 |
xt | +0.020 |
liv | +0.019 |
storm | +0.018 |
ugg | +0.018 |
Neg logit contributions | |
questions | -0.021 |
groups | -0.020 |
triple | -0.019 |
out | -0.018 |
forward | -0.018 |
Token |
|
Token ID | 198 |
Feature activation | +9.97e-03 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
triple | +0.000 |
forward | +0.000 |
out | +0.000 |
Neg logit contributions | |
ller | -0.000 |
xt | -0.000 |
storm | -0.000 |
liv | -0.000 |
ugg | -0.000 |
Token | Charl |
Token ID | 24453 |
Feature activation | +6.60e-02 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.018 |
liv | +0.017 |
ugg | +0.016 |
storm | +0.016 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.013 |
triple | -0.012 |
forward | -0.012 |
out | -0.012 |
Token | otte |
Token ID | 11404 |
Feature activation | +9.91e-03 |
Pos logit contributions | |
ller | +0.115 |
bye | +0.112 |
mm | +0.111 |
storm | +0.110 |
Twe | +0.110 |
Neg logit contributions | |
questions | -0.085 |
groups | -0.083 |
forward | -0.082 |
into | -0.076 |
at | -0.074 |
Token | ran |
Token ID | 4966 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
ller | +0.017 |
xt | +0.017 |
liv | +0.016 |
ugg | +0.015 |
leanor | +0.015 |
Neg logit contributions | |
questions | -0.015 |
groups | -0.014 |
triple | -0.013 |
forward | -0.013 |
out | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | +5.41e-03 |
Pos logit contributions | |
xt | +0.019 |
ller | +0.019 |
liv | +0.018 |
ugg | +0.018 |
round | +0.018 |
Neg logit contributions | |
groups | -0.012 |
questions | -0.012 |
triple | -0.011 |
brothers | -0.011 |
ac | -0.010 |
Token | the |
Token ID | 262 |
Feature activation | -3.80e-03 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.011 |
ugg | +0.010 |
storm | +0.010 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
triple | -0.005 |
forward | -0.005 |
out | -0.005 |
Token | shed |
Token ID | 14999 |
Feature activation | +4.88e-03 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
ac | +0.005 |
triple | +0.004 |
forward | +0.004 |
Neg logit contributions | |
ller | -0.006 |
liv | -0.006 |
leanor | -0.006 |
Karen | -0.006 |
xt | -0.006 |
Token | full |
Token ID | 1336 |
Feature activation | +6.19e-03 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.008 |
triple | +0.007 |
forward | +0.006 |
brothers | +0.006 |
Neg logit contributions | |
ller | -0.014 |
xt | -0.013 |
liv | -0.013 |
Twe | -0.012 |
storm | -0.012 |
Token | of |
Token ID | 286 |
Feature activation | -5.12e-03 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.013 |
ugg | +0.012 |
bye | +0.012 |
storm | +0.012 |
Neg logit contributions | |
groups | -0.006 |
questions | -0.006 |
triple | -0.006 |
increasingly | -0.005 |
forward | -0.005 |
Token | love |
Token ID | 1842 |
Feature activation | +1.59e-02 |
Pos logit contributions | |
triple | +0.007 |
groups | +0.007 |
forward | +0.007 |
questions | +0.006 |
into | +0.006 |
Neg logit contributions | |
xt | -0.008 |
ller | -0.008 |
Twe | -0.008 |
Karen | -0.008 |
ugg | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +8.24e-03 |
Pos logit contributions | |
ller | +0.030 |
xt | +0.029 |
storm | +0.028 |
ugg | +0.027 |
bye | +0.027 |
Neg logit contributions | |
groups | -0.020 |
questions | -0.019 |
triple | -0.019 |
increasingly | -0.017 |
forward | -0.017 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.49e-03 |
Pos logit contributions | |
ller | +0.017 |
xt | +0.017 |
storm | +0.016 |
liv | +0.016 |
ugg | +0.015 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
triple | -0.008 |
forward | -0.007 |
out | -0.007 |
Token | Sad |
Token ID | 26699 |
Feature activation | +6.32e-02 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.010 |
liv | +0.010 |
ugg | +0.010 |
storm | +0.010 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
triple | -0.006 |
forward | -0.006 |
out | -0.006 |
Token | ie |
Token ID | 494 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
ller | +0.111 |
xt | +0.110 |
liv | +0.106 |
storm | +0.103 |
ugg | +0.103 |
Neg logit contributions | |
questions | -0.087 |
groups | -0.083 |
triple | -0.076 |
out | -0.074 |
brothers | -0.074 |
Token | was |
Token ID | 373 |
Feature activation | +1.75e-03 |
Pos logit contributions | |
ller | +0.038 |
xt | +0.037 |
liv | +0.036 |
storm | +0.035 |
ugg | +0.034 |
Neg logit contributions | |
questions | -0.020 |
groups | -0.019 |
triple | -0.018 |
out | -0.017 |
into | -0.016 |
Token | feeling |
Token ID | 4203 |
Feature activation | +4.33e-03 |
Pos logit contributions | |
xt | +0.003 |
ller | +0.003 |
liv | +0.003 |
Twe | +0.003 |
ugg | +0.003 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
cabinets | -0.002 |
ports | -0.002 |
Token | angry |
Token ID | 7954 |
Feature activation | +7.56e-03 |
Pos logit contributions | |
xt | +0.009 |
ller | +0.009 |
ugg | +0.008 |
liv | +0.008 |
Twe | +0.008 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.005 |
triple | -0.004 |
forward | -0.004 |
brothers | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
ller | +0.014 |
xt | +0.014 |
storm | +0.013 |
ugg | +0.012 |
bye | +0.012 |
Neg logit contributions | |
groups | -0.010 |
questions | -0.010 |
triple | -0.010 |
increasingly | -0.008 |
forward | -0.008 |
Token | found |
Token ID | 1043 |
Feature activation | -1.60e-02 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
liv | +0.000 |
ugg | +0.000 |
storm | +0.000 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
out | -0.000 |
Token | it |
Token ID | 340 |
Feature activation | +1.70e-03 |
Pos logit contributions | |
questions | +0.025 |
groups | +0.024 |
triple | +0.023 |
out | +0.022 |
forward | +0.022 |
Neg logit contributions | |
ller | -0.026 |
xt | -0.026 |
liv | -0.024 |
ugg | -0.024 |
storm | -0.024 |
Token | !" |
Token ID | 2474 |
Feature activation | +3.16e-03 |
Pos logit contributions | |
ller | +0.002 |
xt | +0.002 |
liv | +0.002 |
storm | +0.002 |
ugg | +0.002 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.003 |
brothers | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.006 |
liv | +0.005 |
storm | +0.005 |
ugg | +0.005 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.004 |
triple | -0.004 |
out | -0.004 |
forward | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -3.27e-03 |
Pos logit contributions | |
questions | +0.012 |
groups | +0.011 |
out | +0.010 |
forward | +0.010 |
into | +0.010 |
Neg logit contributions | |
ller | -0.025 |
xt | -0.025 |
storm | -0.024 |
liv | -0.023 |
seven | -0.023 |
Token | Charl |
Token ID | 24453 |
Feature activation | +6.11e-02 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
triple | +0.004 |
forward | +0.004 |
out | +0.004 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.005 |
liv | -0.005 |
ugg | -0.005 |
storm | -0.005 |
Token | otte |
Token ID | 11404 |
Feature activation | +7.31e-03 |
Pos logit contributions | |
ller | +0.109 |
storm | +0.106 |
Twe | +0.105 |
bye | +0.105 |
mm | +0.105 |
Neg logit contributions | |
forward | -0.073 |
questions | -0.073 |
groups | -0.072 |
into | -0.067 |
at | -0.064 |
Token | and |
Token ID | 290 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.012 |
liv | +0.012 |
ugg | +0.011 |
storm | +0.011 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.010 |
triple | -0.010 |
forward | -0.009 |
out | -0.009 |
Token | her |
Token ID | 607 |
Feature activation | -7.06e-03 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.012 |
triple | +0.011 |
out | +0.010 |
forward | +0.010 |
Neg logit contributions | |
ller | -0.034 |
xt | -0.034 |
liv | -0.032 |
storm | -0.032 |
ugg | -0.032 |
Token | mom |
Token ID | 1995 |
Feature activation | -4.61e-03 |
Pos logit contributions | |
questions | +0.009 |
groups | +0.008 |
triple | +0.008 |
forward | +0.007 |
out | +0.007 |
Neg logit contributions | |
ller | -0.014 |
xt | -0.014 |
liv | -0.013 |
ugg | -0.013 |
storm | -0.013 |
Token | brought |
Token ID | 3181 |
Feature activation | -7.06e-03 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.007 |
triple | +0.007 |
increasingly | +0.006 |
forward | +0.006 |
Neg logit contributions | |
xt | -0.007 |
liv | -0.007 |
ller | -0.007 |
ugg | -0.007 |
Karen | -0.006 |
Token | â |
Token ID | 22940 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
questions | +0.011 |
groups | +0.010 |
triple | +0.010 |
forward | +0.009 |
out | +0.009 |
Neg logit contributions | |
ller | -0.008 |
xt | -0.008 |
liv | -0.007 |
storm | -0.007 |
ugg | -0.007 |
Token | € |
Token ID | 26391 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
ller | +0.007 |
xt | +0.006 |
sed | +0.006 |
llers | +0.006 |
spe | +0.006 |
Neg logit contributions | |
forward | -0.007 |
questions | -0.007 |
out | -0.006 |
un | -0.006 |
at | -0.006 |
Token | |
Token ID | 220 |
Feature activation | +2.55e-03 |
Pos logit contributions | |
ller | +0.030 |
storm | +0.029 |
ugg | +0.029 |
xt | +0.029 |
seven | +0.029 |
Neg logit contributions | |
at | -0.026 |
triple | -0.025 |
groups | -0.025 |
� | -0.025 |
un | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
ller | +0.005 |
xt | +0.005 |
liv | +0.005 |
storm | +0.005 |
ugg | +0.004 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.003 |
out | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e-03 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.012 |
triple | +0.011 |
out | +0.010 |
forward | +0.010 |
Neg logit contributions | |
ller | -0.026 |
xt | -0.025 |
storm | -0.024 |
liv | -0.024 |
ugg | -0.023 |
Token | Charl |
Token ID | 24453 |
Feature activation | +6.03e-02 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.002 |
forward | +0.002 |
out | +0.002 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
liv | -0.002 |
ugg | -0.002 |
storm | -0.002 |
Token | otte |
Token ID | 11404 |
Feature activation | +6.07e-03 |
Pos logit contributions | |
ller | +0.119 |
bye | +0.115 |
hy | +0.111 |
mm | +0.111 |
Twe | +0.109 |
Neg logit contributions | |
groups | -0.064 |
forward | -0.055 |
questions | -0.052 |
at | -0.051 |
into | -0.051 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.50e-02 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.010 |
liv | +0.009 |
storm | +0.009 |
ugg | +0.009 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
triple | -0.009 |
out | -0.008 |
forward | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -5.92e-03 |
Pos logit contributions | |
triple | +0.020 |
groups | +0.019 |
questions | +0.019 |
cabinets | +0.018 |
ports | +0.016 |
Neg logit contributions | |
ller | -0.027 |
bye | -0.025 |
xt | -0.025 |
Twe | -0.024 |
ugg | -0.023 |
Token | said |
Token ID | 531 |
Feature activation | -3.48e-03 |
Pos logit contributions | |
questions | +0.008 |
at | +0.007 |
out | +0.007 |
into | +0.007 |
triple | +0.007 |
Neg logit contributions | |
ller | -0.011 |
xt | -0.010 |
storm | -0.010 |
llers | -0.010 |
liv | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.003 |
triple | +0.003 |
out | +0.003 |
forward | +0.003 |
Neg logit contributions | |
ller | -0.007 |
xt | -0.007 |
liv | -0.007 |
storm | -0.007 |
leanor | -0.007 |
Token | park |
Token ID | 3952 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
liv | +0.010 |
xt | +0.010 |
storm | +0.009 |
ugg | +0.009 |
Twe | +0.009 |
Neg logit contributions | |
questions | -0.012 |
ac | -0.011 |
forward | -0.011 |
iers | -0.010 |
groups | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
ller | +0.052 |
xt | +0.052 |
liv | +0.048 |
bye | +0.048 |
storm | +0.047 |
Neg logit contributions | |
questions | -0.046 |
groups | -0.042 |
triple | -0.041 |
forward | -0.039 |
increasingly | -0.038 |
Token | Tom |
Token ID | 4186 |
Feature activation | -2.06e-04 |
Pos logit contributions | |
ller | +0.020 |
xt | +0.019 |
ugg | +0.018 |
storm | +0.018 |
leanor | +0.017 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.017 |
triple | -0.015 |
out | -0.015 |
at | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | +5.07e-03 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
forward | +0.000 |
triple | +0.000 |
increasingly | +0.000 |
Neg logit contributions | |
ller | -0.000 |
xt | -0.000 |
liv | -0.000 |
leanor | -0.000 |
storm | -0.000 |
Token | the |
Token ID | 262 |
Feature activation | +5.37e-03 |
Pos logit contributions | |
ller | +0.009 |
xt | +0.008 |
liv | +0.008 |
seven | +0.008 |
leanor | +0.008 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.006 |
ices | -0.006 |
triple | -0.006 |
invitations | -0.005 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.87e-02 |
Pos logit contributions | |
ller | +0.005 |
liv | +0.005 |
leanor | +0.005 |
storm | +0.005 |
bye | +0.005 |
Neg logit contributions | |
groups | -0.011 |
questions | -0.011 |
triple | -0.010 |
ices | -0.010 |
forward | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | +5.37e-03 |
Pos logit contributions | |
ller | +0.150 |
xt | +0.149 |
liv | +0.145 |
ugg | +0.144 |
leanor | +0.141 |
Neg logit contributions | |
questions | -0.033 |
groups | -0.030 |
triple | -0.026 |
out | -0.025 |
at | -0.025 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.32e-03 |
Pos logit contributions | |
ller | +0.009 |
xt | +0.009 |
storm | +0.008 |
bow | +0.008 |
ugg | +0.008 |
Neg logit contributions | |
questions | -0.008 |
triple | -0.008 |
groups | -0.008 |
out | -0.007 |
brothers | -0.007 |
Token | was |
Token ID | 373 |
Feature activation | +6.69e-04 |
Pos logit contributions | |
ller | +0.002 |
xt | +0.002 |
liv | +0.002 |
ugg | +0.002 |
leanor | +0.002 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
forward | -0.002 |
out | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +4.57e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
liv | +0.001 |
leanor | +0.001 |
ugg | +0.001 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
triple | -0.001 |
forward | -0.001 |
out | -0.001 |
Token | h |
Token ID | 289 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
liv | +0.008 |
leanor | +0.007 |
ller | +0.007 |
storm | +0.007 |
xt | +0.007 |
Neg logit contributions | |
groups | -0.006 |
questions | -0.006 |
triple | -0.005 |
forward | -0.005 |
ices | -0.005 |
Token | park |
Token ID | 3952 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
xt | +0.016 |
liv | +0.016 |
Twe | +0.015 |
storm | +0.015 |
Raven | +0.015 |
Neg logit contributions | |
questions | -0.018 |
ac | -0.016 |
ices | -0.016 |
triple | -0.015 |
forward | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
xt | +0.035 |
ller | +0.034 |
bye | +0.033 |
lla | +0.032 |
bow | +0.032 |
Neg logit contributions | |
questions | -0.043 |
triple | -0.041 |
groups | -0.038 |
increasingly | -0.037 |
ey | -0.037 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.65e-03 |
Pos logit contributions | |
xt | +0.015 |
ller | +0.014 |
liv | +0.013 |
Stella | +0.013 |
bow | +0.013 |
Neg logit contributions | |
questions | -0.026 |
forward | -0.025 |
triple | -0.024 |
groups | -0.023 |
out | -0.023 |
Token | was |
Token ID | 373 |
Feature activation | +5.10e-03 |
Pos logit contributions | |
ller | +0.003 |
xt | +0.003 |
liv | +0.003 |
ugg | +0.002 |
storm | +0.002 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.002 |
triple | -0.002 |
forward | -0.002 |
out | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +8.67e-03 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.010 |
liv | +0.010 |
leanor | +0.009 |
seven | +0.009 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.005 |
triple | -0.005 |
forward | -0.005 |
brothers | -0.004 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.83e-02 |
Pos logit contributions | |
liv | +0.011 |
ller | +0.010 |
Raven | +0.010 |
leanor | +0.010 |
storm | +0.010 |
Neg logit contributions | |
questions | -0.015 |
groups | -0.015 |
triple | -0.014 |
ices | -0.014 |
into | -0.014 |
Token | and |
Token ID | 290 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
ller | +0.147 |
xt | +0.145 |
liv | +0.141 |
ugg | +0.140 |
seven | +0.138 |
Neg logit contributions | |
questions | -0.036 |
groups | -0.034 |
triple | -0.028 |
out | -0.027 |
into | -0.026 |
Token | Ben |
Token ID | 3932 |
Feature activation | -2.51e-03 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.021 |
storm | +0.020 |
llers | +0.019 |
ugg | +0.019 |
Neg logit contributions | |
questions | -0.016 |
groups | -0.015 |
triple | -0.015 |
forward | -0.014 |
out | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | +1.27e-04 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.003 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
xt | -0.004 |
ller | -0.004 |
liv | -0.004 |
leanor | -0.004 |
ugg | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +6.35e-03 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
liv | +0.000 |
ugg | +0.000 |
storm | +0.000 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
out | -0.000 |
Token | h |
Token ID | 289 |
Feature activation | +2.37e-02 |
Pos logit contributions | |
liv | +0.010 |
storm | +0.010 |
leanor | +0.010 |
seven | +0.010 |
Raven | +0.010 |
Neg logit contributions | |
groups | -0.009 |
questions | -0.009 |
ices | -0.008 |
forward | -0.008 |
ports | -0.008 |
Token | park |
Token ID | 3952 |
Feature activation | +2.55e-02 |
Pos logit contributions | |
liv | +0.015 |
xt | +0.015 |
storm | +0.014 |
Twe | +0.014 |
bye | +0.014 |
Neg logit contributions | |
questions | -0.019 |
ac | -0.017 |
ices | -0.016 |
iers | -0.016 |
forward | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
xt | +0.036 |
ller | +0.035 |
bye | +0.033 |
lla | +0.032 |
bow | +0.032 |
Neg logit contributions | |
questions | -0.042 |
triple | -0.040 |
groups | -0.037 |
increasingly | -0.036 |
ey | -0.035 |
Token | Tim |
Token ID | 5045 |
Feature activation | -2.68e-03 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.023 |
liv | +0.021 |
storm | +0.020 |
ugg | +0.020 |
Neg logit contributions | |
questions | -0.030 |
groups | -0.028 |
triple | -0.027 |
forward | -0.027 |
out | -0.026 |
Token | was |
Token ID | 373 |
Feature activation | +5.80e-03 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.004 |
forward | +0.004 |
out | +0.004 |
Neg logit contributions | |
ller | -0.004 |
xt | -0.004 |
liv | -0.004 |
leanor | -0.004 |
storm | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +6.88e-03 |
Pos logit contributions | |
xt | +0.010 |
ller | +0.010 |
liv | +0.010 |
Twe | +0.010 |
seven | +0.010 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
ices | -0.006 |
triple | -0.006 |
invitations | -0.006 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.82e-02 |
Pos logit contributions | |
liv | +0.008 |
Raven | +0.008 |
storm | +0.007 |
ller | +0.007 |
leanor | +0.007 |
Neg logit contributions | |
groups | -0.013 |
questions | -0.013 |
ices | -0.012 |
triple | -0.012 |
into | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | +7.28e-03 |
Pos logit contributions | |
ller | +0.144 |
xt | +0.142 |
liv | +0.137 |
ugg | +0.136 |
leanor | +0.134 |
Neg logit contributions | |
questions | -0.040 |
groups | -0.037 |
triple | -0.033 |
out | -0.030 |
into | -0.028 |
Token | Lily |
Token ID | 20037 |
Feature activation | +5.91e-04 |
Pos logit contributions | |
ller | +0.012 |
xt | +0.012 |
liv | +0.011 |
storm | +0.011 |
ugg | +0.011 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
triple | -0.010 |
out | -0.010 |
forward | -0.010 |
Token | was |
Token ID | 373 |
Feature activation | +2.07e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
liv | +0.001 |
ugg | +0.001 |
leanor | +0.001 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
triple | -0.001 |
forward | -0.001 |
out | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +5.87e-03 |
Pos logit contributions | |
ller | +0.004 |
xt | +0.004 |
liv | +0.004 |
ugg | +0.004 |
storm | +0.004 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
forward | -0.002 |
out | -0.002 |
Token | h |
Token ID | 289 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
liv | +0.010 |
leanor | +0.010 |
storm | +0.009 |
seven | +0.009 |
xt | +0.009 |
Neg logit contributions | |
groups | -0.008 |
questions | -0.008 |
ices | -0.007 |
ports | -0.007 |
triple | -0.007 |
Token | park |
Token ID | 3952 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
liv | +0.013 |
xt | +0.013 |
bye | +0.011 |
storm | +0.011 |
leanor | +0.011 |
Neg logit contributions | |
questions | -0.016 |
ac | -0.014 |
iers | -0.014 |
forward | -0.013 |
ices | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | +9.15e-03 |
Pos logit contributions | |
xt | +0.043 |
ller | +0.043 |
bye | +0.040 |
seven | +0.039 |
lla | +0.039 |
Neg logit contributions | |
questions | -0.043 |
triple | -0.041 |
groups | -0.039 |
increasingly | -0.036 |
forward | -0.036 |
Token | Tom |
Token ID | 4186 |
Feature activation | +4.60e-04 |
Pos logit contributions | |
ller | +0.012 |
xt | +0.012 |
liv | +0.011 |
seven | +0.010 |
bow | +0.010 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.016 |
triple | -0.016 |
forward | -0.015 |
out | -0.015 |
Token | was |
Token ID | 373 |
Feature activation | +6.30e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
liv | +0.001 |
leanor | +0.001 |
seven | +0.001 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
forward | -0.001 |
triple | -0.001 |
out | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +7.05e-03 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.011 |
seven | +0.011 |
leanor | +0.010 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.008 |
ices | -0.007 |
triple | -0.007 |
invitations | -0.006 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.80e-02 |
Pos logit contributions | |
liv | +0.008 |
ller | +0.008 |
Raven | +0.008 |
bye | +0.008 |
leanor | +0.008 |
Neg logit contributions | |
groups | -0.012 |
questions | -0.012 |
ices | -0.012 |
triple | -0.011 |
increasingly | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | +7.36e-03 |
Pos logit contributions | |
ller | +0.142 |
xt | +0.141 |
liv | +0.136 |
ugg | +0.134 |
leanor | +0.132 |
Neg logit contributions | |
questions | -0.041 |
groups | -0.038 |
triple | -0.034 |
out | -0.030 |
into | -0.029 |
Token | Mia |
Token ID | 32189 |
Feature activation | +6.04e-03 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.011 |
ugg | +0.010 |
leanor | +0.010 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.012 |
triple | -0.011 |
forward | -0.011 |
out | -0.011 |
Token | was |
Token ID | 373 |
Feature activation | -2.65e-04 |
Pos logit contributions | |
xt | +0.010 |
ller | +0.010 |
liv | +0.009 |
leanor | +0.009 |
ugg | +0.009 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
triple | -0.009 |
forward | -0.008 |
out | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +6.36e-03 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
triple | +0.000 |
forward | +0.000 |
out | +0.000 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
liv | -0.000 |
leanor | -0.000 |
seven | -0.000 |
Token | h |
Token ID | 289 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
liv | +0.011 |
leanor | +0.010 |
seven | +0.010 |
storm | +0.010 |
bye | +0.010 |
Neg logit contributions | |
groups | -0.008 |
questions | -0.008 |
ices | -0.007 |
ports | -0.007 |
triple | -0.007 |
Token | garden |
Token ID | 11376 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
xt | +0.015 |
liv | +0.015 |
storm | +0.014 |
Twe | +0.014 |
ller | +0.014 |
Neg logit contributions | |
questions | -0.017 |
ac | -0.015 |
groups | -0.014 |
forward | -0.014 |
ices | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
xt | +0.029 |
ller | +0.027 |
bye | +0.025 |
storm | +0.024 |
bow | +0.024 |
Neg logit contributions | |
questions | -0.034 |
triple | -0.033 |
increasingly | -0.030 |
forward | -0.030 |
groups | -0.029 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.27e-03 |
Pos logit contributions | |
xt | +0.013 |
ller | +0.013 |
liv | +0.012 |
bow | +0.012 |
Twe | +0.012 |
Neg logit contributions | |
questions | -0.021 |
forward | -0.020 |
groups | -0.020 |
triple | -0.020 |
out | -0.019 |
Token | was |
Token ID | 373 |
Feature activation | +3.55e-03 |
Pos logit contributions | |
ller | +0.002 |
xt | +0.002 |
liv | +0.002 |
ugg | +0.002 |
storm | +0.002 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
forward | -0.002 |
out | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +7.70e-03 |
Pos logit contributions | |
ller | +0.007 |
xt | +0.007 |
liv | +0.007 |
leanor | +0.007 |
seven | +0.007 |
Neg logit contributions | |
questions | -0.004 |
groups | -0.004 |
triple | -0.003 |
forward | -0.003 |
brothers | -0.003 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.78e-02 |
Pos logit contributions | |
Raven | +0.009 |
storm | +0.009 |
ller | +0.009 |
liv | +0.009 |
leanor | +0.009 |
Neg logit contributions | |
groups | -0.014 |
questions | -0.014 |
triple | -0.013 |
ices | -0.013 |
into | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
ller | +0.147 |
xt | +0.145 |
liv | +0.141 |
ugg | +0.140 |
seven | +0.138 |
Neg logit contributions | |
questions | -0.034 |
groups | -0.032 |
triple | -0.026 |
out | -0.026 |
at | -0.025 |
Token | Tom |
Token ID | 4186 |
Feature activation | -6.50e-04 |
Pos logit contributions | |
ller | +0.019 |
xt | +0.018 |
storm | +0.017 |
llers | +0.017 |
ugg | +0.017 |
Neg logit contributions | |
questions | -0.018 |
triple | -0.017 |
groups | -0.017 |
out | -0.016 |
forward | -0.016 |
Token | was |
Token ID | 373 |
Feature activation | -5.48e-04 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
triple | +0.001 |
forward | +0.001 |
out | +0.001 |
Neg logit contributions | |
xt | -0.001 |
ller | -0.001 |
liv | -0.001 |
leanor | -0.001 |
ugg | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +5.62e-03 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
triple | +0.001 |
out | +0.000 |
forward | +0.000 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
liv | -0.001 |
ugg | -0.001 |
storm | -0.001 |
Token | h |
Token ID | 289 |
Feature activation | +2.29e-02 |
Pos logit contributions | |
liv | +0.009 |
storm | +0.009 |
leanor | +0.009 |
Raven | +0.009 |
seven | +0.009 |
Neg logit contributions | |
groups | -0.007 |
questions | -0.007 |
forward | -0.007 |
ices | -0.007 |
triple | -0.007 |
Token | park |
Token ID | 3952 |
Feature activation | +1.93e-02 |
Pos logit contributions | |
liv | +0.018 |
xt | +0.017 |
ller | +0.017 |
storm | +0.017 |
Twe | +0.017 |
Neg logit contributions | |
questions | -0.019 |
triple | -0.016 |
groups | -0.016 |
ices | -0.016 |
forward | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | +9.20e-03 |
Pos logit contributions | |
xt | +0.029 |
ller | +0.029 |
bye | +0.028 |
storm | +0.026 |
lla | +0.026 |
Neg logit contributions | |
questions | -0.030 |
triple | -0.029 |
groups | -0.027 |
increasingly | -0.026 |
brothers | -0.025 |
Token | Anna |
Token ID | 11735 |
Feature activation | +8.81e-03 |
Pos logit contributions | |
xt | +0.011 |
ller | +0.011 |
liv | +0.010 |
bow | +0.010 |
storm | +0.009 |
Neg logit contributions | |
questions | -0.018 |
groups | -0.017 |
forward | -0.017 |
triple | -0.016 |
out | -0.016 |
Token | is |
Token ID | 318 |
Feature activation | +5.63e-03 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.013 |
liv | +0.012 |
ugg | +0.012 |
leanor | +0.012 |
Neg logit contributions | |
questions | -0.015 |
groups | -0.014 |
triple | -0.014 |
forward | -0.013 |
out | -0.013 |
Token | the |
Token ID | 262 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.011 |
leanor | +0.011 |
seven | +0.010 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
triple | -0.006 |
forward | -0.005 |
brothers | -0.005 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.76e-02 |
Pos logit contributions | |
Raven | +0.009 |
liv | +0.009 |
ller | +0.009 |
leanor | +0.008 |
storm | +0.008 |
Neg logit contributions | |
groups | -0.014 |
questions | -0.014 |
triple | -0.013 |
ices | -0.013 |
into | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +8.87e-03 |
Pos logit contributions | |
ller | +0.145 |
xt | +0.144 |
liv | +0.139 |
ugg | +0.139 |
seven | +0.136 |
Neg logit contributions | |
questions | -0.036 |
groups | -0.032 |
out | -0.028 |
triple | -0.027 |
at | -0.026 |
Token | Ben |
Token ID | 3932 |
Feature activation | -4.06e-03 |
Pos logit contributions | |
ller | +0.016 |
xt | +0.015 |
storm | +0.015 |
llers | +0.014 |
ugg | +0.014 |
Neg logit contributions | |
questions | -0.013 |
triple | -0.012 |
groups | -0.012 |
out | -0.011 |
forward | -0.011 |
Token | is |
Token ID | 318 |
Feature activation | -2.38e-03 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.006 |
triple | +0.006 |
forward | +0.006 |
out | +0.006 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.006 |
ugg | -0.006 |
leanor | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +4.87e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.002 |
forward | +0.002 |
out | +0.002 |
Neg logit contributions | |
ller | -0.005 |
xt | -0.005 |
liv | -0.005 |
storm | -0.005 |
ugg | -0.005 |
Token | h |
Token ID | 289 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
liv | +0.008 |
storm | +0.008 |
leanor | +0.008 |
sed | +0.008 |
Raven | +0.008 |
Neg logit contributions | |
groups | -0.007 |
questions | -0.006 |
forward | -0.006 |
ices | -0.006 |
triple | -0.006 |
Token | park |
Token ID | 3952 |
Feature activation | +2.75e-02 |
Pos logit contributions | |
liv | +0.017 |
xt | +0.016 |
storm | +0.015 |
Twe | +0.015 |
bye | +0.015 |
Neg logit contributions | |
questions | -0.020 |
ac | -0.017 |
iers | -0.017 |
ices | -0.017 |
forward | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
xt | +0.042 |
ller | +0.042 |
bye | +0.039 |
lla | +0.038 |
seven | +0.037 |
Neg logit contributions | |
questions | -0.043 |
triple | -0.041 |
groups | -0.039 |
increasingly | -0.037 |
forward | -0.036 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.28e-03 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.013 |
liv | +0.012 |
seven | +0.011 |
bow | +0.011 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.018 |
triple | -0.018 |
forward | -0.017 |
out | -0.017 |
Token | was |
Token ID | 373 |
Feature activation | +8.94e-03 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
forward | +0.002 |
triple | +0.002 |
out | +0.002 |
Neg logit contributions | |
xt | -0.002 |
ller | -0.002 |
liv | -0.002 |
leanor | -0.002 |
seven | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +8.06e-03 |
Pos logit contributions | |
ller | +0.015 |
xt | +0.015 |
liv | +0.015 |
seven | +0.015 |
leanor | +0.015 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
ices | -0.010 |
triple | -0.009 |
invitations | -0.009 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.76e-02 |
Pos logit contributions | |
Raven | +0.010 |
liv | +0.010 |
ller | +0.010 |
bye | +0.009 |
leanor | +0.009 |
Neg logit contributions | |
groups | -0.014 |
questions | -0.014 |
ices | -0.013 |
triple | -0.013 |
into | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | +8.00e-03 |
Pos logit contributions | |
ller | +0.141 |
xt | +0.139 |
liv | +0.135 |
ugg | +0.133 |
leanor | +0.131 |
Neg logit contributions | |
questions | -0.041 |
groups | -0.038 |
triple | -0.034 |
out | -0.030 |
into | -0.029 |
Token | Mia |
Token ID | 32189 |
Feature activation | +5.60e-03 |
Pos logit contributions | |
ller | +0.012 |
xt | +0.012 |
liv | +0.011 |
ugg | +0.011 |
leanor | +0.011 |
Neg logit contributions | |
questions | -0.013 |
groups | -0.013 |
triple | -0.012 |
forward | -0.012 |
out | -0.012 |
Token | was |
Token ID | 373 |
Feature activation | +2.81e-03 |
Pos logit contributions | |
xt | +0.009 |
ller | +0.009 |
liv | +0.009 |
leanor | +0.008 |
ugg | +0.008 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.008 |
triple | -0.008 |
forward | -0.008 |
out | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +7.11e-03 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.005 |
liv | +0.005 |
leanor | +0.005 |
seven | +0.005 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.003 |
out | -0.003 |
Token | h |
Token ID | 289 |
Feature activation | +2.56e-02 |
Pos logit contributions | |
liv | +0.012 |
leanor | +0.011 |
seven | +0.011 |
storm | +0.011 |
Raven | +0.011 |
Neg logit contributions | |
groups | -0.009 |
questions | -0.009 |
ports | -0.008 |
ices | -0.008 |
triple | -0.008 |
Token | Because |
Token ID | 4362 |
Feature activation | +3.54e-03 |
Pos logit contributions | |
questions | +0.015 |
groups | +0.014 |
triple | +0.013 |
forward | +0.013 |
out | +0.013 |
Neg logit contributions | |
ller | -0.017 |
xt | -0.016 |
liv | -0.016 |
storm | -0.015 |
ugg | -0.015 |
Token | I |
Token ID | 314 |
Feature activation | -6.11e-03 |
Pos logit contributions | |
ller | +0.004 |
xt | +0.004 |
liv | +0.003 |
ugg | +0.003 |
seven | +0.003 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
triple | -0.007 |
forward | -0.006 |
increasingly | -0.006 |
Token | am |
Token ID | 716 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
groups | +0.010 |
questions | +0.010 |
triple | +0.009 |
forward | +0.009 |
brothers | +0.008 |
Neg logit contributions | |
xt | -0.009 |
ller | -0.009 |
ugg | -0.009 |
storm | -0.008 |
liv | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
ller | +0.033 |
xt | +0.032 |
liv | +0.031 |
ugg | +0.031 |
storm | +0.031 |
Neg logit contributions | |
questions | -0.020 |
groups | -0.019 |
out | -0.017 |
triple | -0.017 |
forward | -0.017 |
Token | good |
Token ID | 922 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
ller | +0.029 |
xt | +0.028 |
storm | +0.027 |
leanor | +0.027 |
liv | +0.026 |
Neg logit contributions | |
questions | -0.020 |
groups | -0.019 |
triple | -0.018 |
forward | -0.017 |
into | -0.016 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.76e-02 |
Pos logit contributions | |
bye | +0.036 |
leanor | +0.035 |
ller | +0.035 |
sed | +0.034 |
xt | +0.034 |
Neg logit contributions | |
groups | -0.035 |
questions | -0.034 |
increasingly | -0.033 |
triple | -0.031 |
forward | -0.031 |
Token | too |
Token ID | 1165 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
xt | +0.119 |
ller | +0.119 |
liv | +0.119 |
ugg | +0.115 |
leanor | +0.112 |
Neg logit contributions | |
questions | -0.062 |
groups | -0.059 |
at | -0.054 |
out | -0.053 |
into | -0.052 |
Token | ." |
Token ID | 526 |
Feature activation | -4.91e-03 |
Pos logit contributions | |
liv | +0.029 |
ller | +0.028 |
xt | +0.028 |
ugg | +0.028 |
leanor | +0.027 |
Neg logit contributions | |
questions | -0.013 |
groups | -0.012 |
at | -0.011 |
out | -0.011 |
brothers | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
questions | +0.007 |
groups | +0.007 |
triple | +0.006 |
forward | +0.006 |
out | +0.006 |
Neg logit contributions | |
ller | -0.009 |
xt | -0.009 |
liv | -0.008 |
ugg | -0.008 |
seven | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -7.39e-03 |
Pos logit contributions | |
questions | +0.020 |
groups | +0.019 |
triple | +0.018 |
forward | +0.017 |
out | +0.017 |
Neg logit contributions | |
ller | -0.032 |
xt | -0.031 |
liv | -0.030 |
storm | -0.029 |
ugg | -0.029 |
Token | They |
Token ID | 2990 |
Feature activation | +1.56e-03 |
Pos logit contributions | |
questions | +0.016 |
groups | +0.016 |
triple | +0.015 |
out | +0.015 |
forward | +0.015 |
Neg logit contributions | |
xt | -0.007 |
ller | -0.007 |
liv | -0.007 |
ugg | -0.006 |
live | -0.006 |
Token | garden |
Token ID | 11376 |
Feature activation | +2.00e-02 |
Pos logit contributions | |
liv | +0.015 |
xt | +0.015 |
Twe | +0.014 |
storm | +0.014 |
ller | +0.014 |
Neg logit contributions | |
questions | -0.018 |
ac | -0.015 |
forward | -0.015 |
ices | -0.015 |
triple | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
xt | +0.028 |
ller | +0.026 |
bye | +0.024 |
lla | +0.023 |
ugg | +0.023 |
Neg logit contributions | |
questions | -0.033 |
triple | -0.032 |
forward | -0.029 |
increasingly | -0.029 |
groups | -0.028 |
Token | Lily |
Token ID | 20037 |
Feature activation | -7.98e-04 |
Pos logit contributions | |
xt | +0.015 |
ller | +0.013 |
liv | +0.013 |
Stella | +0.013 |
Twe | +0.013 |
Neg logit contributions | |
questions | -0.025 |
forward | -0.023 |
triple | -0.022 |
groups | -0.022 |
out | -0.022 |
Token | was |
Token ID | 373 |
Feature activation | +4.76e-03 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
triple | +0.001 |
forward | +0.001 |
out | +0.001 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
liv | -0.001 |
ugg | -0.001 |
storm | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +6.72e-03 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.009 |
liv | +0.009 |
leanor | +0.009 |
seven | +0.009 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.005 |
triple | -0.005 |
forward | -0.004 |
brothers | -0.004 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.72e-02 |
Pos logit contributions | |
liv | +0.008 |
storm | +0.008 |
Raven | +0.008 |
ller | +0.008 |
leanor | +0.008 |
Neg logit contributions | |
groups | -0.012 |
questions | -0.011 |
triple | -0.011 |
ices | -0.011 |
into | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | +9.09e-03 |
Pos logit contributions | |
ller | +0.142 |
xt | +0.140 |
liv | +0.136 |
ugg | +0.135 |
seven | +0.133 |
Neg logit contributions | |
questions | -0.037 |
groups | -0.035 |
triple | -0.030 |
out | -0.029 |
into | -0.028 |
Token | Ben |
Token ID | 3932 |
Feature activation | -4.10e-03 |
Pos logit contributions | |
ller | +0.017 |
xt | +0.016 |
storm | +0.015 |
ugg | +0.015 |
llers | +0.015 |
Neg logit contributions | |
questions | -0.013 |
groups | -0.012 |
triple | -0.012 |
out | -0.011 |
forward | -0.011 |
Token | was |
Token ID | 373 |
Feature activation | +4.79e-04 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.006 |
triple | +0.006 |
forward | +0.006 |
out | +0.005 |
Neg logit contributions | |
xt | -0.007 |
ller | -0.007 |
liv | -0.006 |
leanor | -0.006 |
ugg | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +4.69e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
liv | +0.001 |
ugg | +0.001 |
storm | +0.001 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
triple | -0.000 |
forward | -0.000 |
out | -0.000 |
Token | h |
Token ID | 289 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
liv | +0.008 |
storm | +0.008 |
leanor | +0.007 |
Raven | +0.007 |
sed | +0.007 |
Neg logit contributions | |
groups | -0.006 |
questions | -0.006 |
ices | -0.006 |
ports | -0.006 |
forward | -0.006 |
Token | " |
Token ID | 1 |
Feature activation | +7.19e-03 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.010 |
triple | +0.009 |
forward | +0.009 |
out | +0.009 |
Neg logit contributions | |
ller | -0.014 |
xt | -0.014 |
liv | -0.014 |
ugg | -0.013 |
leanor | -0.013 |
Token | You |
Token ID | 1639 |
Feature activation | -6.69e-03 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.012 |
liv | +0.011 |
llers | +0.011 |
storm | +0.011 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.010 |
triple | -0.010 |
brothers | -0.009 |
forward | -0.009 |
Token | are |
Token ID | 389 |
Feature activation | +3.92e-03 |
Pos logit contributions | |
questions | +0.009 |
groups | +0.009 |
triple | +0.008 |
forward | +0.008 |
out | +0.008 |
Neg logit contributions | |
ller | -0.012 |
xt | -0.012 |
liv | -0.011 |
ugg | -0.011 |
storm | -0.011 |
Token | a |
Token ID | 257 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.008 |
liv | +0.008 |
ugg | +0.008 |
storm | +0.008 |
Neg logit contributions | |
questions | -0.004 |
groups | -0.004 |
triple | -0.004 |
forward | -0.003 |
out | -0.003 |
Token | good |
Token ID | 922 |
Feature activation | +1.90e-02 |
Pos logit contributions | |
ller | +0.024 |
xt | +0.023 |
leanor | +0.022 |
storm | +0.022 |
Twe | +0.022 |
Neg logit contributions | |
questions | -0.016 |
groups | -0.016 |
triple | -0.014 |
into | -0.014 |
forward | -0.013 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.71e-02 |
Pos logit contributions | |
bye | +0.030 |
ller | +0.030 |
ugg | +0.030 |
xt | +0.030 |
leanor | +0.029 |
Neg logit contributions | |
groups | -0.028 |
questions | -0.026 |
increasingly | -0.026 |
forward | -0.024 |
into | -0.024 |
Token | , |
Token ID | 11 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
xt | +0.091 |
ller | +0.091 |
liv | +0.090 |
ugg | +0.088 |
leanor | +0.085 |
Neg logit contributions | |
questions | -0.085 |
groups | -0.083 |
at | -0.079 |
out | -0.078 |
triple | -0.078 |
Token | Tom |
Token ID | 4186 |
Feature activation | -3.98e-04 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.023 |
liv | +0.021 |
seven | +0.020 |
storm | +0.020 |
Neg logit contributions | |
groups | -0.027 |
questions | -0.027 |
triple | -0.026 |
forward | -0.025 |
out | -0.025 |
Token | !" |
Token ID | 2474 |
Feature activation | +3.73e-03 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
out | +0.001 |
at | +0.001 |
brothers | +0.001 |
Neg logit contributions | |
xt | -0.001 |
ller | -0.001 |
liv | -0.001 |
ugg | -0.001 |
storm | -0.001 |
Token | she |
Token ID | 673 |
Feature activation | -9.57e-03 |
Pos logit contributions | |
ller | +0.005 |
xt | +0.005 |
liv | +0.005 |
seven | +0.004 |
leanor | +0.004 |
Neg logit contributions | |
groups | -0.007 |
questions | -0.007 |
triple | -0.007 |
forward | -0.006 |
ac | -0.006 |
Token | said |
Token ID | 531 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
questions | +0.018 |
groups | +0.017 |
triple | +0.017 |
forward | +0.017 |
out | +0.016 |
Neg logit contributions | |
ller | -0.012 |
xt | -0.012 |
liv | -0.011 |
leanor | -0.011 |
ugg | -0.011 |
Token | park |
Token ID | 3952 |
Feature activation | +2.19e-02 |
Pos logit contributions | |
liv | +0.016 |
xt | +0.016 |
storm | +0.015 |
ller | +0.015 |
Twe | +0.015 |
Neg logit contributions | |
questions | -0.018 |
groups | -0.015 |
ac | -0.015 |
forward | -0.015 |
triple | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
xt | +0.032 |
ller | +0.031 |
bye | +0.030 |
storm | +0.029 |
Twe | +0.028 |
Neg logit contributions | |
questions | -0.035 |
triple | -0.034 |
groups | -0.032 |
increasingly | -0.030 |
scientists | -0.029 |
Token | Lily |
Token ID | 20037 |
Feature activation | -1.86e-03 |
Pos logit contributions | |
ller | +0.015 |
xt | +0.015 |
liv | +0.014 |
storm | +0.013 |
bow | +0.013 |
Neg logit contributions | |
questions | -0.022 |
groups | -0.020 |
forward | -0.020 |
triple | -0.020 |
out | -0.019 |
Token | was |
Token ID | 373 |
Feature activation | +2.96e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.002 |
out | +0.002 |
into | +0.002 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
liv | -0.003 |
ugg | -0.003 |
storm | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +5.59e-03 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.006 |
liv | +0.006 |
leanor | +0.006 |
seven | +0.006 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.002 |
brothers | -0.002 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.71e-02 |
Pos logit contributions | |
liv | +0.007 |
ller | +0.007 |
storm | +0.006 |
leanor | +0.006 |
xt | +0.006 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.010 |
triple | -0.010 |
ices | -0.009 |
into | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +9.45e-03 |
Pos logit contributions | |
ller | +0.145 |
xt | +0.143 |
liv | +0.139 |
ugg | +0.138 |
seven | +0.135 |
Neg logit contributions | |
questions | -0.034 |
groups | -0.032 |
triple | -0.027 |
out | -0.027 |
at | -0.025 |
Token | Tom |
Token ID | 4186 |
Feature activation | -2.75e-03 |
Pos logit contributions | |
ller | +0.016 |
xt | +0.015 |
storm | +0.014 |
llers | +0.014 |
ugg | +0.013 |
Neg logit contributions | |
questions | -0.015 |
triple | -0.014 |
out | -0.014 |
groups | -0.014 |
forward | -0.013 |
Token | was |
Token ID | 373 |
Feature activation | +1.39e-04 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.004 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.005 |
xt | -0.005 |
liv | -0.005 |
ugg | -0.004 |
leanor | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +4.15e-03 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
liv | +0.000 |
ugg | +0.000 |
storm | +0.000 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
out | -0.000 |
Token | h |
Token ID | 289 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
liv | +0.007 |
storm | +0.007 |
leanor | +0.007 |
seven | +0.007 |
Raven | +0.007 |
Neg logit contributions | |
groups | -0.005 |
questions | -0.005 |
ports | -0.005 |
ices | -0.005 |
invitations | -0.005 |
Token | room |
Token ID | 2119 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
xt | +0.028 |
ller | +0.027 |
liv | +0.027 |
sed | +0.026 |
ugg | +0.026 |
Neg logit contributions | |
questions | -0.021 |
triple | -0.018 |
groups | -0.018 |
forward | -0.018 |
increasingly | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | +9.38e-03 |
Pos logit contributions | |
xt | +0.026 |
ller | +0.026 |
storm | +0.023 |
ugg | +0.023 |
liv | +0.023 |
Neg logit contributions | |
triple | -0.026 |
questions | -0.026 |
groups | -0.024 |
increasingly | -0.023 |
forward | -0.023 |
Token | Sara |
Token ID | 24799 |
Feature activation | +6.34e-03 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.010 |
ugg | +0.010 |
storm | +0.010 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.018 |
triple | -0.017 |
forward | -0.017 |
out | -0.016 |
Token | was |
Token ID | 373 |
Feature activation | +1.64e-03 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.010 |
storm | +0.010 |
ugg | +0.010 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
triple | -0.009 |
out | -0.008 |
forward | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +4.58e-03 |
Pos logit contributions | |
xt | +0.003 |
ller | +0.003 |
liv | +0.003 |
leanor | +0.003 |
seven | +0.003 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
forward | -0.001 |
brothers | -0.001 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.69e-02 |
Pos logit contributions | |
liv | +0.005 |
leanor | +0.005 |
storm | +0.005 |
ller | +0.005 |
Raven | +0.005 |
Neg logit contributions | |
groups | -0.009 |
questions | -0.008 |
triple | -0.008 |
ices | -0.008 |
increasingly | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
ller | +0.142 |
xt | +0.140 |
liv | +0.136 |
ugg | +0.135 |
seven | +0.133 |
Neg logit contributions | |
questions | -0.036 |
groups | -0.033 |
triple | -0.029 |
out | -0.028 |
at | -0.027 |
Token | Tom |
Token ID | 4186 |
Feature activation | -2.13e-03 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.016 |
storm | +0.016 |
llers | +0.015 |
bow | +0.015 |
Neg logit contributions | |
questions | -0.016 |
triple | -0.016 |
out | -0.015 |
groups | -0.015 |
forward | -0.015 |
Token | was |
Token ID | 373 |
Feature activation | -3.13e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.003 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.004 |
xt | -0.004 |
liv | -0.004 |
ugg | -0.003 |
leanor | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +3.06e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.003 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.007 |
xt | -0.006 |
liv | -0.006 |
ugg | -0.006 |
storm | -0.006 |
Token | h |
Token ID | 289 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
liv | +0.005 |
storm | +0.005 |
leanor | +0.005 |
seven | +0.005 |
sed | +0.005 |
Neg logit contributions | |
groups | -0.004 |
questions | -0.004 |
ports | -0.004 |
ices | -0.003 |
triple | -0.003 |
Token | park |
Token ID | 3952 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
xt | +0.015 |
liv | +0.015 |
Twe | +0.015 |
bye | +0.014 |
storm | +0.014 |
Neg logit contributions | |
questions | -0.019 |
ac | -0.016 |
iers | -0.016 |
ices | -0.016 |
forward | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
ller | +0.036 |
xt | +0.036 |
bye | +0.034 |
lla | +0.033 |
bow | +0.033 |
Neg logit contributions | |
questions | -0.042 |
triple | -0.040 |
groups | -0.037 |
increasingly | -0.036 |
forward | -0.035 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.98e-03 |
Pos logit contributions | |
xt | +0.012 |
ller | +0.011 |
Twe | +0.011 |
Stella | +0.011 |
bow | +0.011 |
Neg logit contributions | |
questions | -0.024 |
forward | -0.022 |
triple | -0.021 |
groups | -0.021 |
out | -0.020 |
Token | was |
Token ID | 373 |
Feature activation | +6.80e-03 |
Pos logit contributions | |
ller | +0.003 |
xt | +0.003 |
liv | +0.003 |
ugg | +0.003 |
storm | +0.003 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.003 |
out | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +7.88e-03 |
Pos logit contributions | |
ller | +0.014 |
xt | +0.014 |
liv | +0.013 |
leanor | +0.013 |
seven | +0.013 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
triple | -0.006 |
forward | -0.006 |
brothers | -0.006 |
Token | seeker |
Token ID | 45993 |
Feature activation | +5.67e-02 |
Pos logit contributions | |
ller | +0.010 |
liv | +0.010 |
leanor | +0.010 |
Raven | +0.010 |
xt | +0.010 |
Neg logit contributions | |
groups | -0.014 |
questions | -0.014 |
triple | -0.013 |
ices | -0.012 |
into | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
ller | +0.144 |
xt | +0.143 |
liv | +0.139 |
ugg | +0.138 |
seven | +0.136 |
Neg logit contributions | |
questions | -0.033 |
groups | -0.030 |
triple | -0.025 |
out | -0.025 |
at | -0.024 |
Token | Ben |
Token ID | 3932 |
Feature activation | -2.98e-03 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.022 |
storm | +0.021 |
liv | +0.020 |
llers | +0.020 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.013 |
triple | -0.012 |
forward | -0.012 |
out | -0.012 |
Token | was |
Token ID | 373 |
Feature activation | +1.73e-03 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.004 |
triple | +0.004 |
forward | +0.004 |
out | +0.004 |
Neg logit contributions | |
xt | -0.005 |
ller | -0.005 |
liv | -0.005 |
leanor | -0.004 |
storm | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +6.36e-03 |
Pos logit contributions | |
ller | +0.004 |
xt | +0.004 |
liv | +0.003 |
ugg | +0.003 |
storm | +0.003 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
forward | -0.002 |
out | -0.002 |
Token | h |
Token ID | 289 |
Feature activation | +2.42e-02 |
Pos logit contributions | |
liv | +0.010 |
leanor | +0.010 |
storm | +0.010 |
seven | +0.010 |
Raven | +0.010 |
Neg logit contributions | |
groups | -0.009 |
questions | -0.009 |
ices | -0.008 |
ports | -0.008 |
triple | -0.008 |
Token | box |
Token ID | 3091 |
Feature activation | +1.11e-04 |
Pos logit contributions | |
triple | +0.026 |
increasingly | +0.025 |
questions | +0.023 |
groups | +0.023 |
and | +0.023 |
Neg logit contributions | |
ller | -0.020 |
seven | -0.019 |
endant | -0.019 |
bow | -0.019 |
sed | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -1.61e-03 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
seven | +0.000 |
ugg | +0.000 |
liv | +0.000 |
Neg logit contributions | |
triple | -0.000 |
questions | -0.000 |
groups | -0.000 |
increasingly | -0.000 |
scientists | -0.000 |
Token | share |
Token ID | 2648 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.003 |
and | +0.002 |
ices | +0.002 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
seven | -0.002 |
leanor | -0.002 |
Raven | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +3.93e-04 |
Pos logit contributions | |
ller | +0.030 |
xt | +0.030 |
liv | +0.028 |
ugg | +0.027 |
storm | +0.027 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.016 |
triple | -0.016 |
forward | -0.014 |
out | -0.014 |
Token | ch |
Token ID | 442 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
mm | +0.001 |
bow | +0.001 |
seven | +0.001 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
triple | -0.001 |
forward | -0.001 |
increasingly | -0.000 |
Token | ocol |
Token ID | 4668 |
Feature activation | -7.81e-02 |
Pos logit contributions | |
questions | +0.032 |
groups | +0.031 |
triple | +0.030 |
increasingly | +0.030 |
forward | +0.029 |
Neg logit contributions | |
ller | -0.037 |
xt | -0.034 |
ugg | -0.031 |
mm | -0.031 |
seven | -0.031 |
Token | ates |
Token ID | 689 |
Feature activation | -2.60e-02 |
Pos logit contributions | |
questions | +0.113 |
groups | +0.110 |
triple | +0.104 |
forward | +0.100 |
out | +0.097 |
Neg logit contributions | |
ller | -0.137 |
xt | -0.132 |
ugg | -0.125 |
liv | -0.123 |
mm | -0.121 |
Token | . |
Token ID | 13 |
Feature activation | -4.19e-03 |
Pos logit contributions | |
questions | +0.034 |
triple | +0.033 |
groups | +0.033 |
forward | +0.029 |
increasingly | +0.029 |
Neg logit contributions | |
ller | -0.049 |
xt | -0.047 |
seven | -0.044 |
liv | -0.043 |
ugg | -0.043 |
Token | They |
Token ID | 1119 |
Feature activation | +5.37e-03 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
out | +0.004 |
triple | +0.004 |
into | +0.004 |
Neg logit contributions | |
ller | -0.009 |
xt | -0.008 |
liv | -0.008 |
storm | -0.008 |
leanor | -0.008 |
Token | are |
Token ID | 389 |
Feature activation | +9.46e-03 |
Pos logit contributions | |
ller | +0.009 |
xt | +0.009 |
liv | +0.008 |
ugg | +0.008 |
bow | +0.008 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.007 |
triple | -0.007 |
forward | -0.007 |
out | -0.006 |
Token | happy |
Token ID | 3772 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
ller | +0.017 |
xt | +0.016 |
liv | +0.015 |
seven | +0.015 |
Twe | +0.015 |
Neg logit contributions | |
questions | -0.013 |
groups | -0.012 |
triple | -0.011 |
ices | -0.010 |
forward | -0.010 |
Token | started |
Token ID | 2067 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
triple | +0.004 |
forward | +0.004 |
brothers | +0.004 |
Neg logit contributions | |
xt | -0.005 |
ller | -0.005 |
ugg | -0.005 |
liv | -0.005 |
Twe | -0.005 |
Token | eating |
Token ID | 6600 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
xt | +0.021 |
ller | +0.020 |
seven | +0.018 |
Karen | +0.018 |
llers | +0.018 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.019 |
ac | -0.019 |
forward | -0.018 |
aky | -0.017 |
Token | the |
Token ID | 262 |
Feature activation | -9.76e-03 |
Pos logit contributions | |
questions | +0.016 |
triple | +0.016 |
groups | +0.016 |
forward | +0.015 |
ac | +0.015 |
Neg logit contributions | |
ller | -0.019 |
xt | -0.019 |
Twe | -0.019 |
seven | -0.018 |
Stella | -0.018 |
Token | delicious |
Token ID | 12625 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.013 |
triple | +0.012 |
forward | +0.012 |
brothers | +0.011 |
Neg logit contributions | |
ller | -0.018 |
xt | -0.017 |
liv | -0.016 |
ugg | -0.016 |
leanor | -0.016 |
Token | ch |
Token ID | 442 |
Feature activation | -2.83e-02 |
Pos logit contributions | |
questions | +0.036 |
groups | +0.035 |
triple | +0.032 |
forward | +0.032 |
out | +0.030 |
Neg logit contributions | |
ller | -0.044 |
xt | -0.042 |
liv | -0.040 |
storm | -0.039 |
ugg | -0.039 |
Token | ocol |
Token ID | 4668 |
Feature activation | -7.62e-02 |
Pos logit contributions | |
questions | +0.042 |
groups | +0.042 |
triple | +0.039 |
forward | +0.038 |
increasingly | +0.038 |
Neg logit contributions | |
ller | -0.047 |
xt | -0.045 |
ugg | -0.042 |
leanor | -0.041 |
liv | -0.041 |
Token | ates |
Token ID | 689 |
Feature activation | -2.93e-02 |
Pos logit contributions | |
questions | +0.106 |
groups | +0.104 |
triple | +0.098 |
forward | +0.092 |
out | +0.090 |
Neg logit contributions | |
ller | -0.137 |
xt | -0.134 |
liv | -0.127 |
ugg | -0.126 |
leanor | -0.122 |
Token | . |
Token ID | 13 |
Feature activation | +3.23e-03 |
Pos logit contributions | |
questions | +0.045 |
groups | +0.044 |
triple | +0.044 |
increasingly | +0.038 |
brothers | +0.037 |
Neg logit contributions | |
ller | -0.048 |
xt | -0.046 |
liv | -0.042 |
lla | -0.042 |
seven | -0.042 |
Token | She |
Token ID | 1375 |
Feature activation | +5.38e-03 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.006 |
storm | +0.006 |
liv | +0.006 |
rob | +0.006 |
Neg logit contributions | |
questions | -0.004 |
out | -0.004 |
groups | -0.004 |
forward | -0.004 |
into | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
ller | +0.009 |
xt | +0.008 |
liv | +0.008 |
ugg | +0.007 |
seven | +0.007 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.008 |
forward | -0.008 |
triple | -0.008 |
out | -0.007 |
Token | so |
Token ID | 523 |
Feature activation | +5.51e-03 |
Pos logit contributions | |
ller | +0.024 |
xt | +0.024 |
liv | +0.023 |
seven | +0.022 |
Karen | +0.022 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.018 |
triple | -0.016 |
ports | -0.015 |
ices | -0.015 |
Token | find |
Token ID | 1064 |
Feature activation | -5.08e-03 |
Pos logit contributions | |
xt | +0.010 |
ller | +0.010 |
bow | +0.010 |
ugg | +0.009 |
leanor | +0.009 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
triple | -0.009 |
forward | -0.008 |
and | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
triple | +0.005 |
questions | +0.005 |
groups | +0.005 |
forward | +0.005 |
increasingly | +0.005 |
Neg logit contributions | |
ller | -0.009 |
xt | -0.009 |
liv | -0.009 |
seven | -0.009 |
Twe | -0.009 |
Token | box |
Token ID | 3091 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
ller | +0.019 |
bow | +0.018 |
storm | +0.017 |
sed | +0.017 |
Raven | +0.017 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.015 |
forward | -0.015 |
triple | -0.015 |
iece | -0.014 |
Token | of |
Token ID | 286 |
Feature activation | -2.87e-02 |
Pos logit contributions | |
ller | +0.035 |
xt | +0.034 |
storm | +0.032 |
ugg | +0.032 |
liv | +0.032 |
Neg logit contributions | |
questions | -0.021 |
groups | -0.019 |
triple | -0.019 |
increasingly | -0.017 |
forward | -0.015 |
Token | ch |
Token ID | 442 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
forward | +0.041 |
triple | +0.038 |
iece | +0.037 |
increasingly | +0.036 |
questions | +0.035 |
Neg logit contributions | |
ller | -0.044 |
Twe | -0.042 |
xt | -0.042 |
seven | -0.042 |
Karen | -0.039 |
Token | ocol |
Token ID | 4668 |
Feature activation | -7.34e-02 |
Pos logit contributions | |
increasingly | +0.042 |
triple | +0.040 |
questions | +0.040 |
decide | +0.039 |
from | +0.037 |
Neg logit contributions | |
ller | -0.033 |
xt | -0.030 |
llers | -0.027 |
ugg | -0.027 |
seven | -0.026 |
Token | ates |
Token ID | 689 |
Feature activation | -1.95e-02 |
Pos logit contributions | |
questions | +0.110 |
groups | +0.105 |
triple | +0.100 |
forward | +0.098 |
increasingly | +0.095 |
Neg logit contributions | |
ller | -0.123 |
xt | -0.121 |
ugg | -0.113 |
mm | -0.111 |
liv | -0.110 |
Token | . |
Token ID | 13 |
Feature activation | -5.44e-03 |
Pos logit contributions | |
questions | +0.025 |
triple | +0.024 |
groups | +0.024 |
increasingly | +0.021 |
forward | +0.020 |
Neg logit contributions | |
ller | -0.037 |
xt | -0.035 |
seven | -0.033 |
bow | -0.033 |
liv | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
questions | +0.007 |
groups | +0.007 |
triple | +0.007 |
out | +0.006 |
forward | +0.006 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.010 |
liv | -0.010 |
storm | -0.009 |
leanor | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -8.23e-03 |
Pos logit contributions | |
questions | +0.018 |
groups | +0.017 |
triple | +0.015 |
out | +0.015 |
into | +0.014 |
Neg logit contributions | |
ller | -0.037 |
xt | -0.037 |
storm | -0.036 |
liv | -0.036 |
ugg | -0.035 |
Token | " |
Token ID | 1 |
Feature activation | +8.73e-03 |
Pos logit contributions | |
questions | +0.011 |
groups | +0.010 |
triple | +0.010 |
forward | +0.009 |
out | +0.009 |
Neg logit contributions | |
ller | -0.015 |
xt | -0.015 |
liv | -0.014 |
ugg | -0.014 |
leanor | -0.014 |
Token | bled |
Token ID | 9342 |
Feature activation | -7.59e-03 |
Pos logit contributions | |
groups | +0.026 |
questions | +0.025 |
triple | +0.024 |
un | +0.022 |
scientists | +0.021 |
Neg logit contributions | |
ller | -0.015 |
xt | -0.014 |
mm | -0.014 |
ugg | -0.014 |
liv | -0.013 |
Token | up |
Token ID | 510 |
Feature activation | +4.22e-03 |
Pos logit contributions | |
groups | +0.011 |
questions | +0.010 |
triple | +0.010 |
brothers | +0.010 |
scientists | +0.009 |
Neg logit contributions | |
ller | -0.012 |
xt | -0.012 |
Twe | -0.012 |
seven | -0.011 |
Raven | -0.011 |
Token | all |
Token ID | 477 |
Feature activation | +2.03e-03 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.007 |
Twe | +0.007 |
liv | +0.007 |
seven | +0.007 |
Neg logit contributions | |
groups | -0.005 |
questions | -0.005 |
triple | -0.005 |
forward | -0.005 |
brothers | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
ller | +0.005 |
xt | +0.004 |
storm | +0.004 |
liv | +0.004 |
ugg | +0.004 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
out | -0.002 |
forward | -0.002 |
Token | ch |
Token ID | 442 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
questions | +0.012 |
groups | +0.012 |
triple | +0.011 |
forward | +0.010 |
brothers | +0.010 |
Neg logit contributions | |
ller | -0.020 |
xt | -0.019 |
liv | -0.018 |
leanor | -0.018 |
seven | -0.018 |
Token | ocol |
Token ID | 4668 |
Feature activation | -7.32e-02 |
Pos logit contributions | |
questions | +0.043 |
groups | +0.042 |
triple | +0.041 |
out | +0.039 |
forward | +0.039 |
Neg logit contributions | |
ller | -0.041 |
xt | -0.041 |
ugg | -0.038 |
mm | -0.037 |
leanor | -0.036 |
Token | ates |
Token ID | 689 |
Feature activation | -3.41e-02 |
Pos logit contributions | |
questions | +0.101 |
groups | +0.098 |
triple | +0.092 |
forward | +0.087 |
out | +0.085 |
Neg logit contributions | |
ller | -0.133 |
xt | -0.130 |
liv | -0.123 |
ugg | -0.123 |
leanor | -0.119 |
Token | , |
Token ID | 11 |
Feature activation | -1.37e-02 |
Pos logit contributions | |
questions | +0.041 |
groups | +0.038 |
triple | +0.037 |
brothers | +0.031 |
scientists | +0.030 |
Neg logit contributions | |
ller | -0.070 |
xt | -0.068 |
ugg | -0.064 |
liv | -0.064 |
bow | -0.062 |
Token | and |
Token ID | 290 |
Feature activation | -1.23e-03 |
Pos logit contributions | |
questions | +0.017 |
groups | +0.016 |
triple | +0.015 |
forward | +0.014 |
out | +0.014 |
Neg logit contributions | |
ller | -0.027 |
xt | -0.026 |
liv | -0.025 |
ugg | -0.024 |
storm | -0.024 |
Token | she |
Token ID | 673 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
triple | +0.002 |
forward | +0.002 |
brothers | +0.002 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
liv | -0.002 |
ugg | -0.002 |
Twe | -0.002 |
Token | was |
Token ID | 373 |
Feature activation | +8.44e-03 |
Pos logit contributions | |
questions | +0.017 |
groups | +0.017 |
forward | +0.015 |
triple | +0.015 |
out | +0.014 |
Neg logit contributions | |
ller | -0.017 |
xt | -0.017 |
liv | -0.016 |
ugg | -0.015 |
leanor | -0.015 |
Token | was |
Token ID | 373 |
Feature activation | +7.11e-03 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.021 |
liv | +0.020 |
storm | +0.019 |
bow | +0.019 |
Neg logit contributions | |
questions | -0.021 |
groups | -0.019 |
triple | -0.018 |
forward | -0.018 |
out | -0.016 |
Token | a |
Token ID | 257 |
Feature activation | +9.32e-03 |
Pos logit contributions | |
ller | +0.011 |
Twe | +0.011 |
sed | +0.011 |
Blue | +0.010 |
hy | +0.010 |
Neg logit contributions | |
questions | -0.010 |
arre | -0.010 |
ices | -0.010 |
groups | -0.009 |
triple | -0.009 |
Token | box |
Token ID | 3091 |
Feature activation | +2.69e-02 |
Pos logit contributions | |
ller | +0.016 |
storm | +0.015 |
sed | +0.014 |
bow | +0.014 |
Twe | +0.014 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.013 |
ices | -0.012 |
triple | -0.012 |
forward | -0.012 |
Token | of |
Token ID | 286 |
Feature activation | -2.87e-02 |
Pos logit contributions | |
ller | +0.052 |
xt | +0.049 |
storm | +0.048 |
liv | +0.046 |
ugg | +0.046 |
Neg logit contributions | |
questions | -0.036 |
groups | -0.033 |
triple | -0.031 |
increasingly | -0.029 |
forward | -0.028 |
Token | ch |
Token ID | 442 |
Feature activation | -2.76e-02 |
Pos logit contributions | |
forward | +0.042 |
triple | +0.040 |
questions | +0.039 |
increasingly | +0.038 |
iece | +0.038 |
Neg logit contributions | |
Twe | -0.044 |
ller | -0.043 |
xt | -0.040 |
Blue | -0.039 |
hy | -0.039 |
Token | ocol |
Token ID | 4668 |
Feature activation | -7.28e-02 |
Pos logit contributions | |
questions | +0.047 |
increasingly | +0.045 |
triple | +0.044 |
plan | +0.042 |
decide | +0.042 |
Neg logit contributions | |
ller | -0.038 |
xt | -0.037 |
ugg | -0.034 |
llers | -0.031 |
seven | -0.031 |
Token | ates |
Token ID | 689 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
questions | +0.118 |
groups | +0.113 |
triple | +0.108 |
forward | +0.105 |
increasingly | +0.102 |
Neg logit contributions | |
ller | -0.114 |
xt | -0.114 |
mm | -0.103 |
ugg | -0.103 |
seven | -0.102 |
Token | . |
Token ID | 13 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
questions | +0.036 |
groups | +0.034 |
triple | +0.033 |
increasingly | +0.032 |
ang | +0.029 |
Neg logit contributions | |
ller | -0.034 |
xt | -0.032 |
storm | -0.030 |
seven | -0.029 |
liv | -0.029 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.53e-03 |
Pos logit contributions | |
questions | +0.020 |
groups | +0.019 |
triple | +0.018 |
forward | +0.017 |
invitations | +0.017 |
Neg logit contributions | |
ller | -0.016 |
xt | -0.016 |
Twe | -0.015 |
mm | -0.015 |
ugg | -0.015 |
Token | loved |
Token ID | 6151 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.004 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.004 |
xt | -0.004 |
liv | -0.004 |
ugg | -0.004 |
storm | -0.004 |
Token | ch |
Token ID | 442 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
groups | +0.013 |
questions | +0.013 |
triple | +0.013 |
forward | +0.013 |
increasingly | +0.011 |
Neg logit contributions | |
ller | -0.020 |
xt | -0.019 |
seven | -0.017 |
Twe | -0.017 |
liv | -0.017 |
Token | and |
Token ID | 290 |
Feature activation | -6.84e-03 |
Pos logit contributions | |
questions | +0.001 |
triple | +0.001 |
groups | +0.001 |
increasingly | +0.001 |
scientists | +0.001 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
liv | -0.001 |
ugg | -0.001 |
seven | -0.001 |
Token | started |
Token ID | 2067 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
questions | +0.012 |
groups | +0.012 |
triple | +0.010 |
forward | +0.010 |
ices | +0.010 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.009 |
Twe | -0.009 |
ugg | -0.009 |
liv | -0.009 |
Token | eating |
Token ID | 6600 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
xt | +0.016 |
ller | +0.015 |
seven | +0.014 |
chief | +0.014 |
Twe | +0.013 |
Neg logit contributions | |
ac | -0.017 |
groups | -0.017 |
questions | -0.017 |
aky | -0.017 |
forward | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | -7.54e-03 |
Pos logit contributions | |
triple | +0.019 |
questions | +0.019 |
groups | +0.019 |
ac | +0.018 |
ibr | +0.018 |
Neg logit contributions | |
ller | -0.017 |
Twe | -0.016 |
xt | -0.016 |
seven | -0.016 |
mm | -0.016 |
Token | ch |
Token ID | 442 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
groups | +0.011 |
questions | +0.011 |
triple | +0.011 |
forward | +0.010 |
increasingly | +0.010 |
Neg logit contributions | |
ller | -0.011 |
liv | -0.010 |
bow | -0.010 |
xt | -0.010 |
storm | -0.010 |
Token | ocol |
Token ID | 4668 |
Feature activation | -7.17e-02 |
Pos logit contributions | |
questions | +0.038 |
groups | +0.037 |
triple | +0.035 |
forward | +0.035 |
increasingly | +0.035 |
Neg logit contributions | |
ller | -0.041 |
xt | -0.039 |
ugg | -0.037 |
leanor | -0.035 |
liv | -0.035 |
Token | ates |
Token ID | 689 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
questions | +0.107 |
groups | +0.105 |
triple | +0.097 |
forward | +0.094 |
out | +0.091 |
Neg logit contributions | |
ller | -0.123 |
xt | -0.120 |
ugg | -0.114 |
liv | -0.113 |
live | -0.110 |
Token | . |
Token ID | 13 |
Feature activation | +1.65e-03 |
Pos logit contributions | |
questions | +0.045 |
groups | +0.043 |
triple | +0.043 |
increasingly | +0.038 |
scientists | +0.038 |
Neg logit contributions | |
ller | -0.042 |
xt | -0.040 |
seven | -0.037 |
lla | -0.037 |
bow | -0.037 |
Token | The |
Token ID | 383 |
Feature activation | -3.50e-03 |
Pos logit contributions | |
ller | +0.003 |
xt | +0.003 |
ugg | +0.002 |
liv | +0.002 |
seven | +0.002 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.002 |
forward | -0.002 |
ac | -0.002 |
Token | shop |
Token ID | 6128 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
groups | +0.006 |
questions | +0.006 |
forward | +0.006 |
packs | +0.005 |
out | +0.005 |
Neg logit contributions | |
ller | -0.005 |
seven | -0.004 |
bow | -0.004 |
liv | -0.004 |
xt | -0.004 |
Token | keeper |
Token ID | 13884 |
Feature activation | -5.36e-03 |
Pos logit contributions | |
ller | +0.020 |
xt | +0.019 |
liv | +0.018 |
ugg | +0.017 |
bow | +0.017 |
Neg logit contributions | |
questions | -0.024 |
groups | -0.023 |
forward | -0.021 |
triple | -0.020 |
out | -0.020 |
Token | was |
Token ID | 373 |
Feature activation | +9.92e-03 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.023 |
liv | +0.022 |
ugg | +0.021 |
storm | +0.021 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.016 |
triple | -0.015 |
forward | -0.014 |
out | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | -1.09e-03 |
Pos logit contributions | |
ller | +0.019 |
liv | +0.019 |
xt | +0.019 |
seven | +0.018 |
Karen | +0.018 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
triple | -0.010 |
forward | -0.009 |
brothers | -0.009 |
Token | box |
Token ID | 3091 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.001 |
ac | +0.001 |
ices | +0.001 |
iece | +0.001 |
Neg logit contributions | |
ller | -0.002 |
storm | -0.002 |
bow | -0.002 |
Twe | -0.002 |
Stella | -0.002 |
Token | of |
Token ID | 286 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
ller | +0.039 |
xt | +0.037 |
storm | +0.035 |
liv | +0.035 |
ugg | +0.035 |
Neg logit contributions | |
questions | -0.027 |
groups | -0.025 |
triple | -0.024 |
increasingly | -0.022 |
forward | -0.021 |
Token | ch |
Token ID | 442 |
Feature activation | -2.28e-02 |
Pos logit contributions | |
triple | +0.040 |
forward | +0.039 |
groups | +0.038 |
questions | +0.037 |
increasingly | +0.037 |
Neg logit contributions | |
Twe | -0.036 |
ller | -0.036 |
hy | -0.033 |
Karen | -0.033 |
Stella | -0.033 |
Token | ocol |
Token ID | 4668 |
Feature activation | -7.10e-02 |
Pos logit contributions | |
triple | +0.037 |
questions | +0.037 |
increasingly | +0.036 |
groups | +0.036 |
from | +0.034 |
Neg logit contributions | |
xt | -0.031 |
ller | -0.030 |
ugg | -0.027 |
seven | -0.026 |
leanor | -0.026 |
Token | ates |
Token ID | 689 |
Feature activation | -1.87e-02 |
Pos logit contributions | |
questions | +0.098 |
groups | +0.096 |
triple | +0.091 |
forward | +0.086 |
out | +0.082 |
Neg logit contributions | |
ller | -0.127 |
xt | -0.125 |
liv | -0.118 |
ugg | -0.117 |
live | -0.114 |
Token | ! |
Token ID | 0 |
Feature activation | +3.01e-03 |
Pos logit contributions | |
questions | +0.027 |
groups | +0.027 |
triple | +0.027 |
increasingly | +0.023 |
forward | +0.022 |
Neg logit contributions | |
ller | -0.033 |
xt | -0.031 |
seven | -0.029 |
liv | -0.028 |
storm | -0.028 |
Token | Alice |
Token ID | 14862 |
Feature activation | +7.76e-03 |
Pos logit contributions | |
ller | +0.005 |
xt | +0.004 |
storm | +0.004 |
liv | +0.004 |
ugg | +0.004 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.005 |
out | -0.005 |
forward | -0.005 |
into | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.013 |
liv | +0.012 |
ugg | +0.012 |
seven | +0.012 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.011 |
triple | -0.010 |
forward | -0.010 |
out | -0.010 |
Token | her |
Token ID | 607 |
Feature activation | -5.68e-03 |
Pos logit contributions | |
groups | +0.017 |
questions | +0.017 |
triple | +0.016 |
forward | +0.014 |
increasingly | +0.014 |
Neg logit contributions | |
ller | -0.032 |
xt | -0.031 |
liv | -0.030 |
leanor | -0.029 |
ugg | -0.029 |
Token | son |
Token ID | 3367 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
groups | +0.005 |
questions | +0.004 |
forward | +0.004 |
triple | +0.004 |
increasingly | +0.004 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
sed | -0.006 |
ugg | -0.006 |
liv | -0.006 |
Token | is |
Token ID | 318 |
Feature activation | +7.32e-03 |
Pos logit contributions | |
questions | +0.028 |
groups | +0.027 |
triple | +0.025 |
forward | +0.024 |
out | +0.024 |
Neg logit contributions | |
ller | -0.025 |
xt | -0.024 |
liv | -0.023 |
ugg | -0.022 |
storm | -0.022 |
Token | eating |
Token ID | 6600 |
Feature activation | -1.89e-02 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.012 |
storm | +0.011 |
liv | +0.011 |
Twe | +0.011 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.010 |
triple | -0.009 |
ices | -0.009 |
forward | -0.008 |
Token | our |
Token ID | 674 |
Feature activation | +1.46e-03 |
Pos logit contributions | |
questions | +0.028 |
groups | +0.028 |
triple | +0.027 |
forward | +0.024 |
brothers | +0.024 |
Neg logit contributions | |
ller | -0.030 |
xt | -0.029 |
Twe | -0.027 |
seven | -0.027 |
mm | -0.027 |
Token | ch |
Token ID | 442 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
ller | +0.003 |
xt | +0.003 |
liv | +0.002 |
ugg | +0.002 |
bow | +0.002 |
Neg logit contributions | |
groups | -0.002 |
questions | -0.002 |
triple | -0.002 |
forward | -0.002 |
increasingly | -0.002 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.99e-02 |
Pos logit contributions | |
questions | +0.039 |
groups | +0.038 |
triple | +0.036 |
forward | +0.036 |
out | +0.035 |
Neg logit contributions | |
ller | -0.048 |
xt | -0.046 |
ugg | -0.043 |
liv | -0.042 |
bow | -0.041 |
Token | ates |
Token ID | 689 |
Feature activation | -2.61e-02 |
Pos logit contributions | |
questions | +0.105 |
groups | +0.104 |
triple | +0.097 |
forward | +0.093 |
out | +0.091 |
Neg logit contributions | |
ller | -0.119 |
xt | -0.116 |
liv | -0.109 |
ugg | -0.109 |
live | -0.106 |
Token | !" |
Token ID | 2474 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
questions | +0.053 |
groups | +0.052 |
triple | +0.051 |
increasingly | +0.046 |
brothers | +0.046 |
Neg logit contributions | |
ller | -0.030 |
xt | -0.028 |
liv | -0.026 |
storm | -0.025 |
ugg | -0.025 |
Token | |
Token ID | 220 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.023 |
liv | +0.021 |
ugg | +0.021 |
storm | +0.020 |
Neg logit contributions | |
questions | -0.027 |
groups | -0.026 |
triple | -0.025 |
forward | -0.023 |
out | -0.023 |
Token |
|
Token ID | 198 |
Feature activation | +6.93e-03 |
Pos logit contributions | |
ller | +0.020 |
xt | +0.020 |
liv | +0.019 |
ugg | +0.018 |
bow | +0.018 |
Neg logit contributions | |
questions | -0.016 |
groups | -0.015 |
triple | -0.014 |
forward | -0.013 |
out | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
ller | +0.012 |
xt | +0.012 |
liv | +0.011 |
storm | +0.011 |
ugg | +0.011 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.010 |
triple | -0.009 |
forward | -0.009 |
out | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | +3.09e-03 |
Pos logit contributions | |
questions | +0.017 |
triple | +0.017 |
groups | +0.017 |
forward | +0.015 |
increasingly | +0.014 |
Neg logit contributions | |
xt | -0.034 |
ller | -0.033 |
liv | -0.032 |
Twe | -0.031 |
Karen | -0.031 |
Token | big |
Token ID | 1263 |
Feature activation | -4.82e-03 |
Pos logit contributions | |
ller | +0.005 |
storm | +0.005 |
bow | +0.005 |
Raven | +0.005 |
xt | +0.005 |
Neg logit contributions | |
questions | -0.004 |
groups | -0.004 |
triple | -0.004 |
iece | -0.004 |
ices | -0.004 |
Token | box |
Token ID | 3091 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
questions | +0.007 |
groups | +0.007 |
triple | +0.007 |
forward | +0.006 |
into | +0.006 |
Neg logit contributions | |
ller | -0.008 |
xt | -0.008 |
storm | -0.007 |
ugg | -0.007 |
liv | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | -2.43e-02 |
Pos logit contributions | |
ller | +0.036 |
xt | +0.035 |
storm | +0.034 |
ugg | +0.033 |
liv | +0.033 |
Neg logit contributions | |
questions | -0.022 |
groups | -0.020 |
triple | -0.020 |
increasingly | -0.017 |
brothers | -0.017 |
Token | ch |
Token ID | 442 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
triple | +0.035 |
groups | +0.033 |
forward | +0.033 |
increasingly | +0.032 |
questions | +0.032 |
Neg logit contributions | |
Twe | -0.036 |
ller | -0.036 |
xt | -0.036 |
hy | -0.034 |
Karen | -0.034 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.97e-02 |
Pos logit contributions | |
triple | +0.041 |
questions | +0.040 |
increasingly | +0.039 |
groups | +0.038 |
from | +0.038 |
Neg logit contributions | |
xt | -0.027 |
ller | -0.024 |
ugg | -0.023 |
irst | -0.021 |
hy | -0.021 |
Token | ates |
Token ID | 689 |
Feature activation | -2.04e-02 |
Pos logit contributions | |
questions | +0.102 |
groups | +0.099 |
triple | +0.095 |
forward | +0.091 |
out | +0.088 |
Neg logit contributions | |
xt | -0.118 |
ller | -0.117 |
ugg | -0.109 |
liv | -0.109 |
live | -0.105 |
Token | ! |
Token ID | 0 |
Feature activation | -3.05e-03 |
Pos logit contributions | |
questions | +0.029 |
triple | +0.029 |
groups | +0.029 |
increasingly | +0.024 |
brothers | +0.024 |
Neg logit contributions | |
ller | -0.035 |
xt | -0.035 |
liv | -0.032 |
ugg | -0.032 |
storm | -0.032 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +4.34e-03 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.004 |
forward | +0.004 |
out | +0.003 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.005 |
storm | -0.005 |
ugg | -0.005 |
Token | Once |
Token ID | 7454 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
xt | +0.008 |
ller | +0.008 |
liv | +0.008 |
ugg | +0.008 |
bow | +0.008 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.005 |
triple | -0.005 |
forward | -0.005 |
out | -0.004 |
Token | upon |
Token ID | 2402 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
ller | +0.054 |
xt | +0.053 |
liv | +0.051 |
storm | +0.051 |
ugg | +0.051 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.007 |
triple | -0.005 |
forward | -0.005 |
out | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | +2.06e-03 |
Pos logit contributions | |
questions | +0.016 |
groups | +0.016 |
triple | +0.015 |
forward | +0.015 |
ac | +0.013 |
Neg logit contributions | |
ller | -0.026 |
xt | -0.025 |
liv | -0.025 |
Twe | -0.024 |
seven | -0.023 |
Token | big |
Token ID | 1263 |
Feature activation | -5.91e-03 |
Pos logit contributions | |
ller | +0.004 |
storm | +0.003 |
bow | +0.003 |
xt | +0.003 |
Twe | +0.003 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
forward | -0.002 |
ac | -0.002 |
into | -0.002 |
Token | box |
Token ID | 3091 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.008 |
triple | +0.007 |
forward | +0.007 |
increasingly | +0.007 |
Neg logit contributions | |
ller | -0.011 |
xt | -0.010 |
storm | -0.010 |
bow | -0.009 |
liv | -0.009 |
Token | of |
Token ID | 286 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
ller | +0.040 |
xt | +0.039 |
storm | +0.037 |
liv | +0.036 |
ugg | +0.036 |
Neg logit contributions | |
questions | -0.028 |
groups | -0.025 |
triple | -0.025 |
increasingly | -0.022 |
forward | -0.021 |
Token | ch |
Token ID | 442 |
Feature activation | -2.61e-02 |
Pos logit contributions | |
forward | +0.037 |
triple | +0.036 |
iece | +0.034 |
questions | +0.034 |
ac | +0.033 |
Neg logit contributions | |
Twe | -0.041 |
ller | -0.039 |
Karen | -0.038 |
xt | -0.038 |
Stella | -0.037 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.93e-02 |
Pos logit contributions | |
questions | +0.047 |
triple | +0.045 |
increasingly | +0.044 |
plan | +0.043 |
decide | +0.042 |
Neg logit contributions | |
xt | -0.034 |
ller | -0.032 |
ugg | -0.028 |
irst | -0.026 |
round | -0.026 |
Token | ates |
Token ID | 689 |
Feature activation | -2.47e-02 |
Pos logit contributions | |
questions | +0.106 |
groups | +0.101 |
triple | +0.096 |
forward | +0.093 |
out | +0.089 |
Neg logit contributions | |
ller | -0.117 |
xt | -0.116 |
ugg | -0.107 |
liv | -0.107 |
live | -0.104 |
Token | . |
Token ID | 13 |
Feature activation | +4.98e-03 |
Pos logit contributions | |
questions | +0.039 |
triple | +0.038 |
groups | +0.037 |
increasingly | +0.033 |
ac | +0.031 |
Neg logit contributions | |
ller | -0.040 |
xt | -0.038 |
storm | -0.035 |
seven | -0.035 |
liv | -0.034 |
Token | It |
Token ID | 632 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.008 |
liv | +0.007 |
Twe | +0.007 |
ugg | +0.007 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.008 |
triple | -0.007 |
forward | -0.007 |
out | -0.007 |
Token | was |
Token ID | 373 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.022 |
liv | +0.021 |
storm | +0.021 |
ugg | +0.021 |
Neg logit contributions | |
questions | -0.016 |
groups | -0.016 |
triple | -0.015 |
forward | -0.014 |
out | -0.014 |
Token | so |
Token ID | 523 |
Feature activation | +5.86e-03 |
Pos logit contributions | |
ller | +0.024 |
Twe | +0.024 |
Karen | +0.022 |
Stella | +0.022 |
liv | +0.022 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.018 |
ices | -0.018 |
and | -0.018 |
forward | -0.017 |
Token | saw |
Token ID | 2497 |
Feature activation | -7.63e-03 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.005 |
forward | +0.005 |
triple | +0.005 |
out | +0.005 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.005 |
ugg | -0.005 |
leanor | -0.005 |
Token | all |
Token ID | 477 |
Feature activation | +8.68e-03 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.010 |
triple | +0.009 |
forward | +0.009 |
brothers | +0.008 |
Neg logit contributions | |
ller | -0.014 |
xt | -0.014 |
liv | -0.013 |
leanor | -0.013 |
ugg | -0.013 |
Token | the |
Token ID | 262 |
Feature activation | +3.88e-03 |
Pos logit contributions | |
xt | +0.016 |
ller | +0.016 |
liv | +0.015 |
Karen | +0.014 |
Twe | +0.014 |
Neg logit contributions | |
questions | -0.011 |
triple | -0.011 |
groups | -0.011 |
forward | -0.010 |
increasingly | -0.009 |
Token | tasty |
Token ID | 25103 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.007 |
leanor | +0.007 |
liv | +0.007 |
seven | +0.007 |
Neg logit contributions | |
groups | -0.004 |
questions | -0.004 |
triple | -0.004 |
forward | -0.004 |
increasingly | -0.004 |
Token | ch |
Token ID | 442 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
groups | +0.024 |
questions | +0.023 |
forward | +0.022 |
triple | +0.021 |
increasingly | +0.020 |
Neg logit contributions | |
ller | -0.039 |
xt | -0.037 |
mm | -0.035 |
Twe | -0.035 |
Raven | -0.034 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.93e-02 |
Pos logit contributions | |
questions | +0.042 |
groups | +0.040 |
triple | +0.039 |
increasingly | +0.037 |
forward | +0.037 |
Neg logit contributions | |
ller | -0.041 |
xt | -0.040 |
ugg | -0.036 |
mm | -0.036 |
leanor | -0.035 |
Token | ates |
Token ID | 689 |
Feature activation | -3.00e-02 |
Pos logit contributions | |
questions | +0.095 |
groups | +0.091 |
triple | +0.086 |
forward | +0.081 |
out | +0.079 |
Neg logit contributions | |
ller | -0.127 |
xt | -0.125 |
liv | -0.118 |
ugg | -0.116 |
storm | -0.113 |
Token | inside |
Token ID | 2641 |
Feature activation | +4.19e-03 |
Pos logit contributions | |
questions | +0.045 |
triple | +0.044 |
groups | +0.043 |
increasingly | +0.037 |
brothers | +0.036 |
Neg logit contributions | |
ller | -0.051 |
xt | -0.049 |
storm | -0.045 |
liv | -0.045 |
seven | -0.044 |
Token | . |
Token ID | 13 |
Feature activation | -7.32e-03 |
Pos logit contributions | |
ller | +0.007 |
xt | +0.007 |
liv | +0.007 |
storm | +0.006 |
seven | +0.006 |
Neg logit contributions | |
questions | -0.006 |
triple | -0.006 |
groups | -0.006 |
forward | -0.005 |
increasingly | -0.005 |
Token | She |
Token ID | 1375 |
Feature activation | -7.38e-04 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.008 |
out | +0.007 |
into | +0.007 |
triple | +0.007 |
Neg logit contributions | |
ller | -0.016 |
storm | -0.015 |
xt | -0.015 |
liv | -0.014 |
rob | -0.014 |
Token | couldn |
Token ID | 3521 |
Feature activation | +3.61e-03 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
forward | +0.001 |
triple | +0.001 |
out | +0.001 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
liv | -0.001 |
ugg | -0.001 |
leanor | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +7.66e-03 |
Pos logit contributions | |
groups | +0.022 |
triple | +0.021 |
increasingly | +0.020 |
cabinets | +0.020 |
questions | +0.019 |
Neg logit contributions | |
Blue | -0.021 |
Twe | -0.021 |
bye | -0.021 |
Dove | -0.019 |
xt | -0.019 |
Token | big |
Token ID | 1263 |
Feature activation | -5.30e-03 |
Pos logit contributions | |
ller | +0.013 |
Twe | +0.012 |
Raven | +0.011 |
storm | +0.011 |
xt | +0.011 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
iece | -0.011 |
triple | -0.010 |
ices | -0.010 |
Token | box |
Token ID | 3091 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.007 |
triple | +0.007 |
forward | +0.007 |
increasingly | +0.007 |
Neg logit contributions | |
ller | -0.009 |
xt | -0.009 |
storm | -0.008 |
ugg | -0.008 |
Twe | -0.008 |
Token | of |
Token ID | 286 |
Feature activation | -2.37e-02 |
Pos logit contributions | |
ller | +0.025 |
xt | +0.024 |
ugg | +0.024 |
bye | +0.023 |
storm | +0.023 |
Neg logit contributions | |
questions | -0.013 |
triple | -0.012 |
groups | -0.012 |
increasingly | -0.010 |
cabinets | -0.010 |
Token | ch |
Token ID | 442 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
forward | +0.038 |
triple | +0.037 |
groups | +0.037 |
increasingly | +0.036 |
questions | +0.036 |
Neg logit contributions | |
Twe | -0.034 |
ller | -0.032 |
xt | -0.030 |
Karen | -0.028 |
Raven | -0.028 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.85e-02 |
Pos logit contributions | |
increasingly | +0.040 |
questions | +0.039 |
triple | +0.039 |
groups | +0.038 |
from | +0.038 |
Neg logit contributions | |
xt | -0.024 |
ller | -0.023 |
ugg | -0.022 |
irst | -0.019 |
endant | -0.019 |
Token | ates |
Token ID | 689 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
questions | +0.094 |
groups | +0.091 |
triple | +0.087 |
forward | +0.082 |
out | +0.080 |
Neg logit contributions | |
ller | -0.124 |
xt | -0.122 |
ugg | -0.114 |
liv | -0.114 |
leanor | -0.110 |
Token | to |
Token ID | 284 |
Feature activation | -1.28e-02 |
Pos logit contributions | |
triple | +0.030 |
groups | +0.030 |
questions | +0.029 |
increasingly | +0.025 |
scientists | +0.023 |
Neg logit contributions | |
ller | -0.041 |
xt | -0.039 |
ugg | -0.037 |
round | -0.037 |
seven | -0.036 |
Token | share |
Token ID | 2648 |
Feature activation | +1.96e-02 |
Pos logit contributions | |
questions | +0.018 |
groups | +0.018 |
triple | +0.017 |
forward | +0.016 |
out | +0.015 |
Neg logit contributions | |
ller | -0.023 |
xt | -0.022 |
liv | -0.021 |
ugg | -0.021 |
storm | -0.021 |
Token | with |
Token ID | 351 |
Feature activation | -1.75e-04 |
Pos logit contributions | |
ller | +0.035 |
xt | +0.032 |
seven | +0.031 |
Twe | +0.031 |
Raven | +0.030 |
Neg logit contributions | |
triple | -0.027 |
questions | -0.026 |
groups | -0.026 |
increasingly | -0.024 |
forward | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | +9.50e-03 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
triple | +0.000 |
out | +0.000 |
brothers | +0.000 |
Neg logit contributions | |
ller | -0.000 |
xt | -0.000 |
liv | -0.000 |
storm | -0.000 |
ugg | -0.000 |
Token | thumb |
Token ID | 15683 |
Feature activation | +2.88e-04 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
triple | +0.005 |
forward | +0.005 |
out | +0.004 |
Neg logit contributions | |
ller | -0.007 |
xt | -0.007 |
liv | -0.006 |
llers | -0.006 |
ugg | -0.006 |
Token | tried |
Token ID | 3088 |
Feature activation | -1.01e-03 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
liv | +0.000 |
storm | +0.000 |
bow | +0.000 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
invitations | -0.000 |
Token | to |
Token ID | 284 |
Feature activation | -9.72e-03 |
Pos logit contributions | |
groups | +0.001 |
triple | +0.001 |
questions | +0.001 |
brothers | +0.001 |
ac | +0.001 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
seven | -0.002 |
llers | -0.002 |
Twe | -0.001 |
Token | grab |
Token ID | 5552 |
Feature activation | +2.34e-03 |
Pos logit contributions | |
questions | +0.014 |
groups | +0.013 |
triple | +0.013 |
forward | +0.012 |
brothers | +0.011 |
Neg logit contributions | |
ller | -0.017 |
xt | -0.017 |
liv | -0.016 |
storm | -0.016 |
bow | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
ller | +0.003 |
Twe | +0.003 |
xt | +0.003 |
seven | +0.002 |
Dove | +0.002 |
Neg logit contributions | |
groups | -0.005 |
triple | -0.004 |
questions | -0.004 |
brothers | -0.004 |
scientists | -0.004 |
Token | pe |
Token ID | 613 |
Feature activation | -6.84e-02 |
Pos logit contributions | |
groups | +0.023 |
questions | +0.023 |
triple | +0.022 |
forward | +0.021 |
scientists | +0.019 |
Neg logit contributions | |
ller | -0.023 |
xt | -0.022 |
bow | -0.021 |
liv | -0.020 |
seven | -0.020 |
Token | b |
Token ID | 65 |
Feature activation | -5.46e-02 |
Pos logit contributions | |
groups | +0.111 |
questions | +0.104 |
triple | +0.101 |
scientists | +0.096 |
soldiers | +0.094 |
Neg logit contributions | |
ller | -0.114 |
xt | -0.101 |
seven | -0.100 |
liv | -0.098 |
chief | -0.095 |
Token | ble |
Token ID | 903 |
Feature activation | -3.74e-02 |
Pos logit contributions | |
groups | +0.101 |
questions | +0.099 |
triple | +0.093 |
cabinets | +0.087 |
chambers | +0.087 |
Neg logit contributions | |
ller | -0.080 |
bow | -0.067 |
xt | -0.067 |
uch | -0.065 |
chief | -0.064 |
Token | . |
Token ID | 13 |
Feature activation | -4.80e-03 |
Pos logit contributions | |
triple | +0.063 |
questions | +0.061 |
groups | +0.061 |
brothers | +0.057 |
scientists | +0.057 |
Neg logit contributions | |
Twe | -0.051 |
ller | -0.050 |
Stella | -0.048 |
round | -0.047 |
Dove | -0.047 |
Token | She |
Token ID | 1375 |
Feature activation | -3.42e-03 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.007 |
triple | +0.007 |
out | +0.007 |
into | +0.007 |
Neg logit contributions | |
ller | -0.008 |
xt | -0.008 |
liv | -0.007 |
storm | -0.007 |
leanor | -0.007 |
Token | was |
Token ID | 373 |
Feature activation | +9.31e-03 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
triple | +0.005 |
forward | +0.005 |
out | +0.005 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.005 |
leanor | -0.005 |
ugg | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | -9.48e-04 |
Pos logit contributions | |
groups | +0.033 |
triple | +0.033 |
questions | +0.032 |
ices | +0.029 |
brothers | +0.029 |
Neg logit contributions | |
Twe | -0.037 |
ller | -0.036 |
Stella | -0.035 |
Karen | -0.035 |
Raven | -0.035 |
Token | big |
Token ID | 1263 |
Feature activation | -1.13e-03 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
ices | +0.001 |
forward | +0.001 |
triple | +0.001 |
Neg logit contributions | |
ller | -0.002 |
storm | -0.001 |
Raven | -0.001 |
sed | -0.001 |
bow | -0.001 |
Token | box |
Token ID | 3091 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.001 |
triple | +0.001 |
forward | +0.001 |
increasingly | +0.001 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
storm | -0.002 |
liv | -0.002 |
bow | -0.002 |
Token | of |
Token ID | 286 |
Feature activation | -2.69e-02 |
Pos logit contributions | |
ller | +0.041 |
xt | +0.041 |
liv | +0.038 |
storm | +0.038 |
ugg | +0.037 |
Neg logit contributions | |
questions | -0.039 |
groups | -0.037 |
triple | -0.035 |
forward | -0.032 |
increasingly | -0.032 |
Token | ch |
Token ID | 442 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
triple | +0.040 |
forward | +0.038 |
groups | +0.037 |
questions | +0.037 |
increasingly | +0.035 |
Neg logit contributions | |
Twe | -0.041 |
ller | -0.040 |
xt | -0.038 |
Karen | -0.038 |
Stella | -0.038 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.80e-02 |
Pos logit contributions | |
questions | +0.035 |
triple | +0.035 |
increasingly | +0.033 |
groups | +0.033 |
from | +0.032 |
Neg logit contributions | |
xt | -0.029 |
ller | -0.029 |
ugg | -0.026 |
seven | -0.025 |
leanor | -0.025 |
Token | ates |
Token ID | 689 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
questions | +0.095 |
groups | +0.091 |
triple | +0.086 |
forward | +0.082 |
out | +0.079 |
Neg logit contributions | |
ller | -0.122 |
xt | -0.120 |
liv | -0.113 |
ugg | -0.112 |
leanor | -0.109 |
Token | ! |
Token ID | 0 |
Feature activation | -7.04e-03 |
Pos logit contributions | |
questions | +0.030 |
groups | +0.029 |
triple | +0.028 |
increasingly | +0.025 |
forward | +0.025 |
Neg logit contributions | |
ller | -0.028 |
xt | -0.027 |
liv | -0.025 |
storm | -0.025 |
seven | -0.024 |
Token | |
Token ID | 220 |
Feature activation | +6.03e-03 |
Pos logit contributions | |
questions | +0.011 |
groups | +0.011 |
triple | +0.010 |
out | +0.010 |
forward | +0.010 |
Neg logit contributions | |
ller | -0.012 |
xt | -0.011 |
liv | -0.011 |
storm | -0.011 |
leanor | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.011 |
ugg | +0.010 |
storm | +0.010 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.008 |
triple | -0.007 |
forward | -0.007 |
out | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | -3.13e-03 |
Pos logit contributions | |
questions | +0.011 |
groups | +0.010 |
out | +0.009 |
triple | +0.009 |
into | +0.009 |
Neg logit contributions | |
ller | -0.027 |
xt | -0.026 |
storm | -0.026 |
liv | -0.025 |
sed | -0.025 |
Token | It |
Token ID | 632 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
questions | +0.015 |
groups | +0.015 |
triple | +0.014 |
forward | +0.014 |
brothers | +0.013 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.010 |
ugg | -0.010 |
Twe | -0.009 |
liv | -0.009 |
Token | was |
Token ID | 373 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.022 |
liv | +0.022 |
storm | +0.021 |
bow | +0.020 |
Neg logit contributions | |
questions | -0.020 |
groups | -0.019 |
triple | -0.018 |
forward | -0.017 |
out | -0.016 |
Token | filled |
Token ID | 5901 |
Feature activation | +1.55e-03 |
Pos logit contributions | |
ller | +0.025 |
Twe | +0.025 |
Karen | +0.024 |
Stella | +0.024 |
xt | +0.024 |
Neg logit contributions | |
questions | -0.019 |
groups | -0.017 |
forward | -0.017 |
and | -0.016 |
triple | -0.016 |
Token | with |
Token ID | 351 |
Feature activation | -7.31e-03 |
Pos logit contributions | |
xt | +0.003 |
ller | +0.003 |
liv | +0.003 |
Twe | +0.003 |
lla | +0.003 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
brothers | -0.002 |
increasingly | -0.002 |
Token | ch |
Token ID | 442 |
Feature activation | -2.86e-02 |
Pos logit contributions | |
questions | +0.011 |
triple | +0.010 |
forward | +0.010 |
groups | +0.010 |
ices | +0.010 |
Neg logit contributions | |
Twe | -0.011 |
hy | -0.010 |
Stella | -0.010 |
Karen | -0.010 |
ller | -0.010 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.75e-02 |
Pos logit contributions | |
questions | +0.047 |
out | +0.044 |
triple | +0.043 |
groups | +0.043 |
forward | +0.042 |
Neg logit contributions | |
ller | -0.039 |
xt | -0.038 |
ugg | -0.035 |
llers | -0.034 |
mm | -0.033 |
Token | ates |
Token ID | 689 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
questions | +0.099 |
groups | +0.096 |
triple | +0.091 |
forward | +0.088 |
out | +0.084 |
Neg logit contributions | |
ller | -0.116 |
xt | -0.114 |
ugg | -0.106 |
liv | -0.105 |
mm | -0.103 |
Token | and |
Token ID | 290 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
questions | +0.025 |
groups | +0.024 |
triple | +0.023 |
forward | +0.021 |
increasingly | +0.020 |
Neg logit contributions | |
ller | -0.032 |
xt | -0.030 |
bow | -0.028 |
liv | -0.028 |
storm | -0.027 |
Token | coins |
Token ID | 10796 |
Feature activation | -5.89e-03 |
Pos logit contributions | |
ller | +0.019 |
xt | +0.018 |
liv | +0.017 |
seven | +0.017 |
llers | +0.016 |
Neg logit contributions | |
questions | -0.016 |
groups | -0.015 |
forward | -0.015 |
triple | -0.014 |
ac | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -3.39e-03 |
Pos logit contributions | |
questions | +0.009 |
groups | +0.008 |
triple | +0.008 |
forward | +0.007 |
brothers | +0.007 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.010 |
liv | -0.009 |
storm | -0.009 |
bow | -0.009 |
Token | She |
Token ID | 1375 |
Feature activation | -1.49e-03 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.006 |
triple | +0.006 |
forward | +0.005 |
brothers | +0.005 |
Neg logit contributions | |
ller | -0.005 |
xt | -0.004 |
ugg | -0.004 |
Twe | -0.004 |
liv | -0.004 |
Token | her |
Token ID | 607 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
groups | +0.007 |
triple | +0.007 |
questions | +0.007 |
increasingly | +0.006 |
brothers | +0.006 |
Neg logit contributions | |
xt | -0.010 |
Twe | -0.010 |
ller | -0.010 |
ugg | -0.010 |
liv | -0.009 |
Token | a |
Token ID | 257 |
Feature activation | +9.25e-03 |
Pos logit contributions | |
xt | +0.024 |
ugg | +0.022 |
liv | +0.022 |
Twe | +0.021 |
ller | +0.021 |
Neg logit contributions | |
triple | -0.019 |
groups | -0.019 |
questions | -0.019 |
forward | -0.018 |
iece | -0.017 |
Token | box |
Token ID | 3091 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
ugg | +0.016 |
ller | +0.015 |
xt | +0.015 |
liv | +0.015 |
bow | +0.015 |
Neg logit contributions | |
groups | -0.012 |
questions | -0.012 |
iece | -0.011 |
triple | -0.011 |
forward | -0.010 |
Token | of |
Token ID | 286 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
ller | +0.026 |
xt | +0.026 |
ugg | +0.025 |
liv | +0.025 |
storm | +0.024 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.011 |
triple | -0.011 |
increasingly | -0.009 |
forward | -0.009 |
Token | ch |
Token ID | 442 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
forward | +0.034 |
iece | +0.033 |
triple | +0.032 |
and | +0.031 |
increasingly | +0.031 |
Neg logit contributions | |
Twe | -0.033 |
ller | -0.032 |
xt | -0.032 |
oof | -0.031 |
Betsy | -0.031 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.73e-02 |
Pos logit contributions | |
questions | +0.033 |
groups | +0.032 |
triple | +0.032 |
out | +0.031 |
increasingly | +0.031 |
Neg logit contributions | |
xt | -0.025 |
ller | -0.023 |
ugg | -0.022 |
bye | -0.020 |
mm | -0.020 |
Token | ates |
Token ID | 689 |
Feature activation | -1.87e-02 |
Pos logit contributions | |
questions | +0.090 |
groups | +0.087 |
triple | +0.081 |
forward | +0.078 |
out | +0.076 |
Neg logit contributions | |
ller | -0.124 |
xt | -0.123 |
liv | -0.116 |
ugg | -0.115 |
storm | -0.111 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
groups | +0.026 |
triple | +0.026 |
questions | +0.025 |
increasingly | +0.022 |
forward | +0.021 |
Neg logit contributions | |
ller | -0.033 |
xt | -0.032 |
ugg | -0.031 |
seven | -0.030 |
liv | -0.029 |
Token | Lily |
Token ID | 20037 |
Feature activation | -7.88e-03 |
Pos logit contributions | |
ller | +0.030 |
xt | +0.029 |
liv | +0.028 |
leanor | +0.027 |
rob | +0.027 |
Neg logit contributions | |
questions | -0.028 |
groups | -0.028 |
triple | -0.026 |
out | -0.026 |
into | -0.025 |
Token | opened |
Token ID | 4721 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
questions | +0.011 |
groups | +0.010 |
triple | +0.010 |
forward | +0.010 |
out | +0.009 |
Neg logit contributions | |
ller | -0.014 |
xt | -0.014 |
liv | -0.013 |
ugg | -0.013 |
storm | -0.013 |
Token | the |
Token ID | 262 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.012 |
out | +0.012 |
into | +0.011 |
at | +0.011 |
Neg logit contributions | |
ller | -0.025 |
xt | -0.025 |
storm | -0.025 |
liv | -0.024 |
ugg | -0.024 |
Token | a |
Token ID | 257 |
Feature activation | +6.52e-03 |
Pos logit contributions | |
ller | +0.017 |
xt | +0.016 |
liv | +0.016 |
ugg | +0.015 |
storm | +0.015 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.008 |
triple | -0.007 |
forward | -0.007 |
out | -0.006 |
Token | large |
Token ID | 1588 |
Feature activation | +1.19e-04 |
Pos logit contributions | |
ller | +0.011 |
storm | +0.010 |
liv | +0.010 |
xt | +0.010 |
bow | +0.010 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
iece | -0.008 |
triple | -0.008 |
ac | -0.008 |
Token | selection |
Token ID | 6356 |
Feature activation | -1.41e-02 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
storm | +0.000 |
bow | +0.000 |
Twe | +0.000 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
and | -0.000 |
Token | of |
Token ID | 286 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
questions | +0.015 |
groups | +0.014 |
triple | +0.014 |
increasingly | +0.012 |
brothers | +0.011 |
Neg logit contributions | |
xt | -0.028 |
ller | -0.027 |
lla | -0.026 |
ugg | -0.026 |
seven | -0.026 |
Token | ch |
Token ID | 442 |
Feature activation | -2.61e-02 |
Pos logit contributions | |
questions | +0.026 |
triple | +0.025 |
forward | +0.025 |
groups | +0.025 |
iece | +0.023 |
Neg logit contributions | |
ller | -0.037 |
xt | -0.037 |
Twe | -0.034 |
liv | -0.034 |
seven | -0.034 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.70e-02 |
Pos logit contributions | |
questions | +0.042 |
increasingly | +0.040 |
out | +0.039 |
forward | +0.039 |
triple | +0.039 |
Neg logit contributions | |
xt | -0.035 |
ller | -0.035 |
ugg | -0.031 |
round | -0.030 |
seven | -0.030 |
Token | ates |
Token ID | 689 |
Feature activation | -2.28e-02 |
Pos logit contributions | |
questions | +0.104 |
groups | +0.103 |
triple | +0.097 |
forward | +0.094 |
out | +0.091 |
Neg logit contributions | |
xt | -0.107 |
ller | -0.107 |
ugg | -0.099 |
seven | -0.097 |
mm | -0.096 |
Token | . |
Token ID | 13 |
Feature activation | +9.92e-03 |
Pos logit contributions | |
questions | +0.034 |
triple | +0.033 |
groups | +0.033 |
increasingly | +0.030 |
brothers | +0.028 |
Neg logit contributions | |
ller | -0.037 |
xt | -0.035 |
seven | -0.033 |
bow | -0.033 |
liv | -0.032 |
Token | Ell |
Token ID | 7122 |
Feature activation | +6.30e-03 |
Pos logit contributions | |
ller | +0.015 |
xt | +0.014 |
liv | +0.013 |
storm | +0.013 |
ugg | +0.013 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.017 |
triple | -0.016 |
forward | -0.015 |
out | -0.015 |
Token | a |
Token ID | 64 |
Feature activation | -5.29e-03 |
Pos logit contributions | |
xt | +0.014 |
ller | +0.014 |
liv | +0.013 |
ugg | +0.013 |
leanor | +0.013 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.006 |
triple | -0.006 |
forward | -0.005 |
out | -0.005 |
Token | picked |
Token ID | 6497 |
Feature activation | -4.54e-03 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.007 |
forward | +0.007 |
triple | +0.007 |
out | +0.007 |
Neg logit contributions | |
ller | -0.009 |
xt | -0.009 |
liv | -0.008 |
ugg | -0.008 |
leanor | -0.008 |
Token | as |
Token ID | 355 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
ller | +0.026 |
storm | +0.024 |
xt | +0.024 |
bye | +0.022 |
bow | +0.022 |
Neg logit contributions | |
triple | -0.024 |
groups | -0.023 |
questions | -0.023 |
ac | -0.022 |
increasingly | -0.021 |
Token | he |
Token ID | 339 |
Feature activation | -7.94e-03 |
Pos logit contributions | |
groups | +0.027 |
questions | +0.026 |
triple | +0.026 |
ac | +0.023 |
increasingly | +0.023 |
Neg logit contributions | |
ller | -0.025 |
xt | -0.023 |
Twe | -0.022 |
liv | -0.022 |
storm | -0.021 |
Token | opened |
Token ID | 4721 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.013 |
triple | +0.012 |
forward | +0.012 |
out | +0.012 |
Neg logit contributions | |
ller | -0.012 |
xt | -0.012 |
liv | -0.011 |
storm | -0.011 |
leanor | -0.010 |
Token | the |
Token ID | 262 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
triple | +0.013 |
questions | +0.013 |
groups | +0.012 |
brothers | +0.011 |
scientists | +0.011 |
Neg logit contributions | |
ller | -0.020 |
xt | -0.019 |
Twe | -0.018 |
liv | -0.018 |
seven | -0.018 |
Token | ch |
Token ID | 442 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
triple | +0.020 |
groups | +0.020 |
ices | +0.019 |
questions | +0.019 |
and | +0.019 |
Neg logit contributions | |
ller | -0.024 |
storm | -0.022 |
hy | -0.022 |
Raven | -0.021 |
sed | -0.021 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.66e-02 |
Pos logit contributions | |
questions | +0.041 |
groups | +0.041 |
triple | +0.040 |
out | +0.038 |
cabinets | +0.037 |
Neg logit contributions | |
ller | -0.039 |
xt | -0.038 |
ugg | -0.034 |
storm | -0.033 |
round | -0.033 |
Token | ates |
Token ID | 689 |
Feature activation | -3.41e-02 |
Pos logit contributions | |
groups | +0.106 |
questions | +0.106 |
triple | +0.100 |
forward | +0.094 |
out | +0.091 |
Neg logit contributions | |
ller | -0.105 |
xt | -0.104 |
ugg | -0.096 |
seven | -0.095 |
liv | -0.095 |
Token | and |
Token ID | 290 |
Feature activation | +2.17e-03 |
Pos logit contributions | |
triple | +0.053 |
questions | +0.051 |
groups | +0.049 |
increasingly | +0.044 |
scientists | +0.043 |
Neg logit contributions | |
ller | -0.054 |
xt | -0.051 |
round | -0.049 |
storm | -0.048 |
seven | -0.047 |
Token | started |
Token ID | 2067 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
ller | +0.003 |
xt | +0.003 |
storm | +0.003 |
Twe | +0.003 |
liv | +0.003 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.003 |
ices | -0.003 |
Token | eating |
Token ID | 6600 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
ller | +0.019 |
xt | +0.019 |
llers | +0.017 |
seven | +0.017 |
Karen | +0.016 |
Neg logit contributions | |
groups | -0.017 |
ac | -0.017 |
questions | -0.017 |
triple | -0.016 |
forward | -0.015 |
Token | them |
Token ID | 606 |
Feature activation | -5.39e-03 |
Pos logit contributions | |
triple | +0.017 |
groups | +0.017 |
questions | +0.016 |
ac | +0.016 |
scientists | +0.015 |
Neg logit contributions | |
Twe | -0.019 |
ller | -0.018 |
Stella | -0.018 |
xt | -0.018 |
Blue | -0.017 |
Token | was |
Token ID | 373 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.006 |
liv | +0.005 |
bow | +0.005 |
storm | +0.005 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.005 |
triple | -0.005 |
forward | -0.004 |
brothers | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | +8.55e-04 |
Pos logit contributions | |
ller | +0.011 |
liv | +0.011 |
xt | +0.011 |
Twe | +0.010 |
Karen | +0.010 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
forward | -0.006 |
triple | -0.006 |
ac | -0.005 |
Token | box |
Token ID | 3091 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
ller | +0.002 |
storm | +0.001 |
xt | +0.001 |
bow | +0.001 |
liv | +0.001 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
ac | -0.001 |
ices | -0.001 |
aked | -0.001 |
Token | of |
Token ID | 286 |
Feature activation | -2.33e-02 |
Pos logit contributions | |
ller | +0.045 |
xt | +0.043 |
storm | +0.041 |
liv | +0.040 |
hy | +0.040 |
Neg logit contributions | |
questions | -0.036 |
groups | -0.032 |
triple | -0.031 |
increasingly | -0.029 |
brothers | -0.027 |
Token | ch |
Token ID | 442 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
forward | +0.034 |
triple | +0.033 |
iece | +0.031 |
groups | +0.031 |
questions | +0.031 |
Neg logit contributions | |
Karen | -0.033 |
Twe | -0.033 |
ller | -0.033 |
xt | -0.031 |
hy | -0.030 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.63e-02 |
Pos logit contributions | |
questions | +0.036 |
triple | +0.035 |
groups | +0.034 |
increasingly | +0.034 |
decide | +0.033 |
Neg logit contributions | |
xt | -0.028 |
ller | -0.028 |
ugg | -0.025 |
leanor | -0.024 |
seven | -0.023 |
Token | ates |
Token ID | 689 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
questions | +0.101 |
groups | +0.097 |
triple | +0.092 |
forward | +0.088 |
increasingly | +0.084 |
Neg logit contributions | |
ller | -0.111 |
xt | -0.110 |
ugg | -0.102 |
liv | -0.102 |
seven | -0.099 |
Token | . |
Token ID | 13 |
Feature activation | +5.69e-03 |
Pos logit contributions | |
questions | +0.025 |
groups | +0.024 |
triple | +0.023 |
increasingly | +0.020 |
ac | +0.020 |
Neg logit contributions | |
ller | -0.027 |
xt | -0.026 |
storm | -0.024 |
liv | -0.024 |
bow | -0.024 |
Token | " |
Token ID | 366 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.008 |
liv | +0.007 |
bow | +0.007 |
Twe | +0.007 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.010 |
triple | -0.010 |
forward | -0.009 |
out | -0.009 |
Token | For |
Token ID | 1890 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
xt | +0.022 |
seven | +0.021 |
ller | +0.021 |
bow | +0.021 |
ugg | +0.020 |
Neg logit contributions | |
questions | -0.031 |
groups | -0.030 |
triple | -0.028 |
out | -0.027 |
brothers | -0.027 |
Token | me |
Token ID | 502 |
Feature activation | -7.04e-03 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.017 |
liv | +0.016 |
seven | +0.016 |
storm | +0.016 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.014 |
triple | -0.013 |
forward | -0.012 |
out | -0.012 |
Token | she |
Token ID | 673 |
Feature activation | -3.10e-03 |
Pos logit contributions | |
questions | +0.018 |
groups | +0.017 |
triple | +0.016 |
forward | +0.015 |
ac | +0.015 |
Neg logit contributions | |
xt | -0.015 |
ller | -0.015 |
liv | -0.014 |
ugg | -0.014 |
Stella | -0.013 |
Token | paid |
Token ID | 3432 |
Feature activation | -9.75e-03 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.006 |
forward | +0.005 |
triple | +0.005 |
and | +0.005 |
Neg logit contributions | |
ller | -0.004 |
xt | -0.004 |
ugg | -0.003 |
liv | -0.003 |
seven | -0.003 |
Token | for |
Token ID | 329 |
Feature activation | -3.47e-03 |
Pos logit contributions | |
groups | +0.013 |
triple | +0.011 |
increasingly | +0.011 |
questions | +0.011 |
ey | +0.010 |
Neg logit contributions | |
ller | -0.017 |
xt | -0.017 |
liv | -0.016 |
Stella | -0.016 |
Karen | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | +1.53e-05 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.004 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.007 |
xt | -0.007 |
liv | -0.007 |
ugg | -0.007 |
storm | -0.007 |
Token | ch |
Token ID | 442 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
storm | +0.000 |
bow | +0.000 |
liv | +0.000 |
Neg logit contributions | |
groups | -0.000 |
questions | -0.000 |
triple | -0.000 |
forward | -0.000 |
into | -0.000 |
Token | ocol |
Token ID | 4668 |
Feature activation | -6.63e-02 |
Pos logit contributions | |
groups | +0.032 |
questions | +0.032 |
triple | +0.030 |
forward | +0.029 |
out | +0.028 |
Neg logit contributions | |
ller | -0.038 |
xt | -0.036 |
ugg | -0.034 |
bow | -0.033 |
seven | -0.033 |
Token | ates |
Token ID | 689 |
Feature activation | -2.34e-02 |
Pos logit contributions | |
groups | +0.099 |
questions | +0.098 |
triple | +0.091 |
forward | +0.087 |
out | +0.085 |
Neg logit contributions | |
ller | -0.113 |
xt | -0.110 |
ugg | -0.105 |
liv | -0.103 |
bow | -0.101 |
Token | and |
Token ID | 290 |
Feature activation | +3.54e-03 |
Pos logit contributions | |
groups | +0.031 |
questions | +0.031 |
triple | +0.030 |
brothers | +0.026 |
increasingly | +0.026 |
Neg logit contributions | |
ller | -0.042 |
xt | -0.040 |
ugg | -0.039 |
liv | -0.039 |
storm | -0.038 |
Token | the |
Token ID | 262 |
Feature activation | -4.95e-03 |
Pos logit contributions | |
ller | +0.005 |
xt | +0.005 |
liv | +0.005 |
Twe | +0.004 |
ugg | +0.004 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
forward | -0.006 |
triple | -0.006 |
ac | -0.005 |
Token | two |
Token ID | 734 |
Feature activation | -2.19e-02 |
Pos logit contributions | |
groups | +0.008 |
questions | +0.007 |
forward | +0.007 |
triple | +0.007 |
into | +0.007 |
Neg logit contributions | |
ller | -0.008 |
xt | -0.007 |
Raven | -0.007 |
bow | -0.007 |
storm | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
questions | +0.024 |
groups | +0.023 |
increasingly | +0.022 |
forward | +0.021 |
triple | +0.021 |
Neg logit contributions | |
xt | -0.041 |
ller | -0.038 |
hy | -0.038 |
Karen | -0.037 |
lla | -0.036 |
Token | to |
Token ID | 284 |
Feature activation | -8.27e-03 |
Pos logit contributions | |
xt | +0.023 |
ller | +0.023 |
Karen | +0.020 |
llers | +0.020 |
Twe | +0.020 |
Neg logit contributions | |
ac | -0.025 |
groups | -0.025 |
invitations | -0.023 |
triple | -0.022 |
questions | -0.022 |
Token | run |
Token ID | 1057 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
ac | +0.015 |
groups | +0.014 |
triple | +0.014 |
questions | +0.014 |
invitations | +0.014 |
Neg logit contributions | |
xt | -0.010 |
ller | -0.010 |
storm | -0.010 |
Karen | -0.010 |
Twe | -0.010 |
Token | fast |
Token ID | 3049 |
Feature activation | +9.44e-03 |
Pos logit contributions | |
ller | +0.025 |
bye | +0.025 |
Twe | +0.025 |
xt | +0.025 |
round | +0.024 |
Neg logit contributions | |
groups | -0.021 |
questions | -0.020 |
triple | -0.019 |
brothers | -0.019 |
ac | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +4.24e-03 |
Pos logit contributions | |
xt | +0.015 |
ller | +0.015 |
storm | +0.013 |
seven | +0.012 |
Twe | +0.012 |
Neg logit contributions | |
triple | -0.014 |
groups | -0.013 |
questions | -0.013 |
ac | -0.013 |
increasingly | -0.013 |
Token | He |
Token ID | 679 |
Feature activation | -1.47e-03 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.006 |
liv | +0.006 |
ugg | +0.006 |
Twe | +0.005 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
triple | -0.007 |
forward | -0.006 |
invitations | -0.006 |
Token | bumped |
Token ID | 38034 |
Feature activation | +3.80e-02 |
Pos logit contributions | |
groups | +0.002 |
questions | +0.002 |
triple | +0.002 |
forward | +0.002 |
invitations | +0.002 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
liv | -0.002 |
leanor | -0.002 |
storm | -0.002 |
Token | into |
Token ID | 656 |
Feature activation | +8.39e-04 |
Pos logit contributions | |
ller | +0.089 |
xt | +0.085 |
Twe | +0.082 |
llers | +0.078 |
seven | +0.078 |
Neg logit contributions | |
questions | -0.035 |
groups | -0.034 |
triple | -0.030 |
invitations | -0.030 |
cabinets | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | -3.54e-03 |
Pos logit contributions | |
ller | +0.001 |
Twe | +0.001 |
Kitty | +0.001 |
Karen | +0.001 |
xt | +0.001 |
Neg logit contributions | |
forward | -0.001 |
triple | -0.001 |
questions | -0.001 |
groups | -0.001 |
ac | -0.001 |
Token | tree |
Token ID | 5509 |
Feature activation | +2.51e-02 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
triple | +0.005 |
forward | +0.004 |
ac | +0.004 |
Neg logit contributions | |
ller | -0.006 |
storm | -0.006 |
xt | -0.005 |
bow | -0.005 |
Raven | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +5.74e-05 |
Pos logit contributions | |
ller | +0.051 |
xt | +0.048 |
storm | +0.047 |
bow | +0.044 |
liv | +0.044 |
Neg logit contributions | |
questions | -0.031 |
groups | -0.029 |
triple | -0.028 |
invitations | -0.026 |
brothers | -0.025 |
Token | looked |
Token ID | 3114 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
liv | +0.000 |
storm | +0.000 |
ugg | +0.000 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
brothers | -0.000 |
Token | Everyone |
Token ID | 11075 |
Feature activation | -6.39e-04 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.013 |
liv | +0.012 |
ugg | +0.012 |
storm | +0.012 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.014 |
triple | -0.013 |
forward | -0.013 |
out | -0.013 |
Token | was |
Token ID | 373 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
groups | +0.001 |
questions | +0.001 |
triple | +0.001 |
invitations | +0.001 |
cabinets | +0.001 |
Neg logit contributions | |
xt | -0.001 |
ller | -0.001 |
liv | -0.001 |
lla | -0.001 |
leanor | -0.001 |
Token | shocked |
Token ID | 11472 |
Feature activation | -5.74e-04 |
Pos logit contributions | |
ller | +0.021 |
xt | +0.020 |
liv | +0.019 |
Karen | +0.019 |
Twe | +0.019 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.013 |
triple | -0.012 |
forward | -0.011 |
cabinets | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
triple | +0.001 |
increasingly | +0.001 |
forward | +0.001 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
storm | -0.001 |
Twe | -0.001 |
bye | -0.001 |
Token | ran |
Token ID | 4966 |
Feature activation | +1.58e-02 |
Pos logit contributions | |
ller | +0.025 |
xt | +0.024 |
liv | +0.023 |
storm | +0.022 |
leanor | +0.022 |
Neg logit contributions | |
questions | -0.018 |
groups | -0.018 |
triple | -0.017 |
forward | -0.016 |
out | -0.015 |
Token | away |
Token ID | 1497 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
ller | +0.029 |
xt | +0.029 |
Twe | +0.028 |
Karen | +0.028 |
liv | +0.028 |
Neg logit contributions | |
groups | -0.020 |
questions | -0.019 |
triple | -0.018 |
brothers | -0.017 |
ac | -0.016 |
Token | quickly |
Token ID | 2952 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
ller | +0.075 |
xt | +0.072 |
liv | +0.069 |
storm | +0.068 |
Twe | +0.067 |
Neg logit contributions | |
questions | -0.048 |
groups | -0.046 |
triple | -0.045 |
brothers | -0.040 |
forward | -0.039 |
Token | . |
Token ID | 13 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.016 |
storm | +0.016 |
Karen | +0.015 |
seven | +0.015 |
Neg logit contributions | |
triple | -0.015 |
questions | -0.015 |
groups | -0.015 |
ac | -0.013 |
brothers | -0.013 |
Token | But |
Token ID | 887 |
Feature activation | +6.49e-03 |
Pos logit contributions | |
ller | +0.021 |
xt | +0.021 |
storm | +0.020 |
liv | +0.019 |
ugg | +0.019 |
Neg logit contributions | |
questions | -0.014 |
groups | -0.014 |
triple | -0.012 |
out | -0.012 |
forward | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | -2.23e-03 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.010 |
liv | +0.010 |
storm | +0.009 |
ugg | +0.009 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.010 |
triple | -0.010 |
forward | -0.009 |
brothers | -0.009 |
Token | vendor |
Token ID | 18371 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
groups | +0.004 |
questions | +0.004 |
triple | +0.004 |
into | +0.003 |
ac | +0.003 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
storm | -0.003 |
bye | -0.003 |
Stella | -0.003 |
Token | too |
Token ID | 1165 |
Feature activation | +4.07e-03 |
Pos logit contributions | |
ller | +0.002 |
xt | +0.002 |
liv | +0.002 |
Twe | +0.002 |
ugg | +0.002 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
triple | -0.001 |
forward | -0.001 |
brothers | -0.001 |
Token | many |
Token ID | 867 |
Feature activation | +9.30e-03 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.008 |
liv | +0.008 |
storm | +0.008 |
ugg | +0.007 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.005 |
triple | -0.004 |
forward | -0.004 |
out | -0.004 |
Token | berries |
Token ID | 36322 |
Feature activation | -5.24e-03 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.018 |
liv | +0.017 |
ugg | +0.016 |
storm | +0.016 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
triple | -0.010 |
forward | -0.010 |
out | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
questions | +0.007 |
groups | +0.007 |
triple | +0.006 |
brothers | +0.005 |
invitations | +0.005 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.010 |
storm | -0.009 |
liv | -0.009 |
ugg | -0.009 |
Token | his |
Token ID | 465 |
Feature activation | -1.64e-03 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.017 |
liv | +0.016 |
storm | +0.016 |
Twe | +0.016 |
Neg logit contributions | |
questions | -0.016 |
groups | -0.016 |
forward | -0.015 |
triple | -0.015 |
out | -0.014 |
Token | tum |
Token ID | 11814 |
Feature activation | +3.94e-02 |
Pos logit contributions | |
groups | +0.002 |
questions | +0.002 |
triple | +0.002 |
forward | +0.002 |
out | +0.002 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
sed | -0.003 |
storm | -0.003 |
ugg | -0.003 |
Token | my |
Token ID | 1820 |
Feature activation | -6.11e-03 |
Pos logit contributions | |
ller | +0.086 |
xt | +0.086 |
leanor | +0.083 |
storm | +0.082 |
sed | +0.080 |
Neg logit contributions | |
questions | -0.035 |
out | -0.032 |
groups | -0.031 |
brothers | -0.030 |
into | -0.030 |
Token | hurt |
Token ID | 5938 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.010 |
triple | +0.009 |
forward | +0.008 |
invitations | +0.008 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.010 |
storm | -0.009 |
liv | -0.009 |
ugg | -0.009 |
Token | so |
Token ID | 523 |
Feature activation | +7.22e-04 |
Pos logit contributions | |
ller | +0.043 |
xt | +0.042 |
Twe | +0.041 |
liv | +0.039 |
storm | +0.039 |
Neg logit contributions | |
questions | -0.036 |
groups | -0.035 |
triple | -0.033 |
invitations | -0.030 |
ports | -0.028 |
Token | much |
Token ID | 881 |
Feature activation | -5.88e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
liv | +0.001 |
ugg | +0.001 |
storm | +0.001 |
Neg logit contributions | |
questions | -0.001 |
groups | -0.001 |
triple | -0.001 |
forward | -0.001 |
out | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +1.97e-03 |
Pos logit contributions | |
groups | +0.009 |
questions | +0.009 |
triple | +0.008 |
ac | +0.008 |
forward | +0.008 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.009 |
storm | -0.009 |
Twe | -0.009 |
liv | -0.009 |
Token | threw |
Token ID | 9617 |
Feature activation | -2.25e-03 |
Pos logit contributions | |
ller | +0.000 |
xt | +0.000 |
Twe | +0.000 |
liv | +0.000 |
sed | +0.000 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
ices | -0.000 |
Token | them |
Token ID | 606 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
triple | +0.004 |
questions | +0.003 |
groups | +0.003 |
ibr | +0.003 |
ices | +0.003 |
Neg logit contributions | |
Twe | -0.003 |
Stella | -0.003 |
xt | -0.003 |
Blue | -0.003 |
Dove | -0.003 |
Token | outside |
Token ID | 2354 |
Feature activation | +4.03e-04 |
Pos logit contributions | |
triple | +0.018 |
questions | +0.015 |
groups | +0.014 |
increasingly | +0.014 |
scientists | +0.014 |
Neg logit contributions | |
xt | -0.020 |
Blue | -0.018 |
Twe | -0.018 |
ugg | -0.018 |
ller | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | -5.15e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.000 |
seven | +0.000 |
storm | +0.000 |
Twe | +0.000 |
Neg logit contributions | |
triple | -0.001 |
questions | -0.001 |
groups | -0.001 |
increasingly | -0.001 |
servants | -0.001 |
Token | They |
Token ID | 1119 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.007 |
triple | +0.007 |
forward | +0.007 |
out | +0.007 |
Neg logit contributions | |
ller | -0.009 |
xt | -0.009 |
liv | -0.008 |
storm | -0.008 |
ugg | -0.008 |
Token | slammed |
Token ID | 21376 |
Feature activation | +4.04e-02 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.022 |
liv | +0.020 |
ugg | +0.020 |
storm | +0.020 |
Neg logit contributions | |
questions | -0.025 |
groups | -0.024 |
triple | -0.023 |
forward | -0.022 |
out | -0.021 |
Token | the |
Token ID | 262 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
ller | +0.094 |
xt | +0.093 |
liv | +0.090 |
ugg | +0.089 |
mm | +0.088 |
Neg logit contributions | |
groups | -0.034 |
questions | -0.034 |
out | -0.031 |
into | -0.031 |
triple | -0.029 |
Token | door |
Token ID | 3420 |
Feature activation | -1.13e-03 |
Pos logit contributions | |
triple | +0.027 |
questions | +0.025 |
groups | +0.024 |
ices | +0.023 |
increasingly | +0.023 |
Neg logit contributions | |
ller | -0.028 |
sed | -0.026 |
storm | -0.026 |
xt | -0.025 |
hy | -0.025 |
Token | behind |
Token ID | 2157 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
questions | +0.001 |
triple | +0.001 |
groups | +0.001 |
brothers | +0.001 |
increasingly | +0.001 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
storm | -0.002 |
liv | -0.002 |
hy | -0.002 |
Token | them |
Token ID | 606 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
xt | +0.020 |
ller | +0.019 |
liv | +0.018 |
storm | +0.018 |
Twe | +0.018 |
Neg logit contributions | |
questions | -0.015 |
triple | -0.014 |
groups | -0.013 |
forward | -0.012 |
increasingly | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -6.41e-03 |
Pos logit contributions | |
triple | +0.020 |
questions | +0.020 |
groups | +0.019 |
increasingly | +0.018 |
ac | +0.017 |
Neg logit contributions | |
ller | -0.020 |
xt | -0.019 |
storm | -0.018 |
bow | -0.018 |
hy | -0.017 |
Token | she |
Token ID | 673 |
Feature activation | -3.94e-03 |
Pos logit contributions | |
groups | +0.006 |
questions | +0.005 |
triple | +0.005 |
invitations | +0.005 |
brothers | +0.005 |
Neg logit contributions | |
ller | -0.005 |
xt | -0.005 |
liv | -0.005 |
Twe | -0.005 |
ugg | -0.005 |
Token | also |
Token ID | 635 |
Feature activation | -2.24e-03 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.006 |
triple | +0.006 |
forward | +0.006 |
out | +0.006 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.006 |
leanor | -0.005 |
ugg | -0.005 |
Token | didn |
Token ID | 1422 |
Feature activation | +9.69e-03 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.004 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
liv | -0.003 |
ugg | -0.003 |
leanor | -0.003 |
Token | â |
Token ID | 22940 |
Feature activation | +1.69e-06 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.006 |
liv | +0.005 |
storm | +0.004 |
bow | +0.004 |
Neg logit contributions | |
questions | -0.025 |
groups | -0.024 |
triple | -0.024 |
forward | -0.023 |
brothers | -0.022 |
Token | € |
Token ID | 26391 |
Feature activation | +1.22e-02 |
Token | ™ |
Token ID | 8151 |
Feature activation | +3.94e-02 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.017 |
storm | +0.016 |
ugg | +0.016 |
liv | +0.016 |
Neg logit contributions | |
questions | -0.020 |
groups | -0.020 |
triple | -0.019 |
forward | -0.018 |
out | -0.018 |
Token | t |
Token ID | 83 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
ller | +0.030 |
xt | +0.030 |
liv | +0.027 |
ugg | +0.025 |
storm | +0.024 |
Neg logit contributions | |
questions | -0.095 |
groups | -0.093 |
triple | -0.090 |
forward | -0.085 |
out | -0.085 |
Token | want |
Token ID | 765 |
Feature activation | +4.04e-03 |
Pos logit contributions | |
ller | +0.017 |
xt | +0.016 |
storm | +0.015 |
seven | +0.015 |
liv | +0.015 |
Neg logit contributions | |
groups | -0.015 |
questions | -0.014 |
triple | -0.014 |
forward | -0.012 |
brothers | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | -6.07e-05 |
Pos logit contributions | |
xt | +0.008 |
ller | +0.008 |
liv | +0.008 |
ugg | +0.008 |
seven | +0.007 |
Neg logit contributions | |
groups | -0.004 |
questions | -0.004 |
triple | -0.004 |
forward | -0.004 |
brothers | -0.004 |
Token | special |
Token ID | 2041 |
Feature activation | -1.12e-03 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
triple | +0.000 |
forward | +0.000 |
out | +0.000 |
Neg logit contributions | |
ller | -0.000 |
xt | -0.000 |
liv | -0.000 |
storm | -0.000 |
leanor | -0.000 |
Token | thing |
Token ID | 1517 |
Feature activation | +1.21e-03 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
triple | +0.002 |
forward | +0.001 |
out | +0.001 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
liv | -0.002 |
storm | -0.002 |
ugg | -0.002 |
Token | playing |
Token ID | 2712 |
Feature activation | +1.54e-03 |
Pos logit contributions | |
groups | +0.001 |
questions | +0.001 |
triple | +0.001 |
forward | +0.001 |
increasingly | +0.001 |
Neg logit contributions | |
xt | -0.001 |
ller | -0.001 |
liv | -0.001 |
storm | -0.001 |
ugg | -0.001 |
Token | with |
Token ID | 351 |
Feature activation | +6.26e-03 |
Pos logit contributions | |
xt | +0.003 |
liv | +0.002 |
ller | +0.002 |
storm | +0.002 |
leanor | +0.002 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
ac | -0.002 |
older | -0.002 |
Token | his |
Token ID | 465 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
xt | +0.013 |
ller | +0.013 |
liv | +0.013 |
Twe | +0.013 |
ugg | +0.012 |
Neg logit contributions | |
groups | -0.006 |
questions | -0.006 |
triple | -0.005 |
forward | -0.005 |
out | -0.004 |
Token | tie |
Token ID | 9839 |
Feature activation | +3.82e-03 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.022 |
liv | +0.021 |
ugg | +0.020 |
storm | +0.020 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
triple | -0.010 |
forward | -0.009 |
out | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
ller | +0.007 |
xt | +0.006 |
liv | +0.006 |
bow | +0.006 |
storm | +0.006 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.005 |
triple | -0.005 |
increasingly | -0.004 |
cabinets | -0.004 |
Token | being |
Token ID | 852 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
ller | +0.018 |
xt | +0.018 |
liv | +0.018 |
ugg | +0.016 |
leanor | +0.016 |
Neg logit contributions | |
questions | -0.017 |
groups | -0.017 |
triple | -0.015 |
forward | -0.015 |
ac | -0.014 |
Token | obedient |
Token ID | 41652 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
xt | +0.025 |
ller | +0.025 |
liv | +0.024 |
seven | +0.023 |
leanor | +0.023 |
Neg logit contributions | |
questions | -0.016 |
groups | -0.015 |
triple | -0.013 |
forward | -0.012 |
cabinets | -0.012 |
Token | that |
Token ID | 326 |
Feature activation | -1.23e-03 |
Pos logit contributions | |
ller | +0.026 |
xt | +0.026 |
liv | +0.024 |
storm | +0.024 |
ugg | +0.024 |
Neg logit contributions | |
questions | -0.018 |
groups | -0.018 |
triple | -0.017 |
increasingly | -0.015 |
forward | -0.015 |
Token | day |
Token ID | 1110 |
Feature activation | +5.36e-03 |
Pos logit contributions | |
groups | +0.002 |
questions | +0.002 |
triple | +0.002 |
invitations | +0.002 |
cabinets | +0.002 |
Neg logit contributions | |
xt | -0.002 |
ller | -0.002 |
liv | -0.002 |
bye | -0.002 |
storm | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -1.76e-03 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.010 |
liv | +0.010 |
storm | +0.010 |
ugg | +0.010 |
Neg logit contributions | |
groups | -0.006 |
questions | -0.006 |
triple | -0.006 |
invitations | -0.005 |
increasingly | -0.005 |
Token | He |
Token ID | 679 |
Feature activation | -1.66e-03 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
triple | +0.002 |
forward | +0.002 |
out | +0.002 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
liv | -0.003 |
ugg | -0.003 |
leanor | -0.003 |
Token | all |
Token ID | 477 |
Feature activation | +7.41e-03 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.022 |
Twe | +0.021 |
Karen | +0.020 |
Stella | +0.020 |
Neg logit contributions | |
triple | -0.023 |
groups | -0.022 |
ac | -0.021 |
questions | -0.020 |
aked | -0.019 |
Token | about |
Token ID | 546 |
Feature activation | +4.74e-03 |
Pos logit contributions | |
xt | +0.011 |
ller | +0.011 |
liv | +0.010 |
Karen | +0.010 |
Stella | +0.010 |
Neg logit contributions | |
triple | -0.012 |
groups | -0.011 |
questions | -0.011 |
forward | -0.010 |
ac | -0.010 |
Token | being |
Token ID | 852 |
Feature activation | +4.66e-03 |
Pos logit contributions | |
ller | +0.009 |
xt | +0.009 |
liv | +0.008 |
Twe | +0.008 |
llers | +0.008 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
triple | -0.006 |
forward | -0.005 |
out | -0.005 |
Token | en |
Token ID | 551 |
Feature activation | -8.47e-03 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.008 |
liv | +0.007 |
seven | +0.007 |
Twe | +0.007 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
triple | -0.006 |
forward | -0.005 |
cabinets | -0.005 |
Token | vious |
Token ID | 1442 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
questions | +0.013 |
triple | +0.013 |
groups | +0.013 |
cabinets | +0.012 |
out | +0.012 |
Neg logit contributions | |
xt | -0.013 |
ller | -0.012 |
ugg | -0.012 |
bye | -0.012 |
bow | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | -1.06e-03 |
Pos logit contributions | |
ller | +0.026 |
xt | +0.025 |
storm | +0.024 |
bow | +0.023 |
bye | +0.023 |
Neg logit contributions | |
questions | -0.016 |
triple | -0.015 |
groups | -0.015 |
forward | -0.013 |
increasingly | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -3.03e-03 |
Pos logit contributions | |
questions | +0.001 |
groups | +0.001 |
triple | +0.001 |
forward | +0.001 |
out | +0.001 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
liv | -0.002 |
storm | -0.002 |
ugg | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | +3.44e-03 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.004 |
triple | +0.003 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.005 |
ugg | -0.005 |
storm | -0.005 |
Token | The |
Token ID | 464 |
Feature activation | -6.59e-04 |
Pos logit contributions | |
liv | +0.005 |
xt | +0.005 |
ller | +0.005 |
leanor | +0.005 |
live | +0.005 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
out | -0.006 |
into | -0.005 |
triple | -0.005 |
Token | two |
Token ID | 734 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
groups | +0.001 |
forward | +0.001 |
into | +0.001 |
out | +0.001 |
triple | +0.001 |
Neg logit contributions | |
ller | -0.001 |
bye | -0.001 |
xt | -0.001 |
sed | -0.001 |
storm | -0.001 |
Token | friends |
Token ID | 2460 |
Feature activation | -4.39e-03 |
Pos logit contributions | |
questions | +0.017 |
triple | +0.016 |
cabinets | +0.016 |
increasingly | +0.016 |
forward | +0.015 |
Neg logit contributions | |
xt | -0.034 |
ller | -0.031 |
mm | -0.030 |
bye | -0.030 |
ue | -0.029 |
Token | The |
Token ID | 383 |
Feature activation | +3.59e-03 |
Pos logit contributions | |
ller | +0.015 |
xt | +0.014 |
liv | +0.014 |
ugg | +0.013 |
storm | +0.013 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.012 |
triple | -0.011 |
forward | -0.010 |
out | -0.010 |
Token | boy |
Token ID | 2933 |
Feature activation | -9.74e-03 |
Pos logit contributions | |
Twe | +0.005 |
ller | +0.005 |
storm | +0.005 |
Dove | +0.005 |
Raven | +0.005 |
Neg logit contributions | |
and | -0.005 |
packs | -0.005 |
groups | -0.005 |
forward | -0.005 |
into | -0.005 |
Token | was |
Token ID | 373 |
Feature activation | +7.91e-03 |
Pos logit contributions | |
questions | +0.016 |
groups | +0.016 |
forward | +0.015 |
triple | +0.014 |
out | +0.014 |
Neg logit contributions | |
ller | -0.015 |
xt | -0.015 |
liv | -0.013 |
leanor | -0.013 |
ugg | -0.013 |
Token | sad |
Token ID | 6507 |
Feature activation | -3.87e-04 |
Pos logit contributions | |
ller | +0.014 |
xt | +0.014 |
liv | +0.013 |
Twe | +0.013 |
Stella | +0.012 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.010 |
triple | -0.010 |
ices | -0.009 |
cabinets | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +7.56e-03 |
Pos logit contributions | |
groups | +0.001 |
triple | +0.001 |
questions | +0.001 |
ac | +0.001 |
invitations | +0.001 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
storm | -0.001 |
ugg | -0.001 |
Twe | -0.001 |
Token | knew |
Token ID | 2993 |
Feature activation | +9.08e-03 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.012 |
liv | +0.011 |
Twe | +0.011 |
storm | +0.011 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
triple | -0.010 |
forward | -0.010 |
ices | -0.009 |
Token | he |
Token ID | 339 |
Feature activation | +1.97e-03 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.012 |
liv | +0.012 |
Twe | +0.012 |
Karen | +0.011 |
Neg logit contributions | |
groups | -0.016 |
questions | -0.015 |
triple | -0.015 |
forward | -0.014 |
ac | -0.013 |
Token | had |
Token ID | 550 |
Feature activation | +4.81e-03 |
Pos logit contributions | |
ller | +0.003 |
xt | +0.003 |
liv | +0.003 |
ugg | +0.003 |
storm | +0.003 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.003 |
out | -0.003 |
Token | made |
Token ID | 925 |
Feature activation | -2.84e-03 |
Pos logit contributions | |
xt | +0.008 |
ller | +0.008 |
liv | +0.007 |
ugg | +0.007 |
storm | +0.007 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
triple | -0.007 |
forward | -0.006 |
out | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
groups | +0.004 |
questions | +0.003 |
triple | +0.003 |
forward | +0.003 |
packs | +0.003 |
Neg logit contributions | |
Twe | -0.005 |
ller | -0.005 |
xt | -0.005 |
liv | -0.005 |
Karen | -0.005 |
Token | mistake |
Token ID | 7457 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
ller | +0.025 |
Twe | +0.023 |
str | +0.022 |
storm | +0.021 |
bye | +0.021 |
Neg logit contributions | |
groups | -0.028 |
iece | -0.028 |
ibr | -0.028 |
questions | -0.028 |
aked | -0.027 |
Token | Shark |
Token ID | 28616 |
Feature activation | -4.63e-03 |
Pos logit contributions | |
ller | +0.021 |
xt | +0.020 |
liv | +0.019 |
storm | +0.018 |
ugg | +0.018 |
Neg logit contributions | |
questions | -0.027 |
groups | -0.027 |
triple | -0.026 |
forward | -0.025 |
increasingly | -0.024 |
Token | y |
Token ID | 88 |
Feature activation | -1.02e-04 |
Pos logit contributions | |
questions | +0.007 |
groups | +0.006 |
triple | +0.006 |
forward | +0.006 |
increasingly | +0.006 |
Neg logit contributions | |
ller | -0.008 |
xt | -0.008 |
liv | -0.007 |
ugg | -0.007 |
bow | -0.007 |
Token | !" |
Token ID | 2474 |
Feature activation | +9.63e-03 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
triple | +0.000 |
forward | +0.000 |
increasingly | +0.000 |
Neg logit contributions | |
ller | -0.000 |
xt | -0.000 |
bye | -0.000 |
bow | -0.000 |
storm | -0.000 |
Token | |
Token ID | 220 |
Feature activation | +4.89e-03 |
Pos logit contributions | |
ller | +0.015 |
xt | +0.015 |
liv | +0.014 |
bow | +0.014 |
ugg | +0.014 |
Neg logit contributions | |
questions | -0.015 |
groups | -0.015 |
triple | -0.014 |
forward | -0.013 |
out | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -1.99e-03 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.008 |
liv | +0.007 |
ugg | +0.007 |
bow | +0.007 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.007 |
triple | -0.007 |
forward | -0.007 |
invitations | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +5.19e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.002 |
forward | +0.002 |
out | +0.002 |
Neg logit contributions | |
ller | -0.004 |
xt | -0.004 |
liv | -0.003 |
ugg | -0.003 |
storm | -0.003 |
Token | Joe |
Token ID | 19585 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
xt | +0.007 |
ller | +0.007 |
liv | +0.007 |
leanor | +0.007 |
seven | +0.007 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
out | -0.009 |
into | -0.008 |
forward | -0.008 |
Token | y |
Token ID | 88 |
Feature activation | -6.08e-03 |
Pos logit contributions | |
questions | +0.019 |
groups | +0.018 |
triple | +0.017 |
forward | +0.016 |
out | +0.016 |
Neg logit contributions | |
ller | -0.022 |
xt | -0.022 |
liv | -0.020 |
ugg | -0.020 |
bow | -0.020 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.60e-02 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.010 |
triple | +0.009 |
forward | +0.009 |
out | +0.009 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.009 |
liv | -0.009 |
ugg | -0.008 |
storm | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -1.25e-03 |
Pos logit contributions | |
groups | +0.020 |
questions | +0.020 |
triple | +0.019 |
cabinets | +0.017 |
scientists | +0.016 |
Neg logit contributions | |
ller | -0.032 |
xt | -0.030 |
Twe | -0.028 |
bye | -0.028 |
ugg | -0.027 |
Token | asked |
Token ID | 1965 |
Feature activation | +4.94e-03 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
triple | +0.002 |
out | +0.002 |
into | +0.002 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
liv | -0.002 |
storm | -0.002 |
ugg | -0.002 |
Token | like |
Token ID | 588 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
ller | +0.021 |
xt | +0.021 |
liv | +0.019 |
storm | +0.019 |
seven | +0.019 |
Neg logit contributions | |
questions | -0.021 |
groups | -0.021 |
triple | -0.019 |
forward | -0.019 |
brothers | -0.018 |
Token | for |
Token ID | 329 |
Feature activation | -7.76e-03 |
Pos logit contributions | |
groups | +0.025 |
questions | +0.025 |
triple | +0.024 |
forward | +0.023 |
increasingly | +0.022 |
Neg logit contributions | |
ller | -0.023 |
xt | -0.022 |
seven | -0.020 |
storm | -0.020 |
liv | -0.019 |
Token | a |
Token ID | 257 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
questions | +0.012 |
groups | +0.012 |
triple | +0.011 |
forward | +0.010 |
out | +0.010 |
Neg logit contributions | |
ller | -0.013 |
xt | -0.012 |
liv | -0.012 |
ugg | -0.011 |
storm | -0.011 |
Token | treat |
Token ID | 2190 |
Feature activation | +7.37e-04 |
Pos logit contributions | |
xt | +0.020 |
ller | +0.019 |
storm | +0.019 |
bow | +0.018 |
ugg | +0.018 |
Neg logit contributions | |
groups | -0.019 |
questions | -0.018 |
iece | -0.017 |
brothers | -0.017 |
triple | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | +7.45e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
storm | +0.001 |
seven | +0.001 |
bye | +0.001 |
Neg logit contributions | |
groups | -0.001 |
questions | -0.001 |
triple | -0.001 |
increasingly | -0.001 |
forward | -0.001 |
Token | Ell |
Token ID | 7122 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
ller | +0.012 |
Twe | +0.011 |
xt | +0.011 |
Stella | +0.011 |
Karen | +0.011 |
Neg logit contributions | |
groups | -0.011 |
questions | -0.010 |
triple | -0.010 |
ices | -0.010 |
forward | -0.009 |
Token | a |
Token ID | 64 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.022 |
liv | +0.021 |
ugg | +0.021 |
leanor | +0.020 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.012 |
triple | -0.011 |
out | -0.010 |
forward | -0.010 |
Token | ." |
Token ID | 526 |
Feature activation | +1.74e-02 |
Pos logit contributions | |
questions | +0.020 |
groups | +0.019 |
triple | +0.018 |
forward | +0.018 |
out | +0.017 |
Neg logit contributions | |
ller | -0.013 |
xt | -0.012 |
liv | -0.011 |
ugg | -0.011 |
seven | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | +3.27e-04 |
Pos logit contributions | |
ller | +0.031 |
xt | +0.030 |
liv | +0.028 |
storm | +0.028 |
leanor | +0.027 |
Neg logit contributions | |
questions | -0.025 |
groups | -0.024 |
triple | -0.023 |
out | -0.021 |
forward | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | +6.82e-03 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
liv | +0.001 |
storm | +0.001 |
ugg | +0.001 |
Neg logit contributions | |
questions | -0.000 |
groups | -0.000 |
triple | -0.000 |
forward | -0.000 |
out | -0.000 |
Token | E |
Token ID | 36 |
Feature activation | +4.60e-03 |
Pos logit contributions | |
xt | +0.010 |
ller | +0.009 |
liv | +0.009 |
ugg | +0.009 |
leanor | +0.009 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.012 |
triple | -0.011 |
out | -0.011 |
forward | -0.011 |
Token | a |
Token ID | 257 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
questions | +0.019 |
groups | +0.019 |
triple | +0.018 |
forward | +0.017 |
increasingly | +0.016 |
Neg logit contributions | |
ller | -0.030 |
xt | -0.029 |
storm | -0.027 |
liv | -0.026 |
seven | -0.026 |
Token | pirate |
Token ID | 25868 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
ller | +0.020 |
storm | +0.018 |
xt | +0.018 |
bye | +0.017 |
bow | +0.017 |
Neg logit contributions | |
questions | -0.015 |
groups | -0.014 |
triple | -0.014 |
forward | -0.013 |
into | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | +5.13e-03 |
Pos logit contributions | |
ller | +0.026 |
xt | +0.024 |
storm | +0.024 |
bye | +0.023 |
Raven | +0.023 |
Neg logit contributions | |
questions | -0.020 |
groups | -0.020 |
triple | -0.019 |
increasingly | -0.018 |
forward | -0.017 |
Token | a |
Token ID | 257 |
Feature activation | +8.97e-03 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.007 |
seven | +0.007 |
Twe | +0.007 |
storm | +0.007 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.008 |
triple | -0.008 |
forward | -0.008 |
ices | -0.007 |
Token | treasure |
Token ID | 14068 |
Feature activation | +7.80e-03 |
Pos logit contributions | |
ller | +0.016 |
storm | +0.015 |
xt | +0.014 |
sed | +0.014 |
Raven | +0.014 |
Neg logit contributions | |
questions | -0.012 |
groups | -0.012 |
triple | -0.012 |
ices | -0.011 |
forward | -0.011 |
Token | ." |
Token ID | 526 |
Feature activation | -6.61e-03 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.012 |
storm | +0.012 |
bye | +0.012 |
seven | +0.012 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.011 |
triple | -0.011 |
increasingly | -0.010 |
forward | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -1.76e-02 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.010 |
triple | +0.010 |
forward | +0.009 |
out | +0.009 |
Neg logit contributions | |
ller | -0.011 |
xt | -0.010 |
liv | -0.010 |
ugg | -0.010 |
seven | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -9.90e-03 |
Pos logit contributions | |
questions | +0.021 |
groups | +0.020 |
triple | +0.019 |
out | +0.018 |
forward | +0.018 |
Neg logit contributions | |
ller | -0.035 |
xt | -0.034 |
liv | -0.033 |
storm | -0.032 |
ugg | -0.032 |
Token | They |
Token ID | 2990 |
Feature activation | -1.15e-05 |
Pos logit contributions | |
questions | +0.017 |
groups | +0.016 |
triple | +0.015 |
out | +0.015 |
forward | +0.015 |
Neg logit contributions | |
ller | -0.015 |
xt | -0.015 |
liv | -0.014 |
leanor | -0.014 |
seven | -0.014 |
Token | take |
Token ID | 1011 |
Feature activation | -6.27e-03 |
Pos logit contributions | |
questions | +0.000 |
groups | +0.000 |
triple | +0.000 |
and | +0.000 |
brothers | +0.000 |
Neg logit contributions | |
xt | -0.000 |
ller | -0.000 |
bow | -0.000 |
leanor | -0.000 |
storm | -0.000 |
Token | turns |
Token ID | 4962 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
questions | +0.009 |
groups | +0.009 |
triple | +0.009 |
increasingly | +0.008 |
mage | +0.008 |
Neg logit contributions | |
xt | -0.009 |
bye | -0.009 |
ller | -0.009 |
Twe | -0.009 |
Dove | -0.009 |
Token | toys |
Token ID | 14958 |
Feature activation | -3.98e-03 |
Pos logit contributions | |
xt | +0.042 |
ller | +0.040 |
sed | +0.040 |
liv | +0.039 |
ugg | +0.037 |
Neg logit contributions | |
questions | -0.032 |
forward | -0.031 |
triple | -0.031 |
increasingly | -0.030 |
iece | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | +6.32e-03 |
Pos logit contributions | |
triple | +0.006 |
questions | +0.006 |
groups | +0.005 |
increasingly | +0.005 |
forward | +0.005 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
bow | -0.006 |
storm | -0.006 |
ugg | -0.005 |
Token | books |
Token ID | 3835 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.010 |
Twe | +0.009 |
storm | +0.009 |
Karen | +0.009 |
Neg logit contributions | |
forward | -0.009 |
questions | -0.009 |
groups | -0.009 |
triple | -0.008 |
increasingly | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +4.89e-03 |
Pos logit contributions | |
ller | +0.035 |
xt | +0.034 |
liv | +0.032 |
storm | +0.032 |
ugg | +0.032 |
Neg logit contributions | |
questions | -0.021 |
groups | -0.020 |
triple | -0.020 |
forward | -0.017 |
out | -0.017 |
Token | One |
Token ID | 1881 |
Feature activation | -7.82e-03 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.008 |
liv | +0.008 |
storm | +0.008 |
leanor | +0.007 |
Neg logit contributions | |
questions | -0.008 |
groups | -0.008 |
triple | -0.007 |
out | -0.007 |
forward | -0.007 |
Token | day |
Token ID | 1110 |
Feature activation | -3.03e-03 |
Pos logit contributions | |
groups | +0.012 |
questions | +0.012 |
triple | +0.011 |
forward | +0.011 |
increasingly | +0.011 |
Neg logit contributions | |
xt | -0.012 |
ller | -0.012 |
liv | -0.012 |
bye | -0.011 |
ugg | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | +2.24e-03 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.003 |
triple | +0.003 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.006 |
storm | -0.006 |
ugg | -0.005 |
Token | they |
Token ID | 484 |
Feature activation | +8.88e-03 |
Pos logit contributions | |
ller | +0.004 |
xt | +0.004 |
liv | +0.003 |
storm | +0.003 |
ugg | +0.003 |
Neg logit contributions | |
questions | -0.004 |
groups | -0.003 |
triple | -0.003 |
out | -0.003 |
forward | -0.003 |
Token | find |
Token ID | 1064 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
xt | +0.011 |
bye | +0.011 |
Twe | +0.011 |
Stella | +0.010 |
storm | +0.010 |
Neg logit contributions | |
questions | -0.014 |
ices | -0.013 |
and | -0.013 |
triple | -0.013 |
increasingly | -0.013 |
Token | a |
Token ID | 257 |
Feature activation | +5.74e-03 |
Pos logit contributions | |
questions | +0.011 |
groups | +0.010 |
triple | +0.009 |
forward | +0.009 |
increasingly | +0.008 |
Neg logit contributions | |
xt | -0.023 |
ller | -0.023 |
liv | -0.022 |
ugg | -0.022 |
leanor | -0.021 |
Token | huge |
Token ID | 3236 |
Feature activation | -5.59e-03 |
Pos logit contributions | |
ller | +0.011 |
storm | +0.010 |
xt | +0.010 |
liv | +0.010 |
Raven | +0.010 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
iece | -0.006 |
forward | -0.006 |
triple | -0.006 |
Token | train |
Token ID | 4512 |
Feature activation | +7.03e-03 |
Pos logit contributions | |
ller | +0.012 |
xt | +0.011 |
storm | +0.011 |
liv | +0.011 |
bye | +0.011 |
Neg logit contributions | |
questions | -0.009 |
groups | -0.009 |
triple | -0.008 |
forward | -0.008 |
into | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +3.51e-03 |
Pos logit contributions | |
ller | +0.013 |
storm | +0.012 |
xt | +0.012 |
bye | +0.012 |
bow | +0.011 |
Neg logit contributions | |
questions | -0.010 |
groups | -0.009 |
triple | -0.009 |
increasingly | -0.008 |
brothers | -0.008 |
Token | |
Token ID | 220 |
Feature activation | +4.98e-03 |
Pos logit contributions | |
ller | +0.006 |
xt | +0.006 |
liv | +0.006 |
storm | +0.006 |
leanor | +0.006 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.005 |
triple | -0.005 |
out | -0.005 |
forward | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -2.11e-03 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.009 |
liv | +0.009 |
storm | +0.009 |
ugg | +0.009 |
Neg logit contributions | |
questions | -0.006 |
groups | -0.006 |
triple | -0.006 |
forward | -0.005 |
out | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +7.20e-03 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
triple | +0.002 |
out | +0.002 |
forward | +0.002 |
Neg logit contributions | |
ller | -0.004 |
xt | -0.004 |
liv | -0.004 |
storm | -0.004 |
ugg | -0.004 |
Token | Suddenly |
Token ID | 38582 |
Feature activation | -1.92e-02 |
Pos logit contributions | |
xt | +0.012 |
liv | +0.012 |
ller | +0.012 |
leanor | +0.011 |
storm | +0.011 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.010 |
out | -0.009 |
forward | -0.009 |
triple | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | -5.38e-03 |
Pos logit contributions | |
questions | +0.027 |
groups | +0.025 |
triple | +0.024 |
forward | +0.022 |
brothers | +0.021 |
Neg logit contributions | |
ller | -0.034 |
xt | -0.034 |
liv | -0.032 |
storm | -0.031 |
ugg | -0.031 |
Token | the |
Token ID | 262 |
Feature activation | -6.18e-03 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.009 |
triple | +0.009 |
forward | +0.008 |
ac | +0.008 |
Neg logit contributions | |
ller | -0.008 |
xt | -0.007 |
liv | -0.007 |
Twe | -0.007 |
storm | -0.007 |
Token | train |
Token ID | 4512 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.009 |
triple | +0.009 |
forward | +0.009 |
into | +0.008 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.009 |
storm | -0.009 |
liv | -0.009 |
leanor | -0.009 |
Token | arrived |
Token ID | 5284 |
Feature activation | -1.92e-02 |
Pos logit contributions | |
ller | +0.023 |
xt | +0.022 |
storm | +0.022 |
liv | +0.021 |
bow | +0.020 |
Neg logit contributions | |
questions | -0.021 |
groups | -0.020 |
triple | -0.019 |
forward | -0.018 |
out | -0.017 |
Token | and |
Token ID | 290 |
Feature activation | +3.80e-03 |
Pos logit contributions | |
questions | +0.025 |
triple | +0.021 |
groups | +0.020 |
ibr | +0.019 |
ac | +0.019 |
Neg logit contributions | |
ller | -0.034 |
xt | -0.033 |
liv | -0.031 |
sed | -0.030 |
llers | -0.030 |
Token | loved |
Token ID | 6151 |
Feature activation | -3.41e-03 |
Pos logit contributions | |
ller | +0.009 |
xt | +0.009 |
seven | +0.008 |
liv | +0.008 |
storm | +0.008 |
Neg logit contributions | |
questions | -0.007 |
triple | -0.007 |
groups | -0.006 |
at | -0.006 |
brothers | -0.006 |
Token | her |
Token ID | 607 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
questions | +0.004 |
groups | +0.003 |
triple | +0.003 |
out | +0.003 |
forward | +0.003 |
Neg logit contributions | |
ller | -0.007 |
xt | -0.007 |
liv | -0.007 |
storm | -0.007 |
ugg | -0.007 |
Token | cocoa |
Token ID | 35845 |
Feature activation | +1.72e-03 |
Pos logit contributions | |
ller | +0.038 |
xt | +0.037 |
storm | +0.035 |
seven | +0.034 |
liv | +0.034 |
Neg logit contributions | |
questions | -0.020 |
groups | -0.018 |
triple | -0.017 |
out | -0.017 |
brothers | -0.016 |
Token | very |
Token ID | 845 |
Feature activation | -7.67e-04 |
Pos logit contributions | |
ller | +0.004 |
xt | +0.003 |
liv | +0.003 |
storm | +0.003 |
ugg | +0.003 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
forward | -0.002 |
out | -0.002 |
Token | much |
Token ID | 881 |
Feature activation | -8.64e-03 |
Pos logit contributions | |
questions | +0.000 |
at | +0.000 |
groups | +0.000 |
very | +0.000 |
out | +0.000 |
Neg logit contributions | |
sed | -0.002 |
ller | -0.002 |
bow | -0.002 |
storm | -0.002 |
seven | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -2.31e-03 |
Pos logit contributions | |
questions | +0.005 |
from | +0.005 |
at | +0.005 |
out | +0.005 |
into | +0.004 |
Neg logit contributions | |
xt | -0.023 |
liv | -0.022 |
ller | -0.022 |
bow | -0.021 |
llers | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
questions | +0.001 |
out | +0.001 |
groups | +0.001 |
at | +0.001 |
from | +0.001 |
Neg logit contributions | |
ller | -0.006 |
storm | -0.006 |
liv | -0.006 |
xt | -0.006 |
uch | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -2.47e-03 |
Pos logit contributions | |
questions | +0.012 |
groups | +0.010 |
out | +0.009 |
at | +0.009 |
forward | +0.008 |
Neg logit contributions | |
ller | -0.029 |
xt | -0.028 |
storm | -0.028 |
liv | -0.027 |
sed | -0.027 |
Token | One |
Token ID | 3198 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
at | +0.002 |
out | +0.002 |
date | +0.002 |
Neg logit contributions | |
ller | -0.006 |
sed | -0.005 |
chief | -0.005 |
ses | -0.005 |
llers | -0.005 |
Token | day |
Token ID | 1110 |
Feature activation | +1.72e-03 |
Pos logit contributions | |
questions | +0.015 |
groups | +0.015 |
triple | +0.014 |
forward | +0.013 |
out | +0.013 |
Neg logit contributions | |
ller | -0.021 |
xt | -0.020 |
liv | -0.019 |
ugg | -0.019 |
storm | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | +4.17e-03 |
Pos logit contributions | |
ller | +0.004 |
liv | +0.004 |
xt | +0.004 |
llers | +0.004 |
seven | +0.004 |
Neg logit contributions | |
out | -0.001 |
at | -0.001 |
questions | -0.001 |
into | -0.001 |
from | -0.001 |
Token | � |
Token ID | 241 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
ugg | +0.034 |
ller | +0.033 |
storm | +0.032 |
xt | +0.032 |
irst | +0.032 |
Neg logit contributions | |
questions | -0.037 |
triple | -0.033 |
forward | -0.032 |
at | -0.032 |
un | -0.032 |
Token | Hello |
Token ID | 15496 |
Feature activation | -2.46e-03 |
Pos logit contributions | |
ller | +0.019 |
xt | +0.018 |
storm | +0.017 |
liv | +0.017 |
ugg | +0.016 |
Neg logit contributions | |
questions | -0.015 |
groups | -0.014 |
triple | -0.014 |
forward | -0.013 |
out | -0.013 |
Token | , |
Token ID | 11 |
Feature activation | -1.84e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.003 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.004 |
xt | -0.004 |
liv | -0.004 |
ugg | -0.004 |
storm | -0.004 |
Token | â |
Token ID | 22940 |
Feature activation | +8.58e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.003 |
triple | +0.003 |
forward | +0.003 |
out | +0.003 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
liv | -0.003 |
storm | -0.002 |
ugg | -0.002 |
Token | € |
Token ID | 26391 |
Feature activation | +1.95e-02 |
Pos logit contributions | |
sed | +0.013 |
ller | +0.013 |
llers | +0.012 |
xt | +0.012 |
ses | +0.012 |
Neg logit contributions | |
forward | -0.012 |
� | -0.012 |
questions | -0.012 |
by | -0.012 |
un | -0.012 |
Token | said |
Token ID | 531 |
Feature activation | -4.96e-03 |
Pos logit contributions | |
ller | +0.033 |
xt | +0.033 |
seven | +0.032 |
liv | +0.032 |
ugg | +0.031 |
Neg logit contributions | |
groups | -0.025 |
triple | -0.024 |
questions | -0.024 |
at | -0.023 |
out | -0.023 |
Token | Daisy |
Token ID | 40355 |
Feature activation | -6.03e-03 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.008 |
triple | +0.008 |
forward | +0.007 |
out | +0.007 |
Neg logit contributions | |
ller | -0.007 |
xt | -0.007 |
liv | -0.007 |
ugg | -0.007 |
storm | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.008 |
triple | +0.008 |
forward | +0.007 |
out | +0.007 |
Neg logit contributions | |
ller | -0.011 |
xt | -0.011 |
liv | -0.010 |
ugg | -0.010 |
storm | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -8.58e-03 |
Pos logit contributions | |
questions | +0.017 |
groups | +0.016 |
triple | +0.015 |
forward | +0.014 |
out | +0.014 |
Neg logit contributions | |
ller | -0.019 |
xt | -0.018 |
liv | -0.017 |
storm | -0.017 |
ugg | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | +1.33e-03 |
Pos logit contributions | |
questions | +0.010 |
groups | +0.010 |
triple | +0.009 |
forward | +0.009 |
out | +0.008 |
Neg logit contributions | |
ller | -0.017 |
xt | -0.017 |
liv | -0.016 |
storm | -0.016 |
ugg | -0.016 |
Token | The |
Token ID | 464 |
Feature activation | -6.45e-03 |
Pos logit contributions | |
ller | +0.002 |
xt | +0.002 |
liv | +0.002 |
ugg | +0.002 |
storm | +0.002 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
out | -0.002 |
forward | -0.002 |
Token | ble |
Token ID | 903 |
Feature activation | -2.06e-02 |
Pos logit contributions | |
groups | +0.066 |
questions | +0.063 |
triple | +0.059 |
forward | +0.055 |
cabinets | +0.054 |
Neg logit contributions | |
ller | -0.070 |
xt | -0.064 |
seven | -0.062 |
mm | -0.061 |
bow | -0.061 |
Token | ." |
Token ID | 526 |
Feature activation | +6.84e-03 |
Pos logit contributions | |
questions | +0.037 |
groups | +0.037 |
triple | +0.036 |
increasingly | +0.032 |
cabinets | +0.032 |
Neg logit contributions | |
ller | -0.028 |
xt | -0.026 |
storm | -0.024 |
bye | -0.024 |
ugg | -0.024 |
Token | Sam |
Token ID | 3409 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
ller | +0.011 |
xt | +0.011 |
liv | +0.010 |
ugg | +0.010 |
bow | +0.010 |
Neg logit contributions | |
questions | -0.011 |
groups | -0.010 |
triple | -0.010 |
forward | -0.010 |
out | -0.009 |
Token | took |
Token ID | 1718 |
Feature activation | -8.81e-03 |
Pos logit contributions | |
questions | +0.024 |
groups | +0.023 |
triple | +0.022 |
forward | +0.022 |
out | +0.021 |
Neg logit contributions | |
ller | -0.023 |
xt | -0.023 |
liv | -0.021 |
ugg | -0.020 |
bow | -0.020 |
Token | the |
Token ID | 262 |
Feature activation | -5.36e-03 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.012 |
triple | +0.011 |
increasingly | +0.011 |
cabinets | +0.010 |
Neg logit contributions | |
xt | -0.014 |
ller | -0.014 |
Twe | -0.014 |
bye | -0.013 |
liv | -0.013 |
Token | pe |
Token ID | 613 |
Feature activation | -6.11e-02 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
triple | +0.004 |
forward | +0.004 |
out | +0.004 |
Neg logit contributions | |
ller | -0.012 |
xt | -0.012 |
liv | -0.011 |
seven | -0.011 |
ugg | -0.011 |
Token | b |
Token ID | 65 |
Feature activation | -4.66e-02 |
Pos logit contributions | |
groups | +0.106 |
questions | +0.096 |
triple | +0.096 |
scientists | +0.094 |
soldiers | +0.092 |
Neg logit contributions | |
ller | -0.091 |
seven | -0.084 |
xt | -0.080 |
mm | -0.074 |
round | -0.074 |
Token | ble |
Token ID | 903 |
Feature activation | -3.45e-02 |
Pos logit contributions | |
groups | +0.088 |
questions | +0.081 |
triple | +0.077 |
scientists | +0.075 |
cabinets | +0.075 |
Neg logit contributions | |
ller | -0.065 |
seven | -0.058 |
xt | -0.057 |
mm | -0.057 |
bow | -0.056 |
Token | and |
Token ID | 290 |
Feature activation | -3.49e-03 |
Pos logit contributions | |
triple | +0.055 |
groups | +0.055 |
cabinets | +0.055 |
scientists | +0.051 |
ibr | +0.051 |
Neg logit contributions | |
bye | -0.053 |
round | -0.051 |
Twe | -0.049 |
ugg | -0.046 |
ller | -0.045 |
Token | said |
Token ID | 531 |
Feature activation | -4.82e-03 |
Pos logit contributions | |
questions | +0.005 |
groups | +0.005 |
triple | +0.005 |
forward | +0.005 |
out | +0.005 |
Neg logit contributions | |
ller | -0.006 |
xt | -0.006 |
liv | -0.005 |
ugg | -0.005 |
storm | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
questions | +0.006 |
groups | +0.005 |
triple | +0.005 |
forward | +0.005 |
out | +0.005 |
Neg logit contributions | |
ller | -0.010 |
xt | -0.010 |
liv | -0.009 |
storm | -0.009 |
ugg | -0.009 |
Token | was |
Token ID | 373 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
groups | +0.025 |
questions | +0.024 |
triple | +0.023 |
invitations | +0.021 |
forward | +0.021 |
Neg logit contributions | |
ller | -0.030 |
xt | -0.027 |
Twe | -0.027 |
llers | -0.026 |
seven | -0.026 |
Token | able |
Token ID | 1498 |
Feature activation | +4.44e-03 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.021 |
liv | +0.021 |
seven | +0.021 |
Karen | +0.020 |
Neg logit contributions | |
groups | -0.018 |
questions | -0.017 |
triple | -0.016 |
ices | -0.014 |
invitations | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | -6.10e-03 |
Pos logit contributions | |
ller | +0.008 |
xt | +0.007 |
Twe | +0.007 |
liv | +0.007 |
Karen | +0.007 |
Neg logit contributions | |
groups | -0.006 |
questions | -0.006 |
triple | -0.006 |
forward | -0.005 |
increasingly | -0.005 |
Token | move |
Token ID | 1445 |
Feature activation | +5.05e-03 |
Pos logit contributions | |
questions | +0.008 |
groups | +0.008 |
triple | +0.008 |
forward | +0.008 |
invitations | +0.007 |
Neg logit contributions | |
ller | -0.011 |
xt | -0.010 |
storm | -0.010 |
bow | -0.009 |
liv | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | -7.92e-03 |
Pos logit contributions | |
Twe | +0.009 |
ller | +0.008 |
Karen | +0.008 |
hy | +0.008 |
xt | +0.008 |
Neg logit contributions | |
triple | -0.007 |
groups | -0.007 |
questions | -0.006 |
invitations | -0.006 |
ibr | -0.006 |
Token | je |
Token ID | 11223 |
Feature activation | -4.58e-02 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.013 |
triple | +0.012 |
forward | +0.012 |
increasingly | +0.012 |
Neg logit contributions | |
ller | -0.012 |
xt | -0.011 |
Twe | -0.011 |
hy | -0.010 |
storm | -0.010 |
Token | ep |
Token ID | 538 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
questions | +0.072 |
groups | +0.068 |
triple | +0.064 |
forward | +0.059 |
out | +0.058 |
Neg logit contributions | |
ller | -0.078 |
xt | -0.074 |
liv | -0.069 |
leanor | -0.066 |
llers | -0.066 |
Token | and |
Token ID | 290 |
Feature activation | +6.41e-04 |
Pos logit contributions | |
groups | +0.014 |
questions | +0.013 |
triple | +0.013 |
cabinets | +0.012 |
invitations | +0.012 |
Neg logit contributions | |
ller | -0.018 |
bye | -0.016 |
xt | -0.016 |
hy | -0.016 |
storm | -0.016 |
Token | help |
Token ID | 1037 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
ller | +0.001 |
xt | +0.001 |
Twe | +0.001 |
bye | +0.001 |
storm | +0.001 |
Neg logit contributions | |
groups | -0.001 |
questions | -0.001 |
triple | -0.001 |
forward | -0.001 |
ac | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +5.36e-03 |
Pos logit contributions | |
ller | +0.030 |
Twe | +0.029 |
Karen | +0.028 |
Kitty | +0.027 |
xt | +0.026 |
Neg logit contributions | |
groups | -0.026 |
questions | -0.025 |
triple | -0.024 |
increasingly | -0.023 |
invitations | -0.023 |
Token | old |
Token ID | 1468 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.009 |
bye | +0.009 |
Twe | +0.009 |
storm | +0.008 |
Neg logit contributions | |
questions | -0.007 |
groups | -0.007 |
forward | -0.006 |
triple | -0.006 |
out | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +5.71e-03 |
Pos logit contributions | |
ller | +0.038 |
xt | +0.037 |
storm | +0.036 |
ugg | +0.036 |
liv | +0.035 |
Neg logit contributions | |
questions | -0.030 |
groups | -0.027 |
out | -0.025 |
triple | -0.025 |
at | -0.025 |
Token |
|
Token ID | 198 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
ller | +0.013 |
xt | +0.013 |
storm | +0.013 |
ugg | +0.013 |
sed | +0.012 |
Neg logit contributions | |
questions | -0.005 |
groups | -0.004 |
out | -0.004 |
at | -0.004 |
triple | -0.003 |
Token | Mary |
Token ID | 24119 |
Feature activation | -4.04e-03 |
Pos logit contributions | |
ller | +0.022 |
xt | +0.022 |
ugg | +0.020 |
storm | +0.020 |
liv | +0.020 |
Neg logit contributions | |
questions | -0.024 |
groups | -0.023 |
triple | -0.022 |
forward | -0.021 |
out | -0.021 |
Token | put |
Token ID | 1234 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
questions | +0.007 |
groups | +0.007 |
forward | +0.006 |
triple | +0.006 |
out | +0.006 |
Neg logit contributions | |
xt | -0.006 |
ller | -0.006 |
liv | -0.006 |
ugg | -0.005 |
bow | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
groups | +0.013 |
questions | +0.012 |
triple | +0.012 |
forward | +0.009 |
brothers | +0.009 |
Neg logit contributions | |
ller | -0.028 |
xt | -0.027 |
liv | -0.027 |
ugg | -0.027 |
leanor | -0.026 |
Token | squ |
Token ID | 2809 |
Feature activation | -4.01e-02 |
Pos logit contributions | |
questions | +0.016 |
groups | +0.016 |
triple | +0.015 |
forward | +0.015 |
invitations | +0.014 |
Neg logit contributions | |
ller | -0.016 |
xt | -0.016 |
bow | -0.015 |
ugg | -0.015 |
liv | -0.015 |
Token | ishy |
Token ID | 49785 |
Feature activation | -2.06e-02 |
Pos logit contributions | |
groups | +0.073 |
questions | +0.072 |
triple | +0.067 |
scientists | +0.066 |
soldiers | +0.065 |
Neg logit contributions | |
xt | -0.047 |
ugg | -0.047 |
ller | -0.045 |
mm | -0.042 |
liv | -0.041 |
Token | material |
Token ID | 2587 |
Feature activation | -9.51e-03 |
Pos logit contributions | |
groups | +0.031 |
questions | +0.030 |
triple | +0.028 |
forward | +0.027 |
brothers | +0.026 |
Neg logit contributions | |
ller | -0.033 |
xt | -0.031 |
ugg | -0.030 |
bow | -0.030 |
seven | -0.029 |
Token | on |
Token ID | 319 |
Feature activation | +2.60e-03 |
Pos logit contributions | |
triple | +0.013 |
groups | +0.011 |
ibr | +0.010 |
questions | +0.010 |
date | +0.010 |
Neg logit contributions | |
xt | -0.016 |
ller | -0.015 |
chief | -0.015 |
ugg | -0.015 |
Twe | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | -5.80e-03 |
Pos logit contributions | |
ller | +0.005 |
xt | +0.004 |
Twe | +0.004 |
liv | +0.004 |
bow | +0.004 |
Neg logit contributions | |
groups | -0.004 |
questions | -0.004 |
triple | -0.004 |
brothers | -0.003 |
forward | -0.003 |
Token | floor |
Token ID | 4314 |
Feature activation | -4.11e-03 |
Pos logit contributions | |
groups | +0.009 |
questions | +0.009 |
triple | +0.009 |
forward | +0.008 |
packs | +0.008 |
Neg logit contributions | |
ller | -0.009 |
xt | -0.008 |
bow | -0.008 |
ugg | -0.007 |
seven | -0.007 |
Token | The |
Token ID | 464 |
Feature activation | -7.80e-04 |
Pos logit contributions | |
questions | +0.009 |
groups | +0.009 |
out | +0.009 |
invitations | +0.008 |
into | +0.008 |
Neg logit contributions | |
ller | -0.007 |
xt | -0.007 |
leanor | -0.007 |
liv | -0.007 |
seven | -0.007 |
Token | little |
Token ID | 1310 |
Feature activation | -1.45e-03 |
Pos logit contributions | |
groups | +0.001 |
questions | +0.001 |
forward | +0.001 |
triple | +0.001 |
into | +0.001 |
Neg logit contributions | |
ller | -0.001 |
xt | -0.001 |
Twe | -0.001 |
storm | -0.001 |
ugg | -0.001 |
Token | boy |
Token ID | 2933 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
triple | +0.001 |
forward | +0.001 |
out | +0.001 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
storm | -0.003 |
ugg | -0.003 |
liv | -0.003 |
Token | squeezed |
Token ID | 29650 |
Feature activation | -4.53e-03 |
Pos logit contributions | |
questions | +0.030 |
groups | +0.029 |
forward | +0.027 |
triple | +0.026 |
invitations | +0.024 |
Neg logit contributions | |
ller | -0.026 |
xt | -0.026 |
ugg | -0.023 |
bye | -0.022 |
lla | -0.022 |
Token | the |
Token ID | 262 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
groups | +0.008 |
triple | +0.008 |
questions | +0.007 |
arre | +0.007 |
plan | +0.007 |
Neg logit contributions | |
Twe | -0.006 |
Blue | -0.005 |
ller | -0.005 |
Red | -0.005 |
Raven | -0.005 |
Token | ash |
Token ID | 12530 |
Feature activation | -4.04e-02 |
Pos logit contributions | |
questions | +0.013 |
groups | +0.012 |
triple | +0.011 |
forward | +0.011 |
out | +0.010 |
Neg logit contributions | |
ller | -0.019 |
xt | -0.019 |
liv | -0.018 |
ugg | -0.018 |
storm | -0.018 |
Token | tr |
Token ID | 2213 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
groups | +0.094 |
questions | +0.092 |
triple | +0.089 |
brothers | +0.082 |
increasingly | +0.082 |
Neg logit contributions | |
ller | -0.041 |
storm | -0.035 |
bow | -0.033 |
xt | -0.032 |
ugg | -0.032 |
Token | ay |
Token ID | 323 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
questions | +0.051 |
groups | +0.049 |
triple | +0.047 |
forward | +0.046 |
out | +0.045 |
Neg logit contributions | |
ller | -0.064 |
xt | -0.063 |
liv | -0.059 |
storm | -0.058 |
ugg | -0.057 |
Token | close |
Token ID | 1969 |
Feature activation | +1.80e-03 |
Pos logit contributions | |
questions | +0.017 |
groups | +0.016 |
triple | +0.015 |
forward | +0.013 |
out | +0.013 |
Neg logit contributions | |
ller | -0.035 |
xt | -0.035 |
liv | -0.033 |
ugg | -0.033 |
storm | -0.032 |
Token | and |
Token ID | 290 |
Feature activation | -6.86e-03 |
Pos logit contributions | |
ller | +0.004 |
xt | +0.004 |
bye | +0.003 |
ugg | +0.003 |
liv | +0.003 |
Neg logit contributions | |
questions | -0.002 |
groups | -0.002 |
triple | -0.002 |
brothers | -0.002 |
increasingly | -0.001 |
Token | gave |
Token ID | 2921 |
Feature activation | -7.11e-03 |
Pos logit contributions | |
questions | +0.011 |
groups | +0.011 |
triple | +0.011 |
forward | +0.010 |
brothers | +0.009 |
Neg logit contributions | |
ller | -0.011 |
xt | -0.010 |
liv | -0.010 |
storm | -0.009 |
ugg | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | +4.40e-03 |
Pos logit contributions | |
triple | +0.044 |
groups | +0.042 |
ibr | +0.038 |
ices | +0.037 |
scientists | +0.037 |
Neg logit contributions | |
ller | -0.042 |
xt | -0.042 |
seven | -0.041 |
bye | -0.039 |
Twe | -0.037 |
Token | a |
Token ID | 257 |
Feature activation | -6.33e-03 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.010 |
liv | +0.009 |
ugg | +0.009 |
storm | +0.009 |
Neg logit contributions | |
questions | -0.004 |
groups | -0.004 |
triple | -0.004 |
out | -0.003 |
forward | -0.003 |
Token | lady |
Token ID | 10846 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
questions | +0.010 |
forward | +0.009 |
groups | +0.009 |
triple | +0.009 |
ibr | +0.009 |
Neg logit contributions | |
ller | -0.009 |
bow | -0.009 |
storm | -0.008 |
sed | -0.008 |
drop | -0.008 |
Token | who |
Token ID | 508 |
Feature activation | -1.08e-03 |
Pos logit contributions | |
triple | +0.019 |
groups | +0.019 |
questions | +0.019 |
increasingly | +0.018 |
scientists | +0.018 |
Neg logit contributions | |
ller | -0.018 |
xt | -0.018 |
hy | -0.016 |
seven | -0.016 |
Raven | -0.015 |
Token | is |
Token ID | 318 |
Feature activation | +5.32e-06 |
Pos logit contributions | |
questions | +0.002 |
groups | +0.002 |
triple | +0.002 |
forward | +0.001 |
out | +0.001 |
Neg logit contributions | |
ller | -0.002 |
xt | -0.002 |
liv | -0.002 |
ugg | -0.002 |
storm | -0.002 |
Token | sitting |
Token ID | 5586 |
Feature activation | -4.08e-02 |
Token | on |
Token ID | 319 |
Feature activation | +3.25e-03 |
Pos logit contributions | |
triple | +0.035 |
groups | +0.034 |
questions | +0.033 |
plan | +0.026 |
invitations | +0.025 |
Neg logit contributions | |
ller | -0.089 |
xt | -0.086 |
ugg | -0.085 |
seven | -0.084 |
liv | -0.083 |
Token | a |
Token ID | 257 |
Feature activation | +7.62e-03 |
Pos logit contributions | |
ller | +0.007 |
xt | +0.007 |
liv | +0.007 |
storm | +0.006 |
bow | +0.006 |
Neg logit contributions | |
questions | -0.003 |
groups | -0.003 |
triple | -0.003 |
forward | -0.003 |
out | -0.002 |
Token | bench |
Token ID | 7624 |
Feature activation | +2.14e-02 |
Pos logit contributions | |
ller | +0.010 |
xt | +0.009 |
liv | +0.009 |
storm | +0.009 |
ugg | +0.008 |
Neg logit contributions | |
questions | -0.015 |
groups | -0.014 |
triple | -0.014 |
forward | -0.013 |
brothers | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -1.86e-03 |
Pos logit contributions | |
ller | +0.042 |
xt | +0.041 |
liv | +0.038 |
storm | +0.038 |
ugg | +0.038 |
Neg logit contributions | |
questions | -0.026 |
groups | -0.025 |
triple | -0.024 |
forward | -0.022 |
out | -0.021 |
Token | She |
Token ID | 1375 |
Feature activation | +5.64e-03 |
Pos logit contributions | |
questions | +0.003 |
groups | +0.002 |
triple | +0.002 |
forward | +0.002 |
out | +0.002 |
Neg logit contributions | |
ller | -0.003 |
xt | -0.003 |
liv | -0.003 |
storm | -0.003 |
ugg | -0.003 |