Token | yellow |
Token ID | 7872 |
Feature activation | +4.24e-02 |
Pos logit contributions | |
ever | +0.030 |
tow | +0.030 |
aroo | +0.028 |
Sue | +0.028 |
Bill | +0.027 |
Neg logit contributions | |
arre | -0.046 |
homework | -0.044 |
laptop | -0.042 |
chores | -0.041 |
tant | -0.039 |
Token | flower |
Token ID | 15061 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
tow | +0.050 |
free | +0.047 |
ever | +0.044 |
Sue | +0.042 |
Zip | +0.042 |
Neg logit contributions | |
arre | -0.077 |
homework | -0.074 |
laptop | -0.074 |
chores | -0.070 |
apr | -0.070 |
Token | with |
Token ID | 351 |
Feature activation | +3.54e-02 |
Pos logit contributions | |
tow | +0.038 |
Sue | +0.032 |
Zip | +0.032 |
free | +0.031 |
Bill | +0.030 |
Neg logit contributions | |
arre | -0.050 |
homework | -0.048 |
laptop | -0.047 |
chores | -0.044 |
apr | -0.041 |
Token | a |
Token ID | 257 |
Feature activation | +3.70e-02 |
Pos logit contributions | |
tow | +0.058 |
aroo | +0.057 |
oe | +0.055 |
oot | +0.054 |
tted | +0.053 |
Neg logit contributions | |
apr | -0.042 |
chores | -0.041 |
dishes | -0.038 |
sheets | -0.038 |
arre | -0.037 |
Token | red |
Token ID | 2266 |
Feature activation | +4.06e-02 |
Pos logit contributions | |
tow | +0.046 |
ever | +0.045 |
Sue | +0.044 |
Bill | +0.042 |
aroo | +0.041 |
Neg logit contributions | |
arre | -0.068 |
homework | -0.060 |
laptop | -0.060 |
tant | -0.059 |
chores | -0.057 |
Token | center |
Token ID | 3641 |
Feature activation | +6.96e-02 |
Pos logit contributions | |
tow | +0.053 |
ever | +0.047 |
free | +0.047 |
Sue | +0.047 |
Zip | +0.044 |
Neg logit contributions | |
arre | -0.071 |
apr | -0.063 |
homework | -0.062 |
tant | -0.062 |
laptop | -0.062 |
Token | . |
Token ID | 13 |
Feature activation | +7.98e-03 |
Pos logit contributions | |
tow | +0.108 |
Zip | +0.106 |
Dove | +0.102 |
aroo | +0.100 |
Tweet | +0.100 |
Neg logit contributions | |
arre | -0.103 |
laptop | -0.093 |
homework | -0.088 |
chores | -0.084 |
sheets | -0.083 |
Token | She |
Token ID | 1375 |
Feature activation | +9.69e-03 |
Pos logit contributions | |
ever | +0.012 |
swoop | +0.010 |
tow | +0.010 |
free | +0.010 |
aroo | +0.010 |
Neg logit contributions | |
arre | -0.016 |
homework | -0.013 |
laptop | -0.012 |
idents | -0.012 |
chores | -0.012 |
Token | wanted |
Token ID | 2227 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
tow | +0.014 |
aroo | +0.013 |
ever | +0.013 |
Dove | +0.012 |
free | +0.012 |
Neg logit contributions | |
arre | -0.018 |
apr | -0.015 |
homework | -0.015 |
laptop | -0.014 |
laptops | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | +2.50e-02 |
Pos logit contributions | |
tow | +0.029 |
aroo | +0.029 |
Zip | +0.027 |
swoop | +0.027 |
tted | +0.027 |
Neg logit contributions | |
homework | -0.024 |
chores | -0.023 |
arre | -0.021 |
apr | -0.021 |
jobs | -0.021 |
Token | pick |
Token ID | 2298 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
aroo | +0.036 |
tow | +0.036 |
igi | +0.034 |
ull | +0.033 |
oe | +0.033 |
Neg logit contributions | |
homework | -0.036 |
chores | -0.035 |
arre | -0.033 |
argue | -0.032 |
apr | -0.032 |
Token | flower |
Token ID | 15061 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
tow | +0.008 |
ever | +0.007 |
free | +0.007 |
Sue | +0.007 |
aroo | +0.007 |
Neg logit contributions | |
arre | -0.011 |
homework | -0.010 |
laptop | -0.010 |
chores | -0.010 |
jobs | -0.009 |
Token | with |
Token ID | 351 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
tow | +0.024 |
Sue | +0.021 |
free | +0.021 |
Zip | +0.021 |
Bill | +0.020 |
Neg logit contributions | |
arre | -0.031 |
laptop | -0.029 |
homework | -0.029 |
chores | -0.027 |
dining | -0.026 |
Token | a |
Token ID | 257 |
Feature activation | +2.17e-02 |
Pos logit contributions | |
tow | +0.046 |
aroo | +0.045 |
oe | +0.044 |
Zip | +0.041 |
oot | +0.041 |
Neg logit contributions | |
arre | -0.039 |
apr | -0.037 |
chores | -0.037 |
sheets | -0.037 |
computers | -0.036 |
Token | bright |
Token ID | 6016 |
Feature activation | +3.72e-02 |
Pos logit contributions | |
tow | +0.027 |
ever | +0.025 |
Sue | +0.025 |
aroo | +0.025 |
Zip | +0.024 |
Neg logit contributions | |
arre | -0.043 |
homework | -0.037 |
laptop | -0.037 |
chores | -0.036 |
tant | -0.034 |
Token | yellow |
Token ID | 7872 |
Feature activation | +3.99e-02 |
Pos logit contributions | |
ever | +0.049 |
Zip | +0.048 |
tow | +0.047 |
aroo | +0.046 |
Sue | +0.043 |
Neg logit contributions | |
arre | -0.065 |
tant | -0.053 |
sheets | -0.053 |
mess | -0.052 |
laptop | -0.051 |
Token | center |
Token ID | 3641 |
Feature activation | +6.39e-02 |
Pos logit contributions | |
tow | +0.051 |
free | +0.046 |
Zip | +0.045 |
Sue | +0.045 |
ever | +0.045 |
Neg logit contributions | |
arre | -0.073 |
laptop | -0.063 |
homework | -0.061 |
chores | -0.061 |
dishes | -0.060 |
Token | . |
Token ID | 13 |
Feature activation | +1.72e-03 |
Pos logit contributions | |
tow | +0.099 |
Zip | +0.097 |
Dove | +0.094 |
aroo | +0.092 |
Claw | +0.092 |
Neg logit contributions | |
arre | -0.094 |
laptop | -0.084 |
sheets | -0.078 |
homework | -0.076 |
beds | -0.074 |
Token | She |
Token ID | 1375 |
Feature activation | +9.73e-03 |
Pos logit contributions | |
ever | +0.003 |
tow | +0.002 |
aroo | +0.002 |
swoop | +0.002 |
free | +0.002 |
Neg logit contributions | |
arre | -0.003 |
apr | -0.003 |
homework | -0.003 |
laptop | -0.002 |
idents | -0.002 |
Token | picked |
Token ID | 6497 |
Feature activation | +4.44e-03 |
Pos logit contributions | |
tow | +0.015 |
Sue | +0.013 |
aroo | +0.013 |
Dove | +0.013 |
ever | +0.013 |
Neg logit contributions | |
arre | -0.018 |
homework | -0.014 |
apr | -0.014 |
laptop | -0.014 |
laptops | -0.014 |
Token | it |
Token ID | 340 |
Feature activation | +1.90e-04 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.006 |
Twe | +0.005 |
aroo | +0.005 |
hy | +0.005 |
Neg logit contributions | |
arre | -0.008 |
means | -0.007 |
chores | -0.007 |
homework | -0.007 |
apr | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +8.14e-03 |
Pos logit contributions | |
tow | +0.000 |
ever | +0.000 |
Sue | +0.000 |
aroo | +0.000 |
free | +0.000 |
Neg logit contributions | |
arre | -0.000 |
homework | -0.000 |
chores | -0.000 |
laptop | -0.000 |
apr | -0.000 |
Token | black |
Token ID | 2042 |
Feature activation | +7.66e-03 |
Pos logit contributions | |
tow | +0.010 |
ever | +0.010 |
free | +0.009 |
Sue | +0.008 |
aroo | +0.008 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.017 |
chores | -0.017 |
laptop | -0.017 |
apr | -0.016 |
Token | dog |
Token ID | 3290 |
Feature activation | +5.89e-03 |
Pos logit contributions | |
free | +0.010 |
ever | +0.010 |
tow | +0.010 |
Sue | +0.008 |
itself | +0.008 |
Neg logit contributions | |
arre | -0.015 |
laptop | -0.013 |
homework | -0.013 |
chores | -0.012 |
apr | -0.012 |
Token | with |
Token ID | 351 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.006 |
free | +0.005 |
Sue | +0.005 |
Sally | +0.005 |
Neg logit contributions | |
arre | -0.013 |
homework | -0.012 |
laptop | -0.011 |
chores | -0.011 |
ambul | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | +2.50e-02 |
Pos logit contributions | |
tow | +0.034 |
oe | +0.033 |
aroo | +0.032 |
ever | +0.031 |
orse | +0.029 |
Neg logit contributions | |
arre | -0.048 |
chores | -0.042 |
apr | -0.041 |
homework | -0.041 |
ambul | -0.040 |
Token | w |
Token ID | 266 |
Feature activation | -2.44e-03 |
Pos logit contributions | |
ever | +0.029 |
tow | +0.028 |
Sue | +0.025 |
free | +0.024 |
aroo | +0.024 |
Neg logit contributions | |
arre | -0.056 |
homework | -0.050 |
laptop | -0.048 |
chores | -0.047 |
apr | -0.045 |
Token | ag |
Token ID | 363 |
Feature activation | +6.35e-02 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.004 |
chores | +0.004 |
affles | +0.003 |
laptop | +0.003 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.004 |
Sue | -0.004 |
free | -0.004 |
Sally | -0.004 |
Token | gy |
Token ID | 1360 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
tow | +0.075 |
ever | +0.071 |
I | +0.065 |
free | +0.062 |
Dove | +0.061 |
Neg logit contributions | |
arre | -0.125 |
tant | -0.101 |
laptop | -0.097 |
organ | -0.096 |
homework | -0.095 |
Token | tail |
Token ID | 7894 |
Feature activation | +3.42e-02 |
Pos logit contributions | |
tow | +0.017 |
ever | +0.016 |
free | +0.014 |
Sue | +0.014 |
aroo | +0.013 |
Neg logit contributions | |
arre | -0.029 |
homework | -0.025 |
laptop | -0.025 |
chores | -0.024 |
apr | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | +4.25e-03 |
Pos logit contributions | |
tow | +0.044 |
Sue | +0.041 |
ever | +0.040 |
Sally | +0.039 |
aroo | +0.038 |
Neg logit contributions | |
arre | -0.070 |
laptop | -0.056 |
homework | -0.054 |
chores | -0.053 |
obe | -0.050 |
Token | The |
Token ID | 383 |
Feature activation | +1.97e-02 |
Pos logit contributions | |
ever | +0.004 |
tow | +0.004 |
free | +0.003 |
aroo | +0.003 |
Sue | +0.003 |
Neg logit contributions | |
arre | -0.010 |
homework | -0.009 |
laptop | -0.009 |
chores | -0.009 |
apr | -0.009 |
Token | dog |
Token ID | 3290 |
Feature activation | +5.71e-03 |
Pos logit contributions | |
ever | +0.023 |
tow | +0.023 |
free | +0.021 |
Sue | +0.021 |
aroo | +0.020 |
Neg logit contributions | |
arre | -0.043 |
homework | -0.038 |
chores | -0.037 |
laptop | -0.036 |
apr | -0.035 |
Token | yellow |
Token ID | 7872 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
tow | +0.029 |
aroo | +0.025 |
ever | +0.025 |
oot | +0.023 |
Bill | +0.022 |
Neg logit contributions | |
homework | -0.036 |
arre | -0.036 |
chores | -0.035 |
laptop | -0.033 |
apr | -0.033 |
Token | , |
Token ID | 11 |
Feature activation | +6.98e-03 |
Pos logit contributions | |
tow | +0.037 |
free | +0.033 |
aroo | +0.032 |
ever | +0.031 |
swoop | +0.030 |
Neg logit contributions | |
arre | -0.037 |
homework | -0.034 |
laptop | -0.033 |
chores | -0.032 |
jobs | -0.031 |
Token | with |
Token ID | 351 |
Feature activation | +2.72e-02 |
Pos logit contributions | |
tow | +0.010 |
aroo | +0.009 |
ever | +0.008 |
free | +0.008 |
Zip | +0.007 |
Neg logit contributions | |
arre | -0.013 |
homework | -0.012 |
laptop | -0.011 |
chores | -0.011 |
apr | -0.011 |
Token | a |
Token ID | 257 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
aroo | +0.044 |
oe | +0.044 |
tow | +0.043 |
tted | +0.040 |
oot | +0.039 |
Neg logit contributions | |
chores | -0.036 |
apr | -0.036 |
sheets | -0.034 |
computers | -0.034 |
arre | -0.034 |
Token | brown |
Token ID | 7586 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
ever | +0.031 |
tow | +0.030 |
aroo | +0.029 |
Sue | +0.028 |
Sally | +0.027 |
Neg logit contributions | |
arre | -0.048 |
laptop | -0.042 |
homework | -0.041 |
tant | -0.040 |
chores | -0.040 |
Token | center |
Token ID | 3641 |
Feature activation | +6.23e-02 |
Pos logit contributions | |
tow | +0.032 |
ever | +0.028 |
free | +0.027 |
Zip | +0.026 |
tted | +0.025 |
Neg logit contributions | |
arre | -0.039 |
laptop | -0.038 |
homework | -0.036 |
apr | -0.036 |
idents | -0.035 |
Token | . |
Token ID | 13 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
tow | +0.104 |
Zip | +0.103 |
Twe | +0.103 |
aroo | +0.102 |
Fin | +0.102 |
Neg logit contributions | |
arre | -0.077 |
laptop | -0.072 |
beds | -0.066 |
homework | -0.065 |
sheets | -0.064 |
Token | It |
Token ID | 632 |
Feature activation | +9.91e-03 |
Pos logit contributions | |
ever | +0.009 |
tow | +0.009 |
free | +0.008 |
aroo | +0.007 |
swoop | +0.007 |
Neg logit contributions | |
arre | -0.026 |
homework | -0.024 |
chores | -0.023 |
apr | -0.023 |
laptop | -0.023 |
Token | has |
Token ID | 468 |
Feature activation | +2.45e-02 |
Pos logit contributions | |
tow | +0.018 |
ever | +0.017 |
free | +0.016 |
aroo | +0.016 |
Sue | +0.016 |
Neg logit contributions | |
arre | -0.014 |
homework | -0.013 |
chores | -0.012 |
laptop | -0.011 |
means | -0.011 |
Token | many |
Token ID | 867 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
aroo | +0.038 |
tow | +0.037 |
oe | +0.034 |
ever | +0.031 |
oot | +0.031 |
Neg logit contributions | |
arre | -0.037 |
chores | -0.035 |
apr | -0.035 |
laptops | -0.035 |
homework | -0.034 |
Token | pet |
Token ID | 4273 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
tow | +0.031 |
aroo | +0.029 |
ever | +0.029 |
Zip | +0.027 |
Sue | +0.027 |
Neg logit contributions | |
arre | -0.026 |
chores | -0.024 |
tasks | -0.023 |
homework | -0.023 |
apr | -0.023 |
Token | It |
Token ID | 632 |
Feature activation | +2.22e-02 |
Pos logit contributions | |
arre | +0.026 |
homework | +0.022 |
laptop | +0.021 |
chores | +0.021 |
apr | +0.021 |
Neg logit contributions | |
ever | -0.017 |
tow | -0.015 |
aroo | -0.015 |
free | -0.014 |
swoop | -0.014 |
Token | had |
Token ID | 550 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
tow | +0.035 |
ever | +0.032 |
aroo | +0.030 |
Sue | +0.030 |
free | +0.030 |
Neg logit contributions | |
arre | -0.040 |
homework | -0.032 |
chores | -0.031 |
apr | -0.031 |
laptop | -0.030 |
Token | a |
Token ID | 257 |
Feature activation | +2.19e-02 |
Pos logit contributions | |
aroo | +0.035 |
tow | +0.032 |
oe | +0.027 |
orse | +0.026 |
Zip | +0.026 |
Neg logit contributions | |
arre | -0.039 |
apr | -0.033 |
homework | -0.033 |
laptops | -0.033 |
chores | -0.033 |
Token | bright |
Token ID | 6016 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
ever | +0.029 |
tow | +0.028 |
Sue | +0.027 |
aroo | +0.027 |
free | +0.024 |
Neg logit contributions | |
arre | -0.043 |
homework | -0.038 |
chores | -0.037 |
laptop | -0.036 |
apr | -0.035 |
Token | pink |
Token ID | 11398 |
Feature activation | +4.47e-02 |
Pos logit contributions | |
ever | +0.055 |
tow | +0.050 |
aroo | +0.050 |
Zip | +0.048 |
free | +0.047 |
Neg logit contributions | |
arre | -0.078 |
apr | -0.065 |
homework | -0.064 |
chores | -0.063 |
laundry | -0.062 |
Token | center |
Token ID | 3641 |
Feature activation | +6.15e-02 |
Pos logit contributions | |
tow | +0.065 |
ever | +0.060 |
Sue | +0.059 |
free | +0.058 |
Jerry | +0.058 |
Neg logit contributions | |
arre | -0.072 |
apr | -0.064 |
laptop | -0.064 |
homework | -0.064 |
laundry | -0.063 |
Token | and |
Token ID | 290 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
tow | +0.104 |
Zip | +0.100 |
aroo | +0.100 |
Dove | +0.098 |
Tweet | +0.097 |
Neg logit contributions | |
arre | -0.084 |
laptop | -0.073 |
homework | -0.069 |
sheets | -0.064 |
chores | -0.064 |
Token | its |
Token ID | 663 |
Feature activation | +3.37e-02 |
Pos logit contributions | |
tow | +0.039 |
aroo | +0.036 |
ever | +0.034 |
ir | +0.031 |
ull | +0.030 |
Neg logit contributions | |
arre | -0.050 |
homework | -0.049 |
apr | -0.047 |
chores | -0.045 |
matt | -0.045 |
Token | pet |
Token ID | 4273 |
Feature activation | +2.69e-02 |
Pos logit contributions | |
tow | +0.046 |
ever | +0.041 |
aroo | +0.041 |
Zip | +0.039 |
ull | +0.038 |
Neg logit contributions | |
chores | -0.057 |
homework | -0.056 |
arre | -0.055 |
tasks | -0.053 |
laptop | -0.052 |
Token | als |
Token ID | 874 |
Feature activation | +3.28e-02 |
Pos logit contributions | |
tow | +0.050 |
free | +0.044 |
ull | +0.043 |
ever | +0.041 |
orse | +0.041 |
Neg logit contributions | |
arre | -0.030 |
means | -0.029 |
cuts | -0.028 |
chores | -0.026 |
laundry | -0.025 |
Token | were |
Token ID | 547 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
tow | +0.045 |
aroo | +0.040 |
Zip | +0.040 |
Sue | +0.039 |
Twe | +0.038 |
Neg logit contributions | |
arre | -0.058 |
chores | -0.050 |
homework | -0.048 |
laptop | -0.045 |
sheets | -0.045 |
Token | pet |
Token ID | 4273 |
Feature activation | +3.19e-02 |
Pos logit contributions | |
tow | +0.050 |
aroo | +0.046 |
Sue | +0.043 |
Zip | +0.043 |
Dove | +0.042 |
Neg logit contributions | |
arre | -0.056 |
apr | -0.050 |
tasks | -0.048 |
chores | -0.047 |
jobs | -0.047 |
Token | als |
Token ID | 874 |
Feature activation | +2.52e-02 |
Pos logit contributions | |
tow | +0.061 |
orse | +0.051 |
emo | +0.050 |
free | +0.049 |
Twe | +0.049 |
Neg logit contributions | |
arre | -0.036 |
means | -0.028 |
rises | -0.028 |
nurses | -0.027 |
ambul | -0.027 |
Token | and |
Token ID | 290 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
tow | +0.036 |
Sue | +0.033 |
aroo | +0.031 |
Zip | +0.031 |
Twe | +0.030 |
Neg logit contributions | |
arre | -0.046 |
chores | -0.037 |
homework | -0.035 |
sheets | -0.034 |
rises | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
tow | +0.029 |
aroo | +0.026 |
oe | +0.025 |
Zip | +0.024 |
Twe | +0.024 |
Neg logit contributions | |
arre | -0.034 |
apr | -0.032 |
homework | -0.032 |
computers | -0.032 |
sheets | -0.032 |
Token | large |
Token ID | 1588 |
Feature activation | +3.07e-02 |
Pos logit contributions | |
ever | +0.032 |
aroo | +0.032 |
tow | +0.031 |
Sue | +0.031 |
Zip | +0.030 |
Neg logit contributions | |
arre | -0.048 |
homework | -0.041 |
chores | -0.041 |
laptop | -0.041 |
dining | -0.040 |
Token | centre |
Token ID | 7372 |
Feature activation | +6.09e-02 |
Pos logit contributions | |
Zip | +0.038 |
tow | +0.038 |
aroo | +0.036 |
ever | +0.035 |
Twe | +0.034 |
Neg logit contributions | |
arre | -0.054 |
laptop | -0.047 |
homework | -0.047 |
chores | -0.046 |
dining | -0.045 |
Token | . |
Token ID | 13 |
Feature activation | -8.69e-04 |
Pos logit contributions | |
Dove | +0.080 |
tow | +0.079 |
Zip | +0.078 |
Tweet | +0.073 |
Twe | +0.073 |
Neg logit contributions | |
arre | -0.099 |
homework | -0.090 |
laptop | -0.088 |
jobs | -0.086 |
means | -0.086 |
Token | All |
Token ID | 1439 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
arre | +0.002 |
apr | +0.001 |
chores | +0.001 |
homework | +0.001 |
laptop | +0.001 |
Neg logit contributions | |
ever | -0.001 |
tow | -0.001 |
swoop | -0.001 |
aroo | -0.001 |
free | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
tow | +0.013 |
ever | +0.011 |
Dove | +0.011 |
free | +0.011 |
Sue | +0.010 |
Neg logit contributions | |
arre | -0.028 |
homework | -0.025 |
chores | -0.024 |
apr | -0.023 |
jobs | -0.023 |
Token | other |
Token ID | 584 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
tow | +0.026 |
aroo | +0.024 |
ever | +0.023 |
oot | +0.022 |
Dove | +0.021 |
Neg logit contributions | |
arre | -0.028 |
chores | -0.025 |
tasks | -0.024 |
jobs | -0.024 |
apr | -0.023 |
Token | children |
Token ID | 1751 |
Feature activation | +5.91e-03 |
Pos logit contributions | |
tow | +0.023 |
aroo | +0.021 |
Dove | +0.020 |
hy | +0.019 |
Zip | +0.019 |
Neg logit contributions | |
arre | -0.024 |
jobs | -0.020 |
tasks | -0.020 |
chores | -0.019 |
apr | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
tow | +0.037 |
Zip | +0.034 |
aroo | +0.033 |
Sue | +0.033 |
ever | +0.032 |
Neg logit contributions | |
arre | -0.039 |
chores | -0.030 |
homework | -0.028 |
laptop | -0.028 |
sheets | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
tow | +0.022 |
aroo | +0.021 |
oe | +0.021 |
ever | +0.020 |
ary | +0.018 |
Neg logit contributions | |
arre | -0.029 |
homework | -0.027 |
chores | -0.027 |
apr | -0.026 |
computers | -0.026 |
Token | soft |
Token ID | 2705 |
Feature activation | +2.24e-02 |
Pos logit contributions | |
ever | +0.019 |
tow | +0.018 |
Sue | +0.018 |
aroo | +0.017 |
Zip | +0.016 |
Neg logit contributions | |
arre | -0.032 |
homework | -0.027 |
laptop | -0.027 |
chores | -0.026 |
tant | -0.026 |
Token | , |
Token ID | 11 |
Feature activation | +9.86e-03 |
Pos logit contributions | |
ever | +0.032 |
tow | +0.032 |
Zip | +0.029 |
aroo | +0.027 |
Sue | +0.027 |
Neg logit contributions | |
arre | -0.038 |
laptop | -0.033 |
apr | -0.032 |
homework | -0.031 |
idents | -0.031 |
Token | brown |
Token ID | 7586 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
tow | +0.014 |
aroo | +0.012 |
ever | +0.012 |
oe | +0.011 |
Sue | +0.011 |
Neg logit contributions | |
arre | -0.018 |
homework | -0.016 |
chores | -0.016 |
apr | -0.016 |
laptop | -0.016 |
Token | centre |
Token ID | 7372 |
Feature activation | +6.06e-02 |
Pos logit contributions | |
tow | +0.024 |
ever | +0.022 |
Zip | +0.022 |
Sue | +0.021 |
free | +0.021 |
Neg logit contributions | |
arre | -0.028 |
laptop | -0.025 |
apr | -0.024 |
dishes | -0.024 |
laundry | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | -7.35e-03 |
Pos logit contributions | |
Dove | +0.080 |
Zip | +0.079 |
tow | +0.077 |
Tweet | +0.075 |
aroo | +0.075 |
Neg logit contributions | |
arre | -0.100 |
homework | -0.092 |
laptop | -0.092 |
chores | -0.087 |
jobs | -0.086 |
Token | Sab |
Token ID | 9910 |
Feature activation | -4.31e-03 |
Pos logit contributions | |
arre | +0.016 |
homework | +0.014 |
chores | +0.013 |
laptop | +0.013 |
apr | +0.013 |
Neg logit contributions | |
tow | -0.009 |
ever | -0.009 |
free | -0.008 |
Sue | -0.008 |
aroo | -0.007 |
Token | ina |
Token ID | 1437 |
Feature activation | +1.51e-03 |
Pos logit contributions | |
arre | +0.007 |
homework | +0.006 |
chores | +0.006 |
laptop | +0.006 |
apr | +0.005 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.007 |
free | -0.007 |
aroo | -0.007 |
Token | couldn |
Token ID | 3521 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
free | +0.002 |
Sue | +0.002 |
aroo | +0.002 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.002 |
laptop | -0.002 |
apr | -0.002 |
chores | -0.002 |
Token | 't |
Token ID | 470 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
tow | +0.025 |
ever | +0.023 |
free | +0.022 |
Sue | +0.022 |
swoop | +0.022 |
Neg logit contributions | |
arre | -0.042 |
homework | -0.037 |
chores | -0.036 |
laptop | -0.034 |
idents | -0.032 |
Token | ducks |
Token ID | 39694 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
tow | +0.058 |
aroo | +0.057 |
ary | +0.055 |
oot | +0.054 |
oe | +0.053 |
Neg logit contributions | |
chores | -0.061 |
arre | -0.061 |
matt | -0.060 |
apr | -0.060 |
jobs | -0.059 |
Token | , |
Token ID | 11 |
Feature activation | +2.27e-02 |
Pos logit contributions | |
tow | +0.044 |
free | +0.038 |
ever | +0.037 |
Zip | +0.037 |
Twe | +0.036 |
Neg logit contributions | |
arre | -0.042 |
laptop | -0.036 |
chores | -0.035 |
homework | -0.035 |
ambul | -0.032 |
Token | a |
Token ID | 257 |
Feature activation | +3.30e-02 |
Pos logit contributions | |
tow | +0.028 |
ever | +0.025 |
free | +0.023 |
aroo | +0.023 |
oe | +0.023 |
Neg logit contributions | |
arre | -0.046 |
homework | -0.041 |
chores | -0.041 |
apr | -0.040 |
laptop | -0.040 |
Token | playground |
Token ID | 24817 |
Feature activation | +4.34e-02 |
Pos logit contributions | |
ever | +0.046 |
tow | +0.039 |
itself | +0.038 |
ary | +0.038 |
free | +0.037 |
Neg logit contributions | |
arre | -0.061 |
laptop | -0.056 |
homework | -0.053 |
chores | -0.053 |
dining | -0.050 |
Token | with |
Token ID | 351 |
Feature activation | +4.53e-02 |
Pos logit contributions | |
tow | +0.060 |
free | +0.060 |
Dove | +0.057 |
ever | +0.057 |
aroo | +0.057 |
Neg logit contributions | |
laptop | -0.066 |
arre | -0.061 |
beds | -0.060 |
homework | -0.060 |
chores | -0.056 |
Token | swings |
Token ID | 26728 |
Feature activation | +5.99e-02 |
Pos logit contributions | |
oot | +0.074 |
ary | +0.073 |
tow | +0.072 |
oe | +0.071 |
aroo | +0.070 |
Neg logit contributions | |
beds | -0.055 |
matt | -0.054 |
chores | -0.054 |
movies | -0.053 |
jobs | -0.053 |
Token | , |
Token ID | 11 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
tow | +0.110 |
chie | +0.105 |
aroo | +0.098 |
've | +0.097 |
plet | +0.097 |
Neg logit contributions | |
beds | -0.056 |
arre | -0.052 |
chores | -0.051 |
apr | -0.050 |
laptop | -0.050 |
Token | and |
Token ID | 290 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
tow | +0.029 |
ever | +0.026 |
aroo | +0.024 |
free | +0.024 |
Sue | +0.023 |
Neg logit contributions | |
arre | -0.042 |
homework | -0.036 |
chores | -0.035 |
apr | -0.035 |
laptop | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | +2.41e-02 |
Pos logit contributions | |
tow | +0.018 |
ever | +0.017 |
aroo | +0.016 |
free | +0.015 |
Sue | +0.015 |
Neg logit contributions | |
arre | -0.031 |
homework | -0.027 |
chores | -0.027 |
apr | -0.026 |
laptop | -0.025 |
Token | bench |
Token ID | 7624 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
ever | +0.034 |
tow | +0.029 |
Sue | +0.028 |
ary | +0.028 |
Bill | +0.028 |
Neg logit contributions | |
arre | -0.046 |
laptop | -0.040 |
homework | -0.039 |
chores | -0.039 |
dining | -0.037 |
Token | with |
Token ID | 351 |
Feature activation | +4.46e-02 |
Pos logit contributions | |
tow | +0.046 |
Frank | +0.044 |
Bill | +0.043 |
Sally | +0.043 |
Twe | +0.043 |
Neg logit contributions | |
laptop | -0.056 |
homework | -0.055 |
arre | -0.052 |
chores | -0.050 |
beds | -0.049 |
Token | with |
Token ID | 351 |
Feature activation | +3.38e-02 |
Pos logit contributions | |
tow | +0.046 |
aroo | +0.043 |
ever | +0.042 |
free | +0.041 |
swoop | +0.039 |
Neg logit contributions | |
arre | -0.073 |
homework | -0.069 |
laptop | -0.067 |
chores | -0.063 |
jobs | -0.061 |
Token | a |
Token ID | 257 |
Feature activation | +3.32e-02 |
Pos logit contributions | |
aroo | +0.062 |
oe | +0.059 |
ary | +0.056 |
pper | +0.056 |
inger | +0.055 |
Neg logit contributions | |
computers | -0.043 |
matt | -0.040 |
magazines | -0.039 |
movies | -0.039 |
chores | -0.039 |
Token | big |
Token ID | 1263 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
ever | +0.043 |
aroo | +0.041 |
itself | +0.038 |
tow | +0.037 |
Sue | +0.037 |
Neg logit contributions | |
arre | -0.065 |
homework | -0.058 |
laptop | -0.056 |
chores | -0.055 |
dining | -0.051 |
Token | slide |
Token ID | 10649 |
Feature activation | +3.30e-02 |
Pos logit contributions | |
ever | +0.035 |
aroo | +0.033 |
free | +0.031 |
tow | +0.030 |
p | +0.030 |
Neg logit contributions | |
arre | -0.044 |
homework | -0.040 |
laptop | -0.040 |
chores | -0.038 |
apr | -0.037 |
Token | and |
Token ID | 290 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
tow | +0.049 |
free | +0.046 |
aroo | +0.045 |
ever | +0.043 |
ull | +0.043 |
Neg logit contributions | |
arre | -0.056 |
homework | -0.051 |
laptop | -0.049 |
chores | -0.044 |
cases | -0.042 |
Token | swings |
Token ID | 26728 |
Feature activation | +5.78e-02 |
Pos logit contributions | |
tow | +0.031 |
aroo | +0.030 |
ever | +0.028 |
oe | +0.026 |
ir | +0.026 |
Neg logit contributions | |
arre | -0.041 |
homework | -0.037 |
chores | -0.036 |
matt | -0.035 |
computers | -0.035 |
Token | . |
Token ID | 13 |
Feature activation | +1.05e-03 |
Pos logit contributions | |
tow | +0.081 |
aroo | +0.079 |
Twe | +0.077 |
chie | +0.075 |
ever | +0.074 |
Neg logit contributions | |
homework | -0.081 |
arre | -0.080 |
chores | -0.075 |
beds | -0.071 |
roles | -0.071 |
Token | Tim |
Token ID | 5045 |
Feature activation | -3.27e-03 |
Pos logit contributions | |
ever | +0.001 |
tow | +0.001 |
aroo | +0.001 |
swoop | +0.001 |
free | +0.001 |
Neg logit contributions | |
arre | -0.002 |
homework | -0.002 |
idents | -0.002 |
chores | -0.002 |
apr | -0.002 |
Token | learned |
Token ID | 4499 |
Feature activation | -5.46e-03 |
Pos logit contributions | |
arre | +0.007 |
homework | +0.006 |
chores | +0.006 |
laptop | +0.005 |
apr | +0.005 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.004 |
Sue | -0.004 |
free | -0.004 |
aroo | -0.004 |
Token | that |
Token ID | 326 |
Feature activation | -4.57e-02 |
Pos logit contributions | |
arre | +0.016 |
laptop | +0.014 |
apr | +0.014 |
homework | +0.014 |
laptops | +0.014 |
Neg logit contributions | |
free | -0.003 |
ever | -0.003 |
Sue | -0.003 |
tow | -0.002 |
its | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | -2.25e-02 |
Pos logit contributions | |
arre | +0.120 |
apr | +0.106 |
laptop | +0.099 |
laptops | +0.099 |
cuts | +0.098 |
Neg logit contributions | |
ever | -0.046 |
it | -0.037 |
free | -0.035 |
tow | -0.035 |
its | -0.034 |
Token | asked |
Token ID | 1965 |
Feature activation | -8.93e-03 |
Pos logit contributions | |
tow | +0.010 |
ever | +0.009 |
free | +0.009 |
aroo | +0.009 |
Sue | +0.009 |
Neg logit contributions | |
arre | -0.013 |
homework | -0.011 |
apr | -0.011 |
laptop | -0.011 |
chores | -0.011 |
Token | him |
Token ID | 683 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
arre | +0.017 |
homework | +0.016 |
chores | +0.016 |
apr | +0.015 |
nurses | +0.015 |
Neg logit contributions | |
tow | -0.012 |
ever | -0.011 |
free | -0.011 |
aroo | -0.010 |
swoop | -0.010 |
Token | if |
Token ID | 611 |
Feature activation | +7.78e-03 |
Pos logit contributions | |
tow | +0.029 |
ever | +0.028 |
free | +0.027 |
aroo | +0.026 |
swoop | +0.025 |
Neg logit contributions | |
arre | -0.026 |
homework | -0.024 |
chores | -0.023 |
laptop | -0.021 |
jobs | -0.021 |
Token | she |
Token ID | 673 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
tow | +0.009 |
free | +0.008 |
ever | +0.008 |
aroo | +0.007 |
Sue | +0.007 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.016 |
chores | -0.015 |
jobs | -0.014 |
laptop | -0.014 |
Token | could |
Token ID | 714 |
Feature activation | +2.72e-02 |
Pos logit contributions | |
tow | +0.063 |
free | +0.059 |
alks | +0.059 |
Dove | +0.057 |
crashing | +0.056 |
Neg logit contributions | |
arre | -0.038 |
means | -0.037 |
homework | -0.035 |
organ | -0.032 |
doesn | -0.032 |
Token | come |
Token ID | 1282 |
Feature activation | +5.75e-02 |
Pos logit contributions | |
Dove | +0.038 |
aroo | +0.038 |
Zip | +0.038 |
itself | +0.037 |
Jerry | +0.037 |
Neg logit contributions | |
chores | -0.043 |
homework | -0.038 |
arre | -0.037 |
laptop | -0.033 |
jobs | -0.032 |
Token | inside |
Token ID | 2641 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
tow | +0.081 |
aroo | +0.077 |
ever | +0.072 |
Zip | +0.071 |
Sue | +0.071 |
Neg logit contributions | |
arre | -0.083 |
chores | -0.082 |
homework | -0.079 |
matt | -0.074 |
laptop | -0.071 |
Token | and |
Token ID | 290 |
Feature activation | +2.25e-02 |
Pos logit contributions | |
tow | +0.014 |
ever | +0.012 |
aroo | +0.012 |
free | +0.012 |
Dove | +0.012 |
Neg logit contributions | |
arre | -0.026 |
homework | -0.025 |
chores | -0.024 |
laptop | -0.023 |
jobs | -0.022 |
Token | play |
Token ID | 711 |
Feature activation | +3.19e-02 |
Pos logit contributions | |
tow | +0.028 |
ever | +0.026 |
aroo | +0.025 |
free | +0.024 |
Dove | +0.024 |
Neg logit contributions | |
arre | -0.043 |
homework | -0.042 |
chores | -0.040 |
laptop | -0.038 |
jobs | -0.037 |
Token | . |
Token ID | 13 |
Feature activation | -3.20e-03 |
Pos logit contributions | |
tow | +0.033 |
ever | +0.030 |
Sue | +0.026 |
free | +0.026 |
aroo | +0.026 |
Neg logit contributions | |
arre | -0.071 |
homework | -0.066 |
chores | -0.064 |
laptop | -0.061 |
apr | -0.061 |
Token |
|
Token ID | 198 |
Feature activation | +2.52e-03 |
Pos logit contributions | |
arre | +0.007 |
homework | +0.006 |
laptop | +0.006 |
chores | +0.005 |
apr | +0.005 |
Neg logit contributions | |
ever | -0.004 |
tow | -0.004 |
free | -0.004 |
swoop | -0.003 |
aroo | -0.003 |
Token | big |
Token ID | 1263 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
ever | +0.022 |
tow | +0.020 |
Sue | +0.019 |
free | +0.019 |
aroo | +0.017 |
Neg logit contributions | |
arre | -0.044 |
homework | -0.040 |
laptop | -0.038 |
chores | -0.038 |
apr | -0.036 |
Token | structure |
Token ID | 4645 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
ever | +0.014 |
tow | +0.014 |
free | +0.013 |
Sue | +0.012 |
aroo | +0.012 |
Neg logit contributions | |
arre | -0.024 |
homework | -0.021 |
laptop | -0.021 |
chores | -0.020 |
apr | -0.020 |
Token | with |
Token ID | 351 |
Feature activation | +2.85e-02 |
Pos logit contributions | |
tow | +0.020 |
Dove | +0.018 |
free | +0.017 |
ever | +0.017 |
Bill | +0.017 |
Neg logit contributions | |
arre | -0.037 |
homework | -0.035 |
laptop | -0.035 |
chores | -0.033 |
jobs | -0.031 |
Token | slides |
Token ID | 19392 |
Feature activation | +3.43e-02 |
Pos logit contributions | |
aroo | +0.055 |
pper | +0.052 |
orse | +0.052 |
oe | +0.050 |
tow | +0.050 |
Neg logit contributions | |
computers | -0.033 |
jobs | -0.030 |
laptops | -0.030 |
chores | -0.030 |
apr | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
tow | +0.047 |
ever | +0.044 |
aroo | +0.040 |
Sue | +0.038 |
free | +0.038 |
Neg logit contributions | |
arre | -0.067 |
homework | -0.058 |
laptop | -0.057 |
chores | -0.056 |
idents | -0.054 |
Token | swings |
Token ID | 26728 |
Feature activation | +5.68e-02 |
Pos logit contributions | |
tow | +0.017 |
ever | +0.016 |
aroo | +0.015 |
free | +0.015 |
Dove | +0.014 |
Neg logit contributions | |
arre | -0.023 |
homework | -0.020 |
chores | -0.020 |
laptop | -0.019 |
jobs | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | +4.83e-03 |
Pos logit contributions | |
tow | +0.075 |
aroo | +0.068 |
ever | +0.066 |
orse | +0.064 |
Twe | +0.062 |
Neg logit contributions | |
arre | -0.092 |
homework | -0.087 |
chores | -0.087 |
apr | -0.081 |
laptop | -0.081 |
Token | l |
Token ID | 300 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.006 |
aroo | +0.006 |
free | +0.006 |
Sue | +0.006 |
Neg logit contributions | |
arre | -0.009 |
homework | -0.008 |
chores | -0.008 |
laptop | -0.008 |
apr | -0.008 |
Token | adders |
Token ID | 45940 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
tow | +0.033 |
swoop | +0.032 |
Frank | +0.031 |
Twe | +0.031 |
aroo | +0.030 |
Neg logit contributions | |
arre | -0.017 |
chores | -0.014 |
homework | -0.014 |
narrative | -0.012 |
laptop | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
tow | +0.027 |
Dove | +0.023 |
aroo | +0.022 |
Sue | +0.022 |
ever | +0.022 |
Neg logit contributions | |
arre | -0.048 |
homework | -0.043 |
chores | -0.042 |
laptop | -0.042 |
jobs | -0.040 |
Token | They |
Token ID | 1119 |
Feature activation | -4.48e-03 |
Pos logit contributions | |
ever | +0.014 |
free | +0.013 |
tow | +0.013 |
aroo | +0.013 |
swoop | +0.012 |
Neg logit contributions | |
arre | -0.024 |
homework | -0.021 |
apr | -0.021 |
laptop | -0.021 |
chores | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
tow | +0.008 |
Zip | +0.007 |
Dove | +0.007 |
swoop | +0.007 |
ever | +0.007 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.010 |
laptop | -0.010 |
chores | -0.010 |
apr | -0.009 |
Token | He |
Token ID | 679 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
ever | +0.034 |
free | +0.029 |
fallen | +0.028 |
swoop | +0.028 |
yours | +0.028 |
Neg logit contributions | |
arre | -0.030 |
means | -0.027 |
laptop | -0.026 |
matt | -0.025 |
homework | -0.024 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
tow | +0.022 |
ever | +0.021 |
Sue | +0.020 |
free | +0.020 |
Dove | +0.020 |
Neg logit contributions | |
arre | -0.035 |
apr | -0.029 |
homework | -0.028 |
laptop | -0.028 |
laptops | -0.027 |
Token | a |
Token ID | 257 |
Feature activation | +3.82e-02 |
Pos logit contributions | |
ever | +0.016 |
tow | +0.016 |
oe | +0.014 |
free | +0.014 |
aroo | +0.013 |
Neg logit contributions | |
arre | -0.024 |
homework | -0.022 |
chores | -0.022 |
nurses | -0.021 |
apr | -0.020 |
Token | shiny |
Token ID | 22441 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
ever | +0.049 |
tow | +0.042 |
Sue | +0.039 |
Bill | +0.039 |
itself | +0.039 |
Neg logit contributions | |
arre | -0.076 |
laptop | -0.066 |
homework | -0.065 |
chores | -0.063 |
tant | -0.061 |
Token | blue |
Token ID | 4171 |
Feature activation | +5.61e-02 |
Pos logit contributions | |
ever | +0.043 |
tow | +0.041 |
free | +0.039 |
Sue | +0.037 |
Zip | +0.037 |
Neg logit contributions | |
arre | -0.059 |
homework | -0.055 |
tant | -0.053 |
laptop | -0.053 |
chores | -0.052 |
Token | pond |
Token ID | 16723 |
Feature activation | +3.56e-02 |
Pos logit contributions | |
free | +0.075 |
tow | +0.073 |
Sue | +0.071 |
ever | +0.071 |
Zip | +0.067 |
Neg logit contributions | |
arre | -0.095 |
laptop | -0.080 |
tant | -0.079 |
dishes | -0.079 |
chores | -0.078 |
Token | with |
Token ID | 351 |
Feature activation | +5.13e-02 |
Pos logit contributions | |
tow | +0.046 |
ever | +0.041 |
Zip | +0.040 |
Dove | +0.040 |
free | +0.039 |
Neg logit contributions | |
arre | -0.065 |
homework | -0.060 |
laptop | -0.060 |
chores | -0.057 |
apr | -0.052 |
Token | ducks |
Token ID | 39694 |
Feature activation | +2.69e-02 |
Pos logit contributions | |
oot | +0.081 |
ary | +0.081 |
oe | +0.079 |
tow | +0.078 |
aroo | +0.077 |
Neg logit contributions | |
dishes | -0.063 |
arre | -0.063 |
matt | -0.063 |
chores | -0.061 |
beds | -0.058 |
Token | and |
Token ID | 290 |
Feature activation | +2.75e-02 |
Pos logit contributions | |
tow | +0.039 |
Sue | +0.034 |
Zip | +0.033 |
ever | +0.032 |
free | +0.032 |
Neg logit contributions | |
arre | -0.050 |
chores | -0.042 |
homework | -0.041 |
laptop | -0.041 |
dishes | -0.037 |
Token | fish |
Token ID | 5916 |
Feature activation | +3.74e-02 |
Pos logit contributions | |
tow | +0.034 |
ever | +0.031 |
oe | +0.030 |
aroo | +0.029 |
free | +0.028 |
Neg logit contributions | |
arre | -0.054 |
homework | -0.049 |
chores | -0.049 |
apr | -0.048 |
matt | -0.047 |
Token | pink |
Token ID | 11398 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
tow | +0.033 |
ever | +0.028 |
Zip | +0.028 |
aroo | +0.028 |
free | +0.026 |
Neg logit contributions | |
arre | -0.060 |
homework | -0.055 |
chores | -0.053 |
laptop | -0.052 |
tasks | -0.052 |
Token | flower |
Token ID | 15061 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
tow | +0.040 |
free | +0.035 |
Zip | +0.035 |
Bill | +0.034 |
Sue | +0.033 |
Neg logit contributions | |
arre | -0.060 |
homework | -0.057 |
laptop | -0.056 |
chores | -0.055 |
tasks | -0.054 |
Token | with |
Token ID | 351 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
tow | +0.033 |
Zip | +0.029 |
Sue | +0.027 |
aroo | +0.027 |
Bill | +0.027 |
Neg logit contributions | |
arre | -0.040 |
homework | -0.038 |
laptop | -0.037 |
chores | -0.036 |
sheets | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | +2.51e-02 |
Pos logit contributions | |
aroo | +0.053 |
tow | +0.050 |
Zip | +0.050 |
oe | +0.049 |
oot | +0.047 |
Neg logit contributions | |
apr | -0.039 |
sheets | -0.039 |
chores | -0.037 |
recipes | -0.037 |
dishes | -0.036 |
Token | yellow |
Token ID | 7872 |
Feature activation | +3.92e-02 |
Pos logit contributions | |
tow | +0.030 |
aroo | +0.030 |
Sue | +0.030 |
Zip | +0.029 |
ever | +0.029 |
Neg logit contributions | |
arre | -0.047 |
homework | -0.041 |
chores | -0.040 |
laptop | -0.040 |
mess | -0.040 |
Token | centre |
Token ID | 7372 |
Feature activation | +5.56e-02 |
Pos logit contributions | |
tow | +0.050 |
Zip | +0.048 |
Sue | +0.044 |
ever | +0.043 |
tted | +0.043 |
Neg logit contributions | |
arre | -0.066 |
sheets | -0.059 |
chores | -0.058 |
dishes | -0.057 |
laundry | -0.057 |
Token | . |
Token ID | 13 |
Feature activation | -2.91e-03 |
Pos logit contributions | |
Zip | +0.083 |
tow | +0.078 |
Tweet | +0.076 |
Dove | +0.076 |
aroo | +0.075 |
Neg logit contributions | |
arre | -0.088 |
laptop | -0.081 |
homework | -0.077 |
sheets | -0.075 |
recipes | -0.075 |
Token | Anna |
Token ID | 11735 |
Feature activation | +1.04e-03 |
Pos logit contributions | |
arre | +0.007 |
homework | +0.006 |
chores | +0.006 |
laptop | +0.006 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.003 |
ever | -0.003 |
Sue | -0.003 |
free | -0.003 |
pet | -0.002 |
Token | asked |
Token ID | 1965 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
tow | +0.001 |
ever | +0.001 |
free | +0.001 |
Sue | +0.001 |
aroo | +0.001 |
Neg logit contributions | |
arre | -0.002 |
homework | -0.002 |
chores | -0.002 |
laptop | -0.002 |
apr | -0.002 |
Token | her |
Token ID | 607 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
arre | +0.034 |
homework | +0.030 |
chores | +0.028 |
laptop | +0.028 |
apr | +0.028 |
Neg logit contributions | |
ever | -0.015 |
tow | -0.015 |
Sue | -0.014 |
free | -0.014 |
aroo | -0.012 |
Token | m |
Token ID | 285 |
Feature activation | +9.95e-04 |
Pos logit contributions | |
tow | +0.015 |
ever | +0.014 |
Sue | +0.013 |
free | +0.013 |
aroo | +0.012 |
Neg logit contributions | |
arre | -0.033 |
homework | -0.030 |
chores | -0.028 |
laptop | -0.028 |
apr | -0.028 |
Token | and |
Token ID | 290 |
Feature activation | +8.29e-03 |
Pos logit contributions | |
tow | +0.003 |
aroo | +0.003 |
ever | +0.003 |
Sue | +0.003 |
Zip | +0.003 |
Neg logit contributions | |
arre | -0.006 |
homework | -0.005 |
laptop | -0.005 |
chores | -0.005 |
jobs | -0.005 |
Token | he |
Token ID | 339 |
Feature activation | +4.11e-03 |
Pos logit contributions | |
tow | +0.011 |
ever | +0.009 |
free | +0.009 |
aroo | +0.009 |
Sue | +0.008 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.015 |
chores | -0.014 |
laptop | -0.014 |
apr | -0.014 |
Token | wanted |
Token ID | 2227 |
Feature activation | +3.05e-02 |
Pos logit contributions | |
tow | +0.006 |
Sue | +0.005 |
ever | +0.005 |
aroo | +0.005 |
free | +0.005 |
Neg logit contributions | |
arre | -0.008 |
homework | -0.007 |
chores | -0.006 |
apr | -0.006 |
laptop | -0.006 |
Token | to |
Token ID | 284 |
Feature activation | +3.66e-02 |
Pos logit contributions | |
tow | +0.058 |
aroo | +0.053 |
plet | +0.050 |
hy | +0.049 |
inger | +0.048 |
Neg logit contributions | |
homework | -0.038 |
chores | -0.037 |
arre | -0.035 |
jobs | -0.035 |
apr | -0.031 |
Token | catch |
Token ID | 4929 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
aroo | +0.050 |
tow | +0.049 |
Dove | +0.048 |
ever | +0.047 |
oe | +0.047 |
Neg logit contributions | |
arre | -0.055 |
chores | -0.053 |
homework | -0.050 |
jobs | -0.048 |
argue | -0.046 |
Token | one |
Token ID | 530 |
Feature activation | +5.55e-02 |
Pos logit contributions | |
tow | +0.041 |
ever | +0.036 |
aroo | +0.032 |
Sue | +0.032 |
free | +0.030 |
Neg logit contributions | |
arre | -0.079 |
homework | -0.069 |
chores | -0.068 |
jobs | -0.064 |
apr | -0.064 |
Token | . |
Token ID | 13 |
Feature activation | -2.56e-03 |
Pos logit contributions | |
tow | +0.075 |
Dove | +0.064 |
Zip | +0.061 |
hy | +0.061 |
Bill | +0.059 |
Neg logit contributions | |
arre | -0.090 |
homework | -0.089 |
chores | -0.085 |
means | -0.084 |
tasks | -0.080 |
Token | But |
Token ID | 887 |
Feature activation | -9.35e-03 |
Pos logit contributions | |
arre | +0.007 |
homework | +0.006 |
chores | +0.006 |
laptop | +0.006 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
Sue | -0.001 |
free | -0.001 |
Sally | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.51e-02 |
Pos logit contributions | |
arre | +0.024 |
homework | +0.021 |
apr | +0.021 |
laptop | +0.020 |
chores | +0.020 |
Neg logit contributions | |
tow | -0.008 |
ever | -0.008 |
Sue | -0.008 |
free | -0.007 |
Sally | -0.007 |
Token | fish |
Token ID | 5916 |
Feature activation | +2.81e-03 |
Pos logit contributions | |
tow | +0.015 |
ever | +0.014 |
Sue | +0.014 |
free | +0.013 |
Sally | +0.013 |
Neg logit contributions | |
arre | -0.034 |
homework | -0.031 |
chores | -0.030 |
laptop | -0.030 |
apr | -0.029 |
Token | were |
Token ID | 547 |
Feature activation | +4.41e-03 |
Pos logit contributions | |
tow | +0.004 |
ever | +0.004 |
free | +0.004 |
Sue | +0.004 |
aroo | +0.003 |
Neg logit contributions | |
arre | -0.006 |
homework | -0.005 |
chores | -0.005 |
laptop | -0.005 |
apr | -0.005 |
Token | big |
Token ID | 1263 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
ever | +0.022 |
tow | +0.021 |
Sue | +0.019 |
free | +0.019 |
aroo | +0.017 |
Neg logit contributions | |
arre | -0.046 |
homework | -0.041 |
laptop | -0.040 |
chores | -0.040 |
apr | -0.038 |
Token | structure |
Token ID | 4645 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
ever | +0.013 |
tow | +0.012 |
free | +0.012 |
Sue | +0.011 |
aroo | +0.011 |
Neg logit contributions | |
arre | -0.021 |
homework | -0.019 |
laptop | -0.019 |
chores | -0.018 |
apr | -0.018 |
Token | with |
Token ID | 351 |
Feature activation | +2.81e-02 |
Pos logit contributions | |
tow | +0.018 |
Dove | +0.016 |
free | +0.016 |
Bill | +0.016 |
ever | +0.015 |
Neg logit contributions | |
arre | -0.034 |
homework | -0.032 |
laptop | -0.031 |
chores | -0.030 |
jobs | -0.028 |
Token | slides |
Token ID | 19392 |
Feature activation | +3.32e-02 |
Pos logit contributions | |
aroo | +0.053 |
pper | +0.051 |
orse | +0.050 |
oe | +0.049 |
tow | +0.049 |
Neg logit contributions | |
computers | -0.032 |
chores | -0.031 |
jobs | -0.030 |
laptops | -0.030 |
apr | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | +1.32e-02 |
Pos logit contributions | |
tow | +0.045 |
ever | +0.042 |
aroo | +0.038 |
Sue | +0.037 |
free | +0.036 |
Neg logit contributions | |
arre | -0.066 |
homework | -0.057 |
laptop | -0.056 |
chores | -0.055 |
idents | -0.053 |
Token | swings |
Token ID | 26728 |
Feature activation | +5.54e-02 |
Pos logit contributions | |
tow | +0.019 |
ever | +0.018 |
aroo | +0.017 |
free | +0.016 |
Sue | +0.016 |
Neg logit contributions | |
arre | -0.025 |
homework | -0.022 |
chores | -0.021 |
laptop | -0.021 |
jobs | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +8.14e-03 |
Pos logit contributions | |
tow | +0.074 |
aroo | +0.067 |
ever | +0.065 |
orse | +0.063 |
ethyst | +0.061 |
Neg logit contributions | |
arre | -0.089 |
homework | -0.085 |
chores | -0.085 |
laptop | -0.079 |
apr | -0.078 |
Token | They |
Token ID | 1119 |
Feature activation | -1.74e-03 |
Pos logit contributions | |
ever | +0.011 |
tow | +0.010 |
free | +0.009 |
aroo | +0.009 |
swoop | +0.009 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.015 |
chores | -0.014 |
apr | -0.014 |
laptop | -0.014 |
Token | run |
Token ID | 1057 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
arre | +0.003 |
homework | +0.003 |
chores | +0.003 |
laptop | +0.003 |
apr | +0.002 |
Neg logit contributions | |
tow | -0.003 |
ever | -0.003 |
free | -0.002 |
aroo | -0.002 |
Sue | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
tow | +0.014 |
ever | +0.014 |
Sue | +0.012 |
free | +0.012 |
aroo | +0.012 |
Neg logit contributions | |
arre | -0.029 |
homework | -0.025 |
chores | -0.024 |
laptop | -0.024 |
apr | -0.024 |
Token | it |
Token ID | 340 |
Feature activation | +5.85e-03 |
Pos logit contributions | |
ever | +0.016 |
aroo | +0.016 |
tow | +0.016 |
ull | +0.014 |
Tweet | +0.014 |
Neg logit contributions | |
chores | -0.023 |
homework | -0.022 |
arre | -0.021 |
apr | -0.021 |
jobs | -0.020 |
Token | pond |
Token ID | 16723 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
ever | +0.029 |
Sue | +0.026 |
Bill | +0.026 |
Sally | +0.026 |
tow | +0.025 |
Neg logit contributions | |
arre | -0.043 |
chores | -0.039 |
homework | -0.037 |
jobs | -0.036 |
laptop | -0.036 |
Token | had |
Token ID | 550 |
Feature activation | +3.19e-02 |
Pos logit contributions | |
tow | +0.016 |
free | +0.014 |
Dove | +0.014 |
Sue | +0.014 |
ever | +0.014 |
Neg logit contributions | |
arre | -0.021 |
homework | -0.017 |
chores | -0.016 |
laptop | -0.016 |
jobs | -0.016 |
Token | become |
Token ID | 1716 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
aroo | +0.043 |
tow | +0.039 |
Zip | +0.036 |
Sue | +0.034 |
Dove | +0.034 |
Neg logit contributions | |
arre | -0.059 |
jobs | -0.049 |
chores | -0.049 |
homework | -0.049 |
apr | -0.048 |
Token | a |
Token ID | 257 |
Feature activation | +2.31e-02 |
Pos logit contributions | |
aroo | +0.027 |
tow | +0.026 |
ever | +0.025 |
Zip | +0.024 |
Sue | +0.024 |
Neg logit contributions | |
arre | -0.036 |
chores | -0.031 |
homework | -0.031 |
jobs | -0.030 |
apr | -0.029 |
Token | safe |
Token ID | 3338 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
Sue | +0.031 |
aroo | +0.030 |
ever | +0.030 |
tow | +0.029 |
Jen | +0.028 |
Neg logit contributions | |
arre | -0.042 |
homework | -0.038 |
chores | -0.037 |
laptop | -0.035 |
jobs | -0.034 |
Token | haven |
Token ID | 4398 |
Feature activation | +5.53e-02 |
Pos logit contributions | |
Sue | +0.037 |
tow | +0.037 |
free | +0.037 |
Zip | +0.037 |
ever | +0.037 |
Neg logit contributions | |
arre | -0.057 |
homework | -0.048 |
laptop | -0.048 |
chores | -0.048 |
jobs | -0.046 |
Token | for |
Token ID | 329 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
tow | +0.038 |
coconut | +0.037 |
Sue | +0.034 |
pet | +0.034 |
squirrel | +0.033 |
Neg logit contributions | |
arre | -0.130 |
homework | -0.115 |
chores | -0.114 |
means | -0.110 |
ambul | -0.108 |
Token | ducks |
Token ID | 39694 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
homework | +0.018 |
chores | +0.018 |
tasks | +0.016 |
jobs | +0.016 |
ambul | +0.016 |
Neg logit contributions | |
tow | -0.016 |
Zip | -0.014 |
aroo | -0.014 |
tie | -0.014 |
pole | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | +9.45e-03 |
Pos logit contributions | |
tow | +0.020 |
Sue | +0.017 |
free | +0.016 |
aroo | +0.016 |
Zip | +0.016 |
Neg logit contributions | |
arre | -0.035 |
homework | -0.031 |
chores | -0.030 |
laptop | -0.029 |
jobs | -0.028 |
Token | Mia |
Token ID | 32189 |
Feature activation | +2.20e-03 |
Pos logit contributions | |
ever | +0.012 |
swoop | +0.012 |
tow | +0.012 |
free | +0.012 |
aroo | +0.012 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.014 |
laptop | -0.014 |
chores | -0.014 |
means | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | +5.36e-03 |
Pos logit contributions | |
tow | +0.003 |
Sue | +0.003 |
ever | +0.003 |
free | +0.003 |
Sally | +0.003 |
Neg logit contributions | |
arre | -0.004 |
homework | -0.004 |
chores | -0.004 |
laptop | -0.003 |
apr | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | +5.61e-03 |
Pos logit contributions | |
tow | +0.022 |
ever | +0.020 |
Sue | +0.019 |
Dove | +0.019 |
aroo | +0.019 |
Neg logit contributions | |
arre | -0.036 |
homework | -0.032 |
chores | -0.031 |
laptop | -0.031 |
jobs | -0.030 |
Token | sandy |
Token ID | 44039 |
Feature activation | +5.84e-03 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.007 |
aroo | +0.006 |
Sue | +0.006 |
free | +0.006 |
Neg logit contributions | |
arre | -0.011 |
homework | -0.010 |
chores | -0.010 |
laptop | -0.010 |
apr | -0.009 |
Token | beach |
Token ID | 10481 |
Feature activation | +1.95e-02 |
Pos logit contributions | |
tow | +0.009 |
ever | +0.009 |
Sue | +0.008 |
free | +0.008 |
aroo | +0.008 |
Neg logit contributions | |
arre | -0.010 |
homework | -0.009 |
chores | -0.008 |
jobs | -0.008 |
apr | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
tow | +0.027 |
ever | +0.023 |
aroo | +0.022 |
free | +0.022 |
Sue | +0.022 |
Neg logit contributions | |
arre | -0.038 |
homework | -0.035 |
laptop | -0.033 |
chores | -0.033 |
jobs | -0.032 |
Token | se |
Token ID | 384 |
Feature activation | -2.04e-02 |
Pos logit contributions | |
tow | +0.014 |
ever | +0.013 |
aroo | +0.012 |
free | +0.012 |
oe | +0.012 |
Neg logit contributions | |
arre | -0.024 |
homework | -0.022 |
chores | -0.021 |
laptop | -0.021 |
apr | -0.020 |
Token | ag |
Token ID | 363 |
Feature activation | +5.52e-02 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.031 |
chores | +0.030 |
apr | +0.029 |
laptop | +0.028 |
Neg logit contributions | |
tow | -0.032 |
ever | -0.031 |
Sue | -0.030 |
free | -0.030 |
aroo | -0.028 |
Token | ull |
Token ID | 724 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
tow | +0.054 |
Dove | +0.045 |
ever | +0.041 |
Sue | +0.040 |
pet | +0.040 |
Neg logit contributions | |
arre | -0.130 |
homework | -0.105 |
laptops | -0.104 |
tant | -0.104 |
apr | -0.103 |
Token | s |
Token ID | 82 |
Feature activation | +1.58e-02 |
Pos logit contributions | |
tow | +0.043 |
Sue | +0.039 |
ever | +0.039 |
Sally | +0.038 |
Dove | +0.037 |
Neg logit contributions | |
arre | -0.018 |
laptop | -0.010 |
homework | -0.010 |
chores | -0.008 |
ambul | -0.008 |
Token | in |
Token ID | 287 |
Feature activation | +2.88e-02 |
Pos logit contributions | |
tow | +0.021 |
aroo | +0.019 |
Sue | +0.019 |
Dove | +0.019 |
Sally | +0.018 |
Neg logit contributions | |
arre | -0.030 |
homework | -0.024 |
laptop | -0.024 |
chores | -0.023 |
apr | -0.023 |
Token | the |
Token ID | 262 |
Feature activation | -6.40e-03 |
Pos logit contributions | |
aroo | +0.042 |
oot | +0.039 |
iki | +0.037 |
Tweet | +0.037 |
Dove | +0.037 |
Neg logit contributions | |
arre | -0.048 |
movies | -0.044 |
chores | -0.043 |
homework | -0.042 |
matt | -0.042 |
Token | sky |
Token ID | 6766 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
chores | +0.010 |
apr | +0.010 |
laptop | +0.010 |
Neg logit contributions | |
Sue | -0.009 |
ever | -0.009 |
tow | -0.009 |
aroo | -0.009 |
Dove | -0.008 |
Token | 't |
Token ID | 470 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
tow | +0.044 |
pet | +0.041 |
swoop | +0.041 |
Sue | +0.041 |
free | +0.040 |
Neg logit contributions | |
arre | -0.064 |
homework | -0.057 |
chores | -0.056 |
laptop | -0.050 |
means | -0.048 |
Token | wait |
Token ID | 4043 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
tow | +0.035 |
Sue | +0.035 |
Dove | +0.033 |
oe | +0.032 |
Sally | +0.032 |
Neg logit contributions | |
chores | -0.020 |
homework | -0.020 |
arre | -0.019 |
laptop | -0.017 |
jobs | -0.016 |
Token | ! |
Token ID | 0 |
Feature activation | +5.77e-03 |
Pos logit contributions | |
tow | +0.022 |
aroo | +0.021 |
Dove | +0.020 |
Sue | +0.019 |
Tweet | +0.019 |
Neg logit contributions | |
arre | -0.025 |
homework | -0.024 |
chores | -0.024 |
apr | -0.022 |
laptop | -0.021 |
Token | Where |
Token ID | 6350 |
Feature activation | +9.69e-03 |
Pos logit contributions | |
ever | +0.008 |
swoop | +0.008 |
tow | +0.007 |
aroo | +0.007 |
free | +0.007 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.010 |
chores | -0.009 |
laptop | -0.009 |
idents | -0.009 |
Token | ver |
Token ID | 332 |
Feature activation | +3.42e-02 |
Pos logit contributions | |
tow | +0.016 |
free | +0.014 |
ever | +0.014 |
pet | +0.014 |
Dove | +0.014 |
Neg logit contributions | |
arre | -0.016 |
homework | -0.015 |
chores | -0.014 |
laptop | -0.013 |
jobs | -0.013 |
Token | she |
Token ID | 673 |
Feature activation | +5.47e-02 |
Pos logit contributions | |
tow | +0.046 |
free | +0.043 |
ull | +0.040 |
aroo | +0.040 |
ever | +0.039 |
Neg logit contributions | |
arre | -0.060 |
homework | -0.058 |
chores | -0.058 |
nurses | -0.054 |
jobs | -0.054 |
Token | was |
Token ID | 373 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
tow | +0.075 |
Sue | +0.069 |
free | +0.066 |
aroo | +0.066 |
Dove | +0.066 |
Neg logit contributions | |
arre | -0.103 |
homework | -0.092 |
chores | -0.085 |
means | -0.084 |
jobs | -0.083 |
Token | going |
Token ID | 1016 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
tow | +0.023 |
aroo | +0.020 |
Tweet | +0.020 |
Sue | +0.020 |
Zip | +0.019 |
Neg logit contributions | |
arre | -0.029 |
homework | -0.029 |
chores | -0.027 |
laptop | -0.026 |
jobs | -0.026 |
Token | , |
Token ID | 11 |
Feature activation | +1.54e-03 |
Pos logit contributions | |
tow | +0.032 |
Sue | +0.029 |
aroo | +0.028 |
ever | +0.028 |
free | +0.027 |
Neg logit contributions | |
arre | -0.041 |
homework | -0.038 |
chores | -0.037 |
laptop | -0.033 |
jobs | -0.033 |
Token | she |
Token ID | 673 |
Feature activation | +2.72e-02 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
free | +0.002 |
aroo | +0.002 |
Sue | +0.001 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.003 |
chores | -0.003 |
laptop | -0.003 |
jobs | -0.003 |
Token | knew |
Token ID | 2993 |
Feature activation | +2.32e-02 |
Pos logit contributions | |
tow | +0.041 |
Sue | +0.039 |
aroo | +0.038 |
Dove | +0.036 |
free | +0.036 |
Neg logit contributions | |
arre | -0.048 |
homework | -0.042 |
chores | -0.039 |
laptop | -0.038 |
means | -0.037 |
Token | brown |
Token ID | 7586 |
Feature activation | +6.46e-03 |
Pos logit contributions | |
tow | +0.003 |
ever | +0.003 |
aroo | +0.002 |
free | +0.002 |
Sue | +0.002 |
Neg logit contributions | |
arre | -0.005 |
homework | -0.005 |
chores | -0.005 |
laptop | -0.005 |
apr | -0.004 |
Token | dog |
Token ID | 3290 |
Feature activation | +8.22e-03 |
Pos logit contributions | |
ever | +0.008 |
tow | +0.008 |
free | +0.007 |
Sue | +0.007 |
aroo | +0.007 |
Neg logit contributions | |
arre | -0.014 |
homework | -0.012 |
laptop | -0.012 |
chores | -0.012 |
apr | -0.011 |
Token | with |
Token ID | 351 |
Feature activation | +2.31e-02 |
Pos logit contributions | |
tow | +0.008 |
ever | +0.007 |
free | +0.007 |
Sue | +0.006 |
aroo | +0.006 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.018 |
laptop | -0.017 |
chores | -0.016 |
ambul | -0.016 |
Token | a |
Token ID | 257 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
oe | +0.032 |
tow | +0.031 |
aroo | +0.030 |
ever | +0.030 |
Abby | +0.027 |
Neg logit contributions | |
arre | -0.041 |
chores | -0.038 |
homework | -0.037 |
laptops | -0.035 |
computers | -0.035 |
Token | w |
Token ID | 266 |
Feature activation | -4.47e-03 |
Pos logit contributions | |
ever | +0.026 |
tow | +0.024 |
Sue | +0.022 |
aroo | +0.022 |
free | +0.021 |
Neg logit contributions | |
arre | -0.053 |
homework | -0.047 |
laptop | -0.045 |
chores | -0.045 |
apr | -0.042 |
Token | ag |
Token ID | 363 |
Feature activation | +5.47e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
affles | +0.007 |
Neg logit contributions | |
tow | -0.008 |
ever | -0.007 |
Sue | -0.007 |
free | -0.007 |
swoop | -0.007 |
Token | gy |
Token ID | 1360 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
ever | +0.067 |
tow | +0.066 |
I | +0.060 |
Abby | +0.059 |
free | +0.058 |
Neg logit contributions | |
arre | -0.108 |
tant | -0.088 |
laptop | -0.088 |
homework | -0.085 |
organ | -0.082 |
Token | tail |
Token ID | 7894 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
tow | +0.012 |
ever | +0.012 |
free | +0.010 |
Sue | +0.010 |
aroo | +0.010 |
Neg logit contributions | |
arre | -0.024 |
homework | -0.022 |
laptop | -0.021 |
chores | -0.021 |
apr | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
tow | +0.036 |
Sue | +0.035 |
ever | +0.034 |
Abby | +0.033 |
Jen | +0.033 |
Neg logit contributions | |
arre | -0.054 |
laptop | -0.045 |
homework | -0.044 |
chores | -0.043 |
sheets | -0.039 |
Token | Tim |
Token ID | 5045 |
Feature activation | +2.82e-04 |
Pos logit contributions | |
ever | +0.013 |
tow | +0.012 |
free | +0.012 |
aroo | +0.011 |
swoop | +0.010 |
Neg logit contributions | |
arre | -0.026 |
homework | -0.023 |
chores | -0.022 |
laptop | -0.022 |
apr | -0.022 |
Token | my |
Token ID | 1820 |
Feature activation | +9.47e-03 |
Pos logit contributions | |
ever | +0.000 |
tow | +0.000 |
Sue | +0.000 |
free | +0.000 |
pet | +0.000 |
Neg logit contributions | |
arre | -0.001 |
homework | -0.001 |
chores | -0.001 |
laptop | -0.001 |
apr | -0.000 |
Token | play |
Token ID | 711 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
tow | +0.040 |
Sue | +0.039 |
aroo | +0.038 |
Dove | +0.038 |
swoop | +0.037 |
Neg logit contributions | |
arre | -0.054 |
chores | -0.049 |
homework | -0.048 |
laptop | -0.043 |
jobs | -0.042 |
Token | in |
Token ID | 287 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
tow | +0.015 |
ever | +0.015 |
free | +0.014 |
Sue | +0.014 |
aroo | +0.013 |
Neg logit contributions | |
arre | -0.034 |
homework | -0.031 |
chores | -0.029 |
laptop | -0.029 |
apr | -0.029 |
Token | the |
Token ID | 262 |
Feature activation | -2.80e-03 |
Pos logit contributions | |
tow | +0.023 |
ever | +0.022 |
aroo | +0.020 |
Sue | +0.020 |
free | +0.019 |
Neg logit contributions | |
arre | -0.048 |
homework | -0.044 |
chores | -0.042 |
laptop | -0.041 |
apr | -0.041 |
Token | ocean |
Token ID | 9151 |
Feature activation | -6.23e-03 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.004 |
chores | +0.004 |
laptop | +0.004 |
apr | +0.004 |
Neg logit contributions | |
ever | -0.004 |
tow | -0.004 |
aroo | -0.004 |
Sue | -0.004 |
free | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -9.52e-03 |
Pos logit contributions | |
arre | +0.015 |
homework | +0.013 |
chores | +0.012 |
laptop | +0.012 |
apr | +0.012 |
Neg logit contributions | |
tow | -0.006 |
ever | -0.006 |
Sue | -0.006 |
free | -0.006 |
aroo | -0.005 |
Token | shall |
Token ID | 2236 |
Feature activation | +5.46e-02 |
Pos logit contributions | |
arre | +0.021 |
homework | +0.017 |
chores | +0.017 |
idents | +0.017 |
apr | +0.016 |
Neg logit contributions | |
tow | -0.012 |
aroo | -0.011 |
ever | -0.010 |
free | -0.010 |
Zip | -0.010 |
Token | we |
Token ID | 356 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
tow | +0.091 |
ever | +0.080 |
free | +0.076 |
swoop | +0.075 |
Zip | +0.075 |
Neg logit contributions | |
arre | -0.081 |
homework | -0.075 |
chores | -0.074 |
idents | -0.071 |
ambul | -0.068 |
Token | ?" |
Token ID | 1701 |
Feature activation | +1.24e-03 |
Pos logit contributions | |
tow | +0.016 |
Sue | +0.015 |
aroo | +0.015 |
ever | +0.014 |
Dove | +0.014 |
Neg logit contributions | |
arre | -0.026 |
homework | -0.022 |
chores | -0.022 |
jobs | -0.020 |
laptop | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
ever | +0.002 |
tow | +0.001 |
aroo | +0.001 |
free | +0.001 |
swoop | +0.001 |
Neg logit contributions | |
arre | -0.003 |
chores | -0.002 |
homework | -0.002 |
apr | -0.002 |
idents | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | +1.42e-03 |
Pos logit contributions | |
ever | +0.005 |
tow | +0.005 |
aroo | +0.005 |
free | +0.004 |
Sue | +0.004 |
Neg logit contributions | |
arre | -0.010 |
chores | -0.008 |
homework | -0.008 |
apr | -0.007 |
laptop | -0.007 |
Token | And |
Token ID | 1870 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
free | +0.002 |
Sue | +0.002 |
pet | +0.001 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.003 |
laptop | -0.003 |
chores | -0.003 |
apr | -0.003 |
Token | walked |
Token ID | 6807 |
Feature activation | +5.13e-03 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
idents | +0.007 |
Neg logit contributions | |
tow | -0.008 |
Sue | -0.007 |
Dove | -0.006 |
aroo | -0.006 |
ever | -0.006 |
Token | in |
Token ID | 287 |
Feature activation | -1.83e-03 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.006 |
Sue | +0.006 |
aroo | +0.006 |
free | +0.006 |
Neg logit contributions | |
arre | -0.011 |
homework | -0.009 |
chores | -0.009 |
laptop | -0.008 |
jobs | -0.008 |
Token | on |
Token ID | 319 |
Feature activation | -3.69e-03 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.004 |
chores | +0.004 |
laptop | +0.004 |
apr | +0.003 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
aroo | -0.002 |
Sue | -0.002 |
free | -0.002 |
Token | us |
Token ID | 514 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
apr | +0.007 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.004 |
aroo | -0.004 |
Sue | -0.004 |
free | -0.004 |
Token | qu |
Token ID | 627 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
arre | +0.041 |
homework | +0.036 |
chores | +0.035 |
laptop | +0.034 |
jobs | +0.034 |
Neg logit contributions | |
tow | -0.018 |
ever | -0.015 |
Sue | -0.015 |
aroo | -0.015 |
Dove | -0.015 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.80e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.006 |
chores | +0.003 |
laptop | +0.003 |
apr | +0.002 |
Neg logit contributions | |
tow | -0.072 |
ever | -0.071 |
free | -0.071 |
Sue | -0.069 |
pet | -0.068 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
homework | +0.157 |
laptop | +0.153 |
apr | +0.152 |
arre | +0.150 |
chores | +0.150 |
Neg logit contributions | |
ever | -0.087 |
free | -0.086 |
p | -0.071 |
of | -0.069 |
fast | -0.067 |
Token | and |
Token ID | 290 |
Feature activation | +2.21e-03 |
Pos logit contributions | |
arre | +0.031 |
homework | +0.028 |
chores | +0.027 |
laptop | +0.026 |
apr | +0.026 |
Neg logit contributions | |
tow | -0.012 |
ever | -0.012 |
Sue | -0.011 |
free | -0.011 |
aroo | -0.010 |
Token | heard |
Token ID | 2982 |
Feature activation | -4.73e-03 |
Pos logit contributions | |
tow | +0.003 |
aroo | +0.003 |
ever | +0.003 |
Dove | +0.003 |
Sue | +0.003 |
Neg logit contributions | |
arre | -0.004 |
homework | -0.004 |
chores | -0.003 |
laptop | -0.003 |
idents | -0.003 |
Token | us |
Token ID | 514 |
Feature activation | +5.45e-04 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.009 |
jobs | +0.008 |
ambul | +0.008 |
Neg logit contributions | |
tow | -0.006 |
ever | -0.005 |
aroo | -0.005 |
free | -0.005 |
Sue | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
tow | +0.001 |
Sue | +0.001 |
Dove | +0.001 |
aroo | +0.000 |
ever | +0.000 |
Neg logit contributions | |
arre | -0.001 |
homework | -0.001 |
chores | -0.001 |
laptop | -0.001 |
jobs | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -2.85e-03 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.008 |
laptop | +0.008 |
apr | +0.008 |
Neg logit contributions | |
ever | -0.008 |
tow | -0.008 |
aroo | -0.007 |
Sue | -0.007 |
free | -0.007 |
Token | They |
Token ID | 2990 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.005 |
chores | +0.005 |
laptop | +0.005 |
apr | +0.005 |
Neg logit contributions | |
tow | -0.003 |
ever | -0.003 |
free | -0.003 |
Sue | -0.003 |
aroo | -0.003 |
Token | learn |
Token ID | 2193 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
arre | +0.038 |
homework | +0.033 |
chores | +0.032 |
laptop | +0.031 |
apr | +0.030 |
Neg logit contributions | |
tow | -0.025 |
ever | -0.024 |
Sue | -0.023 |
free | -0.023 |
aroo | -0.022 |
Token | that |
Token ID | 326 |
Feature activation | -3.58e-02 |
Pos logit contributions | |
arre | +0.027 |
homework | +0.023 |
apr | +0.023 |
laptop | +0.023 |
chores | +0.022 |
Neg logit contributions | |
ever | -0.008 |
tow | -0.008 |
Sue | -0.007 |
free | -0.007 |
pet | -0.006 |
Token | qu |
Token ID | 627 |
Feature activation | -2.91e-02 |
Pos logit contributions | |
arre | +0.085 |
apr | +0.071 |
homework | +0.069 |
laptop | +0.069 |
riger | +0.068 |
Neg logit contributions | |
ever | -0.041 |
tow | -0.037 |
Sue | -0.035 |
free | -0.034 |
its | -0.033 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.77e-02 |
Pos logit contributions | |
arre | +0.027 |
homework | +0.024 |
laptop | +0.021 |
chores | +0.020 |
apr | +0.020 |
Neg logit contributions | |
tow | -0.066 |
ever | -0.066 |
free | -0.065 |
Sue | -0.063 |
Dove | -0.060 |
Token | ling |
Token ID | 1359 |
Feature activation | -2.61e-02 |
Pos logit contributions | |
laptop | +0.146 |
arre | +0.145 |
homework | +0.144 |
dining | +0.141 |
apr | +0.141 |
Neg logit contributions | |
ever | -0.100 |
free | -0.095 |
of | -0.086 |
itself | -0.082 |
p | -0.081 |
Token | is |
Token ID | 318 |
Feature activation | -9.31e-03 |
Pos logit contributions | |
arre | +0.050 |
homework | +0.043 |
chores | +0.041 |
laptop | +0.041 |
apr | +0.040 |
Neg logit contributions | |
ever | -0.037 |
tow | -0.037 |
free | -0.035 |
Sue | -0.035 |
aroo | -0.033 |
Token | bad |
Token ID | 2089 |
Feature activation | -3.51e-02 |
Pos logit contributions | |
arre | +0.020 |
homework | +0.017 |
laptop | +0.016 |
apr | +0.016 |
chores | +0.016 |
Neg logit contributions | |
tow | -0.012 |
ever | -0.012 |
free | -0.011 |
Sue | -0.011 |
pet | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | -1.11e-03 |
Pos logit contributions | |
arre | +0.083 |
homework | +0.072 |
apr | +0.071 |
chores | +0.070 |
laptop | +0.069 |
Neg logit contributions | |
ever | -0.039 |
tow | -0.034 |
Sue | -0.033 |
free | -0.032 |
pet | -0.029 |
Token | sharing |
Token ID | 7373 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
arre | +0.002 |
homework | +0.002 |
chores | +0.002 |
laptop | +0.002 |
apr | +0.002 |
Neg logit contributions | |
tow | -0.001 |
ever | -0.001 |
Sue | -0.001 |
free | -0.001 |
aroo | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
tow | +0.005 |
ever | +0.005 |
free | +0.005 |
aroo | +0.005 |
Sue | +0.005 |
Neg logit contributions | |
arre | -0.007 |
homework | -0.006 |
laptop | -0.006 |
chores | -0.006 |
apr | -0.005 |
Token | Ben |
Token ID | 3932 |
Feature activation | -2.00e-02 |
Pos logit contributions | |
arre | +0.028 |
homework | +0.024 |
laptop | +0.023 |
chores | +0.023 |
apr | +0.023 |
Neg logit contributions | |
ever | -0.008 |
Sue | -0.008 |
tow | -0.008 |
free | -0.007 |
pet | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
arre | +0.041 |
homework | +0.034 |
chores | +0.033 |
laptop | +0.032 |
jobs | +0.031 |
Neg logit contributions | |
tow | -0.028 |
ever | -0.025 |
aroo | -0.025 |
free | -0.023 |
Sue | -0.023 |
Token | stop |
Token ID | 2245 |
Feature activation | -5.75e-03 |
Pos logit contributions | |
arre | +0.025 |
homework | +0.021 |
chores | +0.021 |
laptop | +0.020 |
apr | +0.020 |
Neg logit contributions | |
ever | -0.015 |
tow | -0.015 |
Sue | -0.014 |
free | -0.014 |
aroo | -0.013 |
Token | qu |
Token ID | 627 |
Feature activation | -3.15e-02 |
Pos logit contributions | |
arre | +0.011 |
homework | +0.010 |
laptop | +0.009 |
chores | +0.009 |
apr | +0.009 |
Neg logit contributions | |
tow | -0.009 |
ever | -0.008 |
aroo | -0.007 |
Sue | -0.007 |
Dove | -0.007 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.52e-02 |
Pos logit contributions | |
homework | +0.024 |
apr | +0.021 |
chores | +0.020 |
ambul | +0.020 |
laptop | +0.020 |
Neg logit contributions | |
free | -0.072 |
tow | -0.070 |
ever | -0.069 |
Sue | -0.069 |
ak | -0.068 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
apr | +0.162 |
homework | +0.160 |
chores | +0.156 |
laptop | +0.153 |
arre | +0.150 |
Neg logit contributions | |
ever | -0.078 |
free | -0.078 |
p | -0.072 |
of | -0.067 |
fast | -0.066 |
Token | right |
Token ID | 826 |
Feature activation | -2.97e-03 |
Pos logit contributions | |
arre | +0.038 |
homework | +0.035 |
chores | +0.033 |
laptop | +0.033 |
apr | +0.033 |
Neg logit contributions | |
ever | -0.013 |
tow | -0.013 |
free | -0.012 |
Sue | -0.012 |
aroo | -0.010 |
Token | now |
Token ID | 783 |
Feature activation | -9.26e-03 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.006 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
free | -0.002 |
Sue | -0.002 |
aroo | -0.002 |
Token | ! |
Token ID | 0 |
Feature activation | -9.23e-03 |
Pos logit contributions | |
arre | +0.022 |
homework | +0.020 |
chores | +0.019 |
laptop | +0.019 |
apr | +0.018 |
Neg logit contributions | |
tow | -0.010 |
ever | -0.009 |
Sue | -0.008 |
free | -0.008 |
aroo | -0.008 |
Token | Look |
Token ID | 6803 |
Feature activation | -6.94e-03 |
Pos logit contributions | |
arre | +0.018 |
laptop | +0.014 |
homework | +0.014 |
idents | +0.013 |
ambul | +0.013 |
Neg logit contributions | |
ever | -0.014 |
tow | -0.014 |
free | -0.014 |
swoop | -0.013 |
pet | -0.012 |
Token | other |
Token ID | 584 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
tow | +0.008 |
ever | +0.008 |
Dove | +0.007 |
Sue | +0.007 |
free | +0.007 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.011 |
chores | -0.011 |
laptop | -0.010 |
tasks | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
arre | +0.048 |
homework | +0.042 |
chores | +0.041 |
laptop | +0.041 |
jobs | +0.039 |
Neg logit contributions | |
tow | -0.021 |
ever | -0.019 |
free | -0.018 |
Sue | -0.017 |
aroo | -0.017 |
Token | They |
Token ID | 1119 |
Feature activation | -2.21e-02 |
Pos logit contributions | |
arre | +0.031 |
homework | +0.026 |
laptop | +0.025 |
idents | +0.025 |
apr | +0.024 |
Neg logit contributions | |
ever | -0.019 |
tow | -0.018 |
free | -0.017 |
swoop | -0.017 |
aroo | -0.016 |
Token | starting |
Token ID | 3599 |
Feature activation | -8.35e-03 |
Pos logit contributions | |
arre | +0.048 |
homework | +0.043 |
chores | +0.041 |
laptop | +0.041 |
apr | +0.040 |
Neg logit contributions | |
ever | -0.026 |
tow | -0.025 |
free | -0.024 |
Sue | -0.023 |
pet | -0.022 |
Token | qu |
Token ID | 627 |
Feature activation | -2.64e-02 |
Pos logit contributions | |
arre | +0.019 |
homework | +0.017 |
chores | +0.017 |
laptop | +0.016 |
apr | +0.016 |
Neg logit contributions | |
tow | -0.009 |
ever | -0.009 |
free | -0.008 |
Sue | -0.008 |
pet | -0.007 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.49e-02 |
Pos logit contributions | |
homework | +0.007 |
laptop | +0.005 |
chores | +0.004 |
ambul | +0.002 |
arre | +0.002 |
Neg logit contributions | |
free | -0.075 |
tow | -0.073 |
ever | -0.073 |
Sue | -0.072 |
Sally | -0.070 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
homework | +0.160 |
laptop | +0.156 |
chores | +0.152 |
dining | +0.150 |
apr | +0.149 |
Neg logit contributions | |
ever | -0.082 |
free | -0.080 |
p | -0.067 |
of | -0.067 |
fast | -0.063 |
Token | again |
Token ID | 757 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.042 |
laptop | +0.041 |
chores | +0.040 |
apr | +0.040 |
Neg logit contributions | |
ever | -0.019 |
tow | -0.018 |
free | -0.017 |
Sue | -0.017 |
pet | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.032 |
chores | +0.031 |
laptop | +0.031 |
apr | +0.030 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.018 |
Sue | -0.017 |
aroo | -0.017 |
free | -0.016 |
Token | their |
Token ID | 511 |
Feature activation | -4.84e-03 |
Pos logit contributions | |
arre | +0.027 |
homework | +0.023 |
chores | +0.022 |
laptop | +0.022 |
apr | +0.022 |
Neg logit contributions | |
tow | -0.016 |
ever | -0.016 |
Sue | -0.015 |
free | -0.015 |
aroo | -0.014 |
Token | voices |
Token ID | 10839 |
Feature activation | +5.86e-04 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.008 |
chores | +0.008 |
laptop | +0.008 |
apr | +0.008 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.006 |
free | -0.006 |
Sally | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
arre | +0.061 |
homework | +0.054 |
chores | +0.052 |
laptop | +0.051 |
apr | +0.050 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.018 |
Sue | -0.018 |
free | -0.016 |
pet | -0.015 |
Token | mess |
Token ID | 2085 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.003 |
cuts | +0.003 |
ambul | +0.003 |
laptops | +0.003 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
free | -0.005 |
pet | -0.005 |
Sue | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -5.60e-03 |
Pos logit contributions | |
arre | +0.079 |
homework | +0.071 |
chores | +0.068 |
laptop | +0.068 |
apr | +0.066 |
Neg logit contributions | |
tow | -0.033 |
ever | -0.032 |
Sue | -0.029 |
free | -0.029 |
aroo | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.012 |
chores | +0.012 |
apr | +0.011 |
laptop | +0.011 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
Sue | -0.005 |
free | -0.005 |
pet | -0.004 |
Token | qu |
Token ID | 627 |
Feature activation | -3.39e-02 |
Pos logit contributions | |
arre | +0.017 |
homework | +0.013 |
chores | +0.012 |
cuts | +0.012 |
ambul | +0.012 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.019 |
free | -0.018 |
Sue | -0.018 |
pet | -0.018 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.48e-02 |
Pos logit contributions | |
arre | +0.051 |
homework | +0.047 |
chores | +0.044 |
laptop | +0.043 |
apr | +0.042 |
Neg logit contributions | |
ever | -0.057 |
tow | -0.057 |
free | -0.055 |
Sue | -0.054 |
aroo | -0.051 |
Token | ling |
Token ID | 1359 |
Feature activation | -5.87e-03 |
Pos logit contributions | |
arre | +0.144 |
homework | +0.139 |
apr | +0.133 |
chores | +0.129 |
aj | +0.129 |
Neg logit contributions | |
ever | -0.096 |
free | -0.093 |
of | -0.088 |
p | -0.079 |
tow | -0.078 |
Token | twins |
Token ID | 20345 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
chores | +0.009 |
laptop | +0.009 |
apr | +0.009 |
Neg logit contributions | |
ever | -0.008 |
tow | -0.008 |
free | -0.008 |
Sue | -0.008 |
Dove | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +7.80e-04 |
Pos logit contributions | |
arre | +0.052 |
homework | +0.047 |
laptop | +0.046 |
chores | +0.046 |
apr | +0.042 |
Neg logit contributions | |
tow | -0.020 |
Sue | -0.018 |
ever | -0.018 |
aroo | -0.018 |
Dove | -0.017 |
Token | She |
Token ID | 1375 |
Feature activation | -4.75e-03 |
Pos logit contributions | |
tow | +0.001 |
Sue | +0.001 |
ever | +0.001 |
free | +0.000 |
Sally | +0.000 |
Neg logit contributions | |
arre | -0.002 |
homework | -0.002 |
chores | -0.002 |
laptop | -0.002 |
apr | -0.002 |
Token | is |
Token ID | 318 |
Feature activation | +1.08e-03 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.008 |
chores | +0.008 |
apr | +0.008 |
laptop | +0.007 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.006 |
free | -0.006 |
pet | -0.006 |
Token | Why |
Token ID | 5195 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.003 |
ambul | +0.003 |
chores | +0.003 |
apr | +0.003 |
Neg logit contributions | |
tow | -0.003 |
ever | -0.003 |
free | -0.003 |
Sue | -0.003 |
aroo | -0.003 |
Token | are |
Token ID | 389 |
Feature activation | +8.90e-03 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.031 |
apr | +0.030 |
laptop | +0.029 |
chores | +0.029 |
Neg logit contributions | |
ever | -0.031 |
tow | -0.030 |
Sue | -0.029 |
free | -0.028 |
Sally | -0.027 |
Token | you |
Token ID | 345 |
Feature activation | -4.81e-03 |
Pos logit contributions | |
tow | +0.011 |
ever | +0.010 |
free | +0.009 |
Sue | +0.009 |
aroo | +0.009 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.018 |
chores | -0.017 |
laptop | -0.016 |
jobs | -0.016 |
Token | two |
Token ID | 734 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
ambul | +0.006 |
Neg logit contributions | |
tow | -0.008 |
ever | -0.008 |
aroo | -0.007 |
Sue | -0.007 |
free | -0.007 |
Token | qu |
Token ID | 627 |
Feature activation | -3.28e-02 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.042 |
chores | +0.041 |
laptop | +0.038 |
jobs | +0.038 |
Neg logit contributions | |
tow | -0.036 |
aroo | -0.033 |
Sue | -0.032 |
ever | -0.032 |
Dove | -0.031 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.46e-02 |
Pos logit contributions | |
arre | +0.001 |
homework | -0.002 |
chores | -0.004 |
laptop | -0.005 |
apr | -0.006 |
Neg logit contributions | |
ever | -0.102 |
tow | -0.101 |
free | -0.100 |
Sue | -0.099 |
Sally | -0.097 |
Token | ling |
Token ID | 1359 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
homework | +0.130 |
arre | +0.129 |
apr | +0.129 |
laptop | +0.126 |
chores | +0.124 |
Neg logit contributions | |
ever | -0.102 |
free | -0.095 |
of | -0.084 |
p | -0.079 |
aroo | -0.078 |
Token | ? |
Token ID | 30 |
Feature activation | -7.71e-03 |
Pos logit contributions | |
arre | +0.045 |
homework | +0.039 |
chores | +0.038 |
laptop | +0.037 |
apr | +0.036 |
Neg logit contributions | |
tow | -0.031 |
ever | -0.030 |
free | -0.028 |
Sue | -0.028 |
aroo | -0.027 |
Token | There |
Token ID | 1318 |
Feature activation | -3.21e-02 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.011 |
laptop | +0.011 |
cuts | +0.010 |
means | +0.010 |
Neg logit contributions | |
ever | -0.012 |
tow | -0.012 |
free | -0.012 |
swoop | -0.012 |
Sue | -0.011 |
Token | are |
Token ID | 389 |
Feature activation | -2.92e-03 |
Pos logit contributions | |
arre | +0.054 |
homework | +0.046 |
chores | +0.043 |
laptop | +0.042 |
jobs | +0.040 |
Neg logit contributions | |
tow | -0.054 |
ever | -0.053 |
free | -0.050 |
Sue | -0.050 |
aroo | -0.048 |
Token | plenty |
Token ID | 6088 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.005 |
chores | +0.005 |
jobs | +0.005 |
laptop | +0.005 |
Neg logit contributions | |
tow | -0.004 |
aroo | -0.004 |
ever | -0.004 |
Sue | -0.004 |
free | -0.004 |
Token | says |
Token ID | 1139 |
Feature activation | +3.21e-03 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.004 |
chores | +0.004 |
laptop | +0.004 |
apr | +0.004 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
Sue | -0.005 |
free | -0.005 |
pet | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
ever | +0.003 |
Sue | +0.003 |
tow | +0.002 |
free | +0.002 |
Sally | +0.002 |
Neg logit contributions | |
arre | -0.008 |
homework | -0.007 |
laptop | -0.007 |
apr | -0.007 |
chores | -0.007 |
Token | " |
Token ID | 366 |
Feature activation | -4.01e-04 |
Pos logit contributions | |
arre | +0.026 |
homework | +0.023 |
chores | +0.022 |
laptop | +0.022 |
apr | +0.022 |
Neg logit contributions | |
tow | -0.011 |
ever | -0.011 |
Sue | -0.010 |
free | -0.010 |
aroo | -0.009 |
Token | Stop |
Token ID | 19485 |
Feature activation | -2.70e-03 |
Pos logit contributions | |
arre | +0.001 |
homework | +0.001 |
chores | +0.001 |
laptop | +0.001 |
apr | +0.001 |
Neg logit contributions | |
tow | -0.000 |
ever | -0.000 |
Sue | -0.000 |
free | -0.000 |
Dove | -0.000 |
Token | qu |
Token ID | 627 |
Feature activation | -2.56e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.005 |
laptop | +0.005 |
chores | +0.005 |
idents | +0.005 |
Neg logit contributions | |
tow | -0.003 |
ever | -0.003 |
free | -0.003 |
Sue | -0.003 |
aroo | -0.003 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.42e-02 |
Pos logit contributions | |
homework | +0.024 |
apr | +0.022 |
chores | +0.022 |
matt | +0.021 |
ambul | +0.021 |
Neg logit contributions | |
tow | -0.053 |
free | -0.053 |
Sue | -0.052 |
ever | -0.052 |
pet | -0.050 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
apr | +0.149 |
homework | +0.143 |
chores | +0.142 |
laptop | +0.141 |
arre | +0.139 |
Neg logit contributions | |
ever | -0.087 |
free | -0.083 |
p | -0.074 |
of | -0.070 |
fast | -0.068 |
Token | , |
Token ID | 11 |
Feature activation | -2.63e-03 |
Pos logit contributions | |
arre | +0.040 |
homework | +0.036 |
chores | +0.034 |
laptop | +0.034 |
apr | +0.034 |
Neg logit contributions | |
tow | -0.013 |
ever | -0.013 |
free | -0.011 |
Sue | -0.011 |
aroo | -0.010 |
Token | Tom |
Token ID | 4186 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.004 |
chores | +0.004 |
laptop | +0.004 |
idents | +0.004 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.003 |
free | -0.003 |
aroo | -0.003 |
ull | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +5.94e-03 |
Pos logit contributions | |
tow | +0.014 |
ever | +0.013 |
free | +0.012 |
aroo | +0.012 |
Sue | +0.012 |
Neg logit contributions | |
arre | -0.022 |
homework | -0.018 |
laptop | -0.018 |
chores | -0.018 |
obe | -0.017 |
Token | Lily |
Token ID | 20037 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
tow | +0.005 |
ever | +0.005 |
free | +0.004 |
Sue | +0.004 |
aroo | +0.004 |
Neg logit contributions | |
arre | -0.015 |
homework | -0.014 |
chores | -0.013 |
laptop | -0.013 |
apr | -0.013 |
Token | said |
Token ID | 531 |
Feature activation | -4.47e-03 |
Pos logit contributions | |
tow | +0.021 |
ever | +0.021 |
free | +0.020 |
aroo | +0.019 |
Sue | +0.019 |
Neg logit contributions | |
arre | -0.027 |
homework | -0.022 |
laptop | -0.021 |
apr | -0.021 |
chores | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
arre | +0.011 |
homework | +0.010 |
laptop | +0.010 |
chores | +0.009 |
apr | +0.009 |
Neg logit contributions | |
ever | -0.004 |
Sue | -0.004 |
tow | -0.004 |
free | -0.003 |
Sally | -0.003 |
Token | " |
Token ID | 366 |
Feature activation | -6.17e-03 |
Pos logit contributions | |
arre | +0.048 |
homework | +0.043 |
chores | +0.041 |
laptop | +0.041 |
apr | +0.040 |
Neg logit contributions | |
tow | -0.023 |
ever | -0.023 |
free | -0.021 |
Sue | -0.021 |
aroo | -0.019 |
Token | Stop |
Token ID | 19485 |
Feature activation | -6.52e-03 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
chores | +0.010 |
laptop | +0.010 |
apr | +0.009 |
Neg logit contributions | |
tow | -0.009 |
ever | -0.009 |
free | -0.008 |
Sue | -0.008 |
aroo | -0.008 |
Token | qu |
Token ID | 627 |
Feature activation | -2.38e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
laptop | +0.009 |
chores | +0.009 |
idents | +0.009 |
Neg logit contributions | |
tow | -0.011 |
ever | -0.010 |
Sue | -0.009 |
free | -0.009 |
aroo | -0.009 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.31e-02 |
Pos logit contributions | |
homework | +0.004 |
arre | +0.002 |
laptop | +0.002 |
chores | +0.002 |
apr | +0.001 |
Neg logit contributions | |
tow | -0.068 |
free | -0.067 |
ever | -0.067 |
Sue | -0.066 |
Sally | -0.065 |
Token | ling |
Token ID | 1359 |
Feature activation | -2.00e-02 |
Pos logit contributions | |
homework | +0.139 |
apr | +0.138 |
laptop | +0.135 |
chores | +0.134 |
dining | +0.133 |
Neg logit contributions | |
ever | -0.087 |
free | -0.086 |
p | -0.074 |
of | -0.072 |
fast | -0.069 |
Token | , |
Token ID | 11 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
arre | +0.048 |
homework | +0.043 |
chores | +0.042 |
laptop | +0.041 |
apr | +0.041 |
Neg logit contributions | |
ever | -0.018 |
tow | -0.018 |
free | -0.017 |
Sue | -0.017 |
aroo | -0.015 |
Token | boys |
Token ID | 6510 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
arre | +0.046 |
homework | +0.040 |
chores | +0.039 |
laptop | +0.038 |
idents | +0.037 |
Neg logit contributions | |
tow | -0.022 |
ever | -0.021 |
free | -0.019 |
aroo | -0.018 |
Sue | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +5.38e-03 |
Pos logit contributions | |
arre | +0.059 |
homework | +0.051 |
laptop | +0.049 |
chores | +0.049 |
jobs | +0.047 |
Neg logit contributions | |
tow | -0.030 |
ever | -0.026 |
aroo | -0.026 |
free | -0.025 |
Dove | -0.025 |
Token | You |
Token ID | 921 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
ever | +0.008 |
tow | +0.008 |
free | +0.008 |
swoop | +0.007 |
Sue | +0.007 |
Neg logit contributions | |
arre | -0.010 |
homework | -0.008 |
laptop | -0.008 |
chores | -0.008 |
cuts | -0.008 |
Token | " |
Token ID | 366 |
Feature activation | -3.87e-03 |
Pos logit contributions | |
tow | +0.008 |
free | +0.007 |
ever | +0.007 |
pet | +0.007 |
swoop | +0.007 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.011 |
chores | -0.011 |
ambul | -0.010 |
laptop | -0.010 |
Token | Why |
Token ID | 5195 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.006 |
chores | +0.006 |
laptop | +0.006 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.006 |
ever | -0.005 |
Sue | -0.005 |
free | -0.005 |
aroo | -0.005 |
Token | are |
Token ID | 389 |
Feature activation | +7.20e-03 |
Pos logit contributions | |
arre | +0.033 |
homework | +0.027 |
apr | +0.027 |
laptop | +0.026 |
chores | +0.026 |
Neg logit contributions | |
ever | -0.027 |
tow | -0.026 |
Sue | -0.025 |
free | -0.024 |
Sally | -0.023 |
Token | you |
Token ID | 345 |
Feature activation | -4.54e-03 |
Pos logit contributions | |
tow | +0.008 |
ever | +0.007 |
free | +0.007 |
Sue | +0.007 |
aroo | +0.006 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.015 |
chores | -0.014 |
laptop | -0.014 |
apr | -0.014 |
Token | qu |
Token ID | 627 |
Feature activation | -2.40e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.006 |
free | -0.006 |
aroo | -0.006 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.29e-02 |
Pos logit contributions | |
homework | +0.005 |
arre | +0.004 |
chores | +0.003 |
laptop | +0.003 |
apr | +0.002 |
Neg logit contributions | |
ever | -0.067 |
free | -0.066 |
tow | -0.066 |
Sue | -0.066 |
Sally | -0.064 |
Token | ling |
Token ID | 1359 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
apr | +0.135 |
arre | +0.134 |
homework | +0.134 |
laptop | +0.133 |
chores | +0.131 |
Neg logit contributions | |
ever | -0.090 |
free | -0.085 |
p | -0.074 |
of | -0.073 |
fast | -0.069 |
Token | ? |
Token ID | 30 |
Feature activation | +1.29e-03 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.041 |
chores | +0.039 |
laptop | +0.039 |
apr | +0.038 |
Neg logit contributions | |
ever | -0.030 |
tow | -0.030 |
Sue | -0.029 |
free | -0.028 |
aroo | -0.026 |
Token | You |
Token ID | 921 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
ever | +0.002 |
free | +0.002 |
tow | +0.002 |
swoop | +0.002 |
pet | +0.002 |
Neg logit contributions | |
arre | -0.002 |
laptop | -0.002 |
homework | -0.002 |
means | -0.002 |
cuts | -0.002 |
Token | can |
Token ID | 460 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.032 |
chores | +0.030 |
laptop | +0.030 |
jobs | +0.029 |
Neg logit contributions | |
tow | -0.030 |
ever | -0.028 |
Sue | -0.027 |
free | -0.026 |
aroo | -0.026 |
Token | share |
Token ID | 2648 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
ull | +0.015 |
tow | +0.015 |
itself | +0.014 |
Sage | +0.014 |
Frank | +0.014 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.017 |
chores | -0.017 |
laptop | -0.014 |
argue | -0.014 |
Token | ? |
Token ID | 30 |
Feature activation | -9.71e-03 |
Pos logit contributions | |
arre | +0.017 |
homework | +0.014 |
chores | +0.013 |
laptop | +0.013 |
apr | +0.013 |
Neg logit contributions | |
tow | -0.018 |
ever | -0.017 |
free | -0.017 |
Sue | -0.017 |
aroo | -0.016 |
Token | Why |
Token ID | 4162 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
arre | +0.018 |
homework | +0.015 |
chores | +0.015 |
laptop | +0.014 |
apr | +0.014 |
Neg logit contributions | |
tow | -0.015 |
ever | -0.015 |
Sue | -0.014 |
free | -0.014 |
aroo | -0.013 |
Token | are |
Token ID | 389 |
Feature activation | +7.98e-03 |
Pos logit contributions | |
arre | +0.037 |
apr | +0.032 |
homework | +0.031 |
laptop | +0.031 |
laptops | +0.030 |
Neg logit contributions | |
ever | -0.022 |
Sue | -0.021 |
tow | -0.020 |
Sally | -0.018 |
free | -0.018 |
Token | you |
Token ID | 345 |
Feature activation | -7.40e-04 |
Pos logit contributions | |
ever | +0.008 |
tow | +0.008 |
Sue | +0.007 |
free | +0.007 |
aroo | +0.007 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.017 |
chores | -0.016 |
laptop | -0.016 |
apr | -0.016 |
Token | qu |
Token ID | 627 |
Feature activation | -2.92e-02 |
Pos logit contributions | |
arre | +0.001 |
homework | +0.001 |
chores | +0.001 |
laptop | +0.001 |
apr | +0.001 |
Neg logit contributions | |
ever | -0.001 |
tow | -0.001 |
free | -0.001 |
Sue | -0.001 |
pet | -0.001 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.28e-02 |
Pos logit contributions | |
homework | +0.008 |
ambul | +0.006 |
chores | +0.006 |
nurses | +0.006 |
matt | +0.005 |
Neg logit contributions | |
free | -0.077 |
ever | -0.077 |
tow | -0.077 |
ak | -0.075 |
Sue | -0.075 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
apr | +0.135 |
homework | +0.134 |
chores | +0.131 |
laptop | +0.130 |
arre | +0.130 |
Neg logit contributions | |
ever | -0.088 |
free | -0.085 |
of | -0.077 |
p | -0.073 |
ull | -0.069 |
Token | with |
Token ID | 351 |
Feature activation | -5.23e-03 |
Pos logit contributions | |
arre | +0.036 |
homework | +0.032 |
chores | +0.030 |
apr | +0.030 |
laptop | +0.029 |
Neg logit contributions | |
ever | -0.025 |
tow | -0.024 |
Sue | -0.023 |
free | -0.023 |
Sally | -0.021 |
Token | your |
Token ID | 534 |
Feature activation | -6.14e-03 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.009 |
apr | +0.009 |
laptop | +0.008 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
aroo | -0.007 |
Zip | -0.007 |
free | -0.006 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
arre | +0.011 |
homework | +0.009 |
chores | +0.009 |
laptop | +0.009 |
apr | +0.008 |
Neg logit contributions | |
tow | -0.010 |
ever | -0.010 |
free | -0.009 |
Sue | -0.009 |
pet | -0.009 |
Token | ? |
Token ID | 30 |
Feature activation | -5.78e-03 |
Pos logit contributions | |
arre | +0.025 |
homework | +0.022 |
chores | +0.021 |
apr | +0.021 |
laptop | +0.021 |
Neg logit contributions | |
ever | -0.015 |
tow | -0.014 |
Sue | -0.013 |
free | -0.013 |
pet | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
arre | +0.066 |
homework | +0.058 |
chores | +0.056 |
laptop | +0.056 |
apr | +0.055 |
Neg logit contributions | |
ever | -0.021 |
tow | -0.021 |
Sue | -0.018 |
free | -0.018 |
aroo | -0.016 |
Token | story |
Token ID | 1621 |
Feature activation | -2.80e-02 |
Pos logit contributions | |
arre | +0.035 |
apr | +0.029 |
homework | +0.028 |
laptop | +0.027 |
tant | +0.027 |
Neg logit contributions | |
ever | -0.031 |
tow | -0.031 |
free | -0.028 |
squirrel | -0.028 |
Sue | -0.028 |
Token | is |
Token ID | 318 |
Feature activation | -2.88e-03 |
Pos logit contributions | |
arre | +0.060 |
apr | +0.058 |
chores | +0.053 |
homework | +0.052 |
laptop | +0.051 |
Neg logit contributions | |
ever | -0.038 |
Sue | -0.032 |
tow | -0.032 |
of | -0.029 |
free | -0.028 |
Token | : |
Token ID | 25 |
Feature activation | -2.76e-02 |
Pos logit contributions | |
arre | +0.007 |
homework | +0.006 |
chores | +0.006 |
laptop | +0.006 |
jobs | +0.006 |
Neg logit contributions | |
tow | -0.003 |
ever | -0.003 |
free | -0.002 |
Sue | -0.002 |
aroo | -0.002 |
Token | Qu |
Token ID | 2264 |
Feature activation | -9.93e-03 |
Pos logit contributions | |
arre | +0.053 |
homework | +0.046 |
chores | +0.044 |
laptop | +0.042 |
jobs | +0.041 |
Neg logit contributions | |
tow | -0.039 |
ever | -0.038 |
Sue | -0.037 |
free | -0.037 |
aroo | -0.035 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.24e-02 |
Pos logit contributions | |
arre | +0.016 |
homework | +0.014 |
chores | +0.013 |
laptop | +0.013 |
apr | +0.013 |
Neg logit contributions | |
tow | -0.017 |
ever | -0.017 |
free | -0.016 |
Sue | -0.016 |
aroo | -0.015 |
Token | lling |
Token ID | 2680 |
Feature activation | -4.13e-02 |
Pos logit contributions | |
laptop | +0.133 |
homework | +0.132 |
apr | +0.131 |
arre | +0.131 |
chores | +0.126 |
Neg logit contributions | |
ever | -0.099 |
free | -0.090 |
of | -0.087 |
ull | -0.080 |
its | -0.079 |
Token | over |
Token ID | 625 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
arre | +0.071 |
homework | +0.060 |
chores | +0.057 |
laptop | +0.056 |
apr | +0.054 |
Neg logit contributions | |
tow | -0.068 |
ever | -0.067 |
Sue | -0.063 |
free | -0.063 |
aroo | -0.060 |
Token | small |
Token ID | 1402 |
Feature activation | -1.96e-02 |
Pos logit contributions | |
arre | +0.032 |
homework | +0.028 |
chores | +0.027 |
laptop | +0.026 |
jobs | +0.026 |
Neg logit contributions | |
tow | -0.023 |
ever | -0.021 |
Sue | -0.020 |
aroo | -0.020 |
free | -0.020 |
Token | things |
Token ID | 1243 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
arre | +0.033 |
homework | +0.028 |
chores | +0.026 |
apr | +0.026 |
laptop | +0.026 |
Neg logit contributions | |
ever | -0.033 |
tow | -0.032 |
free | -0.031 |
Sue | -0.030 |
pet | -0.029 |
Token | is |
Token ID | 318 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
arre | +0.054 |
homework | +0.047 |
chores | +0.045 |
laptop | +0.043 |
jobs | +0.042 |
Neg logit contributions | |
tow | -0.039 |
Sue | -0.036 |
ever | -0.036 |
free | -0.034 |
aroo | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
tow | +0.003 |
free | +0.002 |
aroo | +0.002 |
Dove | +0.002 |
ever | +0.002 |
Neg logit contributions | |
arre | -0.005 |
homework | -0.005 |
chores | -0.004 |
laptop | -0.004 |
jobs | -0.004 |
Token | They |
Token ID | 1119 |
Feature activation | +1.31e-04 |
Pos logit contributions | |
ever | +0.019 |
free | +0.017 |
tow | +0.017 |
swoop | +0.016 |
aroo | +0.016 |
Neg logit contributions | |
arre | -0.027 |
homework | -0.022 |
laptop | -0.022 |
apr | -0.021 |
ambul | -0.021 |
Token | had |
Token ID | 550 |
Feature activation | +9.89e-05 |
Pos logit contributions | |
tow | +0.000 |
ever | +0.000 |
aroo | +0.000 |
free | +0.000 |
Sue | +0.000 |
Neg logit contributions | |
arre | -0.000 |
homework | -0.000 |
chores | -0.000 |
apr | -0.000 |
laptop | -0.000 |
Token | stopped |
Token ID | 5025 |
Feature activation | +2.20e-04 |
Pos logit contributions | |
tow | +0.000 |
aroo | +0.000 |
ever | +0.000 |
Sue | +0.000 |
free | +0.000 |
Neg logit contributions | |
arre | -0.000 |
homework | -0.000 |
chores | -0.000 |
apr | -0.000 |
laptop | -0.000 |
Token | qu |
Token ID | 627 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
tow | +0.000 |
ever | +0.000 |
free | +0.000 |
Sue | +0.000 |
aroo | +0.000 |
Neg logit contributions | |
arre | -0.000 |
homework | -0.000 |
chores | -0.000 |
laptop | -0.000 |
apr | -0.000 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.14e-02 |
Pos logit contributions | |
arre | +0.003 |
homework | +0.002 |
chores | +0.001 |
laptop | +0.001 |
apr | +0.000 |
Neg logit contributions | |
tow | -0.035 |
ever | -0.035 |
free | -0.035 |
Sue | -0.034 |
pet | -0.033 |
Token | ling |
Token ID | 1359 |
Feature activation | -7.47e-03 |
Pos logit contributions | |
homework | +0.142 |
laptop | +0.138 |
chores | +0.136 |
apr | +0.135 |
arre | +0.132 |
Neg logit contributions | |
ever | -0.085 |
free | -0.080 |
p | -0.065 |
fast | -0.065 |
of | -0.065 |
Token | . |
Token ID | 13 |
Feature activation | +5.83e-03 |
Pos logit contributions | |
arre | +0.018 |
homework | +0.016 |
chores | +0.015 |
laptop | +0.015 |
apr | +0.015 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
free | -0.006 |
Sue | -0.006 |
aroo | -0.006 |
Token | To |
Token ID | 1675 |
Feature activation | +1.32e-03 |
Pos logit contributions | |
ever | +0.008 |
swoop | +0.007 |
free | +0.007 |
aroo | +0.007 |
tow | +0.007 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.010 |
laptop | -0.010 |
apr | -0.010 |
laptops | -0.009 |
Token | celebrate |
Token ID | 10648 |
Feature activation | -7.04e-03 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
aroo | +0.002 |
free | +0.002 |
Dove | +0.001 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.002 |
chores | -0.002 |
laptop | -0.002 |
apr | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | -2.18e-04 |
Pos logit contributions | |
arre | +0.017 |
homework | +0.015 |
chores | +0.014 |
laptop | +0.014 |
apr | +0.014 |
Neg logit contributions | |
ever | -0.007 |
tow | -0.006 |
Sue | -0.006 |
free | -0.006 |
Sally | -0.005 |
Token | Please |
Token ID | 5492 |
Feature activation | +1.30e-04 |
Pos logit contributions | |
arre | +0.015 |
homework | +0.011 |
apr | +0.011 |
ambul | +0.011 |
chores | +0.011 |
Neg logit contributions | |
tow | -0.011 |
Sue | -0.010 |
ever | -0.010 |
free | -0.010 |
Sally | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | -6.44e-03 |
Pos logit contributions | |
tow | +0.000 |
ever | +0.000 |
Sue | +0.000 |
aroo | +0.000 |
free | +0.000 |
Neg logit contributions | |
arre | -0.000 |
homework | -0.000 |
chores | -0.000 |
laptop | -0.000 |
jobs | -0.000 |
Token | no |
Token ID | 645 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.012 |
chores | +0.012 |
laptop | +0.012 |
ambul | +0.011 |
Neg logit contributions | |
ever | -0.007 |
tow | -0.007 |
free | -0.007 |
Sue | -0.007 |
Dove | -0.007 |
Token | more |
Token ID | 517 |
Feature activation | +2.61e-03 |
Pos logit contributions | |
arre | +0.024 |
homework | +0.022 |
chores | +0.022 |
jobs | +0.021 |
ambul | +0.021 |
Neg logit contributions | |
tow | -0.013 |
ever | -0.012 |
free | -0.012 |
Sue | -0.012 |
aroo | -0.011 |
Token | qu |
Token ID | 627 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
tow | +0.003 |
ever | +0.003 |
Sue | +0.003 |
Dove | +0.003 |
Zip | +0.003 |
Neg logit contributions | |
arre | -0.005 |
homework | -0.005 |
chores | -0.005 |
laptop | -0.005 |
jobs | -0.005 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.05e-02 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.008 |
chores | +0.006 |
laptop | +0.006 |
apr | +0.005 |
Neg logit contributions | |
ever | -0.069 |
tow | -0.069 |
free | -0.067 |
Sue | -0.066 |
aroo | -0.064 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.94e-02 |
Pos logit contributions | |
arre | +0.121 |
homework | +0.112 |
apr | +0.109 |
laptop | +0.107 |
chores | +0.105 |
Neg logit contributions | |
ever | -0.112 |
free | -0.104 |
aroo | -0.095 |
tow | -0.095 |
swoop | -0.092 |
Token | ! |
Token ID | 0 |
Feature activation | -3.57e-03 |
Pos logit contributions | |
arre | +0.046 |
homework | +0.040 |
chores | +0.039 |
laptop | +0.038 |
jobs | +0.037 |
Neg logit contributions | |
tow | -0.020 |
ever | -0.018 |
Sue | -0.017 |
free | -0.017 |
aroo | -0.016 |
Token | Let |
Token ID | 3914 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
arre | +0.007 |
laptop | +0.006 |
homework | +0.006 |
ambul | +0.006 |
cuts | +0.006 |
Neg logit contributions | |
ever | -0.005 |
free | -0.004 |
tow | -0.004 |
swoop | -0.004 |
Sue | -0.004 |
Token | 's |
Token ID | 338 |
Feature activation | -5.57e-03 |
Pos logit contributions | |
arre | +0.035 |
homework | +0.030 |
laptop | +0.029 |
apr | +0.028 |
chores | +0.028 |
Neg logit contributions | |
ever | -0.032 |
tow | -0.032 |
free | -0.031 |
Sue | -0.031 |
pet | -0.029 |
Token | find |
Token ID | 1064 |
Feature activation | -3.35e-04 |
Pos logit contributions | |
arre | +0.011 |
homework | +0.010 |
chores | +0.010 |
jobs | +0.009 |
laptop | +0.009 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.007 |
aroo | -0.007 |
free | -0.006 |
Token | They |
Token ID | 2990 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
ever | +0.005 |
tow | +0.005 |
Sue | +0.004 |
free | +0.004 |
Sally | +0.004 |
Neg logit contributions | |
arre | -0.006 |
homework | -0.005 |
laptop | -0.005 |
chores | -0.005 |
apr | -0.005 |
Token | are |
Token ID | 389 |
Feature activation | -2.59e-03 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.041 |
chores | +0.039 |
laptop | +0.039 |
apr | +0.038 |
Neg logit contributions | |
tow | -0.025 |
ever | -0.024 |
free | -0.023 |
Sue | -0.022 |
pet | -0.021 |
Token | tired |
Token ID | 10032 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.004 |
chores | +0.004 |
laptop | +0.004 |
apr | +0.004 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.003 |
aroo | -0.003 |
swoop | -0.003 |
Sue | -0.003 |
Token | from |
Token ID | 422 |
Feature activation | -2.85e-04 |
Pos logit contributions | |
arre | +0.036 |
homework | +0.032 |
chores | +0.031 |
laptop | +0.031 |
apr | +0.030 |
Neg logit contributions | |
tow | -0.017 |
ever | -0.016 |
Sue | -0.015 |
free | -0.015 |
aroo | -0.015 |
Token | qu |
Token ID | 627 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
arre | +0.001 |
homework | +0.001 |
chores | +0.000 |
laptop | +0.000 |
apr | +0.000 |
Neg logit contributions | |
tow | -0.000 |
ever | -0.000 |
aroo | -0.000 |
free | -0.000 |
swoop | -0.000 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.04e-02 |
Pos logit contributions | |
homework | +0.031 |
arre | +0.030 |
laptop | +0.029 |
apr | +0.028 |
ambul | +0.028 |
Neg logit contributions | |
tow | -0.042 |
free | -0.042 |
ever | -0.041 |
Sue | -0.040 |
pet | -0.039 |
Token | ling |
Token ID | 1359 |
Feature activation | -3.58e-03 |
Pos logit contributions | |
apr | +0.150 |
arre | +0.149 |
homework | +0.147 |
laptop | +0.145 |
riger | +0.143 |
Neg logit contributions | |
ever | -0.072 |
free | -0.069 |
p | -0.063 |
of | -0.062 |
fast | -0.058 |
Token | . |
Token ID | 13 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.008 |
laptop | +0.008 |
apr | +0.008 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
free | -0.002 |
Sue | -0.002 |
aroo | -0.002 |
Token | They |
Token ID | 1119 |
Feature activation | -2.33e-02 |
Pos logit contributions | |
ever | +0.013 |
tow | +0.012 |
free | +0.012 |
aroo | +0.011 |
swoop | +0.011 |
Neg logit contributions | |
arre | -0.022 |
homework | -0.019 |
laptop | -0.019 |
chores | -0.019 |
apr | -0.018 |
Token | sit |
Token ID | 1650 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
arre | +0.049 |
homework | +0.043 |
laptop | +0.041 |
chores | +0.041 |
apr | +0.040 |
Neg logit contributions | |
tow | -0.029 |
ever | -0.029 |
free | -0.027 |
Sue | -0.027 |
pet | -0.025 |
Token | in |
Token ID | 287 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
tow | +0.003 |
ever | +0.003 |
free | +0.002 |
Sue | +0.002 |
aroo | +0.002 |
Neg logit contributions | |
arre | -0.006 |
homework | -0.005 |
chores | -0.005 |
laptop | -0.005 |
apr | -0.005 |
Token | listen |
Token ID | 6004 |
Feature activation | -3.42e-03 |
Pos logit contributions | |
arre | +0.028 |
homework | +0.024 |
chores | +0.023 |
laptop | +0.022 |
apr | +0.022 |
Neg logit contributions | |
tow | -0.022 |
ever | -0.021 |
free | -0.020 |
Sue | -0.020 |
aroo | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +2.36e-03 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
laptop | +0.008 |
chores | +0.008 |
apr | +0.008 |
Neg logit contributions | |
ever | -0.002 |
tow | -0.002 |
Sue | -0.002 |
free | -0.002 |
pet | -0.001 |
Token | They |
Token ID | 1119 |
Feature activation | +6.25e-03 |
Pos logit contributions | |
tow | +0.002 |
Sue | +0.002 |
ever | +0.001 |
free | +0.001 |
Sally | +0.001 |
Neg logit contributions | |
arre | -0.006 |
homework | -0.006 |
chores | -0.005 |
laptop | -0.005 |
apr | -0.005 |
Token | kept |
Token ID | 4030 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
tow | +0.010 |
ever | +0.009 |
free | +0.009 |
aroo | +0.009 |
Sue | +0.009 |
Neg logit contributions | |
arre | -0.011 |
homework | -0.009 |
chores | -0.009 |
apr | -0.009 |
laptop | -0.009 |
Token | qu |
Token ID | 627 |
Feature activation | -2.13e-02 |
Pos logit contributions | |
arre | +0.020 |
homework | +0.018 |
chores | +0.017 |
laptop | +0.017 |
apr | +0.016 |
Neg logit contributions | |
tow | -0.014 |
ever | -0.014 |
free | -0.013 |
Sue | -0.013 |
aroo | -0.013 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.03e-02 |
Pos logit contributions | |
homework | +0.010 |
laptop | +0.008 |
ambul | +0.008 |
chores | +0.007 |
nurses | +0.007 |
Neg logit contributions | |
free | -0.054 |
tow | -0.053 |
ever | -0.053 |
Sue | -0.052 |
ak | -0.052 |
Token | ling |
Token ID | 1359 |
Feature activation | -8.31e-03 |
Pos logit contributions | |
homework | +0.148 |
apr | +0.146 |
dining | +0.145 |
arre | +0.144 |
laptop | +0.144 |
Neg logit contributions | |
free | -0.072 |
ever | -0.070 |
p | -0.065 |
fast | -0.062 |
of | -0.061 |
Token | with |
Token ID | 351 |
Feature activation | -9.91e-03 |
Pos logit contributions | |
arre | +0.021 |
homework | +0.019 |
laptop | +0.018 |
chores | +0.018 |
apr | +0.018 |
Neg logit contributions | |
ever | -0.007 |
tow | -0.007 |
free | -0.006 |
Sue | -0.006 |
pet | -0.006 |
Token | their |
Token ID | 511 |
Feature activation | +1.40e-03 |
Pos logit contributions | |
arre | +0.020 |
homework | +0.018 |
chores | +0.018 |
apr | +0.017 |
laptop | +0.017 |
Neg logit contributions | |
ever | -0.013 |
tow | -0.013 |
Sue | -0.011 |
free | -0.011 |
aroo | -0.011 |
Token | mom |
Token ID | 1995 |
Feature activation | +3.80e-03 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
free | +0.001 |
Sue | +0.001 |
aroo | +0.001 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.003 |
chores | -0.003 |
laptop | -0.003 |
apr | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -2.82e-03 |
Pos logit contributions | |
tow | +0.003 |
ever | +0.003 |
free | +0.002 |
Sue | +0.002 |
aroo | +0.002 |
Neg logit contributions | |
arre | -0.010 |
homework | -0.009 |
chores | -0.009 |
laptop | -0.009 |
apr | -0.008 |
Token | bad |
Token ID | 2089 |
Feature activation | -2.63e-02 |
Pos logit contributions | |
arre | +0.036 |
homework | +0.031 |
chores | +0.030 |
laptop | +0.029 |
apr | +0.029 |
Neg logit contributions | |
tow | -0.025 |
ever | -0.025 |
free | -0.024 |
Sue | -0.024 |
aroo | -0.022 |
Token | and |
Token ID | 290 |
Feature activation | +7.54e-03 |
Pos logit contributions | |
arre | +0.063 |
apr | +0.058 |
homework | +0.057 |
chores | +0.056 |
laptops | +0.055 |
Neg logit contributions | |
ever | -0.027 |
Sue | -0.023 |
free | -0.022 |
tow | -0.021 |
Sally | -0.020 |
Token | apologized |
Token ID | 22893 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
tow | +0.011 |
ever | +0.011 |
aroo | +0.010 |
free | +0.010 |
Sue | +0.009 |
Neg logit contributions | |
arre | -0.014 |
homework | -0.012 |
chores | -0.011 |
laptop | -0.011 |
nurses | -0.011 |
Token | for |
Token ID | 329 |
Feature activation | -9.97e-03 |
Pos logit contributions | |
arre | +0.033 |
homework | +0.029 |
laptop | +0.029 |
apr | +0.029 |
laptops | +0.029 |
Neg logit contributions | |
ever | -0.008 |
Sue | -0.007 |
free | -0.007 |
Sally | -0.006 |
pet | -0.006 |
Token | qu |
Token ID | 627 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
arre | +0.015 |
homework | +0.015 |
chores | +0.014 |
ambul | +0.013 |
laptop | +0.013 |
Neg logit contributions | |
tow | -0.017 |
ever | -0.016 |
aroo | -0.016 |
oe | -0.015 |
Dove | -0.015 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.03e-02 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.008 |
chores | +0.006 |
laptop | +0.006 |
apr | +0.005 |
Neg logit contributions | |
tow | -0.064 |
ever | -0.063 |
free | -0.062 |
Sue | -0.062 |
aroo | -0.060 |
Token | ling |
Token ID | 1359 |
Feature activation | -5.60e-03 |
Pos logit contributions | |
apr | +0.143 |
homework | +0.141 |
laptop | +0.140 |
arre | +0.139 |
chores | +0.138 |
Neg logit contributions | |
ever | -0.082 |
free | -0.076 |
p | -0.070 |
of | -0.068 |
its | -0.063 |
Token | . |
Token ID | 13 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
arre | +0.015 |
homework | +0.013 |
chores | +0.013 |
laptop | +0.013 |
apr | +0.012 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.004 |
free | -0.004 |
Sue | -0.003 |
aroo | -0.003 |
Token | " |
Token ID | 366 |
Feature activation | -1.07e-03 |
Pos logit contributions | |
arre | +0.028 |
idents | +0.023 |
homework | +0.022 |
chores | +0.021 |
laptop | +0.021 |
Neg logit contributions | |
tow | -0.020 |
ever | -0.019 |
aroo | -0.017 |
free | -0.017 |
swoop | -0.017 |
Token | I |
Token ID | 40 |
Feature activation | -7.16e-03 |
Pos logit contributions | |
arre | +0.002 |
homework | +0.002 |
chores | +0.002 |
apr | +0.002 |
narrative | +0.002 |
Neg logit contributions | |
tow | -0.001 |
free | -0.001 |
ever | -0.001 |
Sue | -0.001 |
pet | -0.001 |
Token | 'm |
Token ID | 1101 |
Feature activation | +5.26e-03 |
Pos logit contributions | |
arre | +0.015 |
homework | +0.013 |
laptop | +0.013 |
apr | +0.013 |
chores | +0.013 |
Neg logit contributions | |
ever | -0.010 |
tow | -0.009 |
free | -0.008 |
Sue | -0.008 |
pet | -0.008 |
Token | told |
Token ID | 1297 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
arre | +0.003 |
homework | +0.002 |
chores | +0.002 |
laptop | +0.002 |
apr | +0.002 |
Neg logit contributions | |
tow | -0.001 |
ever | -0.001 |
Sue | -0.001 |
free | -0.001 |
pet | -0.001 |
Token | them |
Token ID | 606 |
Feature activation | -1.78e-03 |
Pos logit contributions | |
arre | +0.038 |
homework | +0.034 |
chores | +0.032 |
laptop | +0.032 |
apr | +0.032 |
Neg logit contributions | |
tow | -0.014 |
ever | -0.014 |
Sue | -0.013 |
free | -0.013 |
aroo | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | -6.59e-03 |
Pos logit contributions | |
arre | +0.004 |
apr | +0.004 |
laptop | +0.004 |
homework | +0.004 |
laptops | +0.004 |
Neg logit contributions | |
ever | -0.002 |
Sue | -0.002 |
tow | -0.001 |
Sally | -0.001 |
free | -0.001 |
Token | stop |
Token ID | 2245 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.012 |
chores | +0.011 |
jobs | +0.011 |
laptop | +0.011 |
Neg logit contributions | |
tow | -0.009 |
aroo | -0.008 |
ever | -0.008 |
Dove | -0.008 |
free | -0.008 |
Token | qu |
Token ID | 627 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
arre | +0.029 |
homework | +0.025 |
chores | +0.024 |
laptop | +0.023 |
apr | +0.022 |
Neg logit contributions | |
tow | -0.023 |
ever | -0.021 |
aroo | -0.020 |
Dove | -0.020 |
free | -0.020 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.02e-02 |
Pos logit contributions | |
homework | +0.011 |
laptop | +0.009 |
chores | +0.009 |
arre | +0.008 |
ambul | +0.008 |
Neg logit contributions | |
free | -0.059 |
tow | -0.059 |
Sue | -0.059 |
ever | -0.058 |
pet | -0.057 |
Token | lling |
Token ID | 2680 |
Feature activation | -2.47e-02 |
Pos logit contributions | |
homework | +0.148 |
apr | +0.148 |
laptop | +0.147 |
dining | +0.146 |
aj | +0.146 |
Neg logit contributions | |
free | -0.065 |
ever | -0.063 |
p | -0.059 |
fast | -0.053 |
of | -0.050 |
Token | and |
Token ID | 290 |
Feature activation | -9.79e-03 |
Pos logit contributions | |
arre | +0.065 |
homework | +0.059 |
chores | +0.057 |
laptop | +0.056 |
apr | +0.056 |
Neg logit contributions | |
ever | -0.017 |
tow | -0.017 |
free | -0.015 |
Sue | -0.015 |
aroo | -0.013 |
Token | to |
Token ID | 284 |
Feature activation | -6.27e-03 |
Pos logit contributions | |
arre | +0.020 |
homework | +0.018 |
chores | +0.017 |
laptop | +0.017 |
jobs | +0.016 |
Neg logit contributions | |
tow | -0.013 |
ever | -0.012 |
aroo | -0.011 |
free | -0.011 |
Sue | -0.011 |
Token | share |
Token ID | 2648 |
Feature activation | +1.37e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.011 |
chores | +0.011 |
jobs | +0.010 |
apr | +0.010 |
Neg logit contributions | |
tow | -0.009 |
aroo | -0.009 |
ever | -0.008 |
Dove | -0.008 |
free | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +3.83e-03 |
Pos logit contributions | |
tow | +0.016 |
ever | +0.015 |
aroo | +0.014 |
free | +0.013 |
swoop | +0.013 |
Neg logit contributions | |
arre | -0.030 |
homework | -0.028 |
chores | -0.027 |
apr | -0.026 |
laptop | -0.026 |
Token | , |
Token ID | 11 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
arre | +0.091 |
homework | +0.080 |
chores | +0.077 |
laptop | +0.077 |
apr | +0.075 |
Neg logit contributions | |
tow | -0.043 |
ever | -0.042 |
free | -0.039 |
Sue | -0.039 |
aroo | -0.036 |
Token | you |
Token ID | 345 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
arre | +0.022 |
homework | +0.020 |
chores | +0.019 |
tasks | +0.019 |
jobs | +0.019 |
Neg logit contributions | |
tow | -0.014 |
aroo | -0.012 |
ever | -0.012 |
free | -0.012 |
Sue | -0.012 |
Token | can |
Token ID | 460 |
Feature activation | +9.46e-04 |
Pos logit contributions | |
arre | +0.032 |
homework | +0.027 |
chores | +0.026 |
laptop | +0.026 |
apr | +0.025 |
Neg logit contributions | |
tow | -0.028 |
ever | -0.028 |
free | -0.026 |
Sue | -0.026 |
aroo | -0.025 |
Token | help |
Token ID | 1037 |
Feature activation | -3.31e-02 |
Pos logit contributions | |
tow | +0.001 |
Sue | +0.001 |
ever | +0.001 |
aroo | +0.001 |
free | +0.001 |
Neg logit contributions | |
arre | -0.002 |
homework | -0.002 |
chores | -0.002 |
laptop | -0.001 |
jobs | -0.001 |
Token | prevent |
Token ID | 2948 |
Feature activation | -3.49e-02 |
Pos logit contributions | |
arre | +0.064 |
homework | +0.058 |
chores | +0.057 |
tasks | +0.054 |
jobs | +0.054 |
Neg logit contributions | |
tow | -0.049 |
aroo | -0.044 |
Sue | -0.043 |
ever | -0.043 |
Zip | -0.040 |
Token | wasteful |
Token ID | 45393 |
Feature activation | -6.99e-02 |
Pos logit contributions | |
arre | +0.070 |
homework | +0.063 |
chores | +0.063 |
jobs | +0.059 |
tasks | +0.058 |
Neg logit contributions | |
tow | -0.050 |
ever | -0.043 |
aroo | -0.042 |
Sue | -0.041 |
Zip | -0.039 |
Token | things |
Token ID | 1243 |
Feature activation | -2.87e-02 |
Pos logit contributions | |
arre | +0.188 |
apr | +0.168 |
homework | +0.168 |
laptops | +0.166 |
laptop | +0.164 |
Neg logit contributions | |
ever | -0.042 |
free | -0.038 |
Sue | -0.031 |
itself | -0.030 |
it | -0.028 |
Token | from |
Token ID | 422 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
arre | +0.062 |
homework | +0.055 |
chores | +0.053 |
laptop | +0.052 |
apr | +0.052 |
Neg logit contributions | |
ever | -0.034 |
tow | -0.033 |
free | -0.032 |
Sue | -0.031 |
aroo | -0.028 |
Token | happening |
Token ID | 5836 |
Feature activation | -2.21e-02 |
Pos logit contributions | |
arre | +0.040 |
homework | +0.035 |
chores | +0.034 |
jobs | +0.031 |
laptop | +0.031 |
Neg logit contributions | |
tow | -0.044 |
ever | -0.040 |
Sue | -0.040 |
aroo | -0.039 |
Zip | -0.038 |
Token | . |
Token ID | 13 |
Feature activation | +5.46e-03 |
Pos logit contributions | |
arre | +0.052 |
homework | +0.045 |
chores | +0.044 |
laptop | +0.043 |
jobs | +0.042 |
Neg logit contributions | |
tow | -0.025 |
Sue | -0.021 |
ever | -0.021 |
aroo | -0.021 |
Dove | -0.019 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
free | +0.006 |
ever | +0.006 |
tow | +0.006 |
swoop | +0.005 |
aroo | +0.005 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.010 |
chores | -0.010 |
laptop | -0.010 |
ambul | -0.010 |
Token | walking |
Token ID | 6155 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.008 |
laptop | +0.008 |
chores | +0.008 |
laptops | +0.007 |
Neg logit contributions | |
tow | -0.008 |
ever | -0.007 |
aroo | -0.007 |
Dove | -0.007 |
free | -0.007 |
Token | by |
Token ID | 416 |
Feature activation | -2.49e-03 |
Pos logit contributions | |
tow | +0.014 |
ever | +0.013 |
free | +0.012 |
Sue | +0.012 |
aroo | +0.012 |
Neg logit contributions | |
arre | -0.024 |
homework | -0.021 |
chores | -0.020 |
laptop | -0.020 |
apr | -0.019 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.70e-02 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.005 |
laptop | +0.004 |
chores | +0.004 |
jobs | +0.004 |
Neg logit contributions | |
tow | -0.003 |
aroo | -0.003 |
Dove | -0.003 |
ever | -0.003 |
free | -0.003 |
Token | them |
Token ID | 606 |
Feature activation | -2.47e-04 |
Pos logit contributions | |
arre | +0.033 |
homework | +0.030 |
chores | +0.029 |
apr | +0.028 |
ambul | +0.028 |
Neg logit contributions | |
ever | -0.022 |
tow | -0.022 |
free | -0.020 |
aroo | -0.019 |
Dove | -0.018 |
Token | qu |
Token ID | 627 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
arre | +0.001 |
homework | +0.000 |
chores | +0.000 |
laptop | +0.000 |
jobs | +0.000 |
Neg logit contributions | |
tow | -0.000 |
ever | -0.000 |
Sue | -0.000 |
free | -0.000 |
aroo | -0.000 |
Token | arre |
Token ID | 9624 |
Feature activation | -6.90e-02 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.007 |
laptop | +0.007 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.053 |
ever | -0.052 |
free | -0.052 |
Sue | -0.051 |
pet | -0.049 |
Token | ling |
Token ID | 1359 |
Feature activation | -2.11e-03 |
Pos logit contributions | |
homework | +0.146 |
apr | +0.145 |
arre | +0.143 |
idents | +0.141 |
chores | +0.140 |
Neg logit contributions | |
ever | -0.070 |
free | -0.067 |
p | -0.064 |
of | -0.059 |
fast | -0.056 |
Token | . |
Token ID | 13 |
Feature activation | +7.92e-03 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.005 |
chores | +0.004 |
laptop | +0.004 |
apr | +0.004 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
free | -0.002 |
Sue | -0.002 |
aroo | -0.002 |
Token | She |
Token ID | 1375 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
ever | +0.010 |
tow | +0.009 |
aroo | +0.009 |
free | +0.009 |
swoop | +0.008 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.015 |
laptop | -0.014 |
chores | -0.014 |
laptops | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | -1.37e-04 |
Pos logit contributions | |
tow | +0.015 |
ever | +0.015 |
free | +0.014 |
aroo | +0.014 |
Dove | +0.014 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.016 |
nurses | -0.015 |
ambul | -0.015 |
laptop | -0.015 |
Token | very |
Token ID | 845 |
Feature activation | -2.12e-03 |
Pos logit contributions | |
arre | +0.000 |
homework | +0.000 |
laptop | +0.000 |
chores | +0.000 |
laptops | +0.000 |
Neg logit contributions | |
tow | -0.000 |
ever | -0.000 |
aroo | -0.000 |
Dove | -0.000 |
swoop | -0.000 |
Token | sharing |
Token ID | 7373 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.042 |
chores | +0.040 |
laptop | +0.040 |
apr | +0.039 |
Neg logit contributions | |
tow | -0.025 |
ever | -0.025 |
Sue | -0.023 |
free | -0.023 |
aroo | -0.021 |
Token | is |
Token ID | 318 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
arre | +0.043 |
homework | +0.037 |
chores | +0.036 |
laptop | +0.035 |
apr | +0.035 |
Neg logit contributions | |
ever | -0.030 |
tow | -0.029 |
Sue | -0.028 |
free | -0.028 |
pet | -0.025 |
Token | important |
Token ID | 1593 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
arre | +0.023 |
homework | +0.020 |
laptop | +0.019 |
apr | +0.019 |
chores | +0.019 |
Neg logit contributions | |
ever | -0.016 |
tow | -0.016 |
free | -0.015 |
Sue | -0.015 |
Sally | -0.014 |
Token | and |
Token ID | 290 |
Feature activation | -1.52e-03 |
Pos logit contributions | |
arre | +0.050 |
homework | +0.044 |
chores | +0.043 |
laptop | +0.043 |
apr | +0.042 |
Neg logit contributions | |
ever | -0.020 |
tow | -0.017 |
Sue | -0.016 |
free | -0.016 |
Sally | -0.014 |
Token | qu |
Token ID | 627 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
arre | +0.003 |
homework | +0.003 |
chores | +0.003 |
jobs | +0.002 |
tasks | +0.002 |
Neg logit contributions | |
tow | -0.002 |
aroo | -0.002 |
ever | -0.002 |
Sue | -0.002 |
swoop | -0.002 |
Token | arre |
Token ID | 9624 |
Feature activation | -6.90e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.004 |
chores | +0.002 |
laptop | +0.002 |
apr | +0.001 |
Neg logit contributions | |
tow | -0.063 |
ever | -0.062 |
free | -0.061 |
Sue | -0.060 |
aroo | -0.059 |
Token | lling |
Token ID | 2680 |
Feature activation | -2.18e-02 |
Pos logit contributions | |
homework | +0.122 |
arre | +0.122 |
laptop | +0.121 |
apr | +0.118 |
chores | +0.114 |
Neg logit contributions | |
ever | -0.096 |
free | -0.092 |
of | -0.079 |
fast | -0.075 |
itself | -0.074 |
Token | is |
Token ID | 318 |
Feature activation | -8.46e-03 |
Pos logit contributions | |
arre | +0.046 |
homework | +0.041 |
chores | +0.039 |
laptop | +0.038 |
jobs | +0.037 |
Neg logit contributions | |
tow | -0.027 |
ever | -0.025 |
Sue | -0.025 |
free | -0.024 |
aroo | -0.024 |
Token | not |
Token ID | 407 |
Feature activation | -2.81e-02 |
Pos logit contributions | |
arre | +0.015 |
homework | +0.014 |
chores | +0.013 |
jobs | +0.012 |
tasks | +0.012 |
Neg logit contributions | |
tow | -0.013 |
ever | -0.012 |
aroo | -0.012 |
Sue | -0.012 |
free | -0.011 |
Token | good |
Token ID | 922 |
Feature activation | -5.26e-03 |
Pos logit contributions | |
arre | +0.053 |
homework | +0.046 |
chores | +0.045 |
jobs | +0.043 |
tasks | +0.041 |
Neg logit contributions | |
tow | -0.043 |
aroo | -0.040 |
ever | -0.039 |
Sue | -0.036 |
free | -0.036 |
Token | . |
Token ID | 13 |
Feature activation | +7.09e-03 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.011 |
chores | +0.011 |
laptop | +0.011 |
apr | +0.010 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
free | -0.005 |
Sue | -0.005 |
aroo | -0.004 |
Token | eat |
Token ID | 4483 |
Feature activation | +1.71e-03 |
Pos logit contributions | |
tow | +0.008 |
aroo | +0.008 |
ever | +0.008 |
oe | +0.008 |
Dove | +0.008 |
Neg logit contributions | |
homework | -0.008 |
chores | -0.007 |
arre | -0.007 |
jobs | -0.006 |
laptop | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -6.81e-03 |
Pos logit contributions | |
tow | +0.002 |
aroo | +0.002 |
ever | +0.002 |
free | +0.001 |
Sue | +0.001 |
Neg logit contributions | |
arre | -0.004 |
homework | -0.004 |
chores | -0.004 |
jobs | -0.003 |
tasks | -0.003 |
Token | but |
Token ID | 475 |
Feature activation | +1.62e-03 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
laptop | +0.010 |
chores | +0.010 |
apr | +0.009 |
Neg logit contributions | |
tow | -0.011 |
ever | -0.010 |
aroo | -0.010 |
Sue | -0.009 |
oe | -0.009 |
Token | he |
Token ID | 339 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
free | +0.001 |
pet | +0.001 |
Sue | +0.001 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.003 |
chores | -0.003 |
laptop | -0.003 |
jobs | -0.003 |
Token | just |
Token ID | 655 |
Feature activation | +2.21e-02 |
Pos logit contributions | |
tow | +0.018 |
free | +0.016 |
Sue | +0.016 |
Dove | +0.016 |
aroo | +0.015 |
Neg logit contributions | |
arre | -0.016 |
homework | -0.014 |
chores | -0.013 |
laptop | -0.012 |
jobs | -0.012 |
Token | couldn |
Token ID | 3521 |
Feature activation | +2.45e-02 |
Pos logit contributions | |
tow | +0.046 |
oe | +0.038 |
aroo | +0.037 |
Dove | +0.037 |
Twe | +0.036 |
Neg logit contributions | |
arre | -0.025 |
homework | -0.019 |
doesn | -0.019 |
nurses | -0.019 |
idents | -0.019 |
Token | 't |
Token ID | 470 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
tow | +0.032 |
pet | +0.030 |
free | +0.029 |
swoop | +0.029 |
ever | +0.028 |
Neg logit contributions | |
arre | -0.048 |
homework | -0.043 |
chores | -0.042 |
laptop | -0.038 |
tasks | -0.037 |
Token | find |
Token ID | 1064 |
Feature activation | +2.70e-02 |
Pos logit contributions | |
tow | +0.032 |
Sue | +0.028 |
aroo | +0.028 |
Dove | +0.028 |
Bill | +0.027 |
Neg logit contributions | |
arre | -0.033 |
chores | -0.031 |
homework | -0.030 |
jobs | -0.028 |
laptop | -0.027 |
Token | anything |
Token ID | 1997 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
oe | +0.045 |
tted | +0.045 |
ary | +0.045 |
oot | +0.045 |
iki | +0.045 |
Neg logit contributions | |
chores | -0.034 |
homework | -0.033 |
jobs | -0.031 |
problems | -0.030 |
pills | -0.029 |
Token | else |
Token ID | 2073 |
Feature activation | +2.40e-02 |
Pos logit contributions | |
tow | +0.015 |
aroo | +0.013 |
Dove | +0.012 |
Sue | +0.012 |
ever | +0.012 |
Neg logit contributions | |
arre | -0.027 |
homework | -0.025 |
chores | -0.024 |
jobs | -0.023 |
laptop | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | +1.21e-03 |
Pos logit contributions | |
tow | +0.033 |
aroo | +0.026 |
Dove | +0.026 |
Zip | +0.024 |
Tweet | +0.024 |
Neg logit contributions | |
homework | -0.046 |
arre | -0.046 |
chores | -0.044 |
jobs | -0.042 |
tasks | -0.041 |
Token | agreement |
Token ID | 4381 |
Feature activation | +8.41e-03 |
Pos logit contributions | |
aroo | +0.048 |
ever | +0.047 |
Dove | +0.045 |
Sue | +0.044 |
tow | +0.044 |
Neg logit contributions | |
arre | -0.051 |
chores | -0.044 |
homework | -0.042 |
apr | -0.041 |
jobs | -0.040 |
Token | - |
Token ID | 532 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
tow | +0.010 |
aroo | +0.008 |
swoop | +0.008 |
Dove | +0.008 |
free | +0.008 |
Neg logit contributions | |
arre | -0.018 |
homework | -0.017 |
chores | -0.016 |
laptop | -0.016 |
jobs | -0.015 |
Token | it |
Token ID | 340 |
Feature activation | -1.68e-04 |
Pos logit contributions | |
arre | +0.026 |
homework | +0.023 |
chores | +0.023 |
ambul | +0.021 |
laptop | +0.021 |
Neg logit contributions | |
tow | -0.016 |
aroo | -0.016 |
ever | -0.015 |
free | -0.015 |
swoop | -0.015 |
Token | was |
Token ID | 373 |
Feature activation | +9.59e-03 |
Pos logit contributions | |
arre | +0.000 |
homework | +0.000 |
chores | +0.000 |
laptop | +0.000 |
apr | +0.000 |
Neg logit contributions | |
tow | -0.000 |
ever | -0.000 |
Sue | -0.000 |
free | -0.000 |
aroo | -0.000 |
Token | the |
Token ID | 262 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
aroo | +0.012 |
tow | +0.012 |
ever | +0.011 |
Zip | +0.011 |
squirrel | +0.011 |
Neg logit contributions | |
arre | -0.019 |
chores | -0.017 |
homework | -0.017 |
jobs | -0.015 |
apr | -0.015 |
Token | perfect |
Token ID | 2818 |
Feature activation | +3.71e-02 |
Pos logit contributions | |
tow | +0.036 |
ever | +0.036 |
Sue | +0.036 |
free | +0.035 |
aroo | +0.034 |
Neg logit contributions | |
arre | -0.031 |
homework | -0.028 |
chores | -0.028 |
laptop | -0.025 |
jobs | -0.024 |
Token | view |
Token ID | 1570 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
free | +0.052 |
tow | +0.052 |
aroo | +0.051 |
Dove | +0.050 |
ary | +0.050 |
Neg logit contributions | |
arre | -0.060 |
homework | -0.058 |
chores | -0.055 |
tasks | -0.053 |
jobs | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | +2.86e-03 |
Pos logit contributions | |
tow | +0.024 |
Dove | +0.021 |
Tweet | +0.021 |
aroo | +0.020 |
pet | +0.020 |
Neg logit contributions | |
arre | -0.045 |
homework | -0.041 |
chores | -0.038 |
laptop | -0.037 |
idents | -0.037 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -3.07e-03 |
Pos logit contributions | |
ever | +0.004 |
swoop | +0.004 |
free | +0.004 |
tow | +0.004 |
aroo | +0.004 |
Neg logit contributions | |
arre | -0.005 |
homework | -0.004 |
apr | -0.004 |
laptop | -0.004 |
means | -0.004 |
Token | One |
Token ID | 3198 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.004 |
means | +0.003 |
matt | +0.003 |
chores | +0.003 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
free | -0.005 |
swoop | -0.005 |
aroo | -0.005 |
Token | day |
Token ID | 1110 |
Feature activation | -9.96e-03 |
Pos logit contributions | |
tow | +0.017 |
Dove | +0.016 |
ever | +0.016 |
free | +0.015 |
aroo | +0.015 |
Neg logit contributions | |
arre | -0.018 |
homework | -0.016 |
chores | -0.015 |
laptop | -0.014 |
jobs | -0.014 |
Token | sandwiches |
Token ID | 29777 |
Feature activation | -1.03e-04 |
Pos logit contributions | |
arre | +0.012 |
obe | +0.009 |
riger | +0.009 |
narrative | +0.008 |
cuts | +0.008 |
Neg logit contributions | |
pet | -0.007 |
free | -0.007 |
ever | -0.006 |
Sue | -0.006 |
tow | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
arre | +0.000 |
homework | +0.000 |
chores | +0.000 |
laptop | +0.000 |
apr | +0.000 |
Neg logit contributions | |
tow | -0.000 |
ever | -0.000 |
free | -0.000 |
Sue | -0.000 |
aroo | -0.000 |
Token | They |
Token ID | 1119 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
ever | +0.027 |
aroo | +0.026 |
swoop | +0.025 |
free | +0.025 |
tow | +0.024 |
Neg logit contributions | |
arre | -0.030 |
apr | -0.028 |
homework | -0.028 |
chores | -0.028 |
laptop | -0.026 |
Token | are |
Token ID | 389 |
Feature activation | +1.49e-03 |
Pos logit contributions | |
arre | +0.035 |
homework | +0.030 |
chores | +0.029 |
laptop | +0.029 |
apr | +0.028 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.019 |
free | -0.017 |
Sue | -0.017 |
pet | -0.016 |
Token | happy |
Token ID | 3772 |
Feature activation | +8.12e-03 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
Sue | +0.002 |
free | +0.002 |
aroo | +0.002 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.003 |
chores | -0.003 |
laptop | -0.003 |
apr | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.006 |
free | +0.005 |
Sue | +0.005 |
aroo | +0.005 |
Neg logit contributions | |
arre | -0.021 |
homework | -0.019 |
chores | -0.018 |
laptop | -0.018 |
apr | -0.018 |
Token |
|
Token ID | 198 |
Feature activation | +2.11e-03 |
Pos logit contributions | |
ever | +0.032 |
free | +0.030 |
swoop | +0.030 |
tow | +0.030 |
aroo | +0.030 |
Neg logit contributions | |
arre | -0.053 |
homework | -0.047 |
chores | -0.046 |
apr | -0.046 |
laptop | -0.045 |
Token |
|
Token ID | 198 |
Feature activation | +6.19e-03 |
Pos logit contributions | |
ever | +0.002 |
tow | +0.002 |
aroo | +0.002 |
Dove | +0.002 |
swoop | +0.002 |
Neg logit contributions | |
arre | -0.004 |
homework | -0.004 |
chores | -0.004 |
laptop | -0.004 |
apr | -0.004 |
Token | They |
Token ID | 2990 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.007 |
free | +0.006 |
Sue | +0.006 |
aroo | +0.006 |
Neg logit contributions | |
arre | -0.014 |
homework | -0.012 |
chores | -0.012 |
laptop | -0.012 |
apr | -0.011 |
Token | say |
Token ID | 910 |
Feature activation | +8.56e-03 |
Pos logit contributions | |
arre | +0.035 |
homework | +0.031 |
chores | +0.030 |
laptop | +0.030 |
apr | +0.029 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.019 |
Sue | -0.017 |
free | -0.017 |
aroo | -0.016 |
Token | thank |
Token ID | 5875 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
ever | +0.009 |
tow | +0.009 |
Sue | +0.009 |
free | +0.008 |
pet | +0.008 |
Neg logit contributions | |
arre | -0.020 |
homework | -0.017 |
laptop | -0.017 |
chores | -0.017 |
apr | -0.016 |
Token | saw |
Token ID | 2497 |
Feature activation | +5.14e-03 |
Pos logit contributions | |
tow | +0.004 |
ever | +0.003 |
Sue | +0.003 |
aroo | +0.003 |
free | +0.003 |
Neg logit contributions | |
arre | -0.006 |
homework | -0.005 |
chores | -0.005 |
apr | -0.005 |
laptop | -0.005 |
Token | many |
Token ID | 867 |
Feature activation | +9.84e-03 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.007 |
oe | +0.006 |
free | +0.006 |
aroo | +0.006 |
Neg logit contributions | |
arre | -0.009 |
chores | -0.008 |
homework | -0.008 |
ambul | -0.008 |
jobs | -0.008 |
Token | other |
Token ID | 584 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
tow | +0.012 |
ever | +0.012 |
Sue | +0.011 |
free | +0.011 |
aroo | +0.010 |
Neg logit contributions | |
arre | -0.020 |
homework | -0.018 |
chores | -0.018 |
jobs | -0.017 |
laptop | -0.017 |
Token | animals |
Token ID | 4695 |
Feature activation | +5.93e-03 |
Pos logit contributions | |
tow | +0.028 |
ever | +0.025 |
aroo | +0.025 |
Sue | +0.024 |
free | +0.024 |
Neg logit contributions | |
arre | -0.032 |
jobs | -0.027 |
ambul | -0.027 |
chores | -0.027 |
matt | -0.026 |
Token | playing |
Token ID | 2712 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
tow | +0.008 |
aroo | +0.006 |
Sue | +0.006 |
Zip | +0.006 |
Dove | +0.006 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.011 |
chores | -0.011 |
laptop | -0.010 |
jobs | -0.010 |
Token | around |
Token ID | 1088 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
tow | +0.020 |
ever | +0.017 |
Sue | +0.016 |
free | +0.015 |
aroo | +0.015 |
Neg logit contributions | |
arre | -0.045 |
homework | -0.040 |
chores | -0.039 |
laptop | -0.038 |
jobs | -0.038 |
Token | the |
Token ID | 262 |
Feature activation | -3.31e-03 |
Pos logit contributions | |
tow | +0.035 |
hy | +0.028 |
aroo | +0.028 |
inger | +0.027 |
Dove | +0.027 |
Neg logit contributions | |
arre | -0.046 |
chores | -0.041 |
jobs | -0.041 |
tasks | -0.041 |
homework | -0.040 |
Token | lake |
Token ID | 13546 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.005 |
chores | +0.005 |
apr | +0.005 |
laptop | +0.005 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
Sue | -0.005 |
aroo | -0.004 |
Sally | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -6.25e-03 |
Pos logit contributions | |
tow | +0.024 |
aroo | +0.021 |
Zip | +0.020 |
Dove | +0.019 |
ever | +0.019 |
Neg logit contributions | |
arre | -0.035 |
homework | -0.031 |
chores | -0.030 |
jobs | -0.029 |
laptop | -0.029 |
Token | The |
Token ID | 383 |
Feature activation | +2.17e-02 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.011 |
chores | +0.011 |
laptop | +0.011 |
jobs | +0.011 |
Neg logit contributions | |
ever | -0.008 |
tow | -0.008 |
free | -0.007 |
aroo | -0.007 |
swoop | -0.007 |
Token | sw |
Token ID | 1509 |
Feature activation | -7.73e-04 |
Pos logit contributions | |
ever | +0.030 |
tow | +0.029 |
Sue | +0.028 |
Jerry | +0.026 |
Sally | +0.025 |
Neg logit contributions | |
arre | -0.039 |
chores | -0.034 |
ambul | -0.032 |
jobs | -0.032 |
nurses | -0.031 |
Token | and |
Token ID | 290 |
Feature activation | -3.42e-03 |
Pos logit contributions | |
arre | +0.045 |
homework | +0.040 |
chores | +0.038 |
laptop | +0.038 |
jobs | +0.036 |
Neg logit contributions | |
tow | -0.024 |
ever | -0.021 |
free | -0.021 |
Sue | -0.021 |
aroo | -0.020 |
Token | wanted |
Token ID | 2227 |
Feature activation | +5.62e-03 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.006 |
chores | +0.005 |
laptop | +0.005 |
jobs | +0.005 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
free | -0.004 |
aroo | -0.004 |
Sue | -0.004 |
Token | things |
Token ID | 1243 |
Feature activation | +8.33e-03 |
Pos logit contributions | |
tow | +0.008 |
aroo | +0.008 |
swoop | +0.007 |
ever | +0.007 |
free | +0.007 |
Neg logit contributions | |
homework | -0.010 |
arre | -0.010 |
chores | -0.010 |
jobs | -0.009 |
tasks | -0.009 |
Token | her |
Token ID | 607 |
Feature activation | +1.15e-03 |
Pos logit contributions | |
tow | +0.010 |
ever | +0.009 |
Sue | +0.009 |
free | +0.009 |
aroo | +0.008 |
Neg logit contributions | |
arre | -0.018 |
homework | -0.016 |
chores | -0.016 |
laptop | -0.015 |
jobs | -0.015 |
Token | own |
Token ID | 898 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
Sue | +0.002 |
free | +0.002 |
swoop | +0.002 |
Neg logit contributions | |
homework | -0.002 |
arre | -0.002 |
chores | -0.002 |
laptop | -0.002 |
jobs | -0.002 |
Token | way |
Token ID | 835 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
tow | +0.013 |
aroo | +0.011 |
free | +0.011 |
Dove | +0.011 |
swoop | +0.011 |
Neg logit contributions | |
arre | -0.026 |
homework | -0.025 |
chores | -0.024 |
laptop | -0.023 |
jobs | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | -6.58e-03 |
Pos logit contributions | |
tow | +0.038 |
swoop | +0.034 |
aroo | +0.033 |
Zip | +0.033 |
Tweet | +0.031 |
Neg logit contributions | |
arre | -0.046 |
chores | -0.045 |
homework | -0.043 |
laptop | -0.039 |
tasks | -0.037 |
Token |
|
Token ID | 198 |
Feature activation | -3.89e-04 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.012 |
chores | +0.012 |
apr | +0.011 |
laptop | +0.011 |
Neg logit contributions | |
ever | -0.009 |
tow | -0.008 |
aroo | -0.008 |
free | -0.008 |
swoop | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -3.19e-03 |
Pos logit contributions | |
arre | +0.001 |
chores | +0.001 |
homework | +0.001 |
apr | +0.001 |
matt | +0.001 |
Neg logit contributions | |
ever | -0.000 |
tow | -0.000 |
swoop | -0.000 |
aroo | -0.000 |
free | -0.000 |
Token | As |
Token ID | 1722 |
Feature activation | -1.71e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.005 |
chores | +0.005 |
laptop | +0.005 |
apr | +0.005 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.004 |
free | -0.004 |
Sue | -0.004 |
aroo | -0.004 |
Token | she |
Token ID | 673 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
arre | +0.032 |
chores | +0.029 |
homework | +0.028 |
nurses | +0.026 |
apr | +0.026 |
Neg logit contributions | |
tow | -0.024 |
aroo | -0.022 |
ever | -0.021 |
free | -0.021 |
Sue | -0.021 |
Token | watched |
Token ID | 7342 |
Feature activation | +1.96e-03 |
Pos logit contributions | |
tow | +0.041 |
Sue | +0.039 |
ever | +0.038 |
Dove | +0.038 |
aroo | +0.037 |
Neg logit contributions | |
arre | -0.043 |
apr | -0.034 |
homework | -0.032 |
laptops | -0.031 |
laptop | -0.030 |
Token | him |
Token ID | 683 |
Feature activation | +6.98e-03 |
Pos logit contributions | |
tow | +0.003 |
Dove | +0.003 |
Zip | +0.003 |
Sue | +0.002 |
ever | +0.002 |
Neg logit contributions | |
arre | -0.003 |
chores | -0.003 |
homework | -0.003 |
apr | -0.003 |
tasks | -0.003 |
Token | explore |
Token ID | 7301 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
tow | +0.009 |
Sue | +0.008 |
ever | +0.008 |
aroo | +0.008 |
Dove | +0.008 |
Neg logit contributions | |
arre | -0.014 |
homework | -0.013 |
chores | -0.013 |
laptop | -0.012 |
tasks | -0.011 |
Token | with |
Token ID | 351 |
Feature activation | +2.52e-02 |
Pos logit contributions | |
tow | +0.016 |
ever | +0.015 |
aroo | +0.014 |
Sue | +0.014 |
Dove | +0.014 |
Neg logit contributions | |
arre | -0.029 |
chores | -0.027 |
homework | -0.027 |
tasks | -0.026 |
jobs | -0.025 |
Token | such |
Token ID | 884 |
Feature activation | +3.00e-02 |
Pos logit contributions | |
aroo | +0.036 |
oe | +0.035 |
Twe | +0.034 |
Tweet | +0.034 |
Dove | +0.034 |
Neg logit contributions | |
chores | -0.043 |
homework | -0.039 |
arre | -0.038 |
apr | -0.038 |
jobs | -0.037 |
Token | enthusiasm |
Token ID | 17131 |
Feature activation | +8.62e-03 |
Pos logit contributions | |
tow | +0.035 |
ever | +0.034 |
aroo | +0.032 |
oe | +0.032 |
Sue | +0.030 |
Neg logit contributions | |
arre | -0.061 |
chores | -0.056 |
homework | -0.055 |
jobs | -0.054 |
tasks | -0.053 |
Token | . |
Token ID | 13 |
Feature activation | -9.86e-03 |
Pos logit contributions | |
tow | +0.010 |
Dove | +0.010 |
Tweet | +0.010 |
aroo | +0.009 |
Sue | +0.009 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.016 |
chores | -0.016 |
laptop | -0.015 |
tasks | -0.015 |
Token | |
Token ID | 220 |
Feature activation | +8.88e-03 |
Pos logit contributions | |
arre | +0.020 |
chores | +0.015 |
matt | +0.015 |
homework | +0.015 |
apr | +0.015 |
Neg logit contributions | |
ever | -0.014 |
tow | -0.013 |
free | -0.012 |
aroo | -0.012 |
swoop | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | -7.84e-03 |
Pos logit contributions | |
ever | +0.012 |
tow | +0.011 |
aroo | +0.011 |
swoop | +0.011 |
pet | +0.011 |
Neg logit contributions | |
arre | -0.019 |
chores | -0.014 |
homework | -0.014 |
laptop | -0.014 |
idents | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -7.46e-03 |
Pos logit contributions | |
arre | +0.018 |
homework | +0.015 |
chores | +0.015 |
apr | +0.015 |
laptop | +0.015 |
Neg logit contributions | |
ever | -0.008 |
tow | -0.008 |
Sue | -0.007 |
Dove | -0.007 |
pet | -0.006 |
Token | M |
Token ID | 44 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
arre | +0.016 |
homework | +0.015 |
laptop | +0.015 |
chores | +0.014 |
idents | +0.014 |
Neg logit contributions | |
tow | -0.009 |
ever | -0.008 |
free | -0.008 |
aroo | -0.008 |
Sue | -0.008 |
Token | were |
Token ID | 547 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
arre | +0.024 |
homework | +0.021 |
chores | +0.020 |
laptop | +0.020 |
apr | +0.019 |
Neg logit contributions | |
ever | -0.013 |
tow | -0.013 |
free | -0.012 |
Sue | -0.012 |
pet | -0.011 |
Token | sad |
Token ID | 6507 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
arre | +0.024 |
homework | +0.021 |
chores | +0.020 |
laptop | +0.019 |
jobs | +0.018 |
Neg logit contributions | |
tow | -0.018 |
ever | -0.017 |
aroo | -0.016 |
Sue | -0.015 |
Dove | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
arre | +0.057 |
homework | +0.051 |
chores | +0.049 |
laptop | +0.049 |
apr | +0.049 |
Neg logit contributions | |
ever | -0.017 |
tow | -0.016 |
Sue | -0.014 |
free | -0.014 |
pet | -0.012 |
Token | angry |
Token ID | 7954 |
Feature activation | -3.95e-03 |
Pos logit contributions | |
arre | +0.019 |
homework | +0.017 |
chores | +0.016 |
laptop | +0.016 |
apr | +0.015 |
Neg logit contributions | |
tow | -0.016 |
ever | -0.015 |
free | -0.014 |
Sue | -0.014 |
aroo | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | -5.62e-03 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.008 |
laptop | +0.008 |
jobs | +0.008 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.003 |
free | -0.003 |
aroo | -0.003 |
Sue | -0.003 |
Token | They |
Token ID | 1119 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
laptop | +0.010 |
chores | +0.010 |
idents | +0.010 |
Neg logit contributions | |
ever | -0.007 |
tow | -0.007 |
free | -0.007 |
aroo | -0.006 |
swoop | -0.006 |
Token | wanted |
Token ID | 2227 |
Feature activation | -3.77e-03 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.032 |
chores | +0.030 |
laptop | +0.030 |
apr | +0.029 |
Neg logit contributions | |
tow | -0.027 |
ever | -0.026 |
Sue | -0.024 |
free | -0.024 |
aroo | -0.024 |
Token | their |
Token ID | 511 |
Feature activation | +1.24e-03 |
Pos logit contributions | |
homework | +0.007 |
arre | +0.007 |
chores | +0.007 |
jobs | +0.006 |
apr | +0.006 |
Neg logit contributions | |
aroo | -0.005 |
tow | -0.005 |
free | -0.005 |
ever | -0.005 |
swoop | -0.005 |
Token | bricks |
Token ID | 28902 |
Feature activation | -1.89e-02 |
Pos logit contributions | |
tow | +0.002 |
ever | +0.002 |
free | +0.002 |
Sue | +0.002 |
aroo | +0.002 |
Neg logit contributions | |
arre | -0.002 |
homework | -0.002 |
chores | -0.002 |
laptop | -0.002 |
apr | -0.002 |
Token | back |
Token ID | 736 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
arre | +0.045 |
homework | +0.040 |
chores | +0.039 |
laptop | +0.038 |
apr | +0.037 |
Neg logit contributions | |
tow | -0.018 |
ever | -0.017 |
Sue | -0.016 |
free | -0.016 |
aroo | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +3.39e-03 |
Pos logit contributions | |
tow | +0.018 |
aroo | +0.016 |
swoop | +0.015 |
Dove | +0.015 |
Tweet | +0.014 |
Neg logit contributions | |
arre | -0.029 |
homework | -0.025 |
chores | -0.024 |
jobs | -0.023 |
idents | -0.023 |
Token | had |
Token ID | 550 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
tow | +0.008 |
aroo | +0.007 |
free | +0.007 |
Dove | +0.007 |
Sue | +0.007 |
Neg logit contributions | |
arre | -0.011 |
homework | -0.010 |
laptop | -0.010 |
chores | -0.010 |
laptops | -0.009 |
Token | songs |
Token ID | 7259 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
aroo | +0.027 |
tow | +0.025 |
free | +0.023 |
Sally | +0.023 |
Pam | +0.023 |
Neg logit contributions | |
homework | -0.021 |
arre | -0.021 |
chores | -0.020 |
laptop | -0.019 |
laptops | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | -8.41e-03 |
Pos logit contributions | |
tow | +0.021 |
aroo | +0.020 |
ever | +0.019 |
free | +0.019 |
Sue | +0.018 |
Neg logit contributions | |
arre | -0.033 |
homework | -0.030 |
chores | -0.029 |
laptop | -0.029 |
jobs | -0.027 |
Token | rh |
Token ID | 9529 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
chores | +0.009 |
laptop | +0.009 |
apr | +0.009 |
Neg logit contributions | |
tow | -0.016 |
ever | -0.016 |
free | -0.015 |
Sue | -0.015 |
aroo | -0.015 |
Token | ymes |
Token ID | 22009 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
arre | +0.019 |
homework | +0.014 |
chores | +0.013 |
laptop | +0.012 |
jobs | +0.012 |
Neg logit contributions | |
tow | -0.038 |
Sue | -0.036 |
ever | -0.036 |
free | -0.036 |
Sally | -0.036 |
Token | . |
Token ID | 13 |
Feature activation | -4.73e-03 |
Pos logit contributions | |
tow | +0.009 |
ever | +0.009 |
aroo | +0.008 |
Sue | +0.008 |
free | +0.008 |
Neg logit contributions | |
arre | -0.024 |
homework | -0.022 |
laptop | -0.021 |
chores | -0.021 |
jobs | -0.020 |
Token | Lily |
Token ID | 20037 |
Feature activation | -5.50e-03 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.009 |
laptop | +0.009 |
apr | +0.009 |
Neg logit contributions | |
ever | -0.006 |
tow | -0.005 |
free | -0.005 |
aroo | -0.005 |
swoop | -0.005 |
Token | loved |
Token ID | 6151 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.012 |
chores | +0.012 |
laptop | +0.011 |
tasks | +0.011 |
Neg logit contributions | |
ever | -0.005 |
pet | -0.005 |
Sue | -0.004 |
tow | -0.004 |
free | -0.004 |
Token | all |
Token ID | 477 |
Feature activation | -1.84e-03 |
Pos logit contributions | |
arre | +0.024 |
homework | +0.021 |
chores | +0.021 |
laptop | +0.020 |
apr | +0.020 |
Neg logit contributions | |
tow | -0.014 |
ever | -0.013 |
free | -0.012 |
Sue | -0.012 |
aroo | -0.012 |
Token | her |
Token ID | 607 |
Feature activation | -7.37e-03 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.004 |
idents | +0.004 |
laptop | +0.004 |
apr | +0.004 |
Neg logit contributions | |
Sue | -0.001 |
tow | -0.001 |
ever | -0.001 |
free | -0.001 |
Sally | -0.001 |
Token | books |
Token ID | 3835 |
Feature activation | -7.15e-04 |
Pos logit contributions | |
arre | +0.011 |
homework | +0.009 |
chores | +0.008 |
laptop | +0.008 |
apr | +0.008 |
Neg logit contributions | |
tow | -0.014 |
ever | -0.014 |
free | -0.013 |
Sue | -0.013 |
aroo | -0.013 |
Token | it |
Token ID | 340 |
Feature activation | +4.15e-03 |
Pos logit contributions | |
arre | +0.022 |
homework | +0.019 |
laptop | +0.019 |
chores | +0.019 |
apr | +0.018 |
Neg logit contributions | |
ever | -0.007 |
tow | -0.007 |
Sue | -0.006 |
free | -0.006 |
Sally | -0.005 |
Token | was |
Token ID | 373 |
Feature activation | -6.06e-03 |
Pos logit contributions | |
ever | +0.004 |
free | +0.003 |
tow | +0.003 |
pet | +0.003 |
Sue | +0.003 |
Neg logit contributions | |
arre | -0.011 |
homework | -0.010 |
laptop | -0.010 |
chores | -0.010 |
apr | -0.009 |
Token | more |
Token ID | 517 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.012 |
chores | +0.012 |
laptop | +0.011 |
apr | +0.011 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
free | -0.006 |
Sue | -0.006 |
aroo | -0.006 |
Token | dazzling |
Token ID | 41535 |
Feature activation | +3.54e-03 |
Pos logit contributions | |
arre | +0.024 |
homework | +0.021 |
chores | +0.021 |
laptop | +0.020 |
apr | +0.020 |
Neg logit contributions | |
ever | -0.012 |
tow | -0.012 |
free | -0.011 |
Sue | -0.011 |
pet | -0.010 |
Token | than |
Token ID | 621 |
Feature activation | -7.06e-03 |
Pos logit contributions | |
tow | +0.003 |
ever | +0.003 |
Sue | +0.003 |
free | +0.003 |
aroo | +0.003 |
Neg logit contributions | |
arre | -0.008 |
homework | -0.008 |
chores | -0.007 |
laptop | -0.007 |
apr | -0.007 |
Token | she |
Token ID | 673 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
homework | +0.012 |
chores | +0.011 |
arre | +0.010 |
nurses | +0.010 |
ambul | +0.010 |
Neg logit contributions | |
tow | -0.011 |
aroo | -0.010 |
Zip | -0.009 |
swoop | -0.009 |
Tweet | -0.008 |
Token | imagined |
Token ID | 15758 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
tow | +0.021 |
Sue | +0.019 |
aroo | +0.018 |
Sally | +0.017 |
Dove | +0.017 |
Neg logit contributions | |
arre | -0.027 |
homework | -0.024 |
laptop | -0.022 |
chores | -0.022 |
laptops | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | -8.70e-03 |
Pos logit contributions | |
tow | +0.022 |
aroo | +0.017 |
Sue | +0.017 |
Dove | +0.017 |
Zip | +0.017 |
Neg logit contributions | |
arre | -0.034 |
homework | -0.034 |
chores | -0.033 |
tasks | -0.031 |
jobs | -0.030 |
Token | The |
Token ID | 383 |
Feature activation | +7.29e-03 |
Pos logit contributions | |
arre | +0.020 |
homework | +0.018 |
chores | +0.017 |
laptop | +0.017 |
apr | +0.017 |
Neg logit contributions | |
ever | -0.009 |
tow | -0.009 |
free | -0.008 |
aroo | -0.008 |
Sue | -0.007 |
Token | flowers |
Token ID | 12734 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
tow | +0.009 |
ever | +0.009 |
free | +0.008 |
Sue | +0.008 |
pet | +0.008 |
Neg logit contributions | |
arre | -0.016 |
homework | -0.014 |
chores | -0.013 |
laptop | -0.013 |
apr | -0.013 |
Token | were |
Token ID | 547 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
tow | +0.018 |
ever | +0.017 |
Sue | +0.017 |
free | +0.016 |
aroo | +0.015 |
Neg logit contributions | |
arre | -0.027 |
homework | -0.023 |
chores | -0.022 |
laptop | -0.021 |
apr | -0.021 |
Token | to |
Token ID | 284 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.011 |
chores | +0.010 |
laptop | +0.010 |
apr | +0.010 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
Sue | -0.005 |
free | -0.005 |
pet | -0.004 |
Token | cross |
Token ID | 3272 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
aroo | +0.021 |
tow | +0.021 |
ever | +0.021 |
ull | +0.020 |
Dove | +0.020 |
Neg logit contributions | |
homework | -0.030 |
chores | -0.030 |
arre | -0.029 |
jobs | -0.027 |
laptop | -0.026 |
Token | the |
Token ID | 262 |
Feature activation | -9.71e-03 |
Pos logit contributions | |
tow | +0.012 |
ever | +0.012 |
aroo | +0.010 |
free | +0.010 |
Sue | +0.010 |
Neg logit contributions | |
arre | -0.026 |
homework | -0.024 |
chores | -0.023 |
laptop | -0.022 |
jobs | -0.022 |
Token | road |
Token ID | 2975 |
Feature activation | -1.46e-03 |
Pos logit contributions | |
arre | +0.021 |
homework | +0.018 |
chores | +0.018 |
apr | +0.017 |
laptop | +0.017 |
Neg logit contributions | |
tow | -0.012 |
ever | -0.011 |
free | -0.011 |
Sue | -0.011 |
pet | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +9.83e-03 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.003 |
chores | +0.003 |
laptop | +0.003 |
jobs | +0.003 |
Neg logit contributions | |
tow | -0.001 |
ever | -0.001 |
Sue | -0.001 |
free | -0.001 |
aroo | -0.001 |
Token | They |
Token ID | 1119 |
Feature activation | -2.40e-02 |
Pos logit contributions | |
ever | +0.011 |
tow | +0.011 |
free | +0.010 |
aroo | +0.009 |
Sue | +0.009 |
Neg logit contributions | |
arre | -0.022 |
homework | -0.019 |
chores | -0.019 |
laptop | -0.019 |
apr | -0.018 |
Token | wait |
Token ID | 4043 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
arre | +0.051 |
homework | +0.045 |
chores | +0.043 |
laptop | +0.042 |
apr | +0.041 |
Neg logit contributions | |
tow | -0.030 |
ever | -0.030 |
free | -0.027 |
Sue | -0.027 |
aroo | -0.026 |
Token | for |
Token ID | 329 |
Feature activation | +7.46e-03 |
Pos logit contributions | |
arre | +0.039 |
homework | +0.034 |
chores | +0.032 |
laptop | +0.032 |
apr | +0.031 |
Neg logit contributions | |
tow | -0.022 |
ever | -0.022 |
free | -0.020 |
Sue | -0.020 |
aroo | -0.019 |
Token | a |
Token ID | 257 |
Feature activation | +6.82e-03 |
Pos logit contributions | |
aroo | +0.010 |
ever | +0.010 |
swoop | +0.010 |
tow | +0.009 |
Zip | +0.009 |
Neg logit contributions | |
chores | -0.014 |
homework | -0.013 |
apr | -0.013 |
jobs | -0.012 |
arre | -0.012 |
Token | gap |
Token ID | 7625 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
ever | +0.009 |
Sue | +0.008 |
itself | +0.008 |
tow | +0.008 |
aroo | +0.008 |
Neg logit contributions | |
arre | -0.013 |
homework | -0.012 |
chores | -0.012 |
laptop | -0.012 |
tant | -0.011 |
Token | in |
Token ID | 287 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
tow | +0.023 |
Dove | +0.021 |
Twe | +0.020 |
Tweet | +0.020 |
squirrel | +0.020 |
Neg logit contributions | |
arre | -0.031 |
homework | -0.030 |
chores | -0.029 |
laptop | -0.029 |
jobs | -0.028 |
Token | felt |
Token ID | 2936 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
arre | +0.026 |
homework | +0.023 |
chores | +0.022 |
laptop | +0.021 |
apr | +0.021 |
Neg logit contributions | |
ever | -0.017 |
tow | -0.016 |
free | -0.015 |
Sue | -0.015 |
pet | -0.014 |
Token | happy |
Token ID | 3772 |
Feature activation | +1.41e-03 |
Pos logit contributions | |
arre | +0.033 |
homework | +0.029 |
chores | +0.028 |
laptop | +0.027 |
apr | +0.027 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.019 |
Sue | -0.018 |
aroo | -0.017 |
free | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | -2.05e-02 |
Pos logit contributions | |
tow | +0.001 |
ever | +0.001 |
free | +0.001 |
Sue | +0.001 |
aroo | +0.001 |
Neg logit contributions | |
arre | -0.003 |
homework | -0.003 |
chores | -0.003 |
laptop | -0.003 |
apr | -0.003 |
Token | She |
Token ID | 1375 |
Feature activation | -8.12e-03 |
Pos logit contributions | |
arre | +0.048 |
homework | +0.043 |
chores | +0.041 |
laptop | +0.041 |
apr | +0.040 |
Neg logit contributions | |
tow | -0.021 |
ever | -0.020 |
free | -0.019 |
aroo | -0.018 |
Sue | -0.018 |
Token | knew |
Token ID | 2993 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
arre | +0.018 |
homework | +0.016 |
chores | +0.015 |
laptop | +0.015 |
apr | +0.014 |
Neg logit contributions | |
ever | -0.010 |
tow | -0.009 |
free | -0.009 |
Sue | -0.009 |
pet | -0.008 |
Token | that |
Token ID | 326 |
Feature activation | -2.96e-02 |
Pos logit contributions | |
tow | +0.016 |
swoop | +0.014 |
Zip | +0.014 |
free | +0.014 |
ever | +0.013 |
Neg logit contributions | |
homework | -0.021 |
arre | -0.021 |
chores | -0.020 |
nurses | -0.019 |
tasks | -0.019 |
Token | she |
Token ID | 673 |
Feature activation | -5.86e-03 |
Pos logit contributions | |
arre | +0.070 |
homework | +0.060 |
laptop | +0.058 |
apr | +0.057 |
chores | +0.057 |
Neg logit contributions | |
ever | -0.033 |
tow | -0.031 |
Sue | -0.029 |
free | -0.029 |
Sally | -0.027 |
Token | had |
Token ID | 550 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
chores | +0.010 |
laptop | +0.009 |
apr | +0.009 |
Neg logit contributions | |
tow | -0.008 |
Sue | -0.007 |
free | -0.007 |
ever | -0.007 |
aroo | -0.007 |
Token | found |
Token ID | 1043 |
Feature activation | -1.86e-03 |
Pos logit contributions | |
arre | +0.043 |
homework | +0.038 |
chores | +0.036 |
laptop | +0.035 |
apr | +0.035 |
Neg logit contributions | |
tow | -0.025 |
ever | -0.024 |
Sue | -0.023 |
free | -0.023 |
aroo | -0.022 |
Token | something |
Token ID | 1223 |
Feature activation | -4.22e-03 |
Pos logit contributions | |
chores | +0.003 |
arre | +0.003 |
homework | +0.003 |
jobs | +0.003 |
tasks | +0.003 |
Neg logit contributions | |
tow | -0.003 |
aroo | -0.003 |
Zip | -0.003 |
ever | -0.003 |
oe | -0.003 |
Token | special |
Token ID | 2041 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.008 |
chores | +0.007 |
laptop | +0.007 |
jobs | +0.007 |
Neg logit contributions | |
tow | -0.006 |
aroo | -0.005 |
ever | -0.005 |
Sue | -0.005 |
swoop | -0.005 |
Token | for |
Token ID | 329 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
arre | +0.042 |
homework | +0.038 |
laptop | +0.036 |
chores | +0.035 |
apr | +0.035 |
Neg logit contributions | |
ever | -0.028 |
free | -0.027 |
tow | -0.027 |
Sue | -0.026 |
pet | -0.025 |
Token | surprises |
Token ID | 24072 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
tow | +0.022 |
ever | +0.022 |
aroo | +0.020 |
Sue | +0.020 |
free | +0.019 |
Neg logit contributions | |
arre | -0.028 |
homework | -0.025 |
chores | -0.024 |
jobs | -0.023 |
apr | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | -5.42e-03 |
Pos logit contributions | |
tow | +0.014 |
ever | +0.012 |
Sue | +0.012 |
free | +0.012 |
aroo | +0.011 |
Neg logit contributions | |
arre | -0.037 |
homework | -0.035 |
chores | -0.034 |
laptop | -0.033 |
jobs | -0.033 |
Token | One |
Token ID | 1881 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
arre | +0.011 |
homework | +0.010 |
chores | +0.010 |
laptop | +0.009 |
apr | +0.009 |
Neg logit contributions | |
ever | -0.007 |
tow | -0.007 |
free | -0.006 |
aroo | -0.006 |
Sue | -0.006 |
Token | day |
Token ID | 1110 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
tow | +0.017 |
ever | +0.016 |
free | +0.015 |
Sue | +0.015 |
aroo | +0.015 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.016 |
chores | -0.016 |
laptop | -0.015 |
jobs | -0.015 |
Token | , |
Token ID | 11 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
arre | +0.062 |
homework | +0.054 |
laptop | +0.053 |
chores | +0.051 |
apr | +0.051 |
Neg logit contributions | |
ever | -0.019 |
tow | -0.017 |
Sue | -0.017 |
free | -0.016 |
aroo | -0.015 |
Token | he |
Token ID | 339 |
Feature activation | +8.11e-03 |
Pos logit contributions | |
arre | +0.062 |
homework | +0.053 |
laptop | +0.052 |
chores | +0.051 |
apr | +0.050 |
Neg logit contributions | |
ever | -0.024 |
tow | -0.023 |
Sue | -0.022 |
free | -0.022 |
aroo | -0.019 |
Token | saw |
Token ID | 2497 |
Feature activation | -2.60e-03 |
Pos logit contributions | |
tow | +0.008 |
ever | +0.008 |
free | +0.007 |
Sue | +0.007 |
aroo | +0.006 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.017 |
chores | -0.017 |
laptop | -0.016 |
apr | -0.016 |
Token | a |
Token ID | 257 |
Feature activation | +5.74e-03 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.005 |
chores | +0.005 |
apr | +0.005 |
jobs | +0.005 |
Neg logit contributions | |
ever | -0.003 |
tow | -0.003 |
free | -0.002 |
Sue | -0.002 |
aroo | -0.002 |
Token | shiny |
Token ID | 22441 |
Feature activation | +4.40e-03 |
Pos logit contributions | |
ever | +0.006 |
tow | +0.006 |
Sue | +0.006 |
free | +0.005 |
aroo | +0.005 |
Neg logit contributions | |
arre | -0.013 |
homework | -0.011 |
chores | -0.011 |
laptop | -0.011 |
apr | -0.010 |
Token | tunnel |
Token ID | 13275 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
ever | +0.006 |
tow | +0.005 |
Sue | +0.005 |
free | +0.005 |
Jen | +0.004 |
Neg logit contributions | |
arre | -0.009 |
homework | -0.008 |
chores | -0.008 |
laptop | -0.008 |
tasks | -0.007 |
Token | One |
Token ID | 1881 |
Feature activation | +3.12e-03 |
Pos logit contributions | |
arre | +0.019 |
homework | +0.017 |
chores | +0.017 |
laptop | +0.016 |
apr | +0.016 |
Neg logit contributions | |
tow | -0.008 |
ever | -0.008 |
free | -0.007 |
Sue | -0.007 |
aroo | -0.007 |
Token | day |
Token ID | 1110 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
tow | +0.004 |
ever | +0.004 |
Sue | +0.004 |
free | +0.004 |
aroo | +0.003 |
Neg logit contributions | |
arre | -0.007 |
homework | -0.006 |
chores | -0.006 |
laptop | -0.005 |
apr | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
arre | +0.025 |
homework | +0.022 |
chores | +0.021 |
laptop | +0.021 |
apr | +0.021 |
Neg logit contributions | |
tow | -0.011 |
ever | -0.011 |
Sue | -0.010 |
free | -0.010 |
aroo | -0.009 |
Token | it |
Token ID | 340 |
Feature activation | +3.69e-03 |
Pos logit contributions | |
arre | +0.030 |
homework | +0.027 |
chores | +0.027 |
laptop | +0.026 |
apr | +0.026 |
Neg logit contributions | |
tow | -0.012 |
ever | -0.011 |
free | -0.010 |
Sue | -0.010 |
aroo | -0.009 |
Token | decided |
Token ID | 3066 |
Feature activation | +6.27e-04 |
Pos logit contributions | |
ever | +0.004 |
pet | +0.003 |
tow | +0.003 |
free | +0.003 |
Sue | +0.003 |
Neg logit contributions | |
arre | -0.009 |
homework | -0.009 |
laptop | -0.008 |
chores | -0.008 |
apr | -0.008 |
Token | that |
Token ID | 326 |
Feature activation | -2.52e-02 |
Pos logit contributions | |
tow | +0.001 |
ever | +0.001 |
free | +0.001 |
Sue | +0.001 |
aroo | +0.001 |
Neg logit contributions | |
arre | -0.001 |
homework | -0.001 |
chores | -0.001 |
laptop | -0.001 |
jobs | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | -5.55e-03 |
Pos logit contributions | |
arre | +0.067 |
homework | +0.059 |
laptop | +0.058 |
apr | +0.057 |
chores | +0.057 |
Neg logit contributions | |
ever | -0.021 |
tow | -0.019 |
Sue | -0.018 |
free | -0.017 |
Sally | -0.015 |
Token | wanted |
Token ID | 2227 |
Feature activation | -7.22e-03 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.011 |
laptop | +0.011 |
chores | +0.011 |
apr | +0.011 |
Neg logit contributions | |
ever | -0.006 |
tow | -0.006 |
free | -0.006 |
Sue | -0.005 |
pet | -0.005 |
Token | to |
Token ID | 284 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
arre | +0.016 |
homework | +0.014 |
chores | +0.014 |
laptop | +0.013 |
jobs | +0.013 |
Neg logit contributions | |
tow | -0.008 |
ever | -0.008 |
free | -0.007 |
aroo | -0.007 |
Sue | -0.007 |
Token | be |
Token ID | 307 |
Feature activation | +5.10e-03 |
Pos logit contributions | |
arre | +0.021 |
homework | +0.020 |
chores | +0.020 |
jobs | +0.018 |
laptop | +0.018 |
Neg logit contributions | |
tow | -0.014 |
aroo | -0.013 |
ever | -0.013 |
Sue | -0.012 |
Dove | -0.012 |
Token | used |
Token ID | 973 |
Feature activation | -4.38e-03 |
Pos logit contributions | |
tow | +0.006 |
aroo | +0.006 |
ever | +0.006 |
Sue | +0.005 |
Dove | +0.005 |
Neg logit contributions | |
arre | -0.010 |
homework | -0.010 |
chores | -0.009 |
jobs | -0.009 |
apr | -0.009 |
Token | day |
Token ID | 1110 |
Feature activation | -3.89e-03 |
Pos logit contributions | |
arre | +0.079 |
homework | +0.069 |
apr | +0.068 |
laptop | +0.068 |
laptops | +0.068 |
Neg logit contributions | |
ever | -0.030 |
tow | -0.026 |
free | -0.024 |
Sue | -0.023 |
aroo | -0.021 |
Token | on |
Token ID | 319 |
Feature activation | +2.75e-03 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.006 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
Sue | -0.005 |
free | -0.004 |
pet | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
tow | +0.004 |
ever | +0.004 |
free | +0.004 |
pet | +0.004 |
swoop | +0.003 |
Neg logit contributions | |
arre | -0.005 |
homework | -0.005 |
chores | -0.004 |
tasks | -0.004 |
laptop | -0.004 |
Token | Tim |
Token ID | 5045 |
Feature activation | -2.00e-02 |
Pos logit contributions | |
arre | +0.031 |
homework | +0.028 |
chores | +0.028 |
jobs | +0.027 |
tasks | +0.026 |
Neg logit contributions | |
tow | -0.013 |
ever | -0.011 |
aroo | -0.011 |
free | -0.011 |
pet | -0.010 |
Token | knew |
Token ID | 2993 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
arre | +0.044 |
homework | +0.040 |
chores | +0.038 |
laptop | +0.038 |
apr | +0.037 |
Neg logit contributions | |
ever | -0.023 |
tow | -0.022 |
free | -0.021 |
Sue | -0.020 |
pet | -0.019 |
Token | that |
Token ID | 326 |
Feature activation | -2.97e-02 |
Pos logit contributions | |
tow | +0.014 |
free | +0.012 |
ever | +0.012 |
oe | +0.012 |
swoop | +0.012 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.019 |
chores | -0.018 |
jobs | -0.017 |
ambul | -0.017 |
Token | it |
Token ID | 340 |
Feature activation | -8.86e-03 |
Pos logit contributions | |
arre | +0.068 |
homework | +0.059 |
laptop | +0.057 |
apr | +0.057 |
chores | +0.057 |
Neg logit contributions | |
ever | -0.033 |
tow | -0.032 |
Sue | -0.030 |
free | -0.030 |
Sally | -0.027 |
Token | was |
Token ID | 373 |
Feature activation | -8.06e-03 |
Pos logit contributions | |
arre | +0.019 |
homework | +0.016 |
apr | +0.016 |
laptop | +0.016 |
chores | +0.016 |
Neg logit contributions | |
ever | -0.012 |
tow | -0.011 |
free | -0.010 |
Sue | -0.010 |
pet | -0.010 |
Token | important |
Token ID | 1593 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
arre | +0.013 |
homework | +0.012 |
chores | +0.012 |
jobs | +0.011 |
tasks | +0.010 |
Neg logit contributions | |
tow | -0.013 |
aroo | -0.013 |
ever | -0.013 |
Sue | -0.012 |
oe | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
arre | +0.028 |
homework | +0.024 |
chores | +0.023 |
laptop | +0.023 |
apr | +0.023 |
Neg logit contributions | |
ever | -0.011 |
tow | -0.011 |
Sue | -0.010 |
free | -0.010 |
aroo | -0.009 |
Token | be |
Token ID | 307 |
Feature activation | +8.29e-03 |
Pos logit contributions | |
arre | +0.032 |
homework | +0.031 |
chores | +0.031 |
jobs | +0.028 |
tasks | +0.027 |
Neg logit contributions | |
aroo | -0.028 |
oe | -0.026 |
tow | -0.026 |
Sue | -0.025 |
ever | -0.025 |
Token | says |
Token ID | 1139 |
Feature activation | -1.59e-03 |
Pos logit contributions | |
arre | +0.033 |
homework | +0.027 |
aghetti | +0.025 |
chores | +0.025 |
narrative | +0.025 |
Neg logit contributions | |
Sue | -0.021 |
pet | -0.021 |
tow | -0.020 |
free | -0.020 |
ever | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.003 |
chores | +0.003 |
laptop | +0.003 |
apr | +0.003 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
free | -0.002 |
Sue | -0.002 |
aroo | -0.001 |
Token | " |
Token ID | 366 |
Feature activation | -5.22e-03 |
Pos logit contributions | |
arre | +0.027 |
homework | +0.024 |
laptop | +0.023 |
chores | +0.023 |
apr | +0.022 |
Neg logit contributions | |
tow | -0.017 |
ever | -0.017 |
free | -0.015 |
Sue | -0.015 |
aroo | -0.015 |
Token | Mom |
Token ID | 29252 |
Feature activation | -1.92e-02 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.012 |
chores | +0.012 |
laptop | +0.012 |
jobs | +0.012 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.004 |
Sue | -0.004 |
pet | -0.004 |
free | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -4.32e-03 |
Pos logit contributions | |
arre | +0.035 |
homework | +0.029 |
chores | +0.027 |
laptop | +0.027 |
idents | +0.026 |
Neg logit contributions | |
aroo | -0.030 |
tow | -0.029 |
free | -0.027 |
ever | -0.027 |
Dove | -0.027 |
Token | there |
Token ID | 612 |
Feature activation | -2.52e-02 |
Pos logit contributions | |
arre | +0.011 |
homework | +0.010 |
chores | +0.009 |
laptop | +0.009 |
apr | +0.009 |
Neg logit contributions | |
ever | -0.004 |
tow | -0.004 |
Sue | -0.004 |
free | -0.003 |
pet | -0.003 |
Token | is |
Token ID | 318 |
Feature activation | +1.88e-02 |
Pos logit contributions | |
arre | +0.046 |
homework | +0.039 |
apr | +0.038 |
laptop | +0.037 |
chores | +0.037 |
Neg logit contributions | |
tow | -0.038 |
ever | -0.038 |
Sue | -0.037 |
free | -0.036 |
pet | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | +6.18e-03 |
Pos logit contributions | |
ever | +0.017 |
tow | +0.017 |
Sue | +0.015 |
free | +0.015 |
aroo | +0.013 |
Neg logit contributions | |
arre | -0.047 |
homework | -0.042 |
chores | -0.040 |
laptop | -0.040 |
apr | -0.039 |
Token | big |
Token ID | 1263 |
Feature activation | -3.14e-03 |
Pos logit contributions | |
ever | +0.008 |
tow | +0.007 |
free | +0.007 |
Sue | +0.007 |
aroo | +0.007 |
Neg logit contributions | |
arre | -0.013 |
homework | -0.012 |
laptop | -0.011 |
chores | -0.011 |
ambul | -0.010 |
Token | dog |
Token ID | 3290 |
Feature activation | -2.24e-03 |
Pos logit contributions | |
arre | +0.007 |
homework | +0.006 |
laptop | +0.006 |
chores | +0.006 |
apr | +0.006 |
Neg logit contributions | |
ever | -0.004 |
tow | -0.004 |
free | -0.003 |
Sue | -0.003 |
aroo | -0.003 |
Token | outside |
Token ID | 2354 |
Feature activation | +9.41e-04 |
Pos logit contributions | |
arre | +0.005 |
homework | +0.005 |
laptop | +0.004 |
chores | +0.004 |
ambul | +0.004 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
Sue | -0.002 |
free | -0.002 |
Bill | -0.002 |
Token | other |
Token ID | 584 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
tow | +0.008 |
ever | +0.008 |
Dove | +0.007 |
Sue | +0.007 |
free | +0.007 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.011 |
chores | -0.011 |
laptop | -0.010 |
tasks | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
arre | +0.048 |
homework | +0.042 |
chores | +0.041 |
laptop | +0.041 |
jobs | +0.039 |
Neg logit contributions | |
tow | -0.021 |
ever | -0.019 |
free | -0.018 |
Sue | -0.017 |
aroo | -0.017 |
Token | They |
Token ID | 1119 |
Feature activation | -2.21e-02 |
Pos logit contributions | |
arre | +0.031 |
homework | +0.026 |
laptop | +0.025 |
idents | +0.025 |
apr | +0.024 |
Neg logit contributions | |
ever | -0.019 |
tow | -0.018 |
free | -0.017 |
swoop | -0.017 |
aroo | -0.016 |
Token | starting |
Token ID | 3599 |
Feature activation | -8.35e-03 |
Pos logit contributions | |
arre | +0.048 |
homework | +0.043 |
chores | +0.041 |
laptop | +0.041 |
apr | +0.040 |
Neg logit contributions | |
ever | -0.026 |
tow | -0.025 |
free | -0.024 |
Sue | -0.023 |
pet | -0.022 |
Token | qu |
Token ID | 627 |
Feature activation | -2.64e-02 |
Pos logit contributions | |
arre | +0.019 |
homework | +0.017 |
chores | +0.017 |
laptop | +0.016 |
apr | +0.016 |
Neg logit contributions | |
tow | -0.009 |
ever | -0.009 |
free | -0.008 |
Sue | -0.008 |
pet | -0.007 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.49e-02 |
Pos logit contributions | |
homework | +0.007 |
laptop | +0.005 |
chores | +0.004 |
ambul | +0.002 |
arre | +0.002 |
Neg logit contributions | |
free | -0.075 |
tow | -0.073 |
ever | -0.073 |
Sue | -0.072 |
Sally | -0.070 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
homework | +0.160 |
laptop | +0.156 |
chores | +0.152 |
dining | +0.150 |
apr | +0.149 |
Neg logit contributions | |
ever | -0.082 |
free | -0.080 |
p | -0.067 |
of | -0.067 |
fast | -0.063 |
Token | again |
Token ID | 757 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.042 |
laptop | +0.041 |
chores | +0.040 |
apr | +0.040 |
Neg logit contributions | |
ever | -0.019 |
tow | -0.018 |
free | -0.017 |
Sue | -0.017 |
pet | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.032 |
chores | +0.031 |
laptop | +0.031 |
apr | +0.030 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.018 |
Sue | -0.017 |
aroo | -0.017 |
free | -0.016 |
Token | their |
Token ID | 511 |
Feature activation | -4.84e-03 |
Pos logit contributions | |
arre | +0.027 |
homework | +0.023 |
chores | +0.022 |
laptop | +0.022 |
apr | +0.022 |
Neg logit contributions | |
tow | -0.016 |
ever | -0.016 |
Sue | -0.015 |
free | -0.015 |
aroo | -0.014 |
Token | voices |
Token ID | 10839 |
Feature activation | +5.86e-04 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.008 |
chores | +0.008 |
laptop | +0.008 |
apr | +0.008 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.006 |
free | -0.006 |
Sally | -0.006 |
Token | " |
Token ID | 366 |
Feature activation | -3.87e-03 |
Pos logit contributions | |
tow | +0.008 |
free | +0.007 |
ever | +0.007 |
pet | +0.007 |
swoop | +0.007 |
Neg logit contributions | |
arre | -0.012 |
homework | -0.011 |
chores | -0.011 |
ambul | -0.010 |
laptop | -0.010 |
Token | Why |
Token ID | 5195 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.006 |
chores | +0.006 |
laptop | +0.006 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.006 |
ever | -0.005 |
Sue | -0.005 |
free | -0.005 |
aroo | -0.005 |
Token | are |
Token ID | 389 |
Feature activation | +7.20e-03 |
Pos logit contributions | |
arre | +0.033 |
homework | +0.027 |
apr | +0.027 |
laptop | +0.026 |
chores | +0.026 |
Neg logit contributions | |
ever | -0.027 |
tow | -0.026 |
Sue | -0.025 |
free | -0.024 |
Sally | -0.023 |
Token | you |
Token ID | 345 |
Feature activation | -4.54e-03 |
Pos logit contributions | |
tow | +0.008 |
ever | +0.007 |
free | +0.007 |
Sue | +0.007 |
aroo | +0.006 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.015 |
chores | -0.014 |
laptop | -0.014 |
apr | -0.014 |
Token | qu |
Token ID | 627 |
Feature activation | -2.40e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
apr | +0.006 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.006 |
free | -0.006 |
aroo | -0.006 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.29e-02 |
Pos logit contributions | |
homework | +0.005 |
arre | +0.004 |
chores | +0.003 |
laptop | +0.003 |
apr | +0.002 |
Neg logit contributions | |
ever | -0.067 |
free | -0.066 |
tow | -0.066 |
Sue | -0.066 |
Sally | -0.064 |
Token | ling |
Token ID | 1359 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
apr | +0.135 |
arre | +0.134 |
homework | +0.134 |
laptop | +0.133 |
chores | +0.131 |
Neg logit contributions | |
ever | -0.090 |
free | -0.085 |
p | -0.074 |
of | -0.073 |
fast | -0.069 |
Token | ? |
Token ID | 30 |
Feature activation | +1.29e-03 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.041 |
chores | +0.039 |
laptop | +0.039 |
apr | +0.038 |
Neg logit contributions | |
ever | -0.030 |
tow | -0.030 |
Sue | -0.029 |
free | -0.028 |
aroo | -0.026 |
Token | You |
Token ID | 921 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
ever | +0.002 |
free | +0.002 |
tow | +0.002 |
swoop | +0.002 |
pet | +0.002 |
Neg logit contributions | |
arre | -0.002 |
laptop | -0.002 |
homework | -0.002 |
means | -0.002 |
cuts | -0.002 |
Token | can |
Token ID | 460 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.032 |
chores | +0.030 |
laptop | +0.030 |
jobs | +0.029 |
Neg logit contributions | |
tow | -0.030 |
ever | -0.028 |
Sue | -0.027 |
free | -0.026 |
aroo | -0.026 |
Token | share |
Token ID | 2648 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
ull | +0.015 |
tow | +0.015 |
itself | +0.014 |
Sage | +0.014 |
Frank | +0.014 |
Neg logit contributions | |
arre | -0.017 |
homework | -0.017 |
chores | -0.017 |
laptop | -0.014 |
argue | -0.014 |
Token | walked |
Token ID | 6807 |
Feature activation | +5.13e-03 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
idents | +0.007 |
Neg logit contributions | |
tow | -0.008 |
Sue | -0.007 |
Dove | -0.006 |
aroo | -0.006 |
ever | -0.006 |
Token | in |
Token ID | 287 |
Feature activation | -1.83e-03 |
Pos logit contributions | |
tow | +0.007 |
ever | +0.006 |
Sue | +0.006 |
aroo | +0.006 |
free | +0.006 |
Neg logit contributions | |
arre | -0.011 |
homework | -0.009 |
chores | -0.009 |
laptop | -0.008 |
jobs | -0.008 |
Token | on |
Token ID | 319 |
Feature activation | -3.69e-03 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.004 |
chores | +0.004 |
laptop | +0.004 |
apr | +0.003 |
Neg logit contributions | |
tow | -0.002 |
ever | -0.002 |
aroo | -0.002 |
Sue | -0.002 |
free | -0.002 |
Token | us |
Token ID | 514 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
arre | +0.008 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
apr | +0.007 |
Neg logit contributions | |
tow | -0.004 |
ever | -0.004 |
aroo | -0.004 |
Sue | -0.004 |
free | -0.004 |
Token | qu |
Token ID | 627 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
arre | +0.041 |
homework | +0.036 |
chores | +0.035 |
laptop | +0.034 |
jobs | +0.034 |
Neg logit contributions | |
tow | -0.018 |
ever | -0.015 |
Sue | -0.015 |
aroo | -0.015 |
Dove | -0.015 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.80e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.006 |
chores | +0.003 |
laptop | +0.003 |
apr | +0.002 |
Neg logit contributions | |
tow | -0.072 |
ever | -0.071 |
free | -0.071 |
Sue | -0.069 |
pet | -0.068 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
homework | +0.157 |
laptop | +0.153 |
apr | +0.152 |
arre | +0.150 |
chores | +0.150 |
Neg logit contributions | |
ever | -0.087 |
free | -0.086 |
p | -0.071 |
of | -0.069 |
fast | -0.067 |
Token | and |
Token ID | 290 |
Feature activation | +2.21e-03 |
Pos logit contributions | |
arre | +0.031 |
homework | +0.028 |
chores | +0.027 |
laptop | +0.026 |
apr | +0.026 |
Neg logit contributions | |
tow | -0.012 |
ever | -0.012 |
Sue | -0.011 |
free | -0.011 |
aroo | -0.010 |
Token | heard |
Token ID | 2982 |
Feature activation | -4.73e-03 |
Pos logit contributions | |
tow | +0.003 |
aroo | +0.003 |
ever | +0.003 |
Dove | +0.003 |
Sue | +0.003 |
Neg logit contributions | |
arre | -0.004 |
homework | -0.004 |
chores | -0.003 |
laptop | -0.003 |
idents | -0.003 |
Token | us |
Token ID | 514 |
Feature activation | +5.45e-04 |
Pos logit contributions | |
arre | +0.010 |
homework | +0.009 |
chores | +0.009 |
jobs | +0.008 |
ambul | +0.008 |
Neg logit contributions | |
tow | -0.006 |
ever | -0.005 |
aroo | -0.005 |
free | -0.005 |
Sue | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
tow | +0.001 |
Sue | +0.001 |
Dove | +0.001 |
aroo | +0.000 |
ever | +0.000 |
Neg logit contributions | |
arre | -0.001 |
homework | -0.001 |
chores | -0.001 |
laptop | -0.001 |
jobs | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
arre | +0.061 |
homework | +0.054 |
chores | +0.052 |
laptop | +0.051 |
apr | +0.050 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.018 |
Sue | -0.018 |
free | -0.016 |
pet | -0.015 |
Token | mess |
Token ID | 2085 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.003 |
cuts | +0.003 |
ambul | +0.003 |
laptops | +0.003 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
free | -0.005 |
pet | -0.005 |
Sue | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -5.60e-03 |
Pos logit contributions | |
arre | +0.079 |
homework | +0.071 |
chores | +0.068 |
laptop | +0.068 |
apr | +0.066 |
Neg logit contributions | |
tow | -0.033 |
ever | -0.032 |
Sue | -0.029 |
free | -0.029 |
aroo | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.012 |
chores | +0.012 |
apr | +0.011 |
laptop | +0.011 |
Neg logit contributions | |
tow | -0.005 |
ever | -0.005 |
Sue | -0.005 |
free | -0.005 |
pet | -0.004 |
Token | qu |
Token ID | 627 |
Feature activation | -3.39e-02 |
Pos logit contributions | |
arre | +0.017 |
homework | +0.013 |
chores | +0.012 |
cuts | +0.012 |
ambul | +0.012 |
Neg logit contributions | |
tow | -0.019 |
ever | -0.019 |
free | -0.018 |
Sue | -0.018 |
pet | -0.018 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.48e-02 |
Pos logit contributions | |
arre | +0.051 |
homework | +0.047 |
chores | +0.044 |
laptop | +0.043 |
apr | +0.042 |
Neg logit contributions | |
ever | -0.057 |
tow | -0.057 |
free | -0.055 |
Sue | -0.054 |
aroo | -0.051 |
Token | ling |
Token ID | 1359 |
Feature activation | -5.87e-03 |
Pos logit contributions | |
arre | +0.144 |
homework | +0.139 |
apr | +0.133 |
chores | +0.129 |
aj | +0.129 |
Neg logit contributions | |
ever | -0.096 |
free | -0.093 |
of | -0.088 |
p | -0.079 |
tow | -0.078 |
Token | twins |
Token ID | 20345 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
arre | +0.012 |
homework | +0.010 |
chores | +0.009 |
laptop | +0.009 |
apr | +0.009 |
Neg logit contributions | |
ever | -0.008 |
tow | -0.008 |
free | -0.008 |
Sue | -0.008 |
Dove | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +7.80e-04 |
Pos logit contributions | |
arre | +0.052 |
homework | +0.047 |
laptop | +0.046 |
chores | +0.046 |
apr | +0.042 |
Neg logit contributions | |
tow | -0.020 |
Sue | -0.018 |
ever | -0.018 |
aroo | -0.018 |
Dove | -0.017 |
Token | She |
Token ID | 1375 |
Feature activation | -4.75e-03 |
Pos logit contributions | |
tow | +0.001 |
Sue | +0.001 |
ever | +0.001 |
free | +0.000 |
Sally | +0.000 |
Neg logit contributions | |
arre | -0.002 |
homework | -0.002 |
chores | -0.002 |
laptop | -0.002 |
apr | -0.002 |
Token | is |
Token ID | 318 |
Feature activation | +1.08e-03 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.008 |
chores | +0.008 |
apr | +0.008 |
laptop | +0.007 |
Neg logit contributions | |
tow | -0.007 |
ever | -0.007 |
Sue | -0.006 |
free | -0.006 |
pet | -0.006 |
Token | Why |
Token ID | 5195 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
arre | +0.004 |
homework | +0.003 |
ambul | +0.003 |
chores | +0.003 |
apr | +0.003 |
Neg logit contributions | |
tow | -0.003 |
ever | -0.003 |
free | -0.003 |
Sue | -0.003 |
aroo | -0.003 |
Token | are |
Token ID | 389 |
Feature activation | +8.90e-03 |
Pos logit contributions | |
arre | +0.037 |
homework | +0.031 |
apr | +0.030 |
laptop | +0.029 |
chores | +0.029 |
Neg logit contributions | |
ever | -0.031 |
tow | -0.030 |
Sue | -0.029 |
free | -0.028 |
Sally | -0.027 |
Token | you |
Token ID | 345 |
Feature activation | -4.81e-03 |
Pos logit contributions | |
tow | +0.011 |
ever | +0.010 |
free | +0.009 |
Sue | +0.009 |
aroo | +0.009 |
Neg logit contributions | |
arre | -0.019 |
homework | -0.018 |
chores | -0.017 |
laptop | -0.016 |
jobs | -0.016 |
Token | two |
Token ID | 734 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
arre | +0.009 |
homework | +0.007 |
chores | +0.007 |
laptop | +0.007 |
ambul | +0.006 |
Neg logit contributions | |
tow | -0.008 |
ever | -0.008 |
aroo | -0.007 |
Sue | -0.007 |
free | -0.007 |
Token | qu |
Token ID | 627 |
Feature activation | -3.28e-02 |
Pos logit contributions | |
arre | +0.047 |
homework | +0.042 |
chores | +0.041 |
laptop | +0.038 |
jobs | +0.038 |
Neg logit contributions | |
tow | -0.036 |
aroo | -0.033 |
Sue | -0.032 |
ever | -0.032 |
Dove | -0.031 |
Token | arre |
Token ID | 9624 |
Feature activation | -7.46e-02 |
Pos logit contributions | |
arre | +0.001 |
homework | -0.002 |
chores | -0.004 |
laptop | -0.005 |
apr | -0.006 |
Neg logit contributions | |
ever | -0.102 |
tow | -0.101 |
free | -0.100 |
Sue | -0.099 |
Sally | -0.097 |
Token | ling |
Token ID | 1359 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
homework | +0.130 |
arre | +0.129 |
apr | +0.129 |
laptop | +0.126 |
chores | +0.124 |
Neg logit contributions | |
ever | -0.102 |
free | -0.095 |
of | -0.084 |
p | -0.079 |
aroo | -0.078 |
Token | ? |
Token ID | 30 |
Feature activation | -7.71e-03 |
Pos logit contributions | |
arre | +0.045 |
homework | +0.039 |
chores | +0.038 |
laptop | +0.037 |
apr | +0.036 |
Neg logit contributions | |
tow | -0.031 |
ever | -0.030 |
free | -0.028 |
Sue | -0.028 |
aroo | -0.027 |
Token | There |
Token ID | 1318 |
Feature activation | -3.21e-02 |
Pos logit contributions | |
arre | +0.014 |
homework | +0.011 |
laptop | +0.011 |
cuts | +0.010 |
means | +0.010 |
Neg logit contributions | |
ever | -0.012 |
tow | -0.012 |
free | -0.012 |
swoop | -0.012 |
Sue | -0.011 |
Token | are |
Token ID | 389 |
Feature activation | -2.92e-03 |
Pos logit contributions | |
arre | +0.054 |
homework | +0.046 |
chores | +0.043 |
laptop | +0.042 |
jobs | +0.040 |
Neg logit contributions | |
tow | -0.054 |
ever | -0.053 |
free | -0.050 |
Sue | -0.050 |
aroo | -0.048 |
Token | plenty |
Token ID | 6088 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
arre | +0.006 |
homework | +0.005 |
chores | +0.005 |
jobs | +0.005 |
laptop | +0.005 |
Neg logit contributions | |
tow | -0.004 |
aroo | -0.004 |
ever | -0.004 |
Sue | -0.004 |
free | -0.004 |