Token | and |
Token ID | 290 |
Feature activation | +3.74e-02 |
Pos logit contributions | |
ays | +0.064 |
ocol | +0.057 |
unks | +0.057 |
rob | +0.056 |
ips | +0.055 |
Neg logit contributions | |
So | -0.034 |
friend | -0.034 |
kindly | -0.034 |
tutor | -0.033 |
forgive | -0.032 |
Token | fell |
Token ID | 3214 |
Feature activation | +3.37e-02 |
Pos logit contributions | |
ays | +0.080 |
ocol | +0.071 |
unks | +0.069 |
ips | +0.068 |
rob | +0.067 |
Neg logit contributions | |
forgive | -0.054 |
So | -0.053 |
friend | -0.052 |
little | -0.052 |
lder | -0.051 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
ays | +0.076 |
rob | +0.065 |
unks | +0.064 |
ips | +0.064 |
ocol | +0.063 |
Neg logit contributions | |
friend | -0.046 |
kindly | -0.045 |
So | -0.045 |
tutor | -0.044 |
lder | -0.044 |
Token | The |
Token ID | 383 |
Feature activation | +5.93e-03 |
Pos logit contributions | |
ays | +0.046 |
rob | +0.042 |
ips | +0.040 |
unks | +0.040 |
ocol | +0.039 |
Neg logit contributions | |
So | -0.018 |
lder | -0.018 |
tutor | -0.018 |
kindly | -0.018 |
forgive | -0.018 |
Token | ash |
Token ID | 12530 |
Feature activation | +6.17e-02 |
Pos logit contributions | |
ays | +0.013 |
ips | +0.010 |
rob | +0.010 |
unks | +0.010 |
ions | +0.010 |
Neg logit contributions | |
lder | -0.009 |
friend | -0.009 |
So | -0.009 |
tutor | -0.009 |
kindly | -0.009 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
ays | +0.117 |
rob | +0.098 |
ips | +0.097 |
unks | +0.096 |
ocol | +0.096 |
Neg logit contributions | |
friend | -0.105 |
lder | -0.104 |
So | -0.101 |
song | -0.101 |
kindly | -0.100 |
Token | ay |
Token ID | 323 |
Feature activation | +5.10e-02 |
Pos logit contributions | |
rob | +0.190 |
unks | +0.179 |
ocol | +0.179 |
ays | +0.176 |
matters | +0.169 |
Neg logit contributions | |
friend | -0.193 |
So | -0.189 |
kindly | -0.179 |
nd | -0.176 |
broken | -0.174 |
Token | flew |
Token ID | 13112 |
Feature activation | +4.44e-02 |
Pos logit contributions | |
ays | +0.088 |
unks | +0.076 |
ocol | +0.075 |
ips | +0.072 |
rob | +0.072 |
Neg logit contributions | |
lder | -0.092 |
friend | -0.087 |
So | -0.087 |
kindly | -0.087 |
nd | -0.086 |
Token | out |
Token ID | 503 |
Feature activation | +7.09e-03 |
Pos logit contributions | |
ays | +0.079 |
rob | +0.067 |
unks | +0.065 |
ips | +0.065 |
ocol | +0.062 |
Neg logit contributions | |
friend | -0.080 |
kindly | -0.080 |
So | -0.079 |
lder | -0.078 |
tutor | -0.078 |
Token | of |
Token ID | 286 |
Feature activation | +2.53e-02 |
Pos logit contributions | |
ays | +0.015 |
ips | +0.013 |
rob | +0.013 |
unks | +0.013 |
ions | +0.012 |
Neg logit contributions | |
lder | -0.010 |
friend | -0.010 |
tutor | -0.010 |
So | -0.010 |
kindly | -0.010 |
Token | her |
Token ID | 607 |
Feature activation | +1.61e-03 |
Pos logit contributions | |
ays | +0.053 |
rob | +0.045 |
ips | +0.044 |
unks | +0.044 |
plets | +0.043 |
Neg logit contributions | |
friend | -0.038 |
tutor | -0.038 |
kindly | -0.037 |
lder | -0.037 |
forgive | -0.037 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
ays | +0.094 |
ips | +0.078 |
unks | +0.077 |
rob | +0.076 |
ions | +0.075 |
Neg logit contributions | |
lder | -0.061 |
So | -0.060 |
kindly | -0.059 |
tutor | -0.059 |
forgive | -0.059 |
Token | ay |
Token ID | 323 |
Feature activation | +2.86e-02 |
Pos logit contributions | |
ays | +0.161 |
rob | +0.157 |
unks | +0.147 |
ocol | +0.146 |
matters | +0.141 |
Neg logit contributions | |
friend | -0.196 |
So | -0.187 |
kindly | -0.183 |
keeper | -0.180 |
tutor | -0.179 |
Token | . |
Token ID | 13 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
ays | +0.073 |
ips | +0.064 |
rob | +0.063 |
unks | +0.063 |
ocol | +0.061 |
Neg logit contributions | |
lder | -0.030 |
friend | -0.029 |
kindly | -0.029 |
So | -0.029 |
tutor | -0.029 |
Token | The |
Token ID | 383 |
Feature activation | -3.04e-03 |
Pos logit contributions | |
ays | +0.031 |
ips | +0.026 |
unks | +0.026 |
rob | +0.025 |
ions | +0.025 |
Neg logit contributions | |
lder | -0.020 |
friend | -0.020 |
tutor | -0.020 |
So | -0.020 |
kindly | -0.020 |
Token | ash |
Token ID | 12530 |
Feature activation | +6.28e-02 |
Pos logit contributions | |
lder | +0.004 |
So | +0.004 |
kindly | +0.004 |
tutor | +0.004 |
hospitality | +0.004 |
Neg logit contributions | |
ays | -0.006 |
ocol | -0.005 |
ips | -0.005 |
rob | -0.005 |
unks | -0.005 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ays | +0.141 |
ips | +0.120 |
rob | +0.119 |
unks | +0.118 |
ions | +0.114 |
Neg logit contributions | |
lder | -0.086 |
friend | -0.085 |
So | -0.084 |
kindly | -0.083 |
tutor | -0.083 |
Token | ay |
Token ID | 323 |
Feature activation | +4.74e-02 |
Pos logit contributions | |
rob | +0.193 |
ays | +0.186 |
unks | +0.183 |
ocol | +0.173 |
matters | +0.169 |
Neg logit contributions | |
friend | -0.187 |
So | -0.181 |
kindly | -0.178 |
forgive | -0.173 |
keeper | -0.172 |
Token | fell |
Token ID | 3214 |
Feature activation | +3.72e-02 |
Pos logit contributions | |
ays | +0.103 |
ips | +0.088 |
unks | +0.087 |
rob | +0.087 |
ocol | +0.085 |
Neg logit contributions | |
lder | -0.069 |
friend | -0.068 |
kindly | -0.066 |
So | -0.065 |
forgive | -0.064 |
Token | down |
Token ID | 866 |
Feature activation | +7.21e-03 |
Pos logit contributions | |
ays | +0.069 |
rob | +0.056 |
ips | +0.056 |
unks | +0.056 |
ocol | +0.053 |
Neg logit contributions | |
friend | -0.065 |
lder | -0.065 |
kindly | -0.065 |
So | -0.064 |
tutor | -0.064 |
Token | and |
Token ID | 290 |
Feature activation | +3.34e-02 |
Pos logit contributions | |
ays | +0.018 |
ips | +0.016 |
rob | +0.015 |
ions | +0.015 |
unks | +0.015 |
Neg logit contributions | |
lder | -0.008 |
friend | -0.008 |
So | -0.008 |
tutor | -0.008 |
hospitality | -0.007 |
Token | broke |
Token ID | 6265 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
ays | +0.073 |
unks | +0.065 |
rob | +0.064 |
ips | +0.063 |
ocol | +0.062 |
Neg logit contributions | |
kindly | -0.050 |
friend | -0.049 |
little | -0.047 |
forgive | -0.047 |
tutor | -0.047 |
Token | . |
Token ID | 13 |
Feature activation | +7.04e-03 |
Pos logit contributions | |
ays | +0.056 |
rob | +0.051 |
unks | +0.050 |
ips | +0.050 |
ocol | +0.050 |
Neg logit contributions | |
kindly | -0.012 |
friend | -0.011 |
song | -0.010 |
So | -0.010 |
keeper | -0.010 |
Token | She |
Token ID | 1375 |
Feature activation | -8.54e-03 |
Pos logit contributions | |
ays | +0.018 |
rob | +0.016 |
ocol | +0.016 |
ips | +0.016 |
unks | +0.015 |
Neg logit contributions | |
So | -0.008 |
friend | -0.008 |
kindly | -0.008 |
tutor | -0.007 |
lder | -0.007 |
Token | put |
Token ID | 1234 |
Feature activation | +6.08e-02 |
Pos logit contributions | |
lder | +0.011 |
friend | +0.011 |
So | +0.011 |
kindly | +0.011 |
tutor | +0.011 |
Neg logit contributions | |
ays | -0.020 |
ips | -0.017 |
rob | -0.017 |
unks | -0.017 |
ions | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | +3.56e-02 |
Pos logit contributions | |
ays | +0.155 |
unks | +0.150 |
rob | +0.142 |
opl | +0.137 |
plets | +0.136 |
Neg logit contributions | |
little | -0.068 |
kindly | -0.062 |
forgive | -0.062 |
understanding | -0.060 |
friend | -0.060 |
Token | ash |
Token ID | 12530 |
Feature activation | +5.88e-02 |
Pos logit contributions | |
ays | +0.073 |
ips | +0.061 |
rob | +0.061 |
unks | +0.060 |
plets | +0.057 |
Neg logit contributions | |
friend | -0.060 |
lder | -0.057 |
forgive | -0.057 |
kindly | -0.056 |
song | -0.056 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
ays | +0.142 |
rob | +0.124 |
ips | +0.123 |
unks | +0.122 |
ocol | +0.120 |
Neg logit contributions | |
friend | -0.071 |
kindly | -0.068 |
So | -0.068 |
lder | -0.068 |
tutor | -0.067 |
Token | ay |
Token ID | 323 |
Feature activation | +4.41e-02 |
Pos logit contributions | |
rob | +0.199 |
ays | +0.189 |
unks | +0.182 |
ocol | +0.177 |
matters | +0.171 |
Neg logit contributions | |
So | -0.183 |
friend | -0.182 |
kindly | -0.174 |
forgive | -0.168 |
keeper | -0.165 |
Token | up |
Token ID | 510 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
ays | +0.096 |
rob | +0.083 |
unks | +0.081 |
ocol | +0.080 |
ips | +0.079 |
Neg logit contributions | |
friend | -0.065 |
kindly | -0.064 |
So | -0.062 |
forgive | -0.062 |
song | -0.060 |
Token | close |
Token ID | 1969 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
ays | +0.028 |
ips | +0.024 |
unks | +0.023 |
rob | +0.023 |
ions | +0.023 |
Neg logit contributions | |
lder | -0.019 |
tutor | -0.018 |
So | -0.018 |
friend | -0.018 |
forgive | -0.017 |
Token | to |
Token ID | 284 |
Feature activation | +6.64e-03 |
Pos logit contributions | |
ays | +0.047 |
ips | +0.041 |
rob | +0.041 |
unks | +0.040 |
ions | +0.039 |
Neg logit contributions | |
lder | -0.016 |
friend | -0.016 |
kindly | -0.016 |
So | -0.016 |
tutor | -0.016 |
Token | her |
Token ID | 607 |
Feature activation | -2.79e-02 |
Pos logit contributions | |
ays | +0.017 |
rob | +0.014 |
ips | +0.014 |
unks | +0.014 |
plets | +0.013 |
Neg logit contributions | |
forgive | -0.009 |
kindly | -0.009 |
understanding | -0.009 |
friend | -0.008 |
lder | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -1.02e-03 |
Pos logit contributions | |
lder | +0.036 |
So | +0.035 |
tutor | +0.034 |
friend | +0.033 |
forgive | +0.033 |
Neg logit contributions | |
ays | -0.075 |
ips | -0.064 |
unks | -0.062 |
ions | -0.062 |
rob | -0.062 |
Token | He |
Token ID | 679 |
Feature activation | -5.38e-04 |
Pos logit contributions | |
kindly | +0.001 |
lder | +0.001 |
friend | +0.001 |
So | +0.001 |
tutor | +0.001 |
Neg logit contributions | |
ays | -0.003 |
rob | -0.002 |
ips | -0.002 |
unks | -0.002 |
plets | -0.002 |
Token | drops |
Token ID | 10532 |
Feature activation | +3.73e-02 |
Pos logit contributions | |
kindly | +0.001 |
friend | +0.001 |
So | +0.001 |
forgive | +0.001 |
lder | +0.001 |
Neg logit contributions | |
ays | -0.001 |
ips | -0.001 |
ions | -0.001 |
rob | -0.001 |
unks | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.68e-02 |
Pos logit contributions | |
ays | +0.089 |
rob | +0.088 |
unks | +0.082 |
plets | +0.081 |
ips | +0.077 |
Neg logit contributions | |
friend | -0.042 |
forgive | -0.041 |
kindly | -0.041 |
little | -0.040 |
keeper | -0.040 |
Token | ash |
Token ID | 12530 |
Feature activation | +4.29e-02 |
Pos logit contributions | |
ays | +0.035 |
ips | +0.029 |
rob | +0.029 |
unks | +0.029 |
ions | +0.028 |
Neg logit contributions | |
lder | -0.026 |
friend | -0.025 |
tutor | -0.025 |
kindly | -0.025 |
So | -0.025 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
ays | +0.093 |
ips | +0.077 |
rob | +0.076 |
unks | +0.076 |
ions | +0.074 |
Neg logit contributions | |
lder | -0.063 |
friend | -0.062 |
So | -0.062 |
tutor | -0.062 |
kindly | -0.061 |
Token | ay |
Token ID | 323 |
Feature activation | +4.14e-02 |
Pos logit contributions | |
rob | +0.175 |
ays | +0.168 |
unks | +0.160 |
matters | +0.156 |
ocol | +0.153 |
Neg logit contributions | |
friend | -0.198 |
So | -0.192 |
kindly | -0.188 |
forgive | -0.181 |
keeper | -0.180 |
Token | . |
Token ID | 13 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
ays | +0.096 |
unks | +0.085 |
ips | +0.084 |
rob | +0.083 |
ocol | +0.082 |
Neg logit contributions | |
lder | -0.049 |
friend | -0.049 |
kindly | -0.048 |
So | -0.048 |
song | -0.047 |
Token | It |
Token ID | 632 |
Feature activation | +4.15e-02 |
Pos logit contributions | |
ays | +0.054 |
rob | +0.048 |
ips | +0.047 |
unks | +0.047 |
ocol | +0.045 |
Neg logit contributions | |
kindly | -0.023 |
So | -0.023 |
forgive | -0.023 |
lder | -0.022 |
tutor | -0.022 |
Token | breaks |
Token ID | 9457 |
Feature activation | +2.42e-02 |
Pos logit contributions | |
ays | +0.073 |
rob | +0.067 |
unks | +0.066 |
ocol | +0.066 |
ips | +0.065 |
Neg logit contributions | |
friend | -0.071 |
kindly | -0.070 |
song | -0.070 |
So | -0.069 |
keeper | -0.068 |
Token | . |
Token ID | 13 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
ays | +0.067 |
rob | +0.062 |
ips | +0.058 |
unks | +0.058 |
plets | +0.057 |
Neg logit contributions | |
friend | -0.020 |
kindly | -0.020 |
So | -0.018 |
keeper | -0.017 |
tutor | -0.017 |
Token | was |
Token ID | 373 |
Feature activation | +3.52e-02 |
Pos logit contributions | |
ays | +0.033 |
ips | +0.028 |
rob | +0.027 |
ocol | +0.027 |
unks | +0.027 |
Neg logit contributions | |
friend | -0.025 |
kindly | -0.025 |
lder | -0.025 |
forgive | -0.025 |
So | -0.024 |
Token | right |
Token ID | 826 |
Feature activation | -6.89e-03 |
Pos logit contributions | |
ays | +0.097 |
rob | +0.083 |
unks | +0.082 |
plets | +0.082 |
ips | +0.081 |
Neg logit contributions | |
friend | -0.038 |
kindly | -0.038 |
understanding | -0.037 |
forgive | -0.036 |
tutor | -0.036 |
Token | . |
Token ID | 13 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
lder | +0.009 |
So | +0.009 |
Days | +0.009 |
tutor | +0.009 |
tune | +0.009 |
Neg logit contributions | |
ays | -0.016 |
ips | -0.013 |
unks | -0.013 |
ions | -0.013 |
ocol | -0.012 |
Token | The |
Token ID | 383 |
Feature activation | +7.96e-04 |
Pos logit contributions | |
ays | +0.057 |
rob | +0.050 |
ips | +0.048 |
unks | +0.047 |
plets | +0.046 |
Neg logit contributions | |
So | -0.037 |
lder | -0.036 |
forgive | -0.036 |
kindly | -0.036 |
tutor | -0.036 |
Token | ash |
Token ID | 12530 |
Feature activation | +4.76e-02 |
Pos logit contributions | |
ays | +0.002 |
ips | +0.002 |
ocol | +0.002 |
unks | +0.002 |
rob | +0.002 |
Neg logit contributions | |
lder | -0.001 |
So | -0.001 |
kindly | -0.001 |
Days | -0.001 |
broken | -0.001 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
ays | +0.108 |
ips | +0.091 |
rob | +0.090 |
unks | +0.089 |
ions | +0.088 |
Neg logit contributions | |
lder | -0.064 |
So | -0.063 |
tutor | -0.062 |
kindly | -0.062 |
friend | -0.061 |
Token | ay |
Token ID | 323 |
Feature activation | +3.97e-02 |
Pos logit contributions | |
ays | +0.168 |
rob | +0.168 |
unks | +0.165 |
ocol | +0.160 |
matters | +0.153 |
Neg logit contributions | |
friend | -0.197 |
forgive | -0.188 |
So | -0.188 |
kindly | -0.187 |
keeper | -0.185 |
Token | is |
Token ID | 318 |
Feature activation | +4.22e-02 |
Pos logit contributions | |
ays | +0.074 |
unks | +0.061 |
ips | +0.060 |
rob | +0.060 |
ocol | +0.059 |
Neg logit contributions | |
lder | -0.069 |
friend | -0.069 |
kindly | -0.068 |
forgive | -0.067 |
So | -0.066 |
Token | not |
Token ID | 407 |
Feature activation | +3.08e-02 |
Pos logit contributions | |
ays | +0.116 |
rob | +0.103 |
ips | +0.101 |
unks | +0.100 |
plets | +0.097 |
Neg logit contributions | |
friend | -0.041 |
kindly | -0.041 |
forgive | -0.039 |
understanding | -0.039 |
tutor | -0.038 |
Token | for |
Token ID | 329 |
Feature activation | +1.23e-02 |
Pos logit contributions | |
ays | +0.073 |
ips | +0.063 |
rob | +0.062 |
unks | +0.062 |
plets | +0.060 |
Neg logit contributions | |
friend | -0.040 |
kindly | -0.039 |
lder | -0.038 |
tutor | -0.038 |
forgive | -0.038 |
Token | kids |
Token ID | 3988 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
ays | +0.026 |
rob | +0.022 |
ips | +0.022 |
unks | +0.022 |
plets | +0.021 |
Neg logit contributions | |
lder | -0.018 |
friend | -0.018 |
tutor | -0.018 |
kindly | -0.018 |
So | -0.018 |
Token | sun |
Token ID | 4252 |
Feature activation | +2.31e-02 |
Pos logit contributions | |
kindly | +0.003 |
friend | +0.003 |
lder | +0.003 |
song | +0.003 |
forgive | +0.003 |
Neg logit contributions | |
ays | -0.007 |
rob | -0.006 |
ips | -0.006 |
unks | -0.006 |
chairs | -0.006 |
Token | fl |
Token ID | 2704 |
Feature activation | +7.94e-02 |
Pos logit contributions | |
ays | +0.050 |
rob | +0.043 |
ips | +0.042 |
unks | +0.041 |
chairs | +0.041 |
Neg logit contributions | |
friend | -0.033 |
lder | -0.032 |
song | -0.031 |
kindly | -0.031 |
So | -0.030 |
Token | owers |
Token ID | 3618 |
Feature activation | +2.93e-02 |
Pos logit contributions | |
ays | +0.139 |
chairs | +0.119 |
rob | +0.118 |
izz | +0.118 |
plets | +0.116 |
Neg logit contributions | |
lder | -0.132 |
friend | -0.120 |
So | -0.119 |
nd | -0.117 |
birthday | -0.116 |
Token | , |
Token ID | 11 |
Feature activation | -3.04e-03 |
Pos logit contributions | |
ays | +0.077 |
rob | +0.069 |
ips | +0.067 |
unks | +0.065 |
chairs | +0.065 |
Neg logit contributions | |
kindly | -0.029 |
friend | -0.029 |
lder | -0.028 |
forgive | -0.027 |
So | -0.027 |
Token | and |
Token ID | 290 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
kindly | +0.003 |
friend | +0.003 |
lder | +0.003 |
song | +0.003 |
forgive | +0.003 |
Neg logit contributions | |
ays | -0.008 |
rob | -0.007 |
ips | -0.007 |
unks | -0.007 |
chairs | -0.007 |
Token | tul |
Token ID | 48373 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
ays | +0.043 |
rob | +0.038 |
ips | +0.037 |
unks | +0.037 |
izz | +0.035 |
Neg logit contributions | |
kindly | -0.025 |
friend | -0.025 |
understanding | -0.024 |
song | -0.024 |
forgive | -0.024 |
Token | ips |
Token ID | 2419 |
Feature activation | +4.09e-02 |
Pos logit contributions | |
ays | +0.132 |
chairs | +0.130 |
matters | +0.128 |
rob | +0.121 |
involved | +0.120 |
Neg logit contributions | |
lder | -0.214 |
nd | -0.202 |
friend | -0.198 |
kindly | -0.196 |
So | -0.194 |
Token | . |
Token ID | 13 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
ays | +0.097 |
rob | +0.089 |
ips | +0.085 |
unks | +0.084 |
ocol | +0.083 |
Neg logit contributions | |
friend | -0.049 |
kindly | -0.049 |
So | -0.046 |
song | -0.045 |
lder | -0.045 |
Token | They |
Token ID | 1119 |
Feature activation | +8.48e-03 |
Pos logit contributions | |
ays | +0.041 |
rob | +0.036 |
ips | +0.036 |
unks | +0.035 |
plets | +0.034 |
Neg logit contributions | |
So | -0.020 |
kindly | -0.020 |
friend | -0.020 |
lder | -0.020 |
forgive | -0.020 |
Token | see |
Token ID | 766 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
ays | +0.020 |
rob | +0.017 |
ips | +0.017 |
unks | +0.016 |
ions | +0.016 |
Neg logit contributions | |
forgive | -0.012 |
friend | -0.012 |
lder | -0.012 |
kindly | -0.012 |
So | -0.011 |
Token | pine |
Token ID | 20161 |
Feature activation | +5.25e-02 |
Pos logit contributions | |
ays | +0.032 |
ips | +0.029 |
rob | +0.028 |
unks | +0.028 |
plets | +0.027 |
Neg logit contributions | |
friend | -0.021 |
kindly | -0.021 |
little | -0.020 |
So | -0.020 |
song | -0.020 |
Token | no |
Token ID | 645 |
Feature activation | -3.29e-03 |
Pos logit contributions | |
lder | +0.006 |
friend | +0.006 |
So | +0.006 |
tutor | +0.006 |
kindly | +0.006 |
Neg logit contributions | |
ays | -0.017 |
ips | -0.014 |
rob | -0.014 |
unks | -0.014 |
ions | -0.014 |
Token | , |
Token ID | 11 |
Feature activation | -2.34e-02 |
Pos logit contributions | |
lder | +0.004 |
tutor | +0.004 |
So | +0.004 |
kindly | +0.004 |
forgive | +0.004 |
Neg logit contributions | |
ays | -0.008 |
ips | -0.007 |
rob | -0.006 |
chairs | -0.006 |
unks | -0.006 |
Token | because |
Token ID | 780 |
Feature activation | +3.54e-02 |
Pos logit contributions | |
kindly | +0.022 |
understanding | +0.022 |
So | +0.021 |
forgive | +0.020 |
song | +0.020 |
Neg logit contributions | |
ays | -0.067 |
rob | -0.059 |
unks | -0.059 |
ips | -0.058 |
plets | -0.055 |
Token | the |
Token ID | 262 |
Feature activation | +1.37e-02 |
Pos logit contributions | |
ays | +0.085 |
rob | +0.079 |
plets | +0.074 |
unks | +0.074 |
ips | +0.073 |
Neg logit contributions | |
friend | -0.054 |
little | -0.049 |
tutor | -0.049 |
kindly | -0.048 |
understanding | -0.047 |
Token | ash |
Token ID | 12530 |
Feature activation | +5.53e-02 |
Pos logit contributions | |
ays | +0.028 |
ips | +0.023 |
rob | +0.022 |
unks | +0.022 |
plets | +0.021 |
Neg logit contributions | |
friend | -0.024 |
lder | -0.023 |
forgive | -0.022 |
kindly | -0.022 |
tutor | -0.022 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
ays | +0.143 |
ips | +0.126 |
rob | +0.126 |
ocol | +0.125 |
unks | +0.123 |
Neg logit contributions | |
friend | -0.063 |
keeper | -0.059 |
song | -0.057 |
lder | -0.057 |
kindly | -0.056 |
Token | ay |
Token ID | 323 |
Feature activation | +4.40e-02 |
Pos logit contributions | |
rob | +0.188 |
ays | +0.178 |
unks | +0.175 |
ocol | +0.172 |
matters | +0.168 |
Neg logit contributions | |
friend | -0.179 |
So | -0.169 |
kindly | -0.167 |
keeper | -0.166 |
birthday | -0.162 |
Token | was |
Token ID | 373 |
Feature activation | +3.80e-02 |
Pos logit contributions | |
ays | +0.108 |
ips | +0.096 |
unks | +0.095 |
rob | +0.094 |
ocol | +0.094 |
Neg logit contributions | |
friend | -0.052 |
kindly | -0.048 |
lder | -0.048 |
keeper | -0.047 |
forgive | -0.046 |
Token | not |
Token ID | 407 |
Feature activation | +2.27e-02 |
Pos logit contributions | |
ays | +0.098 |
rob | +0.091 |
ips | +0.084 |
unks | +0.084 |
plets | +0.082 |
Neg logit contributions | |
friend | -0.045 |
kindly | -0.045 |
understanding | -0.043 |
forgive | -0.041 |
little | -0.041 |
Token | a |
Token ID | 257 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
ays | +0.055 |
rob | +0.047 |
unks | +0.047 |
ips | +0.046 |
plets | +0.045 |
Neg logit contributions | |
friend | -0.030 |
kindly | -0.029 |
understanding | -0.029 |
forgive | -0.028 |
song | -0.028 |
Token | toy |
Token ID | 13373 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
lder | +0.035 |
So | +0.034 |
hospitality | +0.032 |
kindly | +0.032 |
tutor | +0.031 |
Neg logit contributions | |
ays | -0.043 |
ocol | -0.037 |
rob | -0.037 |
lands | -0.036 |
unks | -0.036 |
Token | her |
Token ID | 607 |
Feature activation | +2.85e-03 |
Pos logit contributions | |
ays | +0.008 |
rob | +0.006 |
unks | +0.006 |
ips | +0.006 |
plets | +0.006 |
Neg logit contributions | |
tutor | -0.006 |
friend | -0.006 |
lder | -0.006 |
kindly | -0.005 |
understanding | -0.005 |
Token | house |
Token ID | 2156 |
Feature activation | -4.11e-03 |
Pos logit contributions | |
ays | +0.007 |
ips | +0.006 |
rob | +0.006 |
unks | +0.006 |
ions | +0.005 |
Neg logit contributions | |
lder | -0.004 |
So | -0.004 |
kindly | -0.004 |
forgive | -0.004 |
friend | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
lder | +0.004 |
So | +0.004 |
friend | +0.004 |
tutor | +0.004 |
kindly | +0.004 |
Neg logit contributions | |
ays | -0.011 |
ips | -0.009 |
unks | -0.009 |
rob | -0.009 |
ions | -0.009 |
Token | The |
Token ID | 383 |
Feature activation | +4.81e-03 |
Pos logit contributions | |
ays | +0.043 |
rob | +0.041 |
unks | +0.037 |
ocol | +0.037 |
ips | +0.036 |
Neg logit contributions | |
So | -0.022 |
little | -0.022 |
friend | -0.021 |
kindly | -0.021 |
Her | -0.021 |
Token | light |
Token ID | 1657 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
ays | +0.010 |
ips | +0.008 |
rob | +0.008 |
unks | +0.008 |
ions | +0.008 |
Neg logit contributions | |
So | -0.007 |
lder | -0.007 |
kindly | -0.007 |
forgive | -0.007 |
understanding | -0.006 |
Token | bul |
Token ID | 15065 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
ays | +0.085 |
rob | +0.075 |
ips | +0.074 |
unks | +0.073 |
ocol | +0.071 |
Neg logit contributions | |
friend | -0.058 |
song | -0.055 |
tutor | -0.055 |
lder | -0.055 |
kindly | -0.054 |
Token | b |
Token ID | 65 |
Feature activation | +5.63e-02 |
Pos logit contributions | |
ays | +0.159 |
unks | +0.140 |
ips | +0.138 |
ocol | +0.136 |
marsh | +0.131 |
Neg logit contributions | |
broken | -0.222 |
kindly | -0.221 |
friend | -0.220 |
forgive | -0.214 |
understanding | -0.212 |
Token | stopped |
Token ID | 5025 |
Feature activation | +4.95e-03 |
Pos logit contributions | |
ays | +0.090 |
rob | +0.087 |
ocol | +0.083 |
ips | +0.074 |
unks | +0.072 |
Neg logit contributions | |
friend | -0.110 |
lder | -0.107 |
kindly | -0.104 |
broken | -0.101 |
forgive | -0.101 |
Token | working |
Token ID | 1762 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
ays | +0.012 |
rob | +0.011 |
ips | +0.011 |
unks | +0.010 |
plets | +0.010 |
Neg logit contributions | |
friend | -0.006 |
kindly | -0.006 |
lder | -0.005 |
forgive | -0.005 |
So | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
ays | +0.050 |
ips | +0.043 |
unks | +0.043 |
rob | +0.043 |
ocol | +0.042 |
Neg logit contributions | |
kindly | -0.017 |
friend | -0.016 |
lder | -0.016 |
tutor | -0.016 |
So | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | -9.69e-03 |
Pos logit contributions | |
ays | +0.044 |
rob | +0.042 |
ocol | +0.040 |
unks | +0.039 |
ions | +0.038 |
Neg logit contributions | |
So | -0.023 |
little | -0.021 |
friend | -0.021 |
kindly | -0.021 |
forgive | -0.020 |
Token | show |
Token ID | 905 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
friend | +0.038 |
lder | +0.037 |
tutor | +0.037 |
forgive | +0.037 |
So | +0.036 |
Neg logit contributions | |
ays | -0.079 |
ips | -0.067 |
rob | -0.067 |
unks | -0.066 |
plets | -0.065 |
Token | her |
Token ID | 607 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
ays | +0.031 |
rob | +0.027 |
plets | +0.027 |
ips | +0.026 |
unks | +0.026 |
Neg logit contributions | |
friend | -0.018 |
kindly | -0.017 |
forgive | -0.017 |
tutor | -0.017 |
understanding | -0.017 |
Token | an |
Token ID | 281 |
Feature activation | -3.31e-03 |
Pos logit contributions | |
friend | +0.021 |
lder | +0.021 |
tutor | +0.020 |
kindly | +0.020 |
So | +0.020 |
Neg logit contributions | |
ays | -0.049 |
ips | -0.042 |
rob | -0.042 |
unks | -0.042 |
plets | -0.041 |
Token | expensive |
Token ID | 5789 |
Feature activation | +6.94e-03 |
Pos logit contributions | |
lder | +0.005 |
So | +0.005 |
forgive | +0.004 |
kindly | +0.004 |
tutor | +0.004 |
Neg logit contributions | |
ays | -0.007 |
unks | -0.006 |
ions | -0.006 |
ocol | -0.006 |
rob | -0.006 |
Token | ash |
Token ID | 12530 |
Feature activation | +3.41e-02 |
Pos logit contributions | |
ays | +0.016 |
ips | +0.014 |
rob | +0.014 |
unks | +0.014 |
plets | +0.013 |
Neg logit contributions | |
friend | -0.009 |
tutor | -0.009 |
lder | -0.009 |
kindly | -0.009 |
forgive | -0.008 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
ays | +0.085 |
ips | +0.074 |
rob | +0.073 |
unks | +0.073 |
ocol | +0.071 |
Neg logit contributions | |
friend | -0.038 |
lder | -0.038 |
tutor | -0.037 |
kindly | -0.037 |
So | -0.037 |
Token | ay |
Token ID | 323 |
Feature activation | +2.63e-02 |
Pos logit contributions | |
rob | +0.182 |
ays | +0.179 |
ocol | +0.167 |
unks | +0.166 |
matters | +0.162 |
Neg logit contributions | |
friend | -0.193 |
keeper | -0.180 |
So | -0.180 |
kindly | -0.177 |
keeper | -0.173 |
Token | he |
Token ID | 339 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
ays | +0.070 |
ips | +0.062 |
rob | +0.061 |
unks | +0.061 |
plets | +0.060 |
Neg logit contributions | |
kindly | -0.025 |
friend | -0.024 |
lder | -0.024 |
tutor | -0.023 |
keeper | -0.023 |
Token | got |
Token ID | 1392 |
Feature activation | +4.49e-02 |
Pos logit contributions | |
ays | +0.029 |
ips | +0.024 |
rob | +0.024 |
unks | +0.024 |
ions | +0.023 |
Neg logit contributions | |
lder | -0.017 |
friend | -0.017 |
kindly | -0.017 |
So | -0.017 |
tutor | -0.016 |
Token | as |
Token ID | 355 |
Feature activation | +3.21e-02 |
Pos logit contributions | |
ays | +0.109 |
rob | +0.100 |
ips | +0.094 |
unks | +0.092 |
plets | +0.089 |
Neg logit contributions | |
kindly | -0.059 |
friend | -0.057 |
understanding | -0.055 |
forgive | -0.055 |
keeper | -0.054 |
Token | a |
Token ID | 257 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
ays | +0.081 |
rob | +0.070 |
ips | +0.069 |
unks | +0.068 |
plets | +0.065 |
Neg logit contributions | |
kindly | -0.043 |
friend | -0.042 |
understanding | -0.041 |
tutor | -0.039 |
little | -0.039 |
Token | Maybe |
Token ID | 6674 |
Feature activation | -1.26e-03 |
Pos logit contributions | |
ays | +0.005 |
rob | +0.004 |
ips | +0.004 |
unks | +0.004 |
plets | +0.004 |
Neg logit contributions | |
lder | -0.003 |
friend | -0.003 |
So | -0.003 |
kindly | -0.003 |
tutor | -0.003 |
Token | we |
Token ID | 356 |
Feature activation | -7.57e-04 |
Pos logit contributions | |
friend | +0.002 |
kindly | +0.002 |
tutor | +0.002 |
So | +0.002 |
lder | +0.002 |
Neg logit contributions | |
ays | -0.003 |
ips | -0.002 |
unks | -0.002 |
rob | -0.002 |
plets | -0.002 |
Token | can |
Token ID | 460 |
Feature activation | -3.74e-02 |
Pos logit contributions | |
lder | +0.001 |
friend | +0.001 |
So | +0.001 |
tutor | +0.001 |
kindly | +0.001 |
Neg logit contributions | |
ays | -0.001 |
ips | -0.001 |
rob | -0.001 |
unks | -0.001 |
ions | -0.001 |
Token | repair |
Token ID | 9185 |
Feature activation | +4.25e-02 |
Pos logit contributions | |
lder | +0.052 |
tutor | +0.051 |
Days | +0.049 |
tune | +0.049 |
hospitality | +0.048 |
Neg logit contributions | |
ays | -0.078 |
ips | -0.067 |
unks | -0.067 |
ions | -0.062 |
rob | -0.062 |
Token | the |
Token ID | 262 |
Feature activation | +4.27e-03 |
Pos logit contributions | |
ays | +0.093 |
rol | +0.088 |
plets | +0.087 |
ips | +0.086 |
izz | +0.084 |
Neg logit contributions | |
friend | -0.057 |
kindly | -0.055 |
who | -0.055 |
little | -0.054 |
tutor | -0.053 |
Token | kay |
Token ID | 34681 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
ays | +0.009 |
ips | +0.008 |
rob | +0.008 |
unks | +0.008 |
ions | +0.008 |
Neg logit contributions | |
friend | -0.006 |
tutor | -0.006 |
lder | -0.006 |
kindly | -0.006 |
forgive | -0.006 |
Token | ak |
Token ID | 461 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
ays | +0.215 |
rob | +0.177 |
ocol | +0.177 |
chairs | +0.176 |
spins | +0.175 |
Neg logit contributions | |
friend | -0.178 |
So | -0.175 |
forgive | -0.170 |
kindly | -0.165 |
broken | -0.165 |
Token | ." |
Token ID | 526 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
ays | +0.065 |
rob | +0.058 |
ips | +0.057 |
unks | +0.056 |
ocol | +0.055 |
Neg logit contributions | |
friend | -0.029 |
kindly | -0.028 |
So | -0.028 |
lder | -0.028 |
forgive | -0.027 |
Token |
|
Token ID | 198 |
Feature activation | -1.87e-02 |
Pos logit contributions | |
lder | +0.023 |
Days | +0.022 |
song | +0.022 |
tune | +0.022 |
hospitality | +0.022 |
Neg logit contributions | |
ays | -0.034 |
ips | -0.029 |
unks | -0.028 |
rob | -0.028 |
ions | -0.027 |
Token |
|
Token ID | 198 |
Feature activation | -2.34e-02 |
Pos logit contributions | |
lder | +0.028 |
tutor | +0.027 |
tune | +0.026 |
hospitality | +0.026 |
song | +0.026 |
Neg logit contributions | |
ays | -0.039 |
ips | -0.033 |
unks | -0.033 |
rob | -0.032 |
izz | -0.032 |
Token | They |
Token ID | 2990 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
hospitality | +0.032 |
birthday | +0.031 |
lder | +0.031 |
doorstep | +0.030 |
friend | +0.030 |
Neg logit contributions | |
ays | -0.044 |
izz | -0.042 |
ions | -0.041 |
unks | -0.041 |
ips | -0.040 |
Token | decided |
Token ID | 3066 |
Feature activation | -3.32e-02 |
Pos logit contributions | |
lder | +0.006 |
friend | +0.006 |
So | +0.006 |
kindly | +0.006 |
tutor | +0.006 |
Neg logit contributions | |
ays | -0.014 |
ips | -0.012 |
rob | -0.012 |
unks | -0.012 |
ions | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | -4.76e-02 |
Pos logit contributions | |
lder | +0.038 |
tutor | +0.035 |
So | +0.035 |
friend | +0.034 |
forgive | +0.034 |
Neg logit contributions | |
ays | -0.079 |
ips | -0.069 |
rob | -0.068 |
unks | -0.067 |
ions | -0.067 |
Token | put |
Token ID | 1234 |
Feature activation | +5.76e-02 |
Pos logit contributions | |
lder | +0.056 |
friend | +0.055 |
So | +0.054 |
tutor | +0.054 |
kindly | +0.054 |
Neg logit contributions | |
ays | -0.116 |
ips | -0.100 |
rob | -0.099 |
unks | -0.098 |
ions | -0.096 |
Token | the |
Token ID | 262 |
Feature activation | +2.98e-02 |
Pos logit contributions | |
ays | +0.153 |
plets | +0.152 |
unks | +0.137 |
rol | +0.135 |
pill | +0.133 |
Neg logit contributions | |
friend | -0.063 |
little | -0.053 |
kindly | -0.052 |
forgive | -0.051 |
who | -0.050 |
Token | ash |
Token ID | 12530 |
Feature activation | +5.25e-02 |
Pos logit contributions | |
ays | +0.056 |
ips | +0.046 |
rob | +0.045 |
unks | +0.045 |
ions | +0.043 |
Neg logit contributions | |
friend | -0.053 |
lder | -0.052 |
kindly | -0.051 |
So | -0.051 |
tutor | -0.051 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
ays | +0.125 |
ips | +0.107 |
rob | +0.107 |
unks | +0.106 |
ocol | +0.103 |
Neg logit contributions | |
friend | -0.065 |
lder | -0.064 |
kindly | -0.063 |
So | -0.063 |
tutor | -0.063 |
Token | ay |
Token ID | 323 |
Feature activation | +4.59e-02 |
Pos logit contributions | |
rob | +0.183 |
ays | +0.181 |
unks | +0.172 |
ocol | +0.166 |
matters | +0.162 |
Neg logit contributions | |
friend | -0.189 |
So | -0.182 |
kindly | -0.177 |
forgive | -0.176 |
keeper | -0.172 |
Token | down |
Token ID | 866 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
ays | +0.096 |
unks | +0.081 |
rob | +0.081 |
ocol | +0.079 |
ips | +0.079 |
Neg logit contributions | |
friend | -0.073 |
kindly | -0.070 |
forgive | -0.069 |
tutor | -0.067 |
So | -0.067 |
Token | and |
Token ID | 290 |
Feature activation | +7.00e-03 |
Pos logit contributions | |
ays | +0.036 |
rob | +0.031 |
ips | +0.030 |
unks | +0.030 |
plets | +0.030 |
Neg logit contributions | |
kindly | -0.018 |
friend | -0.017 |
So | -0.017 |
forgive | -0.017 |
tutor | -0.017 |
Token | go |
Token ID | 467 |
Feature activation | -7.92e-03 |
Pos logit contributions | |
ays | +0.019 |
rob | +0.016 |
ips | +0.016 |
unks | +0.016 |
ocol | +0.016 |
Neg logit contributions | |
friend | -0.009 |
kindly | -0.008 |
forgive | -0.008 |
tutor | -0.008 |
song | -0.008 |
Token | outside |
Token ID | 2354 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
friend | +0.010 |
recommendation | +0.009 |
kindly | +0.009 |
forgive | +0.009 |
tutor | +0.008 |
Neg logit contributions | |
ays | -0.021 |
ocol | -0.018 |
plets | -0.017 |
rob | -0.017 |
unks | -0.017 |
Token | The |
Token ID | 383 |
Feature activation | +4.60e-03 |
Pos logit contributions | |
ays | +0.050 |
ips | +0.041 |
rob | +0.040 |
unks | +0.039 |
lands | +0.038 |
Neg logit contributions | |
broken | -0.039 |
forgive | -0.038 |
understanding | -0.038 |
lder | -0.038 |
Days | -0.037 |
Token | house |
Token ID | 2156 |
Feature activation | +3.18e-02 |
Pos logit contributions | |
ays | +0.005 |
lands | +0.004 |
ained | +0.004 |
ips | +0.004 |
patches | +0.004 |
Neg logit contributions | |
hospitality | -0.010 |
broken | -0.010 |
kindly | -0.010 |
tutor | -0.010 |
lder | -0.010 |
Token | had |
Token ID | 550 |
Feature activation | +3.86e-02 |
Pos logit contributions | |
ays | +0.072 |
ips | +0.061 |
rob | +0.061 |
unks | +0.061 |
ocol | +0.060 |
Neg logit contributions | |
friend | -0.044 |
lder | -0.044 |
kindly | -0.043 |
forgive | -0.042 |
So | -0.042 |
Token | an |
Token ID | 281 |
Feature activation | +6.42e-03 |
Pos logit contributions | |
ays | +0.076 |
ips | +0.063 |
rob | +0.062 |
unks | +0.061 |
ions | +0.060 |
Neg logit contributions | |
lder | -0.062 |
tutor | -0.061 |
kindly | -0.061 |
So | -0.061 |
friend | -0.061 |
Token | ash |
Token ID | 12530 |
Feature activation | +4.04e-02 |
Pos logit contributions | |
ays | +0.013 |
ips | +0.011 |
unks | +0.011 |
rob | +0.011 |
ocol | +0.010 |
Neg logit contributions | |
So | -0.010 |
lder | -0.010 |
forgive | -0.010 |
kindly | -0.010 |
tutor | -0.010 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
ays | +0.086 |
ips | +0.071 |
unks | +0.071 |
rob | +0.071 |
plets | +0.069 |
Neg logit contributions | |
So | -0.059 |
lder | -0.059 |
kindly | -0.058 |
tutor | -0.058 |
forgive | -0.058 |
Token | ay |
Token ID | 323 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
rob | +0.183 |
ays | +0.177 |
unks | +0.167 |
ocol | +0.165 |
matters | +0.160 |
Neg logit contributions | |
friend | -0.188 |
So | -0.175 |
kindly | -0.175 |
keeper | -0.171 |
tutor | -0.171 |
Token | outside |
Token ID | 2354 |
Feature activation | +8.84e-03 |
Pos logit contributions | |
ays | +0.067 |
rob | +0.057 |
ips | +0.057 |
unks | +0.056 |
plets | +0.054 |
Neg logit contributions | |
lder | -0.038 |
friend | -0.038 |
kindly | -0.037 |
tutor | -0.037 |
So | -0.037 |
Token | where |
Token ID | 810 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
ays | +0.020 |
rob | +0.018 |
ips | +0.018 |
unks | +0.017 |
plets | +0.017 |
Neg logit contributions | |
friend | -0.012 |
lder | -0.012 |
kindly | -0.012 |
So | -0.011 |
song | -0.011 |
Token | people |
Token ID | 661 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
ays | +0.071 |
ips | +0.061 |
unks | +0.060 |
rob | +0.059 |
ocol | +0.057 |
Neg logit contributions | |
friend | -0.049 |
kindly | -0.048 |
lder | -0.048 |
song | -0.047 |
little | -0.047 |
Token | put |
Token ID | 1234 |
Feature activation | +5.34e-02 |
Pos logit contributions | |
ays | +0.034 |
ips | +0.029 |
rob | +0.029 |
unks | +0.029 |
ocol | +0.027 |
Neg logit contributions | |
forgive | -0.020 |
kindly | -0.020 |
lder | -0.020 |
friend | -0.020 |
So | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
lder | +0.033 |
So | +0.033 |
tutor | +0.032 |
kindly | +0.031 |
recommendation | +0.031 |
Neg logit contributions | |
ays | -0.078 |
rob | -0.068 |
unks | -0.067 |
ips | -0.067 |
ions | -0.066 |
Token | He |
Token ID | 679 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
ays | +0.062 |
ips | +0.051 |
rob | +0.051 |
unks | +0.050 |
ions | +0.049 |
Neg logit contributions | |
lder | -0.044 |
friend | -0.043 |
So | -0.043 |
kindly | -0.043 |
tutor | -0.043 |
Token | had |
Token ID | 550 |
Feature activation | +2.83e-02 |
Pos logit contributions | |
lder | +0.018 |
friend | +0.018 |
tutor | +0.018 |
So | +0.018 |
kindly | +0.018 |
Neg logit contributions | |
ays | -0.029 |
ips | -0.025 |
rob | -0.025 |
unks | -0.024 |
ions | -0.024 |
Token | an |
Token ID | 281 |
Feature activation | +1.88e-03 |
Pos logit contributions | |
ays | +0.074 |
ips | +0.063 |
rob | +0.062 |
unks | +0.062 |
ocol | +0.060 |
Neg logit contributions | |
friend | -0.037 |
understanding | -0.033 |
song | -0.033 |
little | -0.033 |
kindly | -0.033 |
Token | ash |
Token ID | 12530 |
Feature activation | +3.67e-02 |
Pos logit contributions | |
ays | +0.004 |
ips | +0.003 |
rob | +0.003 |
unks | +0.003 |
ions | +0.003 |
Neg logit contributions | |
lder | -0.003 |
friend | -0.003 |
So | -0.003 |
kindly | -0.003 |
tutor | -0.003 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.079 |
rob | +0.066 |
ips | +0.066 |
unks | +0.066 |
ions | +0.064 |
Neg logit contributions | |
lder | -0.053 |
So | -0.052 |
kindly | -0.051 |
understanding | -0.051 |
forgive | -0.051 |
Token | ay |
Token ID | 323 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
rob | +0.200 |
ays | +0.179 |
unks | +0.174 |
matters | +0.171 |
ocol | +0.170 |
Neg logit contributions | |
friend | -0.178 |
tutor | -0.163 |
kindly | -0.163 |
So | -0.161 |
forgive | -0.155 |
Token | that |
Token ID | 326 |
Feature activation | +5.25e-02 |
Pos logit contributions | |
ays | +0.048 |
ips | +0.040 |
rob | +0.040 |
unks | +0.040 |
plets | +0.038 |
Neg logit contributions | |
friend | -0.034 |
lder | -0.034 |
tutor | -0.033 |
kindly | -0.033 |
So | -0.033 |
Token | could |
Token ID | 714 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
ays | +0.145 |
ips | +0.126 |
ocol | +0.123 |
plets | +0.123 |
unks | +0.122 |
Neg logit contributions | |
friend | -0.064 |
forgive | -0.060 |
kindly | -0.060 |
keeper | -0.060 |
kind | -0.058 |
Token | zip |
Token ID | 19974 |
Feature activation | +3.60e-02 |
Pos logit contributions | |
lder | +0.036 |
friend | +0.035 |
So | +0.035 |
tutor | +0.035 |
kindly | +0.035 |
Neg logit contributions | |
ays | -0.063 |
ips | -0.053 |
rob | -0.053 |
unks | -0.053 |
ions | -0.051 |
Token | around |
Token ID | 1088 |
Feature activation | -9.87e-03 |
Pos logit contributions | |
ays | +0.097 |
ips | +0.086 |
rob | +0.083 |
ocol | +0.083 |
unks | +0.083 |
Neg logit contributions | |
kindly | -0.042 |
little | -0.038 |
friend | -0.038 |
politely | -0.036 |
song | -0.035 |
Token | his |
Token ID | 465 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
ays | +0.064 |
rob | +0.056 |
ips | +0.055 |
unks | +0.054 |
ocol | +0.054 |
Neg logit contributions | |
friend | -0.034 |
tutor | -0.031 |
kindly | -0.031 |
understanding | -0.031 |
So | -0.030 |
Token | mom |
Token ID | 1995 |
Feature activation | -3.07e-04 |
Pos logit contributions | |
lder | +0.015 |
So | +0.015 |
kindly | +0.014 |
Days | +0.013 |
tutor | +0.013 |
Neg logit contributions | |
ays | -0.037 |
unks | -0.033 |
ips | -0.032 |
ocol | -0.032 |
chairs | -0.031 |
Token | put |
Token ID | 1234 |
Feature activation | +5.89e-02 |
Pos logit contributions | |
lder | +0.000 |
friend | +0.000 |
tutor | +0.000 |
So | +0.000 |
kindly | +0.000 |
Neg logit contributions | |
ays | -0.001 |
ips | -0.001 |
rob | -0.001 |
unks | -0.001 |
ions | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +3.13e-02 |
Pos logit contributions | |
ays | +0.140 |
plets | +0.134 |
unks | +0.131 |
rob | +0.121 |
spins | +0.120 |
Neg logit contributions | |
friend | -0.072 |
kindly | -0.068 |
little | -0.066 |
forgive | -0.062 |
tutor | -0.062 |
Token | ash |
Token ID | 12530 |
Feature activation | +5.93e-02 |
Pos logit contributions | |
ays | +0.057 |
ips | +0.046 |
rob | +0.045 |
unks | +0.045 |
ions | +0.043 |
Neg logit contributions | |
lder | -0.057 |
friend | -0.056 |
So | -0.056 |
tutor | -0.056 |
kindly | -0.056 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.136 |
ips | +0.115 |
rob | +0.114 |
unks | +0.113 |
ions | +0.111 |
Neg logit contributions | |
lder | -0.079 |
friend | -0.077 |
So | -0.076 |
tutor | -0.076 |
kindly | -0.076 |
Token | ay |
Token ID | 323 |
Feature activation | +4.92e-02 |
Pos logit contributions | |
ays | +0.182 |
rob | +0.181 |
unks | +0.168 |
ocol | +0.162 |
matters | +0.159 |
Neg logit contributions | |
friend | -0.190 |
So | -0.186 |
kindly | -0.181 |
forgive | -0.175 |
keeper | -0.172 |
Token | away |
Token ID | 1497 |
Feature activation | +2.22e-03 |
Pos logit contributions | |
ays | +0.096 |
rob | +0.080 |
unks | +0.079 |
ips | +0.077 |
ocol | +0.076 |
Neg logit contributions | |
friend | -0.084 |
kindly | -0.082 |
forgive | -0.080 |
So | -0.080 |
tutor | -0.079 |
Token | , |
Token ID | 11 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
ays | +0.006 |
ips | +0.005 |
rob | +0.005 |
unks | +0.005 |
ions | +0.005 |
Neg logit contributions | |
lder | -0.002 |
friend | -0.002 |
tutor | -0.002 |
So | -0.002 |
kindly | -0.002 |
Token | but |
Token ID | 475 |
Feature activation | +4.30e-02 |
Pos logit contributions | |
friend | +0.012 |
kindly | +0.012 |
lder | +0.012 |
So | +0.012 |
forgive | +0.012 |
Neg logit contributions | |
ays | -0.032 |
rob | -0.028 |
ips | -0.028 |
unks | -0.028 |
ions | -0.027 |
Token | Little |
Token ID | 7703 |
Feature activation | +1.87e-02 |
Pos logit contributions | |
ays | +0.104 |
rob | +0.093 |
unks | +0.090 |
ips | +0.089 |
plets | +0.085 |
Neg logit contributions | |
kindly | -0.063 |
friend | -0.061 |
understanding | -0.060 |
forgive | -0.059 |
tutor | -0.057 |
Token | , |
Token ID | 11 |
Feature activation | +4.40e-02 |
Pos logit contributions | |
ays | +0.143 |
ips | +0.124 |
unks | +0.124 |
rob | +0.123 |
izz | +0.117 |
Neg logit contributions | |
kindly | -0.068 |
little | -0.062 |
So | -0.060 |
friend | -0.060 |
keeper | -0.057 |
Token | it |
Token ID | 340 |
Feature activation | +4.96e-02 |
Pos logit contributions | |
ays | +0.113 |
unks | +0.097 |
ips | +0.097 |
rob | +0.095 |
ocol | +0.091 |
Neg logit contributions | |
little | -0.058 |
kindly | -0.056 |
friend | -0.056 |
tutor | -0.053 |
understanding | -0.053 |
Token | caused |
Token ID | 4073 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
ays | +0.115 |
ocol | +0.109 |
rob | +0.105 |
ips | +0.104 |
unks | +0.102 |
Neg logit contributions | |
friend | -0.068 |
song | -0.066 |
kindly | -0.066 |
So | -0.065 |
little | -0.063 |
Token | the |
Token ID | 262 |
Feature activation | +5.33e-03 |
Pos logit contributions | |
ays | +0.053 |
rob | +0.045 |
ips | +0.044 |
unks | +0.044 |
plets | +0.042 |
Neg logit contributions | |
friend | -0.034 |
So | -0.033 |
kindly | -0.033 |
understanding | -0.033 |
song | -0.032 |
Token | ash |
Token ID | 12530 |
Feature activation | +4.60e-02 |
Pos logit contributions | |
ays | +0.011 |
ips | +0.010 |
rob | +0.010 |
unks | +0.009 |
plets | +0.009 |
Neg logit contributions | |
lder | -0.008 |
So | -0.008 |
kindly | -0.007 |
friend | -0.007 |
tutor | -0.007 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.110 |
ips | +0.094 |
rob | +0.093 |
unks | +0.092 |
ions | +0.090 |
Neg logit contributions | |
lder | -0.057 |
friend | -0.055 |
tutor | -0.055 |
So | -0.055 |
kindly | -0.055 |
Token | ay |
Token ID | 323 |
Feature activation | +3.09e-02 |
Pos logit contributions | |
rob | +0.177 |
ays | +0.176 |
unks | +0.160 |
ocol | +0.158 |
matters | +0.154 |
Neg logit contributions | |
friend | -0.192 |
So | -0.192 |
kindly | -0.185 |
keeper | -0.178 |
broken | -0.177 |
Token | to |
Token ID | 284 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
ays | +0.073 |
ips | +0.063 |
rob | +0.063 |
unks | +0.063 |
ocol | +0.061 |
Neg logit contributions | |
lder | -0.038 |
friend | -0.038 |
kindly | -0.037 |
So | -0.037 |
tutor | -0.036 |
Token | scatter |
Token ID | 41058 |
Feature activation | +3.80e-02 |
Pos logit contributions | |
ays | +0.022 |
ips | +0.018 |
rob | +0.018 |
unks | +0.018 |
plets | +0.017 |
Neg logit contributions | |
lder | -0.016 |
friend | -0.016 |
forgive | -0.016 |
kindly | -0.016 |
So | -0.016 |
Token | all |
Token ID | 477 |
Feature activation | +3.35e-02 |
Pos logit contributions | |
ays | +0.092 |
rob | +0.086 |
unks | +0.082 |
ips | +0.081 |
plets | +0.078 |
Neg logit contributions | |
kindly | -0.046 |
friend | -0.045 |
So | -0.043 |
forgive | -0.042 |
keeper | -0.042 |
Token | over |
Token ID | 625 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
ays | +0.072 |
unks | +0.064 |
ocol | +0.062 |
rob | +0.062 |
plets | +0.061 |
Neg logit contributions | |
friend | -0.049 |
keeper | -0.047 |
forgive | -0.046 |
So | -0.046 |
song | -0.046 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
ays | +0.071 |
rob | +0.059 |
unks | +0.059 |
ips | +0.059 |
ions | +0.058 |
Neg logit contributions | |
lder | -0.044 |
So | -0.044 |
kindly | -0.043 |
forgive | -0.043 |
understanding | -0.043 |
Token | ay |
Token ID | 323 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
rob | +0.171 |
ays | +0.167 |
matters | +0.158 |
unks | +0.158 |
ocol | +0.157 |
Neg logit contributions | |
friend | -0.182 |
So | -0.171 |
kindly | -0.169 |
keeper | -0.166 |
tutor | -0.166 |
Token | . |
Token ID | 13 |
Feature activation | +3.19e-02 |
Pos logit contributions | |
ays | +0.052 |
ips | +0.045 |
rob | +0.045 |
unks | +0.044 |
plets | +0.043 |
Neg logit contributions | |
lder | -0.024 |
friend | -0.024 |
kindly | -0.024 |
tutor | -0.024 |
So | -0.024 |
Token | The |
Token ID | 383 |
Feature activation | +7.01e-03 |
Pos logit contributions | |
ays | +0.059 |
rob | +0.050 |
ips | +0.049 |
unks | +0.047 |
plets | +0.044 |
Neg logit contributions | |
lder | -0.058 |
So | -0.058 |
kindly | -0.057 |
tutor | -0.057 |
friend | -0.057 |
Token | ash |
Token ID | 12530 |
Feature activation | +4.79e-02 |
Pos logit contributions | |
ays | +0.012 |
unks | +0.010 |
rob | +0.010 |
ips | +0.009 |
ocol | +0.009 |
Neg logit contributions | |
So | -0.013 |
lder | -0.013 |
tutor | -0.013 |
kindly | -0.013 |
hospitality | -0.012 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.113 |
ips | +0.097 |
rob | +0.096 |
unks | +0.095 |
ions | +0.093 |
Neg logit contributions | |
lder | -0.060 |
friend | -0.060 |
So | -0.058 |
kindly | -0.058 |
tutor | -0.058 |
Token | ay |
Token ID | 323 |
Feature activation | +3.99e-02 |
Pos logit contributions | |
rob | +0.189 |
ays | +0.178 |
unks | +0.176 |
matters | +0.168 |
ocol | +0.168 |
Neg logit contributions | |
friend | -0.175 |
So | -0.166 |
kindly | -0.164 |
keeper | -0.163 |
keeper | -0.159 |
Token | lived |
Token ID | 5615 |
Feature activation | +4.75e-03 |
Pos logit contributions | |
ays | +0.091 |
ips | +0.079 |
rob | +0.076 |
unks | +0.076 |
ocol | +0.074 |
Neg logit contributions | |
lder | -0.055 |
friend | -0.054 |
kindly | -0.052 |
So | -0.051 |
tutor | -0.050 |
Token | in |
Token ID | 287 |
Feature activation | +2.39e-02 |
Pos logit contributions | |
ays | +0.009 |
ips | +0.008 |
unks | +0.007 |
ions | +0.007 |
rob | +0.007 |
Neg logit contributions | |
lder | -0.008 |
tutor | -0.008 |
So | -0.008 |
hospitality | -0.008 |
recommendation | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | -3.08e-03 |
Pos logit contributions | |
ays | +0.059 |
rob | +0.052 |
ips | +0.050 |
plets | +0.049 |
unks | +0.049 |
Neg logit contributions | |
friend | -0.030 |
little | -0.029 |
tutor | -0.029 |
understanding | -0.028 |
lder | -0.028 |
Token | house |
Token ID | 2156 |
Feature activation | +4.97e-03 |
Pos logit contributions | |
lder | +0.004 |
So | +0.004 |
forgive | +0.004 |
kindly | +0.004 |
hospitality | +0.004 |
Neg logit contributions | |
ays | -0.007 |
ips | -0.006 |
unks | -0.006 |
rob | -0.005 |
plets | -0.005 |
Token | putting |
Token ID | 5137 |
Feature activation | +5.31e-02 |
Pos logit contributions | |
ays | +0.005 |
ips | +0.004 |
rob | +0.004 |
unks | +0.004 |
ocol | +0.004 |
Neg logit contributions | |
lder | -0.003 |
friend | -0.003 |
kindly | -0.003 |
understanding | -0.003 |
tutor | -0.003 |
Token | it |
Token ID | 340 |
Feature activation | +4.19e-02 |
Pos logit contributions | |
ays | +0.120 |
rob | +0.115 |
unks | +0.109 |
plets | +0.102 |
ips | +0.101 |
Neg logit contributions | |
little | -0.073 |
friend | -0.071 |
kindly | -0.071 |
understanding | -0.070 |
forgive | -0.067 |
Token | in |
Token ID | 287 |
Feature activation | -5.48e-04 |
Pos logit contributions | |
ays | +0.076 |
ips | +0.061 |
rob | +0.061 |
unks | +0.060 |
ions | +0.057 |
Neg logit contributions | |
lder | -0.076 |
friend | -0.076 |
kindly | -0.075 |
So | -0.075 |
tutor | -0.075 |
Token | the |
Token ID | 262 |
Feature activation | +2.45e-02 |
Pos logit contributions | |
friend | +0.001 |
kindly | +0.001 |
So | +0.001 |
lder | +0.001 |
forgive | +0.001 |
Neg logit contributions | |
ays | -0.001 |
rob | -0.001 |
ips | -0.001 |
unks | -0.001 |
plets | -0.001 |
Token | ash |
Token ID | 12530 |
Feature activation | +2.77e-02 |
Pos logit contributions | |
ays | +0.048 |
ips | +0.039 |
rob | +0.039 |
unks | +0.038 |
ions | +0.037 |
Neg logit contributions | |
lder | -0.041 |
So | -0.040 |
friend | -0.040 |
kindly | -0.040 |
tutor | -0.040 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.062 |
ips | +0.052 |
rob | +0.052 |
unks | +0.051 |
ions | +0.050 |
Neg logit contributions | |
lder | -0.039 |
kindly | -0.038 |
So | -0.038 |
friend | -0.037 |
forgive | -0.037 |
Token | ay |
Token ID | 323 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
rob | +0.153 |
ays | +0.149 |
unks | +0.145 |
ocol | +0.141 |
plets | +0.140 |
Neg logit contributions | |
So | -0.200 |
friend | -0.198 |
kindly | -0.190 |
forgive | -0.189 |
tutor | -0.186 |
Token | . |
Token ID | 13 |
Feature activation | +9.68e-03 |
Pos logit contributions | |
ays | +0.052 |
ips | +0.045 |
rob | +0.045 |
unks | +0.045 |
plets | +0.044 |
Neg logit contributions | |
friend | -0.018 |
lder | -0.018 |
tutor | -0.017 |
So | -0.017 |
kindly | -0.017 |
Token | Lily |
Token ID | 20037 |
Feature activation | -7.55e-03 |
Pos logit contributions | |
ays | +0.022 |
ips | +0.018 |
rob | +0.018 |
unks | +0.018 |
ions | +0.018 |
Neg logit contributions | |
lder | -0.013 |
friend | -0.013 |
So | -0.013 |
tutor | -0.013 |
kindly | -0.013 |
Token | didn |
Token ID | 1422 |
Feature activation | -1.84e-02 |
Pos logit contributions | |
hospitality | +0.015 |
tutor | +0.014 |
recommendation | +0.014 |
birthday | +0.013 |
deed | +0.013 |
Neg logit contributions | |
ays | -0.012 |
unks | -0.010 |
spins | -0.010 |
lands | -0.009 |
izz | -0.009 |
Token | 't |
Token ID | 470 |
Feature activation | -2.99e-02 |
Pos logit contributions | |
So | +0.021 |
tutor | +0.021 |
lder | +0.020 |
forgive | +0.020 |
kindly | +0.020 |
Neg logit contributions | |
ays | -0.045 |
rob | -0.041 |
ocol | -0.039 |
ips | -0.039 |
unks | -0.038 |
Token | Look |
Token ID | 8567 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
lder | +0.005 |
friend | +0.005 |
So | +0.005 |
tutor | +0.005 |
kindly | +0.005 |
Neg logit contributions | |
ays | -0.008 |
ips | -0.007 |
rob | -0.007 |
unks | -0.007 |
ions | -0.007 |
Token | at |
Token ID | 379 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
ays | +0.025 |
rob | +0.022 |
ips | +0.022 |
unks | +0.021 |
plets | +0.021 |
Neg logit contributions | |
friend | -0.012 |
lder | -0.012 |
kindly | -0.012 |
tutor | -0.011 |
So | -0.011 |
Token | this |
Token ID | 428 |
Feature activation | +4.76e-03 |
Pos logit contributions | |
ays | +0.030 |
ips | +0.026 |
rob | +0.026 |
unks | +0.025 |
plets | +0.025 |
Neg logit contributions | |
friend | -0.019 |
lder | -0.018 |
tutor | -0.018 |
kindly | -0.018 |
forgive | -0.018 |
Token | cool |
Token ID | 3608 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
ays | +0.011 |
ips | +0.009 |
rob | +0.009 |
unks | +0.009 |
ions | +0.009 |
Neg logit contributions | |
friend | -0.006 |
lder | -0.006 |
tutor | -0.006 |
kindly | -0.006 |
So | -0.006 |
Token | ash |
Token ID | 12530 |
Feature activation | +4.73e-02 |
Pos logit contributions | |
ays | +0.050 |
ips | +0.044 |
rob | +0.043 |
unks | +0.043 |
plets | +0.041 |
Neg logit contributions | |
friend | -0.031 |
lder | -0.030 |
tutor | -0.029 |
song | -0.029 |
kindly | -0.028 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.119 |
ips | +0.105 |
rob | +0.104 |
unks | +0.103 |
ocol | +0.102 |
Neg logit contributions | |
friend | -0.053 |
lder | -0.052 |
tutor | -0.050 |
song | -0.049 |
kindly | -0.048 |
Token | ay |
Token ID | 323 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
rob | +0.183 |
ays | +0.180 |
ocol | +0.176 |
unks | +0.173 |
matters | +0.172 |
Neg logit contributions | |
friend | -0.173 |
So | -0.164 |
kindly | -0.161 |
lder | -0.158 |
keeper | -0.157 |
Token | ," |
Token ID | 553 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
ays | +0.062 |
unks | +0.054 |
ips | +0.054 |
rob | +0.053 |
ocol | +0.053 |
Neg logit contributions | |
lder | -0.032 |
friend | -0.032 |
kindly | -0.031 |
tutor | -0.030 |
So | -0.030 |
Token | he |
Token ID | 339 |
Feature activation | -2.05e-02 |
Pos logit contributions | |
friend | +0.023 |
kindly | +0.023 |
So | +0.022 |
tutor | +0.022 |
forgive | +0.022 |
Neg logit contributions | |
ays | -0.035 |
ips | -0.030 |
unks | -0.030 |
rob | -0.029 |
plets | -0.029 |
Token | said |
Token ID | 531 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
friend | +0.026 |
kindly | +0.026 |
So | +0.025 |
lder | +0.025 |
tutor | +0.024 |
Neg logit contributions | |
ays | -0.050 |
ips | -0.043 |
rob | -0.043 |
unks | -0.043 |
ocol | -0.042 |
Token | . |
Token ID | 13 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
lder | +0.041 |
So | +0.039 |
tutor | +0.038 |
Days | +0.038 |
friend | +0.037 |
Neg logit contributions | |
ays | -0.078 |
ips | -0.067 |
ions | -0.064 |
unks | -0.063 |
plets | -0.063 |
Token | she |
Token ID | 673 |
Feature activation | -5.16e-03 |
Pos logit contributions | |
ays | +0.001 |
ips | +0.001 |
rob | +0.001 |
unks | +0.001 |
plets | +0.001 |
Neg logit contributions | |
friend | -0.001 |
lder | -0.001 |
kindly | -0.001 |
tutor | -0.001 |
forgive | -0.001 |
Token | could |
Token ID | 714 |
Feature activation | -4.07e-02 |
Pos logit contributions | |
lder | +0.009 |
tutor | +0.009 |
So | +0.009 |
song | +0.009 |
friend | +0.009 |
Neg logit contributions | |
ays | -0.009 |
ips | -0.007 |
rob | -0.007 |
unks | -0.007 |
ions | -0.007 |
Token | have |
Token ID | 423 |
Feature activation | +4.31e-02 |
Pos logit contributions | |
lder | +0.047 |
friend | +0.047 |
So | +0.046 |
kindly | +0.046 |
tutor | +0.046 |
Neg logit contributions | |
ays | -0.100 |
ips | -0.086 |
rob | -0.086 |
unks | -0.085 |
ions | -0.083 |
Token | the |
Token ID | 262 |
Feature activation | +1.58e-02 |
Pos logit contributions | |
ays | +0.101 |
unks | +0.088 |
plets | +0.086 |
ips | +0.084 |
rob | +0.082 |
Neg logit contributions | |
friend | -0.061 |
understanding | -0.057 |
tutor | -0.057 |
forgive | -0.056 |
little | -0.055 |
Token | ash |
Token ID | 12530 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
ays | +0.033 |
ips | +0.028 |
rob | +0.028 |
unks | +0.027 |
ions | +0.027 |
Neg logit contributions | |
lder | -0.024 |
So | -0.023 |
friend | -0.023 |
kindly | -0.023 |
tutor | -0.023 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.083 |
ips | +0.070 |
rob | +0.070 |
unks | +0.069 |
ions | +0.068 |
Neg logit contributions | |
lder | -0.044 |
So | -0.043 |
kindly | -0.042 |
tutor | -0.042 |
friend | -0.042 |
Token | ay |
Token ID | 323 |
Feature activation | +3.04e-02 |
Pos logit contributions | |
ays | +0.165 |
rob | +0.156 |
unks | +0.151 |
ocol | +0.146 |
plets | +0.145 |
Neg logit contributions | |
friend | -0.208 |
So | -0.197 |
kindly | -0.195 |
tutor | -0.194 |
forgive | -0.194 |
Token | to |
Token ID | 284 |
Feature activation | -2.25e-03 |
Pos logit contributions | |
ays | +0.076 |
ips | +0.066 |
unks | +0.066 |
rob | +0.066 |
plets | +0.065 |
Neg logit contributions | |
friend | -0.034 |
kindly | -0.033 |
tutor | -0.033 |
lder | -0.033 |
forgive | -0.033 |
Token | put |
Token ID | 1234 |
Feature activation | +6.14e-02 |
Pos logit contributions | |
lder | +0.003 |
So | +0.003 |
friend | +0.003 |
kindly | +0.003 |
tutor | +0.003 |
Neg logit contributions | |
ays | -0.005 |
ips | -0.004 |
unks | -0.004 |
ions | -0.004 |
rob | -0.004 |
Token | her |
Token ID | 607 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
ays | +0.134 |
rob | +0.123 |
unks | +0.122 |
plets | +0.121 |
ips | +0.114 |
Neg logit contributions | |
kindly | -0.085 |
friend | -0.082 |
forgive | -0.079 |
little | -0.078 |
lady | -0.077 |
Token | rocks |
Token ID | 12586 |
Feature activation | +5.38e-02 |
Pos logit contributions | |
ays | +0.037 |
ips | +0.032 |
rob | +0.031 |
unks | +0.031 |
ions | +0.030 |
Neg logit contributions | |
friend | -0.022 |
lder | -0.022 |
kindly | -0.021 |
tutor | -0.021 |
So | -0.021 |
Token | room |
Token ID | 2119 |
Feature activation | -5.26e-03 |
Pos logit contributions | |
ays | +0.108 |
plets | +0.099 |
rob | +0.099 |
ocol | +0.096 |
unks | +0.095 |
Neg logit contributions | |
friend | -0.045 |
lder | -0.040 |
tutor | -0.040 |
kindly | -0.039 |
recommendation | -0.038 |
Token | and |
Token ID | 290 |
Feature activation | +2.33e-02 |
Pos logit contributions | |
lder | +0.006 |
So | +0.006 |
tutor | +0.006 |
forgive | +0.006 |
kindly | +0.006 |
Neg logit contributions | |
ays | -0.012 |
ips | -0.011 |
unks | -0.010 |
ions | -0.010 |
rob | -0.010 |
Token | spotted |
Token ID | 13489 |
Feature activation | +2.13e-02 |
Pos logit contributions | |
ays | +0.062 |
ips | +0.055 |
rob | +0.054 |
ocol | +0.053 |
unks | +0.052 |
Neg logit contributions | |
friend | -0.027 |
kindly | -0.025 |
little | -0.025 |
lder | -0.025 |
understanding | -0.024 |
Token | an |
Token ID | 281 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
ays | +0.053 |
ips | +0.048 |
plets | +0.045 |
unks | +0.045 |
rob | +0.045 |
Neg logit contributions | |
friend | -0.027 |
little | -0.026 |
kindly | -0.025 |
tutor | -0.024 |
forgive | -0.024 |
Token | ash |
Token ID | 12530 |
Feature activation | +3.31e-02 |
Pos logit contributions | |
ays | +0.022 |
ips | +0.018 |
rob | +0.018 |
unks | +0.018 |
ions | +0.017 |
Neg logit contributions | |
lder | -0.015 |
friend | -0.015 |
tutor | -0.015 |
kindly | -0.015 |
So | -0.015 |
Token | tr |
Token ID | 2213 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ays | +0.077 |
ips | +0.066 |
rob | +0.066 |
unks | +0.065 |
ions | +0.063 |
Neg logit contributions | |
lder | -0.042 |
friend | -0.042 |
tutor | -0.041 |
So | -0.041 |
kindly | -0.041 |
Token | ay |
Token ID | 323 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
ays | +0.172 |
rob | +0.168 |
ocol | +0.165 |
unks | +0.163 |
matters | +0.162 |
Neg logit contributions | |
friend | -0.180 |
So | -0.175 |
tutor | -0.170 |
kindly | -0.170 |
keeper | -0.166 |
Token | . |
Token ID | 13 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
ays | +0.031 |
ips | +0.026 |
rob | +0.025 |
unks | +0.025 |
ocol | +0.024 |
Neg logit contributions | |
lder | -0.028 |
friend | -0.028 |
tutor | -0.028 |
kindly | -0.028 |
So | -0.027 |
Token | It |
Token ID | 632 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
ays | +0.058 |
rob | +0.052 |
ips | +0.051 |
unks | +0.048 |
ocol | +0.048 |
Neg logit contributions | |
So | -0.027 |
kindly | -0.025 |
friend | -0.025 |
little | -0.025 |
lder | -0.024 |
Token | had |
Token ID | 550 |
Feature activation | +4.04e-02 |
Pos logit contributions | |
ays | +0.082 |
ips | +0.074 |
ocol | +0.071 |
rob | +0.068 |
unks | +0.068 |
Neg logit contributions | |
So | -0.029 |
kindly | -0.029 |
friend | -0.029 |
keeper | -0.028 |
lder | -0.028 |
Token | lots |
Token ID | 6041 |
Feature activation | +2.13e-02 |
Pos logit contributions | |
ays | +0.093 |
rob | +0.080 |
ips | +0.080 |
unks | +0.078 |
ocol | +0.076 |
Neg logit contributions | |
friend | -0.056 |
So | -0.054 |
lder | -0.054 |
song | -0.054 |
little | -0.053 |
Token | bad |
Token ID | 2089 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
ays | +0.095 |
rob | +0.090 |
ips | +0.083 |
unks | +0.082 |
plets | +0.080 |
Neg logit contributions | |
friend | -0.035 |
kindly | -0.034 |
forgive | -0.032 |
little | -0.032 |
understanding | -0.031 |
Token | ." |
Token ID | 526 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
lder | +0.031 |
friend | +0.030 |
So | +0.030 |
kindly | +0.030 |
tutor | +0.030 |
Neg logit contributions | |
ays | -0.060 |
ips | -0.051 |
rob | -0.051 |
unks | -0.050 |
ions | -0.049 |
Token |
|
Token ID | 198 |
Feature activation | -1.94e-02 |
Pos logit contributions | |
lder | +0.024 |
friend | +0.023 |
tutor | +0.023 |
song | +0.022 |
kindly | +0.022 |
Neg logit contributions | |
ays | -0.045 |
ips | -0.039 |
unks | -0.038 |
rob | -0.038 |
ions | -0.037 |
Token |
|
Token ID | 198 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
lder | +0.023 |
friend | +0.022 |
tutor | +0.022 |
kindly | +0.022 |
So | +0.022 |
Neg logit contributions | |
ays | -0.047 |
ips | -0.041 |
unks | -0.040 |
rob | -0.040 |
ions | -0.039 |
Token | Ben |
Token ID | 11696 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
hospitality | +0.024 |
lder | +0.023 |
tutor | +0.023 |
friend | +0.023 |
tune | +0.023 |
Neg logit contributions | |
ays | -0.052 |
ips | -0.046 |
unks | -0.045 |
ions | -0.043 |
rob | -0.043 |
Token | agrees |
Token ID | 14386 |
Feature activation | -8.47e-02 |
Pos logit contributions | |
lder | +0.020 |
friend | +0.020 |
So | +0.020 |
tutor | +0.020 |
kindly | +0.020 |
Neg logit contributions | |
ays | -0.022 |
ips | -0.018 |
rob | -0.018 |
unks | -0.017 |
ions | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
lder | +0.188 |
Mic | +0.167 |
tutor | +0.161 |
Days | +0.159 |
doorstep | +0.157 |
Neg logit contributions | |
ays | -0.107 |
ips | -0.094 |
lands | -0.087 |
ions | -0.086 |
gs | -0.085 |
Token | He |
Token ID | 679 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
lder | +0.017 |
friend | +0.017 |
So | +0.016 |
tutor | +0.016 |
hospitality | +0.016 |
Neg logit contributions | |
ays | -0.022 |
ips | -0.018 |
unks | -0.017 |
ions | -0.017 |
rob | -0.017 |
Token | tries |
Token ID | 8404 |
Feature activation | -3.93e-02 |
Pos logit contributions | |
friend | +0.020 |
kindly | +0.020 |
So | +0.020 |
lder | +0.020 |
forgive | +0.020 |
Neg logit contributions | |
ays | -0.021 |
ips | -0.018 |
rob | -0.018 |
unks | -0.017 |
ions | -0.017 |
Token | to |
Token ID | 284 |
Feature activation | -5.30e-02 |
Pos logit contributions | |
lder | +0.047 |
So | +0.040 |
tutor | +0.040 |
kindly | +0.039 |
hospitality | +0.039 |
Neg logit contributions | |
ays | -0.099 |
ips | -0.087 |
unks | -0.083 |
ions | -0.082 |
rob | -0.081 |
Token | flip |
Token ID | 14283 |
Feature activation | +3.32e-02 |
Pos logit contributions | |
lder | +0.090 |
tutor | +0.081 |
kindly | +0.077 |
hospitality | +0.076 |
So | +0.075 |
Neg logit contributions | |
ays | -0.094 |
izz | -0.086 |
ips | -0.083 |
ions | -0.082 |
unks | -0.081 |
Token | there |
Token ID | 612 |
Feature activation | -5.27e-03 |
Pos logit contributions | |
ays | +0.055 |
rob | +0.048 |
ips | +0.048 |
unks | +0.047 |
plets | +0.047 |
Neg logit contributions | |
friend | -0.029 |
tutor | -0.027 |
kindly | -0.027 |
lder | -0.027 |
So | -0.027 |
Token | were |
Token ID | 547 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
friend | +0.007 |
forgive | +0.006 |
lder | +0.006 |
So | +0.006 |
kindly | +0.006 |
Neg logit contributions | |
ays | -0.013 |
ips | -0.011 |
rob | -0.011 |
unks | -0.011 |
plets | -0.011 |
Token | two |
Token ID | 734 |
Feature activation | -2.80e-02 |
Pos logit contributions | |
ays | +0.051 |
rob | +0.044 |
ips | +0.043 |
unks | +0.043 |
plets | +0.042 |
Neg logit contributions | |
friend | -0.038 |
So | -0.037 |
lder | -0.037 |
tutor | -0.036 |
kindly | -0.036 |
Token | friends |
Token ID | 2460 |
Feature activation | -4.35e-02 |
Pos logit contributions | |
lder | +0.045 |
recommendation | +0.040 |
tune | +0.040 |
tutor | +0.040 |
forgive | +0.040 |
Neg logit contributions | |
ays | -0.057 |
unks | -0.048 |
ips | -0.047 |
ocol | -0.046 |
chairs | -0.046 |
Token | named |
Token ID | 3706 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
lder | +0.074 |
Okay | +0.069 |
tutor | +0.064 |
song | +0.064 |
hospitality | +0.063 |
Neg logit contributions | |
ays | -0.086 |
ions | -0.074 |
unks | -0.073 |
ips | -0.070 |
izz | -0.066 |
Token | Happy |
Token ID | 14628 |
Feature activation | -8.47e-02 |
Pos logit contributions | |
ays | +0.059 |
rob | +0.051 |
ips | +0.051 |
plets | +0.050 |
unks | +0.050 |
Neg logit contributions | |
friend | -0.036 |
tutor | -0.035 |
lder | -0.034 |
So | -0.034 |
kindly | -0.033 |
Token | and |
Token ID | 290 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
Days | +0.153 |
Years | +0.144 |
Mic | +0.142 |
Okay | +0.141 |
vet | +0.134 |
Neg logit contributions | |
ays | -0.127 |
ions | -0.097 |
ink | -0.095 |
dressed | -0.092 |
matters | -0.092 |
Token | Gr |
Token ID | 1902 |
Feature activation | +9.14e-03 |
Pos logit contributions | |
lder | +0.017 |
friend | +0.017 |
tutor | +0.017 |
kindly | +0.017 |
So | +0.017 |
Neg logit contributions | |
ays | -0.023 |
ips | -0.019 |
rob | -0.019 |
unks | -0.019 |
ions | -0.018 |
Token | umpy |
Token ID | 32152 |
Feature activation | -3.83e-02 |
Pos logit contributions | |
ays | +0.017 |
ips | +0.014 |
unks | +0.014 |
izz | +0.013 |
rob | +0.013 |
Neg logit contributions | |
tutor | -0.016 |
lder | -0.016 |
friend | -0.016 |
kindly | -0.016 |
song | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
Days | +0.059 |
So | +0.057 |
Years | +0.053 |
lder | +0.053 |
forgive | +0.052 |
Neg logit contributions | |
ays | -0.080 |
rob | -0.069 |
ions | -0.064 |
chairs | -0.063 |
ips | -0.063 |
Token | They |
Token ID | 1119 |
Feature activation | -2.07e-02 |
Pos logit contributions | |
ays | +0.044 |
ips | +0.038 |
unks | +0.038 |
rob | +0.037 |
ocol | +0.037 |
Neg logit contributions | |
So | -0.026 |
friend | -0.026 |
lder | -0.025 |
kindly | -0.025 |
tutor | -0.025 |
Token | |
Token ID | 220 |
Feature activation | +8.08e-03 |
Pos logit contributions | |
tutor | +0.026 |
Days | +0.025 |
lder | +0.025 |
kindly | +0.025 |
understanding | +0.025 |
Neg logit contributions | |
ays | -0.033 |
rob | -0.027 |
ips | -0.027 |
unks | -0.027 |
ions | -0.026 |
Token |
|
Token ID | 198 |
Feature activation | -3.36e-02 |
Pos logit contributions | |
ays | +0.022 |
rob | +0.019 |
ips | +0.019 |
unks | +0.019 |
ocol | +0.019 |
Neg logit contributions | |
So | -0.008 |
friend | -0.008 |
forgive | -0.007 |
kindly | -0.007 |
lder | -0.007 |
Token | The |
Token ID | 464 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
tutor | +0.057 |
lder | +0.055 |
hospitality | +0.055 |
understanding | +0.053 |
kindly | +0.053 |
Neg logit contributions | |
ays | -0.061 |
rob | -0.054 |
unks | -0.052 |
izz | -0.050 |
ips | -0.050 |
Token | horse |
Token ID | 8223 |
Feature activation | -5.52e-03 |
Pos logit contributions | |
forgive | +0.016 |
broken | +0.015 |
kindly | +0.015 |
So | +0.015 |
understanding | +0.015 |
Neg logit contributions | |
ays | -0.022 |
rob | -0.020 |
ips | -0.018 |
ch | -0.018 |
patches | -0.018 |
Token | said |
Token ID | 531 |
Feature activation | -2.82e-02 |
Pos logit contributions | |
tutor | +0.008 |
lder | +0.007 |
recommendation | +0.007 |
understanding | +0.007 |
Days | +0.007 |
Neg logit contributions | |
ays | -0.012 |
rob | -0.010 |
ips | -0.010 |
unks | -0.010 |
ions | -0.009 |
Token | yes |
Token ID | 3763 |
Feature activation | -8.44e-02 |
Pos logit contributions | |
tutor | +0.044 |
So | +0.044 |
lder | +0.043 |
Days | +0.042 |
Years | +0.042 |
Neg logit contributions | |
ays | -0.053 |
ips | -0.045 |
ions | -0.044 |
spins | -0.043 |
plets | -0.042 |
Token | and |
Token ID | 290 |
Feature activation | -1.07e-03 |
Pos logit contributions | |
Really | +0.174 |
tutor | +0.171 |
hospitality | +0.168 |
forgive | +0.166 |
Mic | +0.165 |
Neg logit contributions | |
ays | -0.077 |
gs | -0.076 |
lands | -0.068 |
ch | -0.064 |
az | -0.061 |
Token | the |
Token ID | 262 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
friend | +0.002 |
kindly | +0.001 |
little | +0.001 |
keeper | +0.001 |
So | +0.001 |
Neg logit contributions | |
ays | -0.003 |
ocol | -0.002 |
unks | -0.002 |
ips | -0.002 |
rob | -0.002 |
Token | two |
Token ID | 734 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
lder | +0.020 |
forgive | +0.020 |
So | +0.019 |
kindly | +0.019 |
broken | +0.019 |
Neg logit contributions | |
ays | -0.036 |
rob | -0.032 |
ips | -0.031 |
unks | -0.030 |
plets | -0.029 |
Token | animals |
Token ID | 4695 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
lder | +0.019 |
tutor | +0.018 |
forgive | +0.018 |
tune | +0.018 |
kindly | +0.017 |
Neg logit contributions | |
ays | -0.022 |
ips | -0.019 |
rob | -0.018 |
ions | -0.018 |
unks | -0.018 |
Token | ran |
Token ID | 4966 |
Feature activation | -6.52e-03 |
Pos logit contributions | |
lder | +0.025 |
tutor | +0.025 |
So | +0.025 |
kindly | +0.024 |
recommendation | +0.024 |
Neg logit contributions | |
ays | -0.033 |
ips | -0.027 |
ions | -0.027 |
rob | -0.026 |
unks | -0.026 |
Token | , |
Token ID | 11 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
lder | +0.037 |
So | +0.035 |
tutor | +0.034 |
forgive | +0.034 |
kindly | +0.033 |
Neg logit contributions | |
ays | -0.060 |
ips | -0.051 |
unks | -0.050 |
ions | -0.050 |
rob | -0.049 |
Token | but |
Token ID | 475 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
lder | +0.059 |
tutor | +0.056 |
friend | +0.055 |
forgive | +0.055 |
So | +0.052 |
Neg logit contributions | |
ays | -0.103 |
rob | -0.091 |
plets | -0.088 |
unks | -0.088 |
ips | -0.088 |
Token | Benny |
Token ID | 44275 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
ays | +0.031 |
rob | +0.026 |
ips | +0.025 |
unks | +0.024 |
ions | +0.024 |
Neg logit contributions | |
lder | -0.027 |
tutor | -0.025 |
recommendation | -0.025 |
song | -0.024 |
So | -0.024 |
Token | was |
Token ID | 373 |
Feature activation | +5.04e-03 |
Pos logit contributions | |
tutor | +0.032 |
birthday | +0.031 |
hospitality | +0.030 |
recommendation | +0.030 |
song | +0.029 |
Neg logit contributions | |
ays | -0.032 |
rob | -0.028 |
unks | -0.028 |
lands | -0.027 |
involved | -0.027 |
Token | very |
Token ID | 845 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
ays | +0.012 |
ips | +0.011 |
unks | +0.010 |
rob | +0.010 |
ions | +0.010 |
Neg logit contributions | |
lder | -0.006 |
tutor | -0.006 |
So | -0.006 |
friend | -0.005 |
kindly | -0.005 |
Token | persuasive |
Token ID | 40116 |
Feature activation | -8.37e-02 |
Pos logit contributions | |
ays | +0.033 |
ips | +0.030 |
unks | +0.029 |
izz | +0.028 |
rob | +0.028 |
Neg logit contributions | |
tutor | -0.015 |
lder | -0.015 |
So | -0.015 |
tune | -0.014 |
hospitality | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | -3.55e-03 |
Pos logit contributions | |
lder | +0.165 |
Days | +0.154 |
broken | +0.153 |
Years | +0.148 |
Mic | +0.147 |
Neg logit contributions | |
ays | -0.120 |
ips | -0.100 |
ions | -0.099 |
patches | -0.099 |
matters | -0.093 |
Token | He |
Token ID | 679 |
Feature activation | -9.53e-03 |
Pos logit contributions | |
lder | +0.006 |
forgive | +0.006 |
song | +0.005 |
hospitality | +0.005 |
tune | +0.005 |
Neg logit contributions | |
ays | -0.007 |
ips | -0.006 |
unks | -0.006 |
chairs | -0.005 |
rob | -0.005 |
Token | said |
Token ID | 531 |
Feature activation | -1.79e-02 |
Pos logit contributions | |
tutor | +0.015 |
tune | +0.014 |
recommendation | +0.014 |
birthday | +0.014 |
lder | +0.014 |
Neg logit contributions | |
ays | -0.017 |
unks | -0.015 |
rob | -0.015 |
ips | -0.014 |
lands | -0.014 |
Token | that |
Token ID | 326 |
Feature activation | +9.19e-03 |
Pos logit contributions | |
So | +0.024 |
lder | +0.024 |
tune | +0.024 |
tutor | +0.023 |
doorstep | +0.023 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.032 |
ions | -0.031 |
ocol | -0.031 |
rob | -0.031 |
Token | new |
Token ID | 649 |
Feature activation | -9.46e-03 |
Pos logit contributions | |
ays | +0.025 |
ips | +0.021 |
plets | +0.021 |
unks | +0.021 |
ocol | +0.020 |
Neg logit contributions | |
friend | -0.012 |
kindly | -0.012 |
forgive | -0.012 |
tutor | -0.011 |
understanding | -0.011 |
Token | party |
Token ID | 2151 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
lder | +0.009 |
understanding | +0.009 |
So | +0.008 |
kindly | +0.008 |
tutor | +0.008 |
Neg logit contributions | |
ays | -0.025 |
ips | -0.022 |
rob | -0.022 |
ions | -0.021 |
unks | -0.021 |
Token | ." |
Token ID | 526 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
lder | +0.031 |
So | +0.030 |
kindly | +0.030 |
tutor | +0.030 |
friend | +0.029 |
Neg logit contributions | |
ays | -0.053 |
ips | -0.045 |
rob | -0.045 |
unks | -0.044 |
ions | -0.043 |
Token |
|
Token ID | 198 |
Feature activation | -2.34e-02 |
Pos logit contributions | |
lder | +0.026 |
tune | +0.025 |
song | +0.025 |
tutor | +0.024 |
friend | +0.024 |
Neg logit contributions | |
ays | -0.039 |
ips | -0.033 |
unks | -0.032 |
rob | -0.032 |
ions | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
lder | +0.034 |
tutor | +0.033 |
tune | +0.032 |
kindly | +0.032 |
friend | +0.031 |
Neg logit contributions | |
ays | -0.052 |
ips | -0.044 |
rob | -0.043 |
unks | -0.043 |
ions | -0.041 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.84e-02 |
Pos logit contributions | |
lder | +0.042 |
tutor | +0.041 |
hospitality | +0.041 |
tune | +0.039 |
recommendation | +0.039 |
Neg logit contributions | |
ays | -0.052 |
ips | -0.047 |
rob | -0.047 |
unks | -0.043 |
ions | -0.042 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.28e-02 |
Pos logit contributions | |
birthday | +0.027 |
tutor | +0.027 |
lder | +0.026 |
recommendation | +0.026 |
hospitality | +0.026 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.031 |
rob | -0.031 |
spins | -0.030 |
unks | -0.029 |
Token | . |
Token ID | 13 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
lder | +0.200 |
Mic | +0.191 |
Days | +0.184 |
urious | +0.177 |
tutor | +0.174 |
Neg logit contributions | |
it | -0.075 |
ays | -0.074 |
on | -0.070 |
onto | -0.064 |
patches | -0.063 |
Token | They |
Token ID | 1119 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
lder | +0.027 |
tune | +0.025 |
tutor | +0.024 |
song | +0.024 |
So | +0.024 |
Neg logit contributions | |
ays | -0.030 |
ips | -0.025 |
ions | -0.023 |
unks | -0.023 |
rob | -0.022 |
Token | took |
Token ID | 1718 |
Feature activation | +3.41e-02 |
Pos logit contributions | |
lder | +0.045 |
tutor | +0.044 |
tune | +0.043 |
recommendation | +0.042 |
song | +0.042 |
Neg logit contributions | |
ays | -0.051 |
ips | -0.044 |
rob | -0.044 |
ions | -0.042 |
izz | -0.042 |
Token | the |
Token ID | 262 |
Feature activation | +5.75e-03 |
Pos logit contributions | |
ays | +0.078 |
unks | +0.076 |
plets | +0.073 |
rob | +0.071 |
ocol | +0.069 |
Neg logit contributions | |
friend | -0.048 |
little | -0.043 |
tutor | -0.042 |
song | -0.041 |
kindly | -0.040 |
Token | blanket |
Token ID | 18447 |
Feature activation | +3.84e-03 |
Pos logit contributions | |
ays | +0.011 |
ips | +0.009 |
rob | +0.009 |
unks | +0.009 |
ions | +0.009 |
Neg logit contributions | |
friend | -0.010 |
lder | -0.009 |
tutor | -0.009 |
kindly | -0.009 |
So | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | +1.68e-02 |
Pos logit contributions | |
ays | +0.012 |
rob | +0.011 |
ips | +0.010 |
unks | +0.010 |
plets | +0.010 |
Neg logit contributions | |
friend | -0.005 |
kindly | -0.005 |
lder | -0.005 |
tutor | -0.005 |
forgive | -0.005 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.18e-02 |
Pos logit contributions | |
ays | +0.040 |
rob | +0.034 |
unks | +0.034 |
ips | +0.034 |
ocol | +0.033 |
Neg logit contributions | |
friend | -0.022 |
tutor | -0.021 |
kindly | -0.021 |
forgive | -0.021 |
So | -0.021 |
Token | 's |
Token ID | 338 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
hospitality | +0.038 |
tutor | +0.037 |
lder | +0.037 |
recommendation | +0.037 |
forgive | +0.036 |
Neg logit contributions | |
ays | -0.039 |
unks | -0.032 |
ips | -0.031 |
rob | -0.031 |
chairs | -0.030 |
Token | friends |
Token ID | 2460 |
Feature activation | -3.14e-02 |
Pos logit contributions | |
lder | +0.024 |
So | +0.024 |
kindly | +0.021 |
tune | +0.021 |
understanding | +0.020 |
Neg logit contributions | |
ays | -0.051 |
ips | -0.045 |
unks | -0.044 |
lands | -0.042 |
patches | -0.042 |
Token | said |
Token ID | 531 |
Feature activation | -2.06e-02 |
Pos logit contributions | |
tutor | +0.054 |
lder | +0.053 |
hospitality | +0.053 |
recommendation | +0.052 |
Days | +0.052 |
Neg logit contributions | |
ays | -0.055 |
ips | -0.046 |
unks | -0.044 |
izz | -0.044 |
involved | -0.043 |
Token | goodbye |
Token ID | 24829 |
Feature activation | -8.26e-02 |
Pos logit contributions | |
lder | +0.034 |
So | +0.034 |
tutor | +0.033 |
friend | +0.033 |
kindly | +0.033 |
Neg logit contributions | |
ays | -0.039 |
ips | -0.032 |
unks | -0.031 |
rob | -0.031 |
ions | -0.031 |
Token | and |
Token ID | 290 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
tutor | +0.135 |
Days | +0.135 |
lder | +0.134 |
Mic | +0.132 |
So | +0.129 |
Neg logit contributions | |
ays | -0.147 |
ips | -0.117 |
onto | -0.114 |
plets | -0.114 |
ained | -0.112 |
Token | left |
Token ID | 1364 |
Feature activation | +2.32e-03 |
Pos logit contributions | |
ays | +0.005 |
ips | +0.004 |
unks | +0.004 |
rob | +0.004 |
ions | +0.004 |
Neg logit contributions | |
friend | -0.003 |
lder | -0.002 |
kindly | -0.002 |
tutor | -0.002 |
So | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +8.88e-03 |
Pos logit contributions | |
ays | +0.006 |
rob | +0.005 |
ips | +0.005 |
unks | +0.005 |
plets | +0.005 |
Neg logit contributions | |
friend | -0.002 |
kindly | -0.002 |
tutor | -0.002 |
lder | -0.002 |
forgive | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | -8.29e-03 |
Pos logit contributions | |
ays | +0.017 |
ips | +0.014 |
unks | +0.013 |
chairs | +0.013 |
ions | +0.013 |
Neg logit contributions | |
lder | -0.015 |
hospitality | -0.015 |
friend | -0.014 |
So | -0.014 |
forgive | -0.014 |
Token | felt |
Token ID | 2936 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
tutor | +0.013 |
lder | +0.013 |
hospitality | +0.013 |
recommendation | +0.013 |
forgive | +0.013 |
Neg logit contributions | |
ays | -0.016 |
rob | -0.013 |
ips | -0.013 |
unks | -0.013 |
lands | -0.012 |
Token | 's |
Token ID | 338 |
Feature activation | -4.01e-02 |
Pos logit contributions | |
friend | +0.012 |
lder | +0.012 |
So | +0.011 |
little | +0.011 |
kindly | +0.010 |
Neg logit contributions | |
ays | -0.025 |
rob | -0.023 |
ips | -0.023 |
ocol | -0.022 |
plets | -0.022 |
Token | do |
Token ID | 466 |
Feature activation | -2.00e-02 |
Pos logit contributions | |
friend | +0.055 |
lder | +0.054 |
So | +0.053 |
kindly | +0.053 |
forgive | +0.053 |
Neg logit contributions | |
ays | -0.092 |
rob | -0.079 |
ips | -0.078 |
unks | -0.076 |
plets | -0.074 |
Token | that |
Token ID | 326 |
Feature activation | +1.59e-03 |
Pos logit contributions | |
friend | +0.029 |
kindly | +0.028 |
lder | +0.028 |
forgive | +0.027 |
So | +0.027 |
Neg logit contributions | |
ays | -0.045 |
rob | -0.040 |
ips | -0.039 |
rol | -0.038 |
ocol | -0.037 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.71e-02 |
Pos logit contributions | |
ays | +0.004 |
ips | +0.004 |
rob | +0.003 |
izz | +0.003 |
unks | +0.003 |
Neg logit contributions | |
friend | -0.002 |
kindly | -0.002 |
song | -0.002 |
lder | -0.002 |
So | -0.002 |
Token | Mia |
Token ID | 32189 |
Feature activation | -2.26e-02 |
Pos logit contributions | |
friend | +0.027 |
So | +0.026 |
kindly | +0.025 |
tutor | +0.025 |
forgive | +0.025 |
Neg logit contributions | |
ays | -0.037 |
rob | -0.032 |
unks | -0.031 |
ips | -0.031 |
ocol | -0.030 |
Token | agrees |
Token ID | 14386 |
Feature activation | -8.23e-02 |
Pos logit contributions | |
friend | +0.041 |
So | +0.041 |
lder | +0.041 |
kindly | +0.040 |
tutor | +0.040 |
Neg logit contributions | |
ays | -0.041 |
rob | -0.033 |
ips | -0.033 |
unks | -0.033 |
plets | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | -2.75e-02 |
Pos logit contributions | |
lder | +0.168 |
tutor | +0.148 |
Days | +0.147 |
doorstep | +0.142 |
Okay | +0.142 |
Neg logit contributions | |
ays | -0.116 |
ips | -0.103 |
gs | -0.102 |
ions | -0.098 |
unks | -0.095 |
Token |
|
Token ID | 198 |
Feature activation | -2.80e-02 |
Pos logit contributions | |
lder | +0.037 |
friend | +0.036 |
tutor | +0.035 |
kindly | +0.035 |
forgive | +0.035 |
Neg logit contributions | |
ays | -0.064 |
ips | -0.054 |
unks | -0.053 |
rob | -0.052 |
ions | -0.052 |
Token |
|
Token ID | 198 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
lder | +0.038 |
tutor | +0.037 |
friend | +0.036 |
kindly | +0.036 |
tune | +0.036 |
Neg logit contributions | |
ays | -0.064 |
ips | -0.054 |
unks | -0.054 |
rob | -0.054 |
ions | -0.053 |
Token | They |
Token ID | 2990 |
Feature activation | -3.42e-02 |
Pos logit contributions | |
tutor | +0.050 |
lder | +0.047 |
hospitality | +0.045 |
friend | +0.045 |
birthday | +0.044 |
Neg logit contributions | |
ays | -0.081 |
ions | -0.073 |
unks | -0.072 |
ips | -0.071 |
rob | -0.070 |
Token | start |
Token ID | 923 |
Feature activation | -2.72e-02 |
Pos logit contributions | |
lder | +0.046 |
friend | +0.046 |
tutor | +0.045 |
So | +0.045 |
kindly | +0.045 |
Neg logit contributions | |
ays | -0.077 |
ips | -0.065 |
rob | -0.064 |
unks | -0.064 |
ions | -0.063 |
Token | to |
Token ID | 284 |
Feature activation | -2.23e-02 |
Pos logit contributions | |
lder | +0.008 |
understanding | +0.007 |
So | +0.007 |
tutor | +0.007 |
kindly | +0.007 |
Neg logit contributions | |
ays | -0.011 |
ips | -0.009 |
unks | -0.009 |
ions | -0.009 |
rob | -0.008 |
Token | our |
Token ID | 674 |
Feature activation | -2.92e-02 |
Pos logit contributions | |
friend | +0.038 |
lder | +0.038 |
tutor | +0.037 |
kindly | +0.037 |
So | +0.037 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.035 |
rob | -0.035 |
unks | -0.035 |
plets | -0.033 |
Token | home |
Token ID | 1363 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
lder | +0.042 |
So | +0.039 |
understanding | +0.038 |
kindly | +0.037 |
forgive | +0.037 |
Neg logit contributions | |
ays | -0.063 |
lands | -0.055 |
ips | -0.054 |
unks | -0.054 |
rob | -0.049 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
lder | +0.047 |
tutor | +0.045 |
So | +0.045 |
kindly | +0.044 |
forgive | +0.044 |
Neg logit contributions | |
ays | -0.064 |
ips | -0.054 |
unks | -0.053 |
ions | -0.052 |
rob | -0.051 |
Token | Sam |
Token ID | 3409 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
lder | +0.025 |
tutor | +0.024 |
kindly | +0.024 |
friend | +0.023 |
forgive | +0.023 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.036 |
rob | -0.036 |
unks | -0.036 |
ions | -0.035 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.21e-02 |
Pos logit contributions | |
tutor | +0.034 |
Days | +0.032 |
hospitality | +0.032 |
recommendation | +0.032 |
birthday | +0.032 |
Neg logit contributions | |
ays | -0.032 |
spins | -0.027 |
rob | -0.026 |
unks | -0.026 |
ions | -0.025 |
Token | , |
Token ID | 11 |
Feature activation | -6.19e-02 |
Pos logit contributions | |
lder | +0.174 |
tutor | +0.169 |
urious | +0.168 |
Mic | +0.167 |
Days | +0.166 |
Neg logit contributions | |
it | -0.085 |
ays | -0.081 |
patches | -0.076 |
on | -0.074 |
onto | -0.073 |
Token | but |
Token ID | 475 |
Feature activation | +9.98e-03 |
Pos logit contributions | |
lder | +0.084 |
tutor | +0.079 |
So | +0.076 |
Days | +0.076 |
friend | +0.075 |
Neg logit contributions | |
ays | -0.135 |
ips | -0.116 |
plets | -0.114 |
ions | -0.113 |
unks | -0.113 |
Token | he |
Token ID | 339 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
ays | +0.020 |
ips | +0.017 |
rob | +0.017 |
unks | +0.016 |
ocol | +0.016 |
Neg logit contributions | |
friend | -0.017 |
kindly | -0.017 |
So | -0.017 |
lder | -0.016 |
forgive | -0.016 |
Token | was |
Token ID | 373 |
Feature activation | -6.73e-03 |
Pos logit contributions | |
lder | +0.024 |
tutor | +0.024 |
So | +0.023 |
recommendation | +0.023 |
kindly | +0.023 |
Neg logit contributions | |
ays | -0.036 |
ips | -0.030 |
unks | -0.030 |
rob | -0.030 |
ions | -0.029 |
Token | worried |
Token ID | 7960 |
Feature activation | -5.72e-02 |
Pos logit contributions | |
lder | +0.009 |
friend | +0.009 |
So | +0.009 |
kindly | +0.009 |
tutor | +0.009 |
Neg logit contributions | |
ays | -0.015 |
ips | -0.013 |
rob | -0.013 |
unks | -0.013 |
ions | -0.013 |
Token | home |
Token ID | 1363 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
lder | +0.012 |
So | +0.012 |
understanding | +0.011 |
Days | +0.011 |
kindly | +0.011 |
Neg logit contributions | |
ays | -0.022 |
ips | -0.019 |
ions | -0.018 |
unks | -0.018 |
rob | -0.018 |
Token | for |
Token ID | 329 |
Feature activation | -1.40e-02 |
Pos logit contributions | |
lder | +0.023 |
friend | +0.023 |
kindly | +0.022 |
So | +0.022 |
tutor | +0.022 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.031 |
rob | -0.031 |
unks | -0.031 |
ocol | -0.030 |
Token | lunch |
Token ID | 9965 |
Feature activation | -2.85e-02 |
Pos logit contributions | |
lder | +0.020 |
friend | +0.020 |
tutor | +0.020 |
So | +0.020 |
kindly | +0.020 |
Neg logit contributions | |
ays | -0.031 |
ips | -0.026 |
rob | -0.026 |
unks | -0.025 |
plets | -0.025 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
lder | +0.045 |
kindly | +0.044 |
forgive | +0.044 |
tutor | +0.044 |
So | +0.044 |
Neg logit contributions | |
ays | -0.057 |
ips | -0.048 |
rob | -0.047 |
unks | -0.047 |
ions | -0.046 |
Token | Lily |
Token ID | 20037 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
Days | +0.021 |
lder | +0.021 |
tutor | +0.021 |
understanding | +0.020 |
keeper | +0.020 |
Neg logit contributions | |
ays | -0.027 |
ips | -0.022 |
unks | -0.022 |
rob | -0.021 |
ions | -0.021 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.20e-02 |
Pos logit contributions | |
Days | +0.027 |
tutor | +0.026 |
tune | +0.025 |
hospitality | +0.025 |
recommendation | +0.025 |
Neg logit contributions | |
ays | -0.037 |
rob | -0.030 |
ips | -0.030 |
unks | -0.030 |
spins | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
lder | +0.170 |
Days | +0.161 |
Mic | +0.160 |
tutor | +0.160 |
veterinarian | +0.157 |
Neg logit contributions | |
ays | -0.089 |
it | -0.084 |
onto | -0.082 |
on | -0.077 |
ips | -0.076 |
Token | they |
Token ID | 484 |
Feature activation | -3.49e-02 |
Pos logit contributions | |
lder | +0.030 |
tutor | +0.030 |
So | +0.030 |
friend | +0.029 |
forgive | +0.029 |
Neg logit contributions | |
ays | -0.034 |
ips | -0.028 |
rob | -0.028 |
unks | -0.027 |
ions | -0.027 |
Token | both |
Token ID | 1111 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
tutor | +0.056 |
lder | +0.055 |
song | +0.054 |
tune | +0.054 |
recommendation | +0.054 |
Neg logit contributions | |
ays | -0.067 |
ips | -0.056 |
ions | -0.054 |
izz | -0.054 |
rob | -0.054 |
Token | got |
Token ID | 1392 |
Feature activation | +3.06e-02 |
Pos logit contributions | |
lder | +0.027 |
tutor | +0.027 |
friend | +0.027 |
So | +0.027 |
kindly | +0.027 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.037 |
rob | -0.036 |
unks | -0.036 |
ions | -0.035 |
Token | some |
Token ID | 617 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
ays | +0.066 |
rob | +0.056 |
unks | +0.055 |
ips | +0.055 |
plets | +0.054 |
Neg logit contributions | |
friend | -0.046 |
kindly | -0.045 |
lder | -0.045 |
tutor | -0.045 |
So | -0.044 |
Token | , |
Token ID | 11 |
Feature activation | -3.14e-02 |
Pos logit contributions | |
tutor | +0.043 |
lder | +0.043 |
So | +0.042 |
tune | +0.041 |
kindly | +0.041 |
Neg logit contributions | |
ays | -0.062 |
ips | -0.050 |
ions | -0.050 |
unks | -0.050 |
ocol | -0.050 |
Token | it |
Token ID | 340 |
Feature activation | +7.34e-03 |
Pos logit contributions | |
friend | +0.057 |
kindly | +0.056 |
little | +0.056 |
forgive | +0.055 |
So | +0.055 |
Neg logit contributions | |
ays | -0.061 |
rob | -0.053 |
ips | -0.052 |
unks | -0.051 |
chairs | -0.048 |
Token | is |
Token ID | 318 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
ays | +0.014 |
ocol | +0.012 |
unks | +0.012 |
ips | +0.012 |
rob | +0.011 |
Neg logit contributions | |
friend | -0.013 |
lder | -0.013 |
So | -0.013 |
kindly | -0.012 |
forgive | -0.012 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
ays | +0.032 |
rob | +0.028 |
ips | +0.028 |
unks | +0.027 |
ocol | +0.026 |
Neg logit contributions | |
friend | -0.017 |
kindly | -0.016 |
So | -0.015 |
lder | -0.015 |
keeper | -0.015 |
Token | Mia |
Token ID | 32189 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
lder | +0.030 |
friend | +0.030 |
So | +0.030 |
tutor | +0.029 |
kindly | +0.029 |
Neg logit contributions | |
ays | -0.031 |
ips | -0.025 |
rob | -0.025 |
unks | -0.025 |
ions | -0.024 |
Token | agrees |
Token ID | 14386 |
Feature activation | -8.17e-02 |
Pos logit contributions | |
lder | +0.035 |
friend | +0.035 |
So | +0.034 |
kindly | +0.034 |
tutor | +0.034 |
Neg logit contributions | |
ays | -0.059 |
ips | -0.050 |
rob | -0.050 |
unks | -0.049 |
ions | -0.048 |
Token | . |
Token ID | 13 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
lder | +0.179 |
Days | +0.157 |
Mic | +0.157 |
tutor | +0.155 |
veterinarian | +0.149 |
Neg logit contributions | |
ays | -0.096 |
ips | -0.088 |
ions | -0.084 |
onto | -0.082 |
gs | -0.081 |
Token | " |
Token ID | 366 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
lder | +0.023 |
friend | +0.023 |
tutor | +0.022 |
song | +0.022 |
forgive | +0.022 |
Neg logit contributions | |
ays | -0.041 |
ips | -0.035 |
unks | -0.034 |
ions | -0.033 |
rob | -0.032 |
Token | Let |
Token ID | 5756 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
lder | +0.032 |
friend | +0.032 |
So | +0.031 |
kindly | +0.031 |
tutor | +0.031 |
Neg logit contributions | |
ays | -0.059 |
ips | -0.050 |
rob | -0.049 |
unks | -0.049 |
ions | -0.048 |
Token | 's |
Token ID | 338 |
Feature activation | -4.28e-02 |
Pos logit contributions | |
friend | +0.020 |
So | +0.020 |
lder | +0.020 |
kindly | +0.019 |
forgive | +0.019 |
Neg logit contributions | |
ays | -0.035 |
ips | -0.030 |
rob | -0.030 |
unks | -0.030 |
ions | -0.029 |
Token | show |
Token ID | 905 |
Feature activation | -3.76e-03 |
Pos logit contributions | |
lder | +0.059 |
friend | +0.059 |
So | +0.058 |
kindly | +0.057 |
tutor | +0.057 |
Neg logit contributions | |
ays | -0.096 |
ips | -0.081 |
rob | -0.081 |
unks | -0.080 |
ions | -0.078 |
Token | far |
Token ID | 1290 |
Feature activation | +3.29e-02 |
Pos logit contributions | |
ays | +0.045 |
rob | +0.040 |
unks | +0.038 |
ips | +0.038 |
ocol | +0.038 |
Neg logit contributions | |
friend | -0.029 |
So | -0.028 |
lder | -0.028 |
kindly | -0.028 |
song | -0.028 |
Token | it |
Token ID | 340 |
Feature activation | +4.43e-02 |
Pos logit contributions | |
ays | +0.070 |
unks | +0.063 |
ips | +0.060 |
izz | +0.060 |
rob | +0.059 |
Neg logit contributions | |
friend | -0.049 |
kindly | -0.049 |
song | -0.048 |
forgive | -0.047 |
keeper | -0.047 |
Token | goes |
Token ID | 2925 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
ays | +0.082 |
ocol | +0.080 |
rob | +0.075 |
ions | +0.074 |
izz | +0.073 |
Neg logit contributions | |
friend | -0.073 |
So | -0.071 |
kindly | -0.071 |
lder | -0.070 |
forgive | -0.069 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.71e-02 |
Pos logit contributions | |
ays | +0.055 |
rob | +0.049 |
ocol | +0.049 |
ips | +0.048 |
unks | +0.047 |
Neg logit contributions | |
friend | -0.028 |
kindly | -0.027 |
So | -0.026 |
lder | -0.026 |
keeper | -0.025 |
Token | Sam |
Token ID | 3409 |
Feature activation | -2.19e-02 |
Pos logit contributions | |
lder | +0.033 |
kindly | +0.033 |
tutor | +0.033 |
friend | +0.032 |
forgive | +0.032 |
Neg logit contributions | |
ays | -0.029 |
ips | -0.023 |
rob | -0.023 |
unks | -0.023 |
ions | -0.021 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.15e-02 |
Pos logit contributions | |
tutor | +0.036 |
hospitality | +0.035 |
recommendation | +0.034 |
birthday | +0.034 |
lder | +0.034 |
Neg logit contributions | |
ays | -0.041 |
rob | -0.033 |
ips | -0.033 |
spins | -0.033 |
unks | -0.031 |
Token | and |
Token ID | 290 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
lder | +0.179 |
tutor | +0.166 |
Mic | +0.166 |
urious | +0.163 |
Days | +0.161 |
Neg logit contributions | |
it | -0.081 |
ays | -0.079 |
on | -0.074 |
onto | -0.074 |
gs | -0.073 |
Token | said |
Token ID | 531 |
Feature activation | -2.07e-02 |
Pos logit contributions | |
friend | +0.026 |
kindly | +0.026 |
lder | +0.025 |
So | +0.025 |
tutor | +0.025 |
Neg logit contributions | |
ays | -0.038 |
ips | -0.032 |
unks | -0.032 |
rob | -0.032 |
ocol | -0.032 |
Token | , |
Token ID | 11 |
Feature activation | -6.59e-02 |
Pos logit contributions | |
lder | +0.027 |
tutor | +0.027 |
So | +0.027 |
tune | +0.026 |
friend | +0.026 |
Neg logit contributions | |
ays | -0.046 |
ips | -0.040 |
ions | -0.038 |
rob | -0.038 |
unks | -0.038 |
Token | " |
Token ID | 366 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
hospitality | +0.099 |
tutor | +0.098 |
lder | +0.097 |
So | +0.096 |
friend | +0.096 |
Neg logit contributions | |
ays | -0.126 |
ips | -0.109 |
plets | -0.108 |
unks | -0.105 |
ions | -0.102 |
Token | Yes |
Token ID | 5297 |
Feature activation | -4.03e-02 |
Pos logit contributions | |
tutor | +0.036 |
friend | +0.035 |
kindly | +0.035 |
hospitality | +0.033 |
lder | +0.033 |
Neg logit contributions | |
ays | -0.081 |
rob | -0.074 |
plets | -0.073 |
ips | -0.071 |
unks | -0.070 |
Token | ." |
Token ID | 526 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
lder | +0.001 |
So | +0.001 |
understanding | +0.001 |
tutor | +0.001 |
forgive | +0.001 |
Neg logit contributions | |
ays | -0.002 |
ips | -0.002 |
unks | -0.002 |
rob | -0.002 |
ions | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
lder | +0.013 |
tutor | +0.012 |
friend | +0.012 |
kindly | +0.012 |
So | +0.012 |
Neg logit contributions | |
ays | -0.026 |
ips | -0.022 |
rob | -0.022 |
unks | -0.021 |
ions | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
lder | +0.023 |
tutor | +0.022 |
tune | +0.021 |
kindly | +0.021 |
friend | +0.021 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.031 |
rob | -0.031 |
unks | -0.031 |
izz | -0.029 |
Token | S |
Token ID | 50 |
Feature activation | +3.59e-02 |
Pos logit contributions | |
lder | +0.029 |
tutor | +0.029 |
hospitality | +0.027 |
recommendation | +0.026 |
doorstep | +0.026 |
Neg logit contributions | |
ays | -0.042 |
rob | -0.037 |
ips | -0.037 |
izz | -0.035 |
unks | -0.035 |
Token | ara |
Token ID | 3301 |
Feature activation | +3.27e-04 |
Pos logit contributions | |
ays | +0.078 |
ips | +0.067 |
rob | +0.062 |
ocol | +0.061 |
unks | +0.061 |
Neg logit contributions | |
tutor | -0.055 |
understanding | -0.055 |
kindly | -0.054 |
tune | -0.054 |
friend | -0.054 |
Token | agrees |
Token ID | 14386 |
Feature activation | -8.14e-02 |
Pos logit contributions | |
ays | +0.001 |
ips | +0.000 |
rob | +0.000 |
unks | +0.000 |
ions | +0.000 |
Neg logit contributions | |
lder | -0.001 |
friend | -0.001 |
tutor | -0.001 |
So | -0.001 |
kindly | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
lder | +0.171 |
Days | +0.152 |
Mic | +0.151 |
urious | +0.145 |
tutor | +0.145 |
Neg logit contributions | |
ays | -0.103 |
ips | -0.099 |
ions | -0.086 |
on | -0.085 |
gs | -0.085 |
Token | they |
Token ID | 484 |
Feature activation | -2.70e-02 |
Pos logit contributions | |
kindly | +0.030 |
friend | +0.030 |
forgive | +0.029 |
tutor | +0.028 |
So | +0.028 |
Neg logit contributions | |
ays | -0.036 |
ocol | -0.033 |
unks | -0.032 |
rob | -0.032 |
ions | -0.031 |
Token | put |
Token ID | 1234 |
Feature activation | +4.77e-02 |
Pos logit contributions | |
lder | +0.034 |
friend | +0.033 |
tutor | +0.032 |
So | +0.032 |
kindly | +0.032 |
Neg logit contributions | |
ays | -0.064 |
ips | -0.055 |
rob | -0.054 |
unks | -0.053 |
ions | -0.052 |
Token | on |
Token ID | 319 |
Feature activation | +6.69e-03 |
Pos logit contributions | |
plets | +0.112 |
unks | +0.110 |
ays | +0.109 |
ocol | +0.108 |
rol | +0.106 |
Neg logit contributions | |
friend | -0.054 |
lady | -0.047 |
little | -0.046 |
kindly | -0.045 |
forgive | -0.045 |
Token | their |
Token ID | 511 |
Feature activation | -6.46e-03 |
Pos logit contributions | |
ays | +0.015 |
rob | +0.013 |
plets | +0.013 |
unks | +0.013 |
ocol | +0.013 |
Neg logit contributions | |
friend | -0.009 |
So | -0.009 |
kindly | -0.009 |
tutor | -0.009 |
song | -0.009 |
Token | okay |
Token ID | 8788 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
friend | +0.022 |
kindly | +0.021 |
forgive | +0.021 |
So | +0.021 |
tutor | +0.020 |
Neg logit contributions | |
ays | -0.053 |
rob | -0.048 |
ips | -0.046 |
unks | -0.046 |
ocol | -0.044 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
lder | +0.060 |
So | +0.059 |
kindly | +0.059 |
tutor | +0.059 |
forgive | +0.058 |
Neg logit contributions | |
ays | -0.057 |
ips | -0.044 |
unks | -0.044 |
ions | -0.043 |
rob | -0.043 |
Token |
|
Token ID | 198 |
Feature activation | -2.52e-02 |
Pos logit contributions | |
lder | +0.018 |
friend | +0.018 |
tutor | +0.018 |
kindly | +0.018 |
So | +0.018 |
Neg logit contributions | |
ays | -0.038 |
ips | -0.032 |
rob | -0.032 |
unks | -0.032 |
ions | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | -3.38e-02 |
Pos logit contributions | |
tune | +0.039 |
tutor | +0.038 |
hospitality | +0.038 |
lder | +0.038 |
song | +0.038 |
Neg logit contributions | |
ays | -0.051 |
ips | -0.043 |
unks | -0.043 |
rob | -0.042 |
izz | -0.042 |
Token | Tom |
Token ID | 13787 |
Feature activation | -3.05e-02 |
Pos logit contributions | |
tutor | +0.053 |
hospitality | +0.053 |
deed | +0.050 |
friend | +0.049 |
tune | +0.049 |
Neg logit contributions | |
ays | -0.062 |
ips | -0.057 |
unks | -0.055 |
izz | -0.054 |
ions | -0.054 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.12e-02 |
Pos logit contributions | |
hospitality | +0.042 |
birthday | +0.041 |
tutor | +0.041 |
lder | +0.040 |
recommendation | +0.039 |
Neg logit contributions | |
ays | -0.062 |
ips | -0.054 |
gs | -0.052 |
chairs | -0.052 |
spins | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
lder | +0.183 |
Mic | +0.173 |
Days | +0.164 |
tutor | +0.158 |
urious | +0.158 |
Neg logit contributions | |
ays | -0.085 |
onto | -0.078 |
on | -0.073 |
it | -0.070 |
gs | -0.070 |
Token | They |
Token ID | 1119 |
Feature activation | -2.63e-02 |
Pos logit contributions | |
lder | +0.018 |
forgive | +0.018 |
tutor | +0.017 |
tune | +0.017 |
friend | +0.017 |
Neg logit contributions | |
ays | -0.025 |
ips | -0.022 |
unks | -0.020 |
ions | -0.020 |
rob | -0.019 |
Token | made |
Token ID | 925 |
Feature activation | -3.92e-03 |
Pos logit contributions | |
tutor | +0.045 |
lder | +0.045 |
song | +0.045 |
tune | +0.044 |
recommendation | +0.043 |
Neg logit contributions | |
ays | -0.046 |
ips | -0.039 |
ions | -0.038 |
izz | -0.038 |
rob | -0.037 |
Token | a |
Token ID | 257 |
Feature activation | -3.86e-02 |
Pos logit contributions | |
friend | +0.006 |
kindly | +0.005 |
little | +0.005 |
So | +0.005 |
song | +0.005 |
Neg logit contributions | |
ays | -0.009 |
rob | -0.008 |
unks | -0.008 |
ips | -0.008 |
plets | -0.008 |
Token | pink |
Token ID | 11398 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
lder | +0.066 |
hospitality | +0.058 |
So | +0.055 |
tutor | +0.054 |
forgive | +0.053 |
Neg logit contributions | |
ays | -0.062 |
lands | -0.058 |
spins | -0.056 |
patches | -0.054 |
funnel | -0.054 |
Token | , |
Token ID | 11 |
Feature activation | -3.25e-02 |
Pos logit contributions | |
tutor | +0.043 |
So | +0.043 |
lder | +0.043 |
tune | +0.042 |
kindly | +0.041 |
Neg logit contributions | |
ays | -0.061 |
ips | -0.050 |
ions | -0.050 |
unks | -0.049 |
ocol | -0.049 |
Token | it |
Token ID | 340 |
Feature activation | +9.42e-03 |
Pos logit contributions | |
friend | +0.060 |
kindly | +0.059 |
forgive | +0.058 |
little | +0.058 |
song | +0.058 |
Neg logit contributions | |
ays | -0.063 |
rob | -0.054 |
ips | -0.054 |
unks | -0.052 |
chairs | -0.048 |
Token | is |
Token ID | 318 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
ays | +0.018 |
ocol | +0.015 |
ips | +0.015 |
unks | +0.015 |
rob | +0.014 |
Neg logit contributions | |
lder | -0.017 |
friend | -0.017 |
So | -0.016 |
kindly | -0.016 |
forgive | -0.016 |
Token | !" |
Token ID | 2474 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
ays | +0.034 |
ips | +0.029 |
rob | +0.029 |
unks | +0.028 |
ocol | +0.028 |
Neg logit contributions | |
friend | -0.018 |
kindly | -0.017 |
lder | -0.017 |
So | -0.017 |
tutor | -0.016 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.15e-02 |
Pos logit contributions | |
lder | +0.034 |
friend | +0.033 |
So | +0.033 |
tutor | +0.033 |
kindly | +0.033 |
Neg logit contributions | |
ays | -0.049 |
ips | -0.041 |
rob | -0.041 |
unks | -0.040 |
ions | -0.039 |
Token | agrees |
Token ID | 14386 |
Feature activation | -8.12e-02 |
Pos logit contributions | |
lder | +0.032 |
friend | +0.032 |
tutor | +0.031 |
So | +0.031 |
kindly | +0.031 |
Neg logit contributions | |
ays | -0.046 |
ips | -0.038 |
rob | -0.038 |
unks | -0.037 |
ions | -0.036 |
Token | . |
Token ID | 13 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
lder | +0.178 |
Mic | +0.155 |
Days | +0.155 |
tutor | +0.153 |
doorstep | +0.148 |
Neg logit contributions | |
ays | -0.097 |
ips | -0.089 |
ions | -0.083 |
gs | -0.081 |
on | -0.078 |
Token | " |
Token ID | 366 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
lder | +0.025 |
friend | +0.024 |
forgive | +0.024 |
song | +0.024 |
tutor | +0.024 |
Neg logit contributions | |
ays | -0.045 |
ips | -0.038 |
unks | -0.037 |
ions | -0.036 |
rob | -0.036 |
Token | We |
Token ID | 1135 |
Feature activation | +4.19e-03 |
Pos logit contributions | |
lder | +0.031 |
friend | +0.031 |
tutor | +0.031 |
kindly | +0.031 |
So | +0.030 |
Neg logit contributions | |
ays | -0.058 |
ips | -0.050 |
rob | -0.050 |
unks | -0.049 |
ions | -0.048 |
Token | are |
Token ID | 389 |
Feature activation | +4.20e-05 |
Pos logit contributions | |
ays | +0.009 |
rob | +0.007 |
unks | +0.007 |
ips | +0.007 |
chairs | +0.007 |
Neg logit contributions | |
forgive | -0.007 |
friend | -0.007 |
lder | -0.007 |
So | -0.007 |
agree | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
ays | +0.000 |
rob | +0.000 |
unks | +0.000 |
plets | +0.000 |
chairs | +0.000 |
Neg logit contributions | |
friend | -0.000 |
tutor | -0.000 |
kindly | -0.000 |
understanding | -0.000 |
forgive | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
tutor | +0.021 |
friend | +0.021 |
tune | +0.020 |
lder | +0.020 |
song | +0.020 |
Neg logit contributions | |
ays | -0.030 |
rob | -0.026 |
unks | -0.026 |
ips | -0.026 |
izz | -0.025 |
Token | Carl |
Token ID | 26886 |
Feature activation | -7.94e-03 |
Pos logit contributions | |
tutor | +0.022 |
friend | +0.021 |
hospitality | +0.021 |
birthday | +0.021 |
lder | +0.020 |
Neg logit contributions | |
ays | -0.033 |
ions | -0.030 |
unks | -0.030 |
ips | -0.030 |
rob | -0.030 |
Token | excited |
Token ID | 6568 |
Feature activation | -4.79e-02 |
Pos logit contributions | |
tutor | +0.010 |
lder | +0.010 |
So | +0.010 |
friend | +0.010 |
kindly | +0.010 |
Neg logit contributions | |
ays | -0.018 |
ips | -0.015 |
unks | -0.015 |
rob | -0.015 |
ions | -0.015 |
Token | ly |
Token ID | 306 |
Feature activation | -3.43e-02 |
Pos logit contributions | |
Days | +0.058 |
So | +0.054 |
lder | +0.051 |
Years | +0.051 |
forgive | +0.051 |
Neg logit contributions | |
ays | -0.120 |
ips | -0.101 |
rob | -0.097 |
unks | -0.097 |
ions | -0.097 |
Token | said |
Token ID | 531 |
Feature activation | -2.14e-02 |
Pos logit contributions | |
tutor | +0.046 |
lder | +0.045 |
So | +0.045 |
Days | +0.045 |
song | +0.044 |
Neg logit contributions | |
ays | -0.076 |
ips | -0.064 |
unks | -0.062 |
ions | -0.061 |
plets | -0.061 |
Token | yes |
Token ID | 3763 |
Feature activation | -8.11e-02 |
Pos logit contributions | |
So | +0.028 |
lder | +0.028 |
tutor | +0.027 |
tune | +0.027 |
Days | +0.027 |
Neg logit contributions | |
ays | -0.046 |
ips | -0.040 |
ions | -0.039 |
rob | -0.039 |
ocol | -0.038 |
Token | , |
Token ID | 11 |
Feature activation | -5.26e-02 |
Pos logit contributions | |
Days | +0.149 |
lder | +0.146 |
hospitality | +0.145 |
Years | +0.143 |
tutor | +0.143 |
Neg logit contributions | |
ays | -0.114 |
ips | -0.087 |
gs | -0.086 |
az | -0.083 |
unks | -0.082 |
Token | and |
Token ID | 290 |
Feature activation | -4.97e-03 |
Pos logit contributions | |
lder | +0.058 |
friend | +0.056 |
tutor | +0.055 |
So | +0.055 |
kindly | +0.054 |
Neg logit contributions | |
ays | -0.132 |
ips | -0.114 |
rob | -0.113 |
unks | -0.112 |
ions | -0.110 |
Token | the |
Token ID | 262 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
friend | +0.007 |
kindly | +0.007 |
tutor | +0.006 |
So | +0.006 |
forgive | +0.006 |
Neg logit contributions | |
ays | -0.012 |
unks | -0.011 |
ocol | -0.011 |
rob | -0.010 |
ips | -0.010 |
Token | store |
Token ID | 3650 |
Feature activation | +5.20e-03 |
Pos logit contributions | |
lder | +0.017 |
So | +0.015 |
Days | +0.015 |
kindly | +0.014 |
Years | +0.014 |
Neg logit contributions | |
ays | -0.030 |
ips | -0.027 |
rob | -0.026 |
spins | -0.026 |
matters | -0.025 |
Token | owner |
Token ID | 4870 |
Feature activation | -3.89e-03 |
Pos logit contributions | |
ays | +0.014 |
ips | +0.012 |
ions | +0.012 |
rob | +0.012 |
involved | +0.012 |
Neg logit contributions | |
lder | -0.004 |
tune | -0.004 |
Days | -0.004 |
So | -0.004 |
understanding | -0.004 |
Token | on |
Token ID | 319 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
friend | +0.026 |
kindly | +0.025 |
lder | +0.024 |
forgive | +0.024 |
So | +0.024 |
Neg logit contributions | |
ays | -0.055 |
rob | -0.047 |
ips | -0.047 |
ocol | -0.046 |
unks | -0.046 |
Token | an |
Token ID | 281 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
friend | +0.024 |
tutor | +0.023 |
lder | +0.023 |
kindly | +0.023 |
So | +0.022 |
Neg logit contributions | |
ays | -0.032 |
ips | -0.027 |
rob | -0.027 |
plets | -0.026 |
unks | -0.026 |
Token | adventure |
Token ID | 8855 |
Feature activation | -3.10e-02 |
Pos logit contributions | |
forgive | +0.016 |
lder | +0.016 |
keeper | +0.016 |
kindly | +0.016 |
So | +0.016 |
Neg logit contributions | |
ays | -0.025 |
rob | -0.022 |
ions | -0.021 |
ocol | -0.021 |
ips | -0.021 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
lder | +0.044 |
friend | +0.043 |
So | +0.043 |
tutor | +0.043 |
kindly | +0.043 |
Neg logit contributions | |
ays | -0.067 |
ips | -0.057 |
rob | -0.056 |
unks | -0.056 |
ions | -0.054 |
Token | Ben |
Token ID | 3932 |
Feature activation | -2.43e-02 |
Pos logit contributions | |
lder | +0.034 |
friend | +0.034 |
tutor | +0.033 |
So | +0.033 |
kindly | +0.033 |
Neg logit contributions | |
ays | -0.033 |
ips | -0.027 |
rob | -0.027 |
unks | -0.027 |
ions | -0.025 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.10e-02 |
Pos logit contributions | |
lder | +0.042 |
tutor | +0.041 |
Days | +0.041 |
hospitality | +0.040 |
recommendation | +0.040 |
Neg logit contributions | |
ays | -0.044 |
rob | -0.036 |
ips | -0.035 |
unks | -0.034 |
chairs | -0.033 |
Token | . |
Token ID | 13 |
Feature activation | -2.77e-02 |
Pos logit contributions | |
lder | +0.195 |
Days | +0.181 |
Years | +0.171 |
Mic | +0.170 |
urious | +0.169 |
Neg logit contributions | |
ays | -0.084 |
onto | -0.066 |
gs | -0.066 |
on | -0.064 |
izz | -0.064 |
Token |
|
Token ID | 198 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
lder | +0.048 |
tune | +0.045 |
hospitality | +0.044 |
song | +0.043 |
worry | +0.042 |
Neg logit contributions | |
ays | -0.056 |
ips | -0.047 |
ions | -0.044 |
unks | -0.044 |
plets | -0.042 |
Token |
|
Token ID | 198 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
lder | +0.028 |
tutor | +0.026 |
tune | +0.025 |
kindly | +0.025 |
hospitality | +0.025 |
Neg logit contributions | |
ays | -0.042 |
ips | -0.035 |
unks | -0.035 |
rob | -0.034 |
ions | -0.034 |
Token | They |
Token ID | 2990 |
Feature activation | -3.10e-02 |
Pos logit contributions | |
lder | +0.046 |
tutor | +0.044 |
hospitality | +0.042 |
worry | +0.040 |
lawyer | +0.040 |
Neg logit contributions | |
ays | -0.053 |
ips | -0.048 |
ions | -0.046 |
unks | -0.044 |
rob | -0.043 |
Token | climbed |
Token ID | 19952 |
Feature activation | +3.23e-02 |
Pos logit contributions | |
tutor | +0.046 |
lder | +0.046 |
friend | +0.045 |
song | +0.044 |
So | +0.044 |
Neg logit contributions | |
ays | -0.065 |
ips | -0.054 |
rob | -0.054 |
unks | -0.053 |
ions | -0.052 |
Token | it |
Token ID | 340 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
ays | +0.010 |
plets | +0.009 |
ips | +0.009 |
rob | +0.009 |
izz | +0.009 |
Neg logit contributions | |
friend | -0.007 |
tutor | -0.007 |
song | -0.007 |
little | -0.007 |
tune | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | -8.55e-03 |
Pos logit contributions | |
lder | +0.020 |
friend | +0.020 |
So | +0.020 |
kindly | +0.020 |
tutor | +0.020 |
Neg logit contributions | |
ays | -0.032 |
ips | -0.027 |
rob | -0.027 |
unks | -0.027 |
ions | -0.026 |
Token | longest |
Token ID | 14069 |
Feature activation | +1.08e-03 |
Pos logit contributions | |
lder | +0.013 |
kindly | +0.013 |
So | +0.012 |
forgive | +0.012 |
friend | +0.012 |
Neg logit contributions | |
ays | -0.017 |
rob | -0.015 |
ips | -0.015 |
unks | -0.015 |
ions | -0.014 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.60e-02 |
Pos logit contributions | |
ays | +0.003 |
rob | +0.002 |
ips | +0.002 |
unks | +0.002 |
ocol | +0.002 |
Neg logit contributions | |
friend | -0.001 |
tutor | -0.001 |
song | -0.001 |
So | -0.001 |
lder | -0.001 |
Token | Sam |
Token ID | 3409 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
lder | +0.031 |
kindly | +0.030 |
tutor | +0.030 |
friend | +0.030 |
So | +0.030 |
Neg logit contributions | |
ays | -0.027 |
ips | -0.022 |
rob | -0.022 |
unks | -0.021 |
ions | -0.020 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.09e-02 |
Pos logit contributions | |
tutor | +0.027 |
hospitality | +0.026 |
Days | +0.026 |
recommendation | +0.025 |
lder | +0.025 |
Neg logit contributions | |
ays | -0.035 |
rob | -0.029 |
spins | -0.029 |
ips | -0.029 |
unks | -0.028 |
Token | , |
Token ID | 11 |
Feature activation | -6.09e-02 |
Pos logit contributions | |
lder | +0.168 |
Mic | +0.159 |
tutor | +0.158 |
veterinarian | +0.157 |
urious | +0.154 |
Neg logit contributions | |
it | -0.084 |
ays | -0.084 |
onto | -0.082 |
on | -0.078 |
patches | -0.076 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
lder | +0.086 |
tutor | +0.082 |
friend | +0.079 |
hospitality | +0.078 |
Days | +0.078 |
Neg logit contributions | |
ays | -0.125 |
ips | -0.108 |
plets | -0.107 |
ions | -0.105 |
rob | -0.105 |
Token | they |
Token ID | 484 |
Feature activation | -3.56e-02 |
Pos logit contributions | |
friend | +0.023 |
lder | +0.023 |
kindly | +0.022 |
So | +0.022 |
tutor | +0.022 |
Neg logit contributions | |
ays | -0.030 |
ips | -0.025 |
rob | -0.024 |
unks | -0.024 |
ocol | -0.023 |
Token | both |
Token ID | 1111 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
friend | +0.051 |
So | +0.050 |
lder | +0.049 |
kindly | +0.049 |
forgive | +0.048 |
Neg logit contributions | |
ays | -0.080 |
ips | -0.067 |
rob | -0.067 |
unks | -0.067 |
ocol | -0.066 |
Token | climbed |
Token ID | 19952 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
friend | +0.026 |
So | +0.026 |
lder | +0.025 |
forgive | +0.025 |
kindly | +0.025 |
Neg logit contributions | |
ays | -0.044 |
unks | -0.037 |
ocol | -0.037 |
ips | -0.037 |
rob | -0.036 |
Token | okay |
Token ID | 8788 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
ays | +0.032 |
rob | +0.028 |
unks | +0.027 |
ips | +0.027 |
plets | +0.025 |
Neg logit contributions | |
friend | -0.018 |
forgive | -0.018 |
song | -0.017 |
kindly | -0.017 |
So | -0.017 |
Token | ?" |
Token ID | 1701 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
So | +0.053 |
lder | +0.053 |
tutor | +0.052 |
Days | +0.052 |
kindly | +0.052 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.033 |
unks | -0.032 |
ions | -0.032 |
rob | -0.030 |
Token |
|
Token ID | 198 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
lder | +0.017 |
friend | +0.017 |
tutor | +0.016 |
kindly | +0.016 |
So | +0.016 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.032 |
rob | -0.031 |
unks | -0.031 |
ions | -0.030 |
Token |
|
Token ID | 198 |
Feature activation | -1.94e-02 |
Pos logit contributions | |
lder | +0.018 |
friend | +0.018 |
tutor | +0.018 |
kindly | +0.018 |
So | +0.018 |
Neg logit contributions | |
ays | -0.040 |
ips | -0.035 |
rob | -0.034 |
unks | -0.034 |
ions | -0.033 |
Token | Tom |
Token ID | 13787 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
tutor | +0.022 |
lder | +0.021 |
friend | +0.020 |
kindly | +0.020 |
hospitality | +0.020 |
Neg logit contributions | |
ays | -0.049 |
ips | -0.044 |
rob | -0.043 |
unks | -0.043 |
ions | -0.041 |
Token | agrees |
Token ID | 14386 |
Feature activation | -8.09e-02 |
Pos logit contributions | |
lder | +0.019 |
tutor | +0.018 |
friend | +0.018 |
tune | +0.018 |
So | +0.018 |
Neg logit contributions | |
ays | -0.021 |
ips | -0.018 |
rob | -0.017 |
unks | -0.017 |
ions | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
lder | +0.181 |
Days | +0.155 |
tutor | +0.155 |
Mic | +0.153 |
doorstep | +0.150 |
Neg logit contributions | |
ays | -0.098 |
ips | -0.091 |
on | -0.084 |
gs | -0.083 |
onto | -0.080 |
Token | They |
Token ID | 1119 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
friend | +0.013 |
So | +0.013 |
kindly | +0.013 |
tutor | +0.013 |
lder | +0.013 |
Neg logit contributions | |
ays | -0.026 |
rob | -0.022 |
ips | -0.022 |
unks | -0.022 |
ocol | -0.022 |
Token | hold |
Token ID | 1745 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
lder | +0.034 |
tune | +0.032 |
tutor | +0.032 |
song | +0.030 |
kindly | +0.030 |
Neg logit contributions | |
ays | -0.049 |
ips | -0.043 |
rob | -0.042 |
unks | -0.041 |
ions | -0.040 |
Token | hands |
Token ID | 2832 |
Feature activation | -1.00e-03 |
Pos logit contributions | |
plets | +0.055 |
rob | +0.055 |
ays | +0.054 |
unks | +0.051 |
ocol | +0.048 |
Neg logit contributions | |
friend | -0.042 |
So | -0.036 |
forgive | -0.035 |
kindly | -0.035 |
tutor | -0.034 |
Token | and |
Token ID | 290 |
Feature activation | +4.59e-03 |
Pos logit contributions | |
lder | +0.001 |
tutor | +0.001 |
Days | +0.001 |
recommendation | +0.001 |
So | +0.001 |
Neg logit contributions | |
ays | -0.002 |
ips | -0.002 |
unks | -0.002 |
ions | -0.002 |
rob | -0.002 |
Token | " |
Token ID | 1 |
Feature activation | -2.69e-02 |
Pos logit contributions | |
hospitality | +0.047 |
lder | +0.041 |
keeper | +0.041 |
recommendation | +0.041 |
gesture | +0.040 |
Neg logit contributions | |
ays | -0.061 |
ips | -0.054 |
unks | -0.053 |
ions | -0.052 |
matters | -0.050 |
Token | Me |
Token ID | 5308 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
friend | +0.035 |
lder | +0.035 |
kindly | +0.034 |
tutor | +0.034 |
forgive | +0.033 |
Neg logit contributions | |
ays | -0.061 |
ips | -0.053 |
rob | -0.052 |
unks | -0.051 |
plets | -0.051 |
Token | neither |
Token ID | 6159 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
ays | +0.024 |
rob | +0.021 |
ips | +0.020 |
unks | +0.020 |
ocol | +0.020 |
Neg logit contributions | |
friend | -0.019 |
lder | -0.018 |
kindly | -0.018 |
tutor | -0.017 |
So | -0.017 |
Token | !" |
Token ID | 2474 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
lder | +0.026 |
tutor | +0.025 |
kindly | +0.025 |
So | +0.024 |
forgive | +0.024 |
Neg logit contributions | |
ays | -0.041 |
ips | -0.034 |
unks | -0.034 |
rob | -0.034 |
ions | -0.033 |
Token | Max |
Token ID | 5436 |
Feature activation | -3.83e-02 |
Pos logit contributions | |
lder | +0.045 |
hospitality | +0.042 |
recommendation | +0.042 |
Days | +0.041 |
So | +0.041 |
Neg logit contributions | |
ays | -0.044 |
ips | -0.035 |
chairs | -0.035 |
rob | -0.035 |
ions | -0.034 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.05e-02 |
Pos logit contributions | |
lder | +0.071 |
tutor | +0.070 |
hospitality | +0.070 |
birthday | +0.069 |
recommendation | +0.069 |
Neg logit contributions | |
ays | -0.056 |
chairs | -0.046 |
involved | -0.045 |
rob | -0.044 |
ips | -0.043 |
Token | and |
Token ID | 290 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
lder | +0.187 |
Days | +0.167 |
Mic | +0.166 |
urious | +0.164 |
Years | +0.157 |
Neg logit contributions | |
ays | -0.085 |
onto | -0.075 |
on | -0.071 |
chairs | -0.068 |
it | -0.065 |
Token | did |
Token ID | 750 |
Feature activation | -3.54e-02 |
Pos logit contributions | |
lder | +0.030 |
tutor | +0.029 |
friend | +0.029 |
So | +0.029 |
kindly | +0.028 |
Neg logit contributions | |
ays | -0.041 |
ips | -0.034 |
rob | -0.034 |
unks | -0.033 |
ions | -0.033 |
Token | the |
Token ID | 262 |
Feature activation | -2.33e-02 |
Pos logit contributions | |
lder | +0.044 |
tutor | +0.041 |
So | +0.041 |
tune | +0.040 |
hospitality | +0.040 |
Neg logit contributions | |
ays | -0.082 |
ips | -0.071 |
unks | -0.069 |
ions | -0.068 |
matters | -0.068 |
Token | same |
Token ID | 976 |
Feature activation | -4.25e-02 |
Pos logit contributions | |
Days | +0.043 |
kindly | +0.042 |
forgive | +0.041 |
broken | +0.041 |
lder | +0.041 |
Neg logit contributions | |
ays | -0.038 |
rob | -0.030 |
matters | -0.030 |
ips | -0.029 |
lands | -0.028 |
Token | . |
Token ID | 13 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
lder | +0.067 |
So | +0.060 |
hospitality | +0.057 |
Days | +0.055 |
Okay | +0.055 |
Neg logit contributions | |
ays | -0.087 |
ips | -0.077 |
ocol | -0.073 |
matters | -0.071 |
lands | -0.069 |
Token |
|
Token ID | 198 |
Feature activation | -6.35e-03 |
Pos logit contributions | |
ays | +0.023 |
ips | +0.019 |
rob | +0.019 |
unks | +0.019 |
ions | +0.019 |
Neg logit contributions | |
lder | -0.011 |
friend | -0.011 |
So | -0.011 |
kindly | -0.011 |
tutor | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
lder | +0.009 |
tutor | +0.009 |
tune | +0.008 |
friend | +0.008 |
song | +0.008 |
Neg logit contributions | |
ays | -0.014 |
rob | -0.012 |
ips | -0.012 |
unks | -0.012 |
izz | -0.012 |
Token | Tom |
Token ID | 13787 |
Feature activation | -2.26e-02 |
Pos logit contributions | |
lder | +0.015 |
tutor | +0.014 |
tune | +0.014 |
hospitality | +0.014 |
song | +0.014 |
Neg logit contributions | |
ays | -0.022 |
rob | -0.020 |
ips | -0.019 |
izz | -0.019 |
ions | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
Days | +0.036 |
tutor | +0.035 |
lder | +0.035 |
hospitality | +0.035 |
recommendation | +0.035 |
Neg logit contributions | |
ays | -0.044 |
ips | -0.037 |
rob | -0.035 |
unks | -0.035 |
izz | -0.034 |
Token | Mia |
Token ID | 32189 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
lder | +0.030 |
So | +0.029 |
kindly | +0.028 |
tutor | +0.028 |
forgive | +0.028 |
Neg logit contributions | |
ays | -0.024 |
ips | -0.019 |
ions | -0.018 |
rob | -0.018 |
unks | -0.018 |
Token | agreed |
Token ID | 4987 |
Feature activation | -8.04e-02 |
Pos logit contributions | |
tutor | +0.044 |
Days | +0.043 |
Years | +0.042 |
recommendation | +0.041 |
birthday | +0.040 |
Neg logit contributions | |
ays | -0.028 |
ips | -0.022 |
plets | -0.021 |
izz | -0.021 |
involved | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
Mic | +0.166 |
lder | +0.166 |
urious | +0.158 |
Days | +0.153 |
tutor | +0.150 |
Neg logit contributions | |
it | -0.091 |
ays | -0.090 |
patches | -0.083 |
matters | -0.083 |
on | -0.082 |
Token | They |
Token ID | 1119 |
Feature activation | -2.29e-02 |
Pos logit contributions | |
isy | +0.019 |
lder | +0.019 |
friend | +0.018 |
tune | +0.018 |
tutor | +0.018 |
Neg logit contributions | |
ays | -0.019 |
ips | -0.015 |
unks | -0.013 |
ions | -0.013 |
chairs | -0.013 |
Token | worked |
Token ID | 3111 |
Feature activation | -3.40e-03 |
Pos logit contributions | |
tune | +0.038 |
tutor | +0.037 |
lder | +0.037 |
song | +0.036 |
recommendation | +0.036 |
Neg logit contributions | |
ays | -0.040 |
rob | -0.035 |
ips | -0.033 |
izz | -0.033 |
chairs | -0.032 |
Token | in |
Token ID | 287 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
lder | +0.006 |
tutor | +0.006 |
friend | +0.006 |
hospitality | +0.006 |
forgive | +0.006 |
Neg logit contributions | |
ays | -0.006 |
ips | -0.005 |
rob | -0.005 |
unks | -0.005 |
ions | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
lder | +0.042 |
So | +0.040 |
tutor | +0.039 |
kindly | +0.039 |
friend | +0.039 |
Neg logit contributions | |
ays | -0.035 |
ips | -0.029 |
rob | -0.027 |
ions | -0.027 |
unks | -0.027 |
Token | , |
Token ID | 11 |
Feature activation | +4.29e-02 |
Pos logit contributions | |
ays | +0.053 |
ocol | +0.049 |
plets | +0.049 |
rob | +0.047 |
unks | +0.046 |
Neg logit contributions | |
friend | -0.026 |
little | -0.023 |
So | -0.023 |
keeper | -0.022 |
lder | -0.022 |
Token | the |
Token ID | 262 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
ays | +0.110 |
rob | +0.098 |
unks | +0.098 |
ips | +0.095 |
opl | +0.092 |
Neg logit contributions | |
friend | -0.052 |
little | -0.050 |
kindly | -0.050 |
tutor | -0.049 |
forgive | -0.047 |
Token | girl |
Token ID | 2576 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
ays | +0.031 |
ips | +0.025 |
rob | +0.024 |
unks | +0.024 |
ions | +0.024 |
Neg logit contributions | |
lder | -0.026 |
So | -0.025 |
forgive | -0.024 |
tutor | -0.024 |
kindly | -0.024 |
Token | found |
Token ID | 1043 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
ays | +0.041 |
rob | +0.037 |
ips | +0.036 |
ocol | +0.035 |
plets | +0.035 |
Neg logit contributions | |
friend | -0.020 |
lder | -0.019 |
kindly | -0.019 |
So | -0.018 |
forgive | -0.017 |
Token | some |
Token ID | 617 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
ays | +0.081 |
rob | +0.074 |
ips | +0.073 |
unks | +0.073 |
plets | +0.071 |
Neg logit contributions | |
friend | -0.036 |
little | -0.034 |
kindly | -0.034 |
forgive | -0.031 |
understanding | -0.030 |
Token | che |
Token ID | 1125 |
Feature activation | +7.19e-02 |
Pos logit contributions | |
ays | +0.028 |
ips | +0.025 |
rob | +0.024 |
unks | +0.024 |
plets | +0.023 |
Neg logit contributions | |
friend | -0.016 |
kindly | -0.015 |
little | -0.015 |
So | -0.015 |
tutor | -0.015 |
Token | wy |
Token ID | 21768 |
Feature activation | +6.09e-03 |
Pos logit contributions | |
ays | +0.146 |
chairs | +0.125 |
plets | +0.120 |
rob | +0.117 |
unks | +0.116 |
Neg logit contributions | |
lder | -0.103 |
friend | -0.101 |
isy | -0.101 |
nd | -0.100 |
Days | -0.096 |
Token | things |
Token ID | 1243 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
ays | +0.013 |
ips | +0.011 |
rob | +0.011 |
unks | +0.011 |
ions | +0.011 |
Neg logit contributions | |
friend | -0.009 |
lder | -0.009 |
So | -0.009 |
kindly | -0.008 |
tutor | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
ays | +0.067 |
rob | +0.061 |
unks | +0.059 |
ips | +0.059 |
ocol | +0.057 |
Neg logit contributions | |
kindly | -0.024 |
forgive | -0.022 |
friend | -0.022 |
keeper | -0.021 |
tutor | -0.021 |
Token | She |
Token ID | 1375 |
Feature activation | +3.42e-03 |
Pos logit contributions | |
ays | +0.041 |
rob | +0.037 |
ips | +0.035 |
unks | +0.035 |
ocol | +0.035 |
Neg logit contributions | |
So | -0.018 |
lder | -0.018 |
friend | -0.018 |
tutor | -0.018 |
kindly | -0.018 |
Token | was |
Token ID | 373 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
ays | +0.008 |
ips | +0.007 |
rob | +0.007 |
unks | +0.007 |
ions | +0.006 |
Neg logit contributions | |
lder | -0.005 |
friend | -0.004 |
kindly | -0.004 |
So | -0.004 |
tutor | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
ays | +0.028 |
ips | +0.024 |
rob | +0.024 |
unks | +0.024 |
ions | +0.023 |
Neg logit contributions | |
lder | -0.013 |
friend | -0.013 |
So | -0.013 |
tutor | -0.013 |
kindly | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
lder | +0.016 |
tutor | +0.016 |
friend | +0.016 |
kindly | +0.016 |
hospitality | +0.016 |
Neg logit contributions | |
ays | -0.027 |
unks | -0.023 |
ips | -0.023 |
rob | -0.023 |
ions | -0.022 |
Token | Suddenly |
Token ID | 38582 |
Feature activation | +3.82e-02 |
Pos logit contributions | |
hospitality | +0.025 |
tutor | +0.025 |
friend | +0.024 |
kindly | +0.023 |
lder | +0.023 |
Neg logit contributions | |
ays | -0.042 |
ions | -0.039 |
izz | -0.037 |
unks | -0.037 |
spins | -0.037 |
Token | , |
Token ID | 11 |
Feature activation | +2.65e-02 |
Pos logit contributions | |
ays | +0.112 |
rob | +0.103 |
unks | +0.099 |
ips | +0.098 |
ocol | +0.095 |
Neg logit contributions | |
friend | -0.035 |
kindly | -0.033 |
little | -0.029 |
understanding | -0.029 |
tutor | -0.029 |
Token | the |
Token ID | 262 |
Feature activation | +2.01e-03 |
Pos logit contributions | |
ays | +0.057 |
rob | +0.049 |
ips | +0.048 |
unks | +0.048 |
ocol | +0.046 |
Neg logit contributions | |
friend | -0.041 |
kindly | -0.040 |
tutor | -0.040 |
lder | -0.039 |
So | -0.039 |
Token | k |
Token ID | 479 |
Feature activation | +7.21e-02 |
Pos logit contributions | |
ays | +0.004 |
ips | +0.003 |
rob | +0.003 |
unks | +0.003 |
ions | +0.003 |
Neg logit contributions | |
lder | -0.003 |
friend | -0.003 |
kindly | -0.003 |
So | -0.003 |
tutor | -0.003 |
Token | ite |
Token ID | 578 |
Feature activation | +3.22e-02 |
Pos logit contributions | |
ays | +0.107 |
rob | +0.087 |
unks | +0.084 |
ocol | +0.083 |
ips | +0.080 |
Neg logit contributions | |
friend | -0.152 |
So | -0.147 |
kindly | -0.144 |
lder | -0.144 |
tutor | -0.143 |
Token | got |
Token ID | 1392 |
Feature activation | +3.42e-02 |
Pos logit contributions | |
ays | +0.060 |
ips | +0.049 |
rob | +0.049 |
unks | +0.048 |
ions | +0.046 |
Neg logit contributions | |
lder | -0.056 |
friend | -0.056 |
kindly | -0.055 |
So | -0.055 |
tutor | -0.055 |
Token | stuck |
Token ID | 7819 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
ays | +0.069 |
rob | +0.064 |
ips | +0.058 |
unks | +0.057 |
ocol | +0.056 |
Neg logit contributions | |
kindly | -0.058 |
friend | -0.057 |
So | -0.055 |
understanding | -0.054 |
forgive | -0.053 |
Token | in |
Token ID | 287 |
Feature activation | -9.51e-03 |
Pos logit contributions | |
ays | +0.026 |
rob | +0.022 |
ips | +0.022 |
unks | +0.022 |
ocol | +0.021 |
Neg logit contributions | |
friend | -0.015 |
lder | -0.015 |
kindly | -0.015 |
So | -0.015 |
tutor | -0.015 |
Token | a |
Token ID | 257 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
lder | +0.017 |
tutor | +0.017 |
friend | +0.017 |
kindly | +0.017 |
So | +0.017 |
Neg logit contributions | |
ays | -0.017 |
ips | -0.014 |
ions | -0.014 |
unks | -0.014 |
rob | -0.013 |
Token | she |
Token ID | 673 |
Feature activation | -2.46e-03 |
Pos logit contributions | |
friend | +0.008 |
kindly | +0.008 |
who | +0.008 |
forgive | +0.008 |
understanding | +0.008 |
Neg logit contributions | |
ays | -0.018 |
rob | -0.016 |
ips | -0.016 |
plets | -0.016 |
unks | -0.016 |
Token | was |
Token ID | 373 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
friend | +0.003 |
lder | +0.003 |
kindly | +0.003 |
So | +0.003 |
forgive | +0.003 |
Neg logit contributions | |
ays | -0.006 |
rob | -0.005 |
ips | -0.005 |
ocol | -0.005 |
ions | -0.005 |
Token | still |
Token ID | 991 |
Feature activation | -4.59e-03 |
Pos logit contributions | |
ays | +0.028 |
rob | +0.024 |
unks | +0.023 |
ips | +0.023 |
plets | +0.023 |
Neg logit contributions | |
friend | -0.012 |
kindly | -0.012 |
understanding | -0.012 |
tutor | -0.012 |
forgive | -0.012 |
Token | wearing |
Token ID | 5762 |
Feature activation | +3.15e-02 |
Pos logit contributions | |
friend | +0.006 |
kindly | +0.006 |
tutor | +0.006 |
understanding | +0.006 |
forgive | +0.006 |
Neg logit contributions | |
ays | -0.011 |
rob | -0.010 |
ips | -0.009 |
unks | -0.009 |
plets | -0.009 |
Token | her |
Token ID | 607 |
Feature activation | +1.46e-02 |
Pos logit contributions | |
ays | +0.078 |
rob | +0.068 |
unks | +0.066 |
ips | +0.065 |
plets | +0.064 |
Neg logit contributions | |
friend | -0.043 |
song | -0.041 |
kindly | -0.041 |
forgive | -0.041 |
tutor | -0.040 |
Token | p |
Token ID | 279 |
Feature activation | +7.24e-02 |
Pos logit contributions | |
ays | +0.033 |
rob | +0.028 |
ips | +0.028 |
unks | +0.027 |
ions | +0.027 |
Neg logit contributions | |
friend | -0.021 |
tutor | -0.020 |
lder | -0.020 |
kindly | -0.020 |
forgive | -0.020 |
Token | aj |
Token ID | 1228 |
Feature activation | +1.45e-03 |
Pos logit contributions | |
ays | +0.153 |
rob | +0.137 |
ions | +0.129 |
plets | +0.128 |
ips | +0.127 |
Neg logit contributions | |
friend | -0.108 |
lder | -0.102 |
kindly | -0.098 |
So | -0.098 |
tutor | -0.098 |
Token | amas |
Token ID | 17485 |
Feature activation | -1.97e-03 |
Pos logit contributions | |
ays | +0.003 |
ips | +0.002 |
unks | +0.002 |
rob | +0.002 |
plets | +0.002 |
Neg logit contributions | |
friend | -0.003 |
lder | -0.003 |
tutor | -0.003 |
forgive | -0.003 |
kindly | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -1.35e-03 |
Pos logit contributions | |
lder | +0.002 |
friend | +0.002 |
So | +0.002 |
tutor | +0.002 |
kindly | +0.002 |
Neg logit contributions | |
ays | -0.005 |
ips | -0.004 |
rob | -0.004 |
unks | -0.004 |
ions | -0.004 |
Token | |
Token ID | 220 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
lder | +0.002 |
friend | +0.002 |
tutor | +0.002 |
So | +0.002 |
forgive | +0.002 |
Neg logit contributions | |
ays | -0.003 |
ips | -0.003 |
unks | -0.003 |
rob | -0.003 |
ions | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
ays | +0.050 |
rob | +0.043 |
ips | +0.043 |
unks | +0.042 |
ocol | +0.042 |
Neg logit contributions | |
So | -0.019 |
friend | -0.018 |
lder | -0.018 |
kindly | -0.018 |
forgive | -0.018 |
Token | , |
Token ID | 11 |
Feature activation | +7.06e-03 |
Pos logit contributions | |
ays | +0.034 |
ips | +0.029 |
rob | +0.028 |
unks | +0.028 |
ions | +0.028 |
Neg logit contributions | |
lder | -0.019 |
So | -0.018 |
tutor | -0.018 |
friend | -0.018 |
kindly | -0.018 |
Token | tragedy |
Token ID | 13574 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
ays | +0.013 |
ips | +0.011 |
rob | +0.011 |
ions | +0.011 |
unks | +0.011 |
Neg logit contributions | |
lder | -0.012 |
So | -0.012 |
tutor | -0.011 |
friend | -0.011 |
kindly | -0.011 |
Token | struck |
Token ID | 7425 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
ays | +0.027 |
ips | +0.022 |
unks | +0.022 |
rob | +0.022 |
ocol | +0.021 |
Neg logit contributions | |
kindly | -0.019 |
lder | -0.019 |
friend | -0.019 |
So | -0.019 |
tutor | -0.019 |
Token | ! |
Token ID | 0 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
ays | +0.036 |
rob | +0.031 |
ips | +0.030 |
unks | +0.030 |
plets | +0.029 |
Neg logit contributions | |
friend | -0.024 |
kindly | -0.023 |
lder | -0.023 |
So | -0.023 |
tutor | -0.023 |
Token | The |
Token ID | 383 |
Feature activation | -7.17e-03 |
Pos logit contributions | |
ays | +0.031 |
ips | +0.026 |
unks | +0.025 |
ions | +0.025 |
rob | +0.025 |
Neg logit contributions | |
friend | -0.025 |
lder | -0.025 |
So | -0.025 |
forgive | -0.024 |
kindly | -0.024 |
Token | ribbon |
Token ID | 29092 |
Feature activation | +7.19e-02 |
Pos logit contributions | |
lder | +0.007 |
So | +0.006 |
hospitality | +0.006 |
kindly | +0.005 |
agree | +0.005 |
Neg logit contributions | |
ays | -0.018 |
spins | -0.016 |
ips | -0.016 |
ocol | -0.016 |
chairs | -0.016 |
Token | broke |
Token ID | 6265 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
ays | +0.149 |
rob | +0.140 |
ocol | +0.135 |
unks | +0.131 |
ips | +0.127 |
Neg logit contributions | |
friend | -0.107 |
kindly | -0.105 |
So | -0.102 |
song | -0.100 |
keeper | -0.099 |
Token | , |
Token ID | 11 |
Feature activation | +5.86e-04 |
Pos logit contributions | |
ays | +0.057 |
rob | +0.053 |
unks | +0.049 |
ips | +0.049 |
ocol | +0.048 |
Neg logit contributions | |
friend | -0.032 |
kindly | -0.032 |
So | -0.029 |
little | -0.029 |
keeper | -0.029 |
Token | and |
Token ID | 290 |
Feature activation | +3.07e-02 |
Pos logit contributions | |
ays | +0.002 |
rob | +0.001 |
ips | +0.001 |
unks | +0.001 |
ocol | +0.001 |
Neg logit contributions | |
kindly | -0.001 |
friend | -0.001 |
lder | -0.001 |
So | -0.001 |
understanding | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -9.08e-03 |
Pos logit contributions | |
ays | +0.071 |
rob | +0.063 |
unks | +0.063 |
ips | +0.061 |
ocol | +0.057 |
Neg logit contributions | |
kindly | -0.045 |
friend | -0.045 |
little | -0.045 |
understanding | -0.043 |
song | -0.043 |
Token | pink |
Token ID | 11398 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
lder | +0.008 |
So | +0.007 |
hospitality | +0.006 |
kindly | +0.006 |
forgive | +0.006 |
Neg logit contributions | |
ays | -0.024 |
ips | -0.021 |
spins | -0.021 |
ocol | -0.021 |
chairs | -0.021 |
Token | I |
Token ID | 40 |
Feature activation | +3.16e-02 |
Pos logit contributions | |
So | +0.005 |
friend | +0.005 |
lder | +0.005 |
forgive | +0.004 |
kindly | +0.004 |
Neg logit contributions | |
ays | -0.010 |
ips | -0.008 |
unks | -0.008 |
rob | -0.008 |
ocol | -0.008 |
Token | told |
Token ID | 1297 |
Feature activation | +5.03e-03 |
Pos logit contributions | |
ays | +0.071 |
ips | +0.059 |
unks | +0.059 |
rob | +0.059 |
ions | +0.057 |
Neg logit contributions | |
forgive | -0.050 |
friend | -0.048 |
So | -0.048 |
kindly | -0.047 |
lder | -0.046 |
Token | you |
Token ID | 345 |
Feature activation | -6.06e-03 |
Pos logit contributions | |
ays | +0.012 |
ips | +0.010 |
rob | +0.010 |
unks | +0.010 |
plets | +0.009 |
Neg logit contributions | |
friend | -0.007 |
So | -0.007 |
kindly | -0.007 |
lder | -0.007 |
forgive | -0.007 |
Token | not |
Token ID | 407 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
friend | +0.008 |
lder | +0.008 |
kindly | +0.008 |
So | +0.008 |
tutor | +0.008 |
Neg logit contributions | |
ays | -0.014 |
rob | -0.012 |
ips | -0.012 |
unks | -0.012 |
plets | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
lder | +0.018 |
friend | +0.018 |
So | +0.018 |
tutor | +0.018 |
kindly | +0.018 |
Neg logit contributions | |
ays | -0.054 |
ips | -0.047 |
rob | -0.047 |
unks | -0.047 |
ions | -0.046 |
Token | pick |
Token ID | 2298 |
Feature activation | +7.22e-02 |
Pos logit contributions | |
tutor | +0.031 |
lder | +0.030 |
Days | +0.029 |
kindly | +0.029 |
So | +0.028 |
Neg logit contributions | |
ays | -0.052 |
ips | -0.046 |
unks | -0.046 |
matters | -0.046 |
rob | -0.045 |
Token | my |
Token ID | 616 |
Feature activation | +4.53e-03 |
Pos logit contributions | |
plets | +0.162 |
ays | +0.161 |
unks | +0.158 |
ips | +0.153 |
izz | +0.150 |
Neg logit contributions | |
little | -0.092 |
friend | -0.088 |
kindly | -0.080 |
puppy | -0.075 |
stranger | -0.073 |
Token | flowers |
Token ID | 12734 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
ays | +0.010 |
ips | +0.009 |
rob | +0.009 |
plets | +0.009 |
unks | +0.009 |
Neg logit contributions | |
friend | -0.006 |
tutor | -0.006 |
lder | -0.006 |
kindly | -0.006 |
forgive | -0.006 |
Token | ! |
Token ID | 0 |
Feature activation | +2.76e-02 |
Pos logit contributions | |
ays | +0.073 |
rob | +0.064 |
ips | +0.064 |
unks | +0.063 |
plets | +0.062 |
Neg logit contributions | |
friend | -0.031 |
kindly | -0.030 |
So | -0.030 |
lder | -0.030 |
tutor | -0.030 |
Token | Now |
Token ID | 2735 |
Feature activation | +8.26e-03 |
Pos logit contributions | |
ays | +0.061 |
rob | +0.053 |
ips | +0.052 |
unks | +0.051 |
ocol | +0.049 |
Neg logit contributions | |
So | -0.041 |
kindly | -0.040 |
forgive | -0.039 |
friend | -0.039 |
tutor | -0.038 |
Token | I |
Token ID | 314 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
ays | +0.019 |
rob | +0.016 |
ips | +0.016 |
unks | +0.016 |
plets | +0.016 |
Neg logit contributions | |
friend | -0.011 |
kindly | -0.011 |
So | -0.011 |
lder | -0.011 |
tutor | -0.011 |
Token | 't |
Token ID | 470 |
Feature activation | -4.16e-02 |
Pos logit contributions | |
So | +0.044 |
tutor | +0.043 |
lder | +0.043 |
kindly | +0.042 |
friend | +0.041 |
Neg logit contributions | |
ays | -0.080 |
rob | -0.070 |
ocol | -0.068 |
ips | -0.068 |
unks | -0.066 |
Token | want |
Token ID | 765 |
Feature activation | -2.64e-02 |
Pos logit contributions | |
lder | +0.067 |
tutor | +0.064 |
So | +0.063 |
keeper | +0.063 |
kindly | +0.062 |
Neg logit contributions | |
ays | -0.079 |
ips | -0.068 |
izz | -0.066 |
matters | -0.065 |
rob | -0.064 |
Token | to |
Token ID | 284 |
Feature activation | -4.94e-02 |
Pos logit contributions | |
friend | +0.014 |
forgive | +0.012 |
tutor | +0.012 |
So | +0.011 |
kindly | +0.011 |
Neg logit contributions | |
ays | -0.085 |
rob | -0.076 |
plets | -0.076 |
ips | -0.076 |
unks | -0.074 |
Token | clean |
Token ID | 3424 |
Feature activation | +6.94e-03 |
Pos logit contributions | |
lder | +0.067 |
tutor | +0.065 |
kindly | +0.062 |
keeper | +0.062 |
friend | +0.061 |
Neg logit contributions | |
ays | -0.105 |
ips | -0.093 |
izz | -0.092 |
unks | -0.090 |
ions | -0.090 |
Token | up |
Token ID | 510 |
Feature activation | -9.65e-03 |
Pos logit contributions | |
ays | +0.017 |
plets | +0.016 |
ips | +0.015 |
unks | +0.015 |
ocol | +0.015 |
Neg logit contributions | |
kindly | -0.008 |
friend | -0.008 |
little | -0.008 |
tutor | -0.007 |
mistake | -0.007 |
Token | because |
Token ID | 780 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
kindly | +0.011 |
friend | +0.011 |
tutor | +0.010 |
understanding | +0.010 |
forgive | +0.010 |
Neg logit contributions | |
ays | -0.025 |
rob | -0.022 |
ips | -0.021 |
unks | -0.021 |
plets | -0.021 |
Token | he |
Token ID | 339 |
Feature activation | -4.70e-03 |
Pos logit contributions | |
ays | +0.055 |
rob | +0.051 |
plets | +0.050 |
ips | +0.049 |
unks | +0.047 |
Neg logit contributions | |
friend | -0.025 |
little | -0.023 |
tutor | -0.022 |
understanding | -0.022 |
kindly | -0.021 |
Token | loved |
Token ID | 6151 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
lder | +0.006 |
friend | +0.005 |
tutor | +0.005 |
So | +0.005 |
kindly | +0.005 |
Neg logit contributions | |
ays | -0.011 |
ips | -0.010 |
rob | -0.010 |
unks | -0.010 |
ions | -0.009 |
Token | playing |
Token ID | 2712 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
friend | +0.031 |
tutor | +0.030 |
understanding | +0.030 |
kindly | +0.029 |
song | +0.029 |
Neg logit contributions | |
ays | -0.066 |
plets | -0.057 |
rob | -0.056 |
ips | -0.056 |
unks | -0.055 |
Token | in |
Token ID | 287 |
Feature activation | +1.53e-03 |
Pos logit contributions | |
friend | +0.018 |
kindly | +0.018 |
tutor | +0.018 |
forgive | +0.018 |
So | +0.018 |
Neg logit contributions | |
ays | -0.041 |
unks | -0.035 |
ips | -0.035 |
rob | -0.035 |
plets | -0.034 |
Token | the |
Token ID | 262 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
ays | +0.004 |
plets | +0.003 |
rob | +0.003 |
unks | +0.003 |
ips | +0.003 |
Neg logit contributions | |
little | -0.002 |
friend | -0.002 |
tutor | -0.002 |
understanding | -0.002 |
forgive | -0.002 |
Token | happy |
Token ID | 3772 |
Feature activation | -2.99e-02 |
Pos logit contributions | |
ays | +0.067 |
rob | +0.058 |
ips | +0.057 |
unks | +0.057 |
ocol | +0.054 |
Neg logit contributions | |
friend | -0.039 |
understanding | -0.039 |
kindly | -0.038 |
song | -0.038 |
little | -0.038 |
Token | . |
Token ID | 13 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
lder | +0.036 |
So | +0.034 |
tutor | +0.034 |
kindly | +0.033 |
forgive | +0.033 |
Neg logit contributions | |
ays | -0.073 |
ips | -0.063 |
rob | -0.061 |
unks | -0.061 |
ions | -0.061 |
Token |
|
Token ID | 198 |
Feature activation | -4.88e-03 |
Pos logit contributions | |
ays | +0.052 |
rob | +0.047 |
ips | +0.045 |
unks | +0.045 |
ocol | +0.045 |
Neg logit contributions | |
So | -0.021 |
friend | -0.020 |
kindly | -0.020 |
tutor | -0.020 |
lder | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
lder | +0.006 |
tutor | +0.006 |
friend | +0.006 |
kindly | +0.006 |
song | +0.006 |
Neg logit contributions | |
ays | -0.012 |
ips | -0.010 |
unks | -0.010 |
rob | -0.010 |
ions | -0.010 |
Token | The |
Token ID | 464 |
Feature activation | -5.46e-03 |
Pos logit contributions | |
friend | +0.013 |
lder | +0.013 |
tutor | +0.013 |
hospitality | +0.013 |
birthday | +0.012 |
Neg logit contributions | |
ays | -0.026 |
izz | -0.023 |
ips | -0.023 |
ions | -0.023 |
plets | -0.023 |
Token | little |
Token ID | 1310 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
lder | +0.006 |
So | +0.005 |
ously | +0.005 |
hospitality | +0.005 |
cess | +0.004 |
Neg logit contributions | |
ays | -0.012 |
spins | -0.011 |
ips | -0.011 |
izz | -0.011 |
ocol | -0.011 |
Token | girl |
Token ID | 2576 |
Feature activation | -2.37e-03 |
Pos logit contributions | |
ays | +0.049 |
ips | +0.043 |
ions | +0.041 |
rob | +0.041 |
spins | +0.041 |
Neg logit contributions | |
lder | -0.025 |
So | -0.023 |
Days | -0.023 |
Years | -0.022 |
hospitality | -0.021 |
Token | was |
Token ID | 373 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
lder | +0.003 |
tutor | +0.003 |
So | +0.003 |
friend | +0.003 |
kindly | +0.003 |
Neg logit contributions | |
ays | -0.005 |
ips | -0.004 |
unks | -0.004 |
rob | -0.004 |
ions | -0.004 |
Token | very |
Token ID | 845 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
ays | +0.047 |
rob | +0.042 |
unks | +0.040 |
ocol | +0.039 |
ips | +0.039 |
Neg logit contributions | |
friend | -0.021 |
understanding | -0.020 |
kindly | -0.020 |
forgive | -0.019 |
tutor | -0.018 |
Token | pleased |
Token ID | 10607 |
Feature activation | -5.20e-02 |
Pos logit contributions | |
ays | +0.054 |
rob | +0.048 |
ips | +0.047 |
unks | +0.047 |
ions | +0.046 |
Neg logit contributions | |
friend | -0.019 |
kindly | -0.019 |
lder | -0.019 |
understanding | -0.018 |
forgive | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
lder | +0.084 |
Days | +0.076 |
So | +0.074 |
tutor | +0.073 |
hospitality | +0.073 |
Neg logit contributions | |
ays | -0.107 |
ions | -0.090 |
ips | -0.090 |
unks | -0.085 |
chairs | -0.081 |
Token | , |
Token ID | 11 |
Feature activation | -2.67e-02 |
Pos logit contributions | |
lder | +0.015 |
friend | +0.015 |
kindly | +0.015 |
So | +0.015 |
tutor | +0.015 |
Neg logit contributions | |
ays | -0.044 |
ips | -0.038 |
rob | -0.038 |
unks | -0.038 |
ions | -0.037 |
Token | and |
Token ID | 290 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
kindly | +0.025 |
friend | +0.025 |
So | +0.025 |
understanding | +0.024 |
lder | +0.024 |
Neg logit contributions | |
ays | -0.073 |
rob | -0.063 |
ips | -0.063 |
unks | -0.063 |
ions | -0.061 |
Token | she |
Token ID | 673 |
Feature activation | +7.75e-04 |
Pos logit contributions | |
ays | +0.046 |
unks | +0.041 |
ips | +0.040 |
rob | +0.039 |
ocol | +0.038 |
Neg logit contributions | |
kindly | -0.021 |
friend | -0.021 |
understanding | -0.021 |
So | -0.020 |
forgive | -0.020 |
Token | felt |
Token ID | 2936 |
Feature activation | +2.90e-02 |
Pos logit contributions | |
ays | +0.002 |
ips | +0.002 |
rob | +0.002 |
unks | +0.002 |
ocol | +0.002 |
Neg logit contributions | |
friend | -0.001 |
kindly | -0.001 |
So | -0.001 |
lder | -0.001 |
forgive | -0.001 |
Token | brave |
Token ID | 14802 |
Feature activation | -3.14e-02 |
Pos logit contributions | |
ays | +0.077 |
rob | +0.070 |
unks | +0.068 |
ips | +0.066 |
plets | +0.064 |
Neg logit contributions | |
kindly | -0.036 |
forgive | -0.036 |
understanding | -0.035 |
So | -0.033 |
friend | -0.032 |
Token | and |
Token ID | 290 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
lder | +0.040 |
So | +0.038 |
friend | +0.037 |
tutor | +0.037 |
kindly | +0.036 |
Neg logit contributions | |
ays | -0.074 |
ips | -0.064 |
rob | -0.062 |
ions | -0.060 |
unks | -0.060 |
Token | happy |
Token ID | 3772 |
Feature activation | -4.40e-02 |
Pos logit contributions | |
ays | +0.073 |
unks | +0.064 |
rob | +0.063 |
ips | +0.063 |
ions | +0.061 |
Neg logit contributions | |
kindly | -0.024 |
understanding | -0.024 |
friend | -0.023 |
forgive | -0.023 |
song | -0.022 |
Token | again |
Token ID | 757 |
Feature activation | -2.96e-02 |
Pos logit contributions | |
lder | +0.060 |
So | +0.057 |
Days | +0.054 |
tutor | +0.053 |
kindly | +0.053 |
Neg logit contributions | |
ays | -0.100 |
ips | -0.086 |
ions | -0.083 |
rob | -0.080 |
unks | -0.080 |
Token | . |
Token ID | 13 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
lder | +0.032 |
tutor | +0.030 |
friend | +0.030 |
So | +0.030 |
kindly | +0.029 |
Neg logit contributions | |
ays | -0.075 |
ips | -0.065 |
unks | -0.064 |
rob | -0.064 |
ions | -0.063 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +3.26e-02 |
Pos logit contributions | |
ays | +0.056 |
rob | +0.050 |
unks | +0.048 |
ips | +0.048 |
ocol | +0.046 |
Neg logit contributions | |
So | -0.028 |
lder | -0.027 |
kindly | -0.027 |
friend | -0.027 |
forgive | -0.027 |
Token | Jack |
Token ID | 14295 |
Feature activation | -2.24e-02 |
Pos logit contributions | |
ays | +0.067 |
ocol | +0.061 |
plets | +0.057 |
unks | +0.055 |
ips | +0.054 |
Neg logit contributions | |
So | -0.048 |
friend | -0.047 |
forgive | -0.044 |
lder | -0.044 |
little | -0.043 |
Token | it |
Token ID | 340 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
friend | +0.002 |
kindly | +0.002 |
tutor | +0.002 |
lder | +0.002 |
forgive | +0.002 |
Neg logit contributions | |
ays | -0.003 |
rob | -0.003 |
ips | -0.003 |
unks | -0.003 |
plets | -0.002 |
Token | grow |
Token ID | 1663 |
Feature activation | +4.05e-02 |
Pos logit contributions | |
friend | +0.017 |
kindly | +0.016 |
lder | +0.016 |
So | +0.016 |
tutor | +0.016 |
Neg logit contributions | |
ays | -0.029 |
rob | -0.025 |
ips | -0.024 |
unks | -0.024 |
plets | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
ays | +0.109 |
rob | +0.104 |
ips | +0.099 |
unks | +0.097 |
chairs | +0.096 |
Neg logit contributions | |
kindly | -0.040 |
friend | -0.035 |
little | -0.034 |
So | -0.034 |
politely | -0.032 |
Token | They |
Token ID | 1119 |
Feature activation | -5.57e-03 |
Pos logit contributions | |
ays | +0.033 |
rob | +0.029 |
ips | +0.028 |
unks | +0.028 |
ocol | +0.027 |
Neg logit contributions | |
So | -0.019 |
kindly | -0.018 |
friend | -0.018 |
tutor | -0.018 |
lder | -0.018 |
Token | were |
Token ID | 547 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
lder | +0.008 |
friend | +0.008 |
So | +0.008 |
kindly | +0.008 |
tutor | +0.008 |
Neg logit contributions | |
ays | -0.012 |
ips | -0.010 |
rob | -0.010 |
unks | -0.010 |
ions | -0.010 |
Token | very |
Token ID | 845 |
Feature activation | +2.98e-02 |
Pos logit contributions | |
ays | +0.042 |
rob | +0.038 |
plets | +0.036 |
ips | +0.036 |
unks | +0.035 |
Neg logit contributions | |
friend | -0.021 |
kindly | -0.020 |
understanding | -0.020 |
tutor | -0.019 |
lder | -0.019 |
Token | excited |
Token ID | 6568 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
ays | +0.085 |
rob | +0.077 |
ips | +0.073 |
unks | +0.072 |
ions | +0.071 |
Neg logit contributions | |
kindly | -0.028 |
friend | -0.027 |
lder | -0.026 |
understanding | -0.026 |
So | -0.024 |
Token | and |
Token ID | 290 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
lder | +0.063 |
Days | +0.061 |
forgive | +0.060 |
So | +0.060 |
tutor | +0.058 |
Neg logit contributions | |
ays | -0.103 |
ions | -0.085 |
ips | -0.084 |
unks | -0.083 |
chairs | -0.082 |
Token | happy |
Token ID | 3772 |
Feature activation | -4.02e-02 |
Pos logit contributions | |
ays | +0.047 |
rob | +0.041 |
ips | +0.040 |
unks | +0.039 |
ions | +0.038 |
Neg logit contributions | |
kindly | -0.022 |
lder | -0.022 |
friend | -0.022 |
understanding | -0.021 |
forgive | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
lder | +0.055 |
So | +0.054 |
Days | +0.054 |
forgive | +0.050 |
tutor | +0.050 |
Neg logit contributions | |
ays | -0.090 |
ions | -0.076 |
ips | -0.076 |
unks | -0.074 |
rob | -0.072 |
Token |
|
Token ID | 198 |
Feature activation | -5.50e-03 |
Pos logit contributions | |
ays | +0.028 |
rob | +0.025 |
ips | +0.025 |
ocol | +0.024 |
unks | +0.024 |
Neg logit contributions | |
So | -0.012 |
friend | -0.012 |
kindly | -0.011 |
tutor | -0.011 |
forgive | -0.011 |
Token | Let |
Token ID | 3914 |
Feature activation | -2.95e-03 |
Pos logit contributions | |
ays | +0.072 |
rob | +0.065 |
ips | +0.062 |
unks | +0.061 |
plets | +0.059 |
Neg logit contributions | |
lder | -0.050 |
who | -0.047 |
forgive | -0.047 |
tutor | -0.046 |
lawyer | -0.046 |
Token | go |
Token ID | 467 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
friend | +0.004 |
lder | +0.003 |
So | +0.003 |
tutor | +0.003 |
kindly | +0.003 |
Neg logit contributions | |
ays | -0.007 |
ips | -0.006 |
rob | -0.006 |
unks | -0.006 |
ocol | -0.006 |
Token | of |
Token ID | 286 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
friend | +0.024 |
lder | +0.024 |
So | +0.024 |
kindly | +0.024 |
tutor | +0.024 |
Neg logit contributions | |
ays | -0.049 |
ips | -0.042 |
rob | -0.042 |
unks | -0.042 |
plets | -0.041 |
Token | my |
Token ID | 616 |
Feature activation | -1.79e-02 |
Pos logit contributions | |
ays | +0.029 |
rob | +0.024 |
plets | +0.024 |
ips | +0.024 |
unks | +0.023 |
Neg logit contributions | |
friend | -0.022 |
forgive | -0.021 |
tutor | -0.021 |
kindly | -0.021 |
understanding | -0.021 |
Token | dress |
Token ID | 6576 |
Feature activation | +4.27e-03 |
Pos logit contributions | |
friend | +0.024 |
tutor | +0.023 |
lder | +0.022 |
kindly | +0.022 |
So | +0.022 |
Neg logit contributions | |
ays | -0.042 |
rob | -0.036 |
ips | -0.036 |
unks | -0.035 |
ions | -0.035 |
Token | . |
Token ID | 13 |
Feature activation | +2.34e-02 |
Pos logit contributions | |
ays | +0.011 |
rob | +0.010 |
ips | +0.010 |
unks | +0.010 |
ocol | +0.010 |
Neg logit contributions | |
friend | -0.004 |
lder | -0.004 |
kindly | -0.004 |
tutor | -0.004 |
So | -0.004 |
Token | That |
Token ID | 1320 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
ays | +0.047 |
rob | +0.043 |
unks | +0.041 |
ips | +0.040 |
plets | +0.038 |
Neg logit contributions | |
forgive | -0.038 |
kindly | -0.037 |
tutor | -0.036 |
So | -0.035 |
friend | -0.035 |
Token | 's |
Token ID | 338 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
ays | +0.056 |
ocol | +0.055 |
ips | +0.051 |
unks | +0.051 |
plets | +0.050 |
Neg logit contributions | |
friend | -0.039 |
song | -0.035 |
So | -0.034 |
little | -0.033 |
tutor | -0.032 |
Token | not |
Token ID | 407 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
ays | +0.042 |
rob | +0.037 |
plets | +0.036 |
ips | +0.036 |
unks | +0.036 |
Neg logit contributions | |
friend | -0.019 |
kindly | -0.018 |
forgive | -0.017 |
tutor | -0.017 |
understanding | -0.017 |
Token | yours |
Token ID | 12431 |
Feature activation | -1.70e-02 |
Pos logit contributions | |
ays | +0.028 |
ips | +0.024 |
rob | +0.023 |
ions | +0.023 |
unks | +0.023 |
Neg logit contributions | |
lder | -0.019 |
So | -0.019 |
tutor | -0.018 |
kindly | -0.018 |
forgive | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
lder | +0.019 |
friend | +0.018 |
So | +0.018 |
tutor | +0.018 |
kindly | +0.018 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.037 |
rob | -0.037 |
unks | -0.037 |
ions | -0.036 |
Token | to |
Token ID | 284 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
lder | +0.080 |
tutor | +0.073 |
Days | +0.073 |
So | +0.069 |
doorstep | +0.068 |
Neg logit contributions | |
ays | -0.126 |
spins | -0.104 |
ips | -0.104 |
lands | -0.103 |
happens | -0.100 |
Token | the |
Token ID | 262 |
Feature activation | -3.01e-02 |
Pos logit contributions | |
friend | +0.040 |
lder | +0.040 |
tutor | +0.040 |
kindly | +0.040 |
forgive | +0.039 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.035 |
rob | -0.035 |
unks | -0.034 |
plets | -0.033 |
Token | dolphin |
Token ID | 44136 |
Feature activation | -2.58e-02 |
Pos logit contributions | |
So | +0.037 |
lder | +0.037 |
Days | +0.034 |
kindly | +0.034 |
Years | +0.032 |
Neg logit contributions | |
ays | -0.067 |
rob | -0.058 |
ips | -0.058 |
unks | -0.057 |
ocol | -0.057 |
Token | . |
Token ID | 13 |
Feature activation | -9.30e-04 |
Pos logit contributions | |
lder | +0.043 |
Days | +0.041 |
Years | +0.039 |
Mic | +0.038 |
tutor | +0.038 |
Neg logit contributions | |
ays | -0.052 |
ips | -0.043 |
ions | -0.040 |
lands | -0.039 |
spins | -0.038 |
Token | The |
Token ID | 383 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
lder | +0.001 |
friend | +0.001 |
tutor | +0.001 |
So | +0.001 |
kindly | +0.001 |
Neg logit contributions | |
ays | -0.002 |
ips | -0.002 |
unks | -0.002 |
rob | -0.002 |
ions | -0.002 |
Token | dolphin |
Token ID | 44136 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
lder | +0.027 |
So | +0.026 |
friend | +0.026 |
kindly | +0.026 |
tutor | +0.026 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.036 |
rob | -0.036 |
unks | -0.036 |
ions | -0.035 |
Token | nodded |
Token ID | 14464 |
Feature activation | -2.82e-02 |
Pos logit contributions | |
ays | +0.020 |
ips | +0.016 |
rob | +0.016 |
lands | +0.016 |
spins | +0.016 |
Neg logit contributions | |
lder | -0.019 |
tutor | -0.019 |
Days | -0.018 |
recommendation | -0.018 |
hospitality | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -5.37e-03 |
Pos logit contributions | |
lder | +0.047 |
tutor | +0.042 |
Days | +0.042 |
doorstep | +0.042 |
resa | +0.039 |
Neg logit contributions | |
ays | -0.059 |
ips | -0.049 |
lands | -0.045 |
spins | -0.044 |
ions | -0.044 |
Token | made |
Token ID | 925 |
Feature activation | +1.21e-03 |
Pos logit contributions | |
lder | +0.008 |
tutor | +0.008 |
So | +0.008 |
friend | +0.007 |
Days | +0.007 |
Neg logit contributions | |
ays | -0.012 |
ips | -0.010 |
rob | -0.010 |
unks | -0.009 |
ions | -0.009 |
Token | a |
Token ID | 257 |
Feature activation | -3.38e-02 |
Pos logit contributions | |
ays | +0.003 |
rob | +0.002 |
unks | +0.002 |
ips | +0.002 |
plets | +0.002 |
Neg logit contributions | |
friend | -0.002 |
kindly | -0.002 |
forgive | -0.002 |
song | -0.002 |
tutor | -0.002 |
Token | funny |
Token ID | 8258 |
Feature activation | -4.51e-02 |
Pos logit contributions | |
lder | +0.055 |
hospitality | +0.047 |
Days | +0.047 |
So | +0.046 |
tutor | +0.046 |
Neg logit contributions | |
ays | -0.063 |
lands | -0.059 |
spins | -0.053 |
patches | -0.051 |
matters | -0.051 |
Token | with |
Token ID | 351 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
lder | +0.024 |
So | +0.023 |
tutor | +0.023 |
friend | +0.023 |
kindly | +0.022 |
Neg logit contributions | |
ays | -0.038 |
ips | -0.033 |
rob | -0.033 |
unks | -0.032 |
ions | -0.032 |
Token | the |
Token ID | 262 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
ays | +0.036 |
rob | +0.031 |
plets | +0.031 |
ips | +0.031 |
unks | +0.030 |
Neg logit contributions | |
friend | -0.023 |
forgive | -0.021 |
kindly | -0.021 |
little | -0.021 |
tutor | -0.020 |
Token | string |
Token ID | 4731 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
ays | +0.029 |
ips | +0.024 |
rob | +0.024 |
unks | +0.023 |
ions | +0.023 |
Neg logit contributions | |
lder | -0.021 |
kindly | -0.020 |
So | -0.019 |
tutor | -0.019 |
forgive | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | +7.13e-03 |
Pos logit contributions | |
ays | +0.053 |
ips | +0.046 |
ions | +0.045 |
unks | +0.045 |
rob | +0.044 |
Neg logit contributions | |
lder | -0.029 |
So | -0.026 |
tutor | -0.026 |
forgive | -0.025 |
kindly | -0.025 |
Token | had |
Token ID | 550 |
Feature activation | +2.40e-02 |
Pos logit contributions | |
ays | +0.018 |
unks | +0.014 |
ips | +0.014 |
ocol | +0.014 |
plets | +0.014 |
Neg logit contributions | |
friend | -0.010 |
forgive | -0.010 |
understanding | -0.010 |
kindly | -0.010 |
song | -0.009 |
Token | a |
Token ID | 257 |
Feature activation | -2.90e-02 |
Pos logit contributions | |
ays | +0.047 |
ips | +0.039 |
rob | +0.038 |
unks | +0.038 |
ions | +0.037 |
Neg logit contributions | |
lder | -0.040 |
friend | -0.040 |
So | -0.039 |
kindly | -0.039 |
tutor | -0.039 |
Token | great |
Token ID | 1049 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
lder | +0.063 |
edly | +0.060 |
cess | +0.056 |
keeper | +0.056 |
doorstep | +0.055 |
Neg logit contributions | |
ays | -0.030 |
rob | -0.029 |
spins | -0.028 |
marsh | -0.028 |
matters | -0.028 |
Token | time |
Token ID | 640 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
kindly | +0.041 |
keeper | +0.039 |
lder | +0.039 |
politely | +0.039 |
keeper | +0.039 |
Neg logit contributions | |
ays | -0.019 |
ips | -0.016 |
ained | -0.016 |
rob | -0.016 |
matters | -0.016 |
Token | together |
Token ID | 1978 |
Feature activation | -3.59e-02 |
Pos logit contributions | |
friend | +0.018 |
kindly | +0.018 |
forgive | +0.017 |
So | +0.017 |
lder | +0.017 |
Neg logit contributions | |
ays | -0.034 |
rob | -0.029 |
ips | -0.028 |
unks | -0.028 |
plets | -0.028 |
Token | . |
Token ID | 13 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
lder | +0.049 |
tutor | +0.047 |
So | +0.046 |
kindly | +0.045 |
Days | +0.044 |
Neg logit contributions | |
ays | -0.083 |
ips | -0.072 |
ions | -0.069 |
unks | -0.069 |
rob | -0.066 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
ays | +0.049 |
rob | +0.043 |
ips | +0.043 |
unks | +0.043 |
ocol | +0.042 |
Neg logit contributions | |
friend | -0.019 |
So | -0.019 |
forgive | -0.019 |
kindly | -0.018 |
lder | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -3.40e-02 |
Pos logit contributions | |
lder | +0.017 |
friend | +0.016 |
kindly | +0.016 |
So | +0.016 |
tutor | +0.015 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.033 |
rob | -0.032 |
ocol | -0.032 |
unks | -0.032 |
Token | M |
Token ID | 337 |
Feature activation | +7.16e-03 |
Pos logit contributions | |
lder | +0.053 |
So | +0.052 |
tutor | +0.052 |
kindly | +0.052 |
friend | +0.052 |
Neg logit contributions | |
ays | -0.068 |
rob | -0.057 |
ips | -0.056 |
unks | -0.055 |
ions | -0.055 |
Token | ummy |
Token ID | 13513 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
ays | +0.015 |
unks | +0.012 |
izz | +0.012 |
ips | +0.012 |
ions | +0.011 |
Neg logit contributions | |
kindly | -0.012 |
tune | -0.012 |
understanding | -0.012 |
song | -0.012 |
respectful | -0.012 |
Token | were |
Token ID | 547 |
Feature activation | +8.38e-03 |
Pos logit contributions | |
So | +0.045 |
lder | +0.045 |
tutor | +0.045 |
Days | +0.045 |
tune | +0.045 |
Neg logit contributions | |
ays | -0.064 |
rob | -0.053 |
ips | -0.052 |
unks | -0.051 |
ions | -0.051 |
Token | in |
Token ID | 287 |
Feature activation | -7.11e-03 |
Pos logit contributions | |
ays | +0.018 |
rob | +0.016 |
plets | +0.015 |
unks | +0.015 |
ips | +0.015 |
Neg logit contributions | |
friend | -0.013 |
tutor | -0.012 |
kindly | -0.012 |
lder | -0.012 |
So | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | +9.11e-03 |
Pos logit contributions | |
lder | +0.013 |
So | +0.012 |
friend | +0.012 |
kindly | +0.012 |
tutor | +0.012 |
Neg logit contributions | |
ays | -0.013 |
ips | -0.011 |
rob | -0.010 |
unks | -0.010 |
ions | -0.010 |
Token | backyard |
Token ID | 24296 |
Feature activation | -2.29e-02 |
Pos logit contributions | |
ays | +0.021 |
ips | +0.018 |
rob | +0.018 |
unks | +0.018 |
ions | +0.018 |
Neg logit contributions | |
friend | -0.012 |
lder | -0.012 |
tutor | -0.011 |
So | -0.011 |
kindly | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +2.69e-02 |
Pos logit contributions | |
lder | +0.032 |
tutor | +0.032 |
Days | +0.030 |
hospitality | +0.029 |
So | +0.029 |
Neg logit contributions | |
ays | -0.051 |
ips | -0.043 |
unks | -0.043 |
ions | -0.042 |
ained | -0.039 |
Token | Sammy |
Token ID | 44067 |
Feature activation | -9.49e-03 |
Pos logit contributions | |
ays | +0.068 |
rob | +0.065 |
ips | +0.062 |
unks | +0.058 |
ocol | +0.058 |
Neg logit contributions | |
friend | -0.028 |
So | -0.027 |
little | -0.026 |
kindly | -0.026 |
recommendation | -0.025 |
Token | loved |
Token ID | 6151 |
Feature activation | -2.40e-02 |
Pos logit contributions | |
lder | +0.012 |
friend | +0.011 |
kindly | +0.011 |
So | +0.011 |
tutor | +0.011 |
Neg logit contributions | |
ays | -0.023 |
ips | -0.020 |
rob | -0.020 |
unks | -0.019 |
ocol | -0.019 |
Token | being |
Token ID | 852 |
Feature activation | +3.88e-02 |
Pos logit contributions | |
friend | +0.022 |
tutor | +0.021 |
lder | +0.021 |
kindly | +0.020 |
song | +0.020 |
Neg logit contributions | |
ays | -0.067 |
ips | -0.058 |
rob | -0.058 |
plets | -0.057 |
unks | -0.057 |
Token | good |
Token ID | 922 |
Feature activation | -2.43e-02 |
Pos logit contributions | |
So | +0.040 |
lder | +0.039 |
tune | +0.036 |
As | +0.035 |
broken | +0.035 |
Neg logit contributions | |
ays | -0.060 |
ips | -0.054 |
spins | -0.051 |
unks | -0.050 |
lands | -0.049 |
Token | by |
Token ID | 1525 |
Feature activation | -2.45e-02 |
Pos logit contributions | |
lder | +0.025 |
So | +0.024 |
Days | +0.022 |
kindly | +0.022 |
forgive | +0.021 |
Neg logit contributions | |
ays | -0.062 |
ips | -0.054 |
unks | -0.052 |
ocol | -0.051 |
ions | -0.051 |
Token | es |
Token ID | 274 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
lder | +0.051 |
So | +0.050 |
tutor | +0.050 |
forgive | +0.049 |
tune | +0.049 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.030 |
ions | -0.028 |
unks | -0.028 |
rob | -0.028 |
Token | . |
Token ID | 13 |
Feature activation | +6.24e-03 |
Pos logit contributions | |
lder | +0.031 |
tutor | +0.028 |
Days | +0.027 |
So | +0.027 |
friend | +0.026 |
Neg logit contributions | |
ays | -0.045 |
ions | -0.039 |
ips | -0.039 |
rob | -0.037 |
chairs | -0.036 |
Token | She |
Token ID | 1375 |
Feature activation | -1.55e-03 |
Pos logit contributions | |
ays | +0.012 |
ips | +0.010 |
ions | +0.010 |
unks | +0.009 |
chairs | +0.009 |
Neg logit contributions | |
tune | -0.010 |
forgive | -0.010 |
friend | -0.010 |
song | -0.010 |
lder | -0.010 |
Token | quickly |
Token ID | 2952 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
lder | +0.002 |
friend | +0.002 |
tutor | +0.002 |
So | +0.002 |
kindly | +0.002 |
Neg logit contributions | |
ays | -0.004 |
ips | -0.003 |
rob | -0.003 |
unks | -0.003 |
ions | -0.003 |
Token | grabbed |
Token ID | 13176 |
Feature activation | +3.64e-02 |
Pos logit contributions | |
lder | +0.022 |
friend | +0.022 |
So | +0.021 |
kindly | +0.021 |
tutor | +0.021 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.031 |
rob | -0.031 |
unks | -0.031 |
ions | -0.030 |
Token | her |
Token ID | 607 |
Feature activation | +2.08e-03 |
Pos logit contributions | |
ays | +0.087 |
unks | +0.078 |
rob | +0.076 |
plets | +0.075 |
ips | +0.074 |
Neg logit contributions | |
friend | -0.047 |
tutor | -0.047 |
kindly | -0.046 |
little | -0.044 |
understanding | -0.044 |
Token | toy |
Token ID | 13373 |
Feature activation | +9.52e-03 |
Pos logit contributions | |
ays | +0.005 |
ips | +0.004 |
unks | +0.004 |
rob | +0.004 |
ocol | +0.004 |
Neg logit contributions | |
lder | -0.003 |
So | -0.003 |
kindly | -0.003 |
forgive | -0.003 |
Days | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
ays | +0.021 |
ips | +0.018 |
ions | +0.018 |
unks | +0.017 |
rob | +0.017 |
Neg logit contributions | |
lder | -0.014 |
So | -0.013 |
Days | -0.013 |
forgive | -0.013 |
understanding | -0.013 |
Token | ran |
Token ID | 4966 |
Feature activation | -2.25e-03 |
Pos logit contributions | |
ays | +0.048 |
unks | +0.042 |
ips | +0.042 |
ocol | +0.041 |
rob | +0.041 |
Neg logit contributions | |
friend | -0.022 |
kindly | -0.022 |
So | -0.020 |
understanding | -0.020 |
lder | -0.020 |
Token | right |
Token ID | 826 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
ays | +0.034 |
rob | +0.029 |
unks | +0.029 |
ips | +0.028 |
plets | +0.028 |
Neg logit contributions | |
friend | -0.016 |
kindly | -0.015 |
forgive | -0.015 |
understanding | -0.015 |
tutor | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
lder | +0.017 |
So | +0.017 |
hospitality | +0.016 |
Days | +0.016 |
tune | +0.016 |
Neg logit contributions | |
ays | -0.028 |
ips | -0.023 |
unks | -0.023 |
ions | -0.022 |
ocol | -0.022 |
Token | We |
Token ID | 775 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
ays | +0.046 |
rob | +0.043 |
unks | +0.040 |
ips | +0.040 |
izz | +0.038 |
Neg logit contributions | |
forgive | -0.027 |
friend | -0.026 |
lder | -0.025 |
tutor | -0.025 |
kindly | -0.025 |
Token | learned |
Token ID | 4499 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
ays | +0.034 |
ips | +0.029 |
rob | +0.029 |
unks | +0.028 |
ions | +0.027 |
Neg logit contributions | |
friend | -0.018 |
lder | -0.018 |
forgive | -0.018 |
So | -0.018 |
kindly | -0.017 |
Token | our |
Token ID | 674 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
lder | +0.016 |
friend | +0.016 |
So | +0.016 |
tutor | +0.016 |
kindly | +0.016 |
Neg logit contributions | |
ays | -0.024 |
ips | -0.020 |
rob | -0.020 |
unks | -0.020 |
ions | -0.019 |
Token | lesson |
Token ID | 11483 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
kindly | +0.032 |
lder | +0.031 |
So | +0.031 |
broken | +0.031 |
Her | +0.030 |
Neg logit contributions | |
ays | -0.045 |
matters | -0.041 |
lands | -0.040 |
ips | -0.039 |
unks | -0.039 |
Token | . |
Token ID | 13 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
lder | +0.016 |
friend | +0.016 |
kindly | +0.016 |
So | +0.015 |
tutor | +0.015 |
Neg logit contributions | |
ays | -0.037 |
ips | -0.032 |
rob | -0.032 |
unks | -0.031 |
ocol | -0.031 |
Token | We |
Token ID | 775 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
ays | +0.030 |
rob | +0.027 |
ips | +0.026 |
unks | +0.026 |
ocol | +0.025 |
Neg logit contributions | |
forgive | -0.021 |
So | -0.020 |
friend | -0.020 |
lder | -0.020 |
kindly | -0.020 |
Token | will |
Token ID | 481 |
Feature activation | -5.56e-02 |
Pos logit contributions | |
ays | +0.023 |
ips | +0.020 |
rob | +0.019 |
unks | +0.019 |
ions | +0.019 |
Neg logit contributions | |
lder | -0.017 |
tutor | -0.016 |
friend | -0.016 |
kindly | -0.016 |
So | -0.016 |
Token | listen |
Token ID | 6004 |
Feature activation | -3.42e-02 |
Pos logit contributions | |
tutor | +0.073 |
lder | +0.072 |
tune | +0.068 |
broken | +0.067 |
hospitality | +0.067 |
Neg logit contributions | |
ays | -0.103 |
matters | -0.096 |
ips | -0.094 |
unks | -0.094 |
lands | -0.090 |
Token | to |
Token ID | 284 |
Feature activation | -1.60e-02 |
Pos logit contributions | |
lder | +0.038 |
So | +0.036 |
tutor | +0.036 |
Days | +0.034 |
friend | +0.034 |
Neg logit contributions | |
ays | -0.084 |
ips | -0.071 |
ions | -0.070 |
unks | -0.069 |
plets | -0.067 |
Token | the |
Token ID | 262 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
lder | +0.010 |
friend | +0.009 |
tutor | +0.009 |
kindly | +0.009 |
So | +0.009 |
Neg logit contributions | |
ays | -0.010 |
ips | -0.008 |
rob | -0.008 |
unks | -0.008 |
ions | -0.008 |
Token | distance |
Token ID | 5253 |
Feature activation | -2.90e-02 |
Pos logit contributions | |
ays | +0.022 |
ips | +0.018 |
rob | +0.018 |
unks | +0.018 |
plets | +0.017 |
Neg logit contributions | |
lder | -0.021 |
tutor | -0.020 |
kindly | -0.020 |
friend | -0.020 |
So | -0.020 |
Token | and |
Token ID | 290 |
Feature activation | -2.68e-03 |
Pos logit contributions | |
lder | +0.029 |
friend | +0.028 |
tutor | +0.028 |
So | +0.028 |
kindly | +0.028 |
Neg logit contributions | |
ays | -0.076 |
ips | -0.066 |
rob | -0.065 |
unks | -0.065 |
ions | -0.064 |
Token | decided |
Token ID | 3066 |
Feature activation | -3.49e-02 |
Pos logit contributions | |
kindly | +0.003 |
friend | +0.003 |
lder | +0.003 |
So | +0.003 |
tutor | +0.003 |
Neg logit contributions | |
ays | -0.007 |
ips | -0.006 |
rob | -0.006 |
unks | -0.006 |
ocol | -0.006 |
Token | it |
Token ID | 340 |
Feature activation | -3.46e-03 |
Pos logit contributions | |
lder | +0.038 |
tutor | +0.037 |
friend | +0.036 |
So | +0.036 |
forgive | +0.035 |
Neg logit contributions | |
ays | -0.083 |
ips | -0.072 |
unks | -0.071 |
rob | -0.070 |
lands | -0.070 |
Token | would |
Token ID | 561 |
Feature activation | -5.78e-02 |
Pos logit contributions | |
friend | +0.004 |
kindly | +0.004 |
So | +0.004 |
lder | +0.004 |
keeper | +0.004 |
Neg logit contributions | |
ays | -0.009 |
rob | -0.008 |
ocol | -0.008 |
ips | -0.007 |
unks | -0.007 |
Token | be |
Token ID | 307 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
lder | +0.077 |
tutor | +0.075 |
So | +0.072 |
kindly | +0.072 |
friend | +0.072 |
Neg logit contributions | |
ays | -0.127 |
ips | -0.110 |
unks | -0.109 |
ions | -0.107 |
rob | -0.105 |
Token | her |
Token ID | 607 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
ays | +0.052 |
plets | +0.044 |
ips | +0.043 |
rob | +0.043 |
unks | +0.042 |
Neg logit contributions | |
friend | -0.026 |
kindly | -0.024 |
understanding | -0.023 |
So | -0.023 |
song | -0.022 |
Token | goal |
Token ID | 3061 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
lder | +0.038 |
Days | +0.034 |
So | +0.034 |
broken | +0.033 |
Her | +0.032 |
Neg logit contributions | |
ays | -0.055 |
ips | -0.047 |
unks | -0.047 |
lands | -0.046 |
spins | -0.045 |
Token | . |
Token ID | 13 |
Feature activation | +8.87e-03 |
Pos logit contributions | |
friend | +0.016 |
So | +0.015 |
kindly | +0.015 |
tutor | +0.015 |
forgive | +0.014 |
Neg logit contributions | |
ays | -0.052 |
rob | -0.046 |
ips | -0.045 |
ocol | -0.045 |
unks | -0.045 |
Token |
|
Token ID | 198 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
ays | +0.018 |
ips | +0.015 |
unks | +0.013 |
lands | +0.013 |
rob | +0.013 |
Neg logit contributions | |
broken | -0.014 |
friend | -0.014 |
forgive | -0.014 |
tune | -0.014 |
Days | -0.014 |
Token | , |
Token ID | 11 |
Feature activation | +3.72e-02 |
Pos logit contributions | |
ays | +0.058 |
rob | +0.050 |
ips | +0.050 |
unks | +0.049 |
ions | +0.048 |
Neg logit contributions | |
friend | -0.026 |
kindly | -0.025 |
lder | -0.025 |
tutor | -0.025 |
So | -0.025 |
Token | she |
Token ID | 673 |
Feature activation | -3.94e-03 |
Pos logit contributions | |
ays | +0.105 |
rob | +0.093 |
ips | +0.090 |
unks | +0.090 |
plets | +0.087 |
Neg logit contributions | |
friend | -0.041 |
tutor | -0.038 |
little | -0.038 |
kindly | -0.037 |
understanding | -0.034 |
Token | asked |
Token ID | 1965 |
Feature activation | -2.04e-02 |
Pos logit contributions | |
lder | +0.005 |
friend | +0.005 |
So | +0.005 |
tutor | +0.005 |
kindly | +0.005 |
Neg logit contributions | |
ays | -0.009 |
ips | -0.008 |
rob | -0.007 |
unks | -0.007 |
ions | -0.007 |
Token | her |
Token ID | 607 |
Feature activation | -4.43e-02 |
Pos logit contributions | |
lder | +0.030 |
So | +0.029 |
friend | +0.028 |
tune | +0.028 |
song | +0.027 |
Neg logit contributions | |
ays | -0.044 |
ips | -0.038 |
ions | -0.036 |
rob | -0.036 |
unks | -0.036 |
Token | mom |
Token ID | 1995 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
lder | +0.055 |
tune | +0.053 |
So | +0.052 |
Okay | +0.050 |
Days | +0.048 |
Neg logit contributions | |
ays | -0.100 |
patches | -0.087 |
ocol | -0.086 |
ions | -0.086 |
ips | -0.085 |
Token | my |
Token ID | 1820 |
Feature activation | -4.01e-02 |
Pos logit contributions | |
lder | +0.040 |
So | +0.037 |
tune | +0.037 |
Days | +0.036 |
song | +0.036 |
Neg logit contributions | |
ays | -0.056 |
ips | -0.047 |
ions | -0.045 |
unks | -0.045 |
rob | -0.044 |
Token | to |
Token ID | 284 |
Feature activation | -3.13e-02 |
Pos logit contributions | |
lder | +0.057 |
So | +0.055 |
tune | +0.053 |
song | +0.053 |
friend | +0.053 |
Neg logit contributions | |
ays | -0.089 |
ips | -0.075 |
ions | -0.073 |
unks | -0.072 |
rob | -0.071 |
Token | help |
Token ID | 1037 |
Feature activation | -2.35e-02 |
Pos logit contributions | |
lder | +0.043 |
Days | +0.041 |
tutor | +0.040 |
broken | +0.040 |
So | +0.039 |
Neg logit contributions | |
ays | -0.063 |
ions | -0.056 |
ips | -0.056 |
izz | -0.056 |
ocol | -0.056 |
Token | her |
Token ID | 607 |
Feature activation | -4.45e-02 |
Pos logit contributions | |
lder | +0.034 |
So | +0.034 |
tutor | +0.033 |
friend | +0.033 |
keeper | +0.032 |
Neg logit contributions | |
ays | -0.049 |
ips | -0.042 |
ions | -0.041 |
ocol | -0.041 |
unks | -0.041 |
Token | open |
Token ID | 1280 |
Feature activation | +9.12e-03 |
Pos logit contributions | |
lder | +0.058 |
So | +0.054 |
tutor | +0.054 |
kindly | +0.053 |
song | +0.052 |
Neg logit contributions | |
ays | -0.104 |
ips | -0.089 |
unks | -0.088 |
ions | -0.085 |
rob | -0.085 |
Token | the |
Token ID | 262 |
Feature activation | +3.66e-03 |
Pos logit contributions | |
ays | +0.020 |
plets | +0.019 |
rob | +0.019 |
ips | +0.018 |
unks | +0.017 |
Neg logit contributions | |
friend | -0.013 |
kindly | -0.012 |
tutor | -0.012 |
little | -0.012 |
keeper | -0.012 |
Token | Uh |
Token ID | 34653 |
Feature activation | +5.23e-03 |
Pos logit contributions | |
So | +0.008 |
lder | +0.008 |
friend | +0.008 |
tutor | +0.008 |
forgive | +0.008 |
Neg logit contributions | |
ays | -0.014 |
ips | -0.012 |
unks | -0.012 |
rob | -0.011 |
ocol | -0.011 |
Token | - |
Token ID | 12 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
ays | +0.011 |
ips | +0.010 |
rob | +0.009 |
unks | +0.009 |
ions | +0.009 |
Neg logit contributions | |
lder | -0.008 |
friend | -0.008 |
So | -0.007 |
tutor | -0.007 |
kindly | -0.007 |
Token | oh |
Token ID | 1219 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
ays | +0.059 |
ips | +0.047 |
rob | +0.046 |
unks | +0.046 |
ions | +0.044 |
Neg logit contributions | |
lder | -0.067 |
friend | -0.066 |
So | -0.066 |
kindly | -0.065 |
tutor | -0.065 |
Token | ," |
Token ID | 553 |
Feature activation | +5.26e-05 |
Pos logit contributions | |
So | +0.019 |
tutor | +0.018 |
lder | +0.018 |
kindly | +0.018 |
friend | +0.018 |
Neg logit contributions | |
ays | -0.029 |
rob | -0.025 |
ips | -0.025 |
unks | -0.024 |
plets | -0.024 |
Token | Anna |
Token ID | 11735 |
Feature activation | -2.44e-02 |
Pos logit contributions | |
ays | +0.000 |
rob | +0.000 |
ips | +0.000 |
unks | +0.000 |
plets | +0.000 |
Neg logit contributions | |
kindly | -0.000 |
tutor | -0.000 |
friend | -0.000 |
So | -0.000 |
forgive | -0.000 |
Token | says |
Token ID | 1139 |
Feature activation | -4.06e-02 |
Pos logit contributions | |
lder | +0.040 |
friend | +0.040 |
So | +0.040 |
kindly | +0.040 |
tutor | +0.040 |
Neg logit contributions | |
ays | -0.048 |
rob | -0.040 |
ips | -0.040 |
unks | -0.039 |
ions | -0.038 |
Token | . |
Token ID | 13 |
Feature activation | -3.12e-02 |
Pos logit contributions | |
lder | +0.052 |
Days | +0.048 |
So | +0.048 |
tutor | +0.046 |
friend | +0.046 |
Neg logit contributions | |
ays | -0.099 |
ips | -0.085 |
unks | -0.081 |
ions | -0.079 |
plets | -0.078 |
Token | " |
Token ID | 366 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
hospitality | +0.041 |
lder | +0.041 |
friend | +0.040 |
forgive | +0.040 |
So | +0.040 |
Neg logit contributions | |
ays | -0.071 |
ips | -0.061 |
unks | -0.058 |
plets | -0.057 |
ions | -0.056 |
Token | We |
Token ID | 1135 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
lder | +0.025 |
So | +0.025 |
friend | +0.025 |
kindly | +0.024 |
tutor | +0.024 |
Neg logit contributions | |
ays | -0.048 |
ips | -0.041 |
rob | -0.041 |
unks | -0.040 |
ions | -0.039 |
Token | should |
Token ID | 815 |
Feature activation | -4.21e-02 |
Pos logit contributions | |
ays | +0.030 |
rob | +0.026 |
ips | +0.025 |
unks | +0.025 |
ocol | +0.024 |
Neg logit contributions | |
forgive | -0.020 |
friend | -0.020 |
lder | -0.019 |
So | -0.019 |
kindly | -0.019 |
Token | stop |
Token ID | 2245 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
tutor | +0.050 |
So | +0.050 |
lder | +0.050 |
kindly | +0.050 |
friend | +0.049 |
Neg logit contributions | |
ays | -0.097 |
ips | -0.084 |
unks | -0.083 |
ions | -0.082 |
ocol | -0.081 |
Token | oy |
Token ID | 35104 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
lder | +0.023 |
So | +0.022 |
tutor | +0.022 |
kindly | +0.022 |
friend | +0.022 |
Neg logit contributions | |
ays | -0.026 |
ips | -0.021 |
rob | -0.021 |
unks | -0.021 |
ocol | -0.020 |
Token | ster |
Token ID | 1706 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
ays | +0.056 |
ips | +0.050 |
rob | +0.049 |
ions | +0.049 |
unks | +0.048 |
Neg logit contributions | |
friend | -0.020 |
lder | -0.019 |
kindly | -0.019 |
So | -0.018 |
forgive | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +8.40e-03 |
Pos logit contributions | |
lder | +0.021 |
tutor | +0.020 |
So | +0.019 |
understanding | +0.018 |
kindly | +0.018 |
Neg logit contributions | |
ays | -0.043 |
ips | -0.037 |
unks | -0.036 |
ions | -0.036 |
rob | -0.035 |
Token | Tim |
Token ID | 5045 |
Feature activation | -1.24e-03 |
Pos logit contributions | |
ays | +0.019 |
ips | +0.016 |
rob | +0.016 |
unks | +0.015 |
ions | +0.015 |
Neg logit contributions | |
lder | -0.012 |
friend | -0.012 |
So | -0.012 |
kindly | -0.012 |
tutor | -0.012 |
Token | said |
Token ID | 531 |
Feature activation | -9.29e-03 |
Pos logit contributions | |
tutor | +0.002 |
lder | +0.002 |
hospitality | +0.002 |
recommendation | +0.002 |
birthday | +0.002 |
Neg logit contributions | |
ays | -0.002 |
unks | -0.002 |
ips | -0.002 |
rob | -0.002 |
ions | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | -4.98e-02 |
Pos logit contributions | |
lder | +0.010 |
friend | +0.010 |
kindly | +0.010 |
tutor | +0.010 |
So | +0.010 |
Neg logit contributions | |
ays | -0.024 |
rob | -0.020 |
ips | -0.020 |
unks | -0.020 |
ions | -0.020 |
Token | " |
Token ID | 366 |
Feature activation | -9.90e-03 |
Pos logit contributions | |
lder | +0.059 |
friend | +0.058 |
So | +0.057 |
tutor | +0.057 |
kindly | +0.055 |
Neg logit contributions | |
ays | -0.118 |
ips | -0.102 |
rob | -0.100 |
unks | -0.100 |
plets | -0.099 |
Token | Put |
Token ID | 11588 |
Feature activation | +3.90e-02 |
Pos logit contributions | |
tutor | +0.014 |
friend | +0.014 |
lder | +0.014 |
kindly | +0.014 |
forgive | +0.013 |
Neg logit contributions | |
ays | -0.022 |
rob | -0.018 |
ips | -0.018 |
unks | -0.018 |
plets | -0.018 |
Token | the |
Token ID | 262 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
ays | +0.088 |
plets | +0.084 |
chairs | +0.081 |
rol | +0.080 |
unks | +0.080 |
Neg logit contributions | |
little | -0.046 |
nd | -0.041 |
friend | -0.041 |
and | -0.040 |
lady | -0.039 |
Token | rock |
Token ID | 3881 |
Feature activation | +5.03e-02 |
Pos logit contributions | |
ays | +0.084 |
ips | +0.071 |
rob | +0.071 |
unks | +0.068 |
ions | +0.068 |
Neg logit contributions | |
friend | -0.048 |
little | -0.045 |
forgive | -0.044 |
kindly | -0.043 |
song | -0.043 |
Token | in |
Token ID | 287 |
Feature activation | +7.31e-03 |
Pos logit contributions | |
ays | +0.112 |
rob | +0.099 |
unks | +0.094 |
ips | +0.094 |
ocol | +0.093 |
Neg logit contributions | |
friend | -0.072 |
kindly | -0.070 |
So | -0.068 |
forgive | -0.067 |
lder | -0.066 |
Token | want |
Token ID | 765 |
Feature activation | +2.02e-03 |
Pos logit contributions | |
lder | +0.034 |
tutor | +0.034 |
friend | +0.034 |
So | +0.033 |
kindly | +0.033 |
Neg logit contributions | |
ays | -0.051 |
ips | -0.043 |
rob | -0.043 |
unks | -0.043 |
ions | -0.041 |
Token | to |
Token ID | 284 |
Feature activation | -3.34e-02 |
Pos logit contributions | |
ays | +0.006 |
rob | +0.005 |
ips | +0.005 |
unks | +0.005 |
plets | +0.005 |
Neg logit contributions | |
friend | -0.002 |
forgive | -0.002 |
tutor | -0.002 |
kindly | -0.002 |
song | -0.002 |
Token | play |
Token ID | 711 |
Feature activation | -3.87e-03 |
Pos logit contributions | |
lder | +0.045 |
tutor | +0.044 |
kindly | +0.044 |
So | +0.044 |
friend | +0.042 |
Neg logit contributions | |
ays | -0.075 |
ips | -0.064 |
unks | -0.063 |
rob | -0.063 |
ocol | -0.061 |
Token | with |
Token ID | 351 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
friend | +0.004 |
forgive | +0.004 |
kindly | +0.004 |
lder | +0.004 |
tutor | +0.004 |
Neg logit contributions | |
ays | -0.010 |
ips | -0.009 |
unks | -0.009 |
rob | -0.009 |
plets | -0.009 |
Token | you |
Token ID | 345 |
Feature activation | -1.37e-02 |
Pos logit contributions | |
ays | +0.043 |
rob | +0.038 |
ips | +0.037 |
plets | +0.035 |
unks | +0.035 |
Neg logit contributions | |
friend | -0.034 |
kindly | -0.032 |
forgive | -0.032 |
lder | -0.032 |
little | -0.032 |
Token | anymore |
Token ID | 7471 |
Feature activation | -4.17e-02 |
Pos logit contributions | |
lder | +0.024 |
tutor | +0.023 |
hospitality | +0.023 |
Days | +0.023 |
So | +0.023 |
Neg logit contributions | |
ays | -0.026 |
ips | -0.021 |
unks | -0.020 |
ions | -0.020 |
rob | -0.019 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
lder | +0.063 |
tutor | +0.061 |
So | +0.061 |
kindly | +0.061 |
friend | +0.061 |
Neg logit contributions | |
ays | -0.088 |
ips | -0.073 |
unks | -0.072 |
rob | -0.072 |
ions | -0.071 |
Token |
|
Token ID | 198 |
Feature activation | -1.50e-02 |
Pos logit contributions | |
lder | +0.019 |
tutor | +0.018 |
friend | +0.018 |
song | +0.018 |
hospitality | +0.018 |
Neg logit contributions | |
ays | -0.032 |
ips | -0.027 |
unks | -0.027 |
rob | -0.027 |
ions | -0.026 |
Token |
|
Token ID | 198 |
Feature activation | -1.94e-02 |
Pos logit contributions | |
lder | +0.022 |
tutor | +0.021 |
hospitality | +0.021 |
tune | +0.021 |
song | +0.021 |
Neg logit contributions | |
ays | -0.032 |
unks | -0.027 |
ips | -0.027 |
rob | -0.027 |
izz | -0.026 |
Token | Tim |
Token ID | 14967 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
tutor | +0.027 |
hospitality | +0.027 |
lder | +0.026 |
birthday | +0.025 |
recommendation | +0.025 |
Neg logit contributions | |
ays | -0.039 |
izz | -0.037 |
unks | -0.037 |
ions | -0.036 |
rob | -0.036 |
Token | was |
Token ID | 373 |
Feature activation | +8.39e-03 |
Pos logit contributions | |
birthday | +0.025 |
hospitality | +0.025 |
tutor | +0.024 |
recommendation | +0.024 |
Days | +0.023 |
Neg logit contributions | |
ays | -0.019 |
spins | -0.015 |
ips | -0.015 |
lands | -0.015 |
rob | -0.014 |