Token | garden |
Token ID | 11376 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
its | +0.057 |
ters | +0.053 |
ade | +0.050 |
ying | +0.050 |
aches | +0.050 |
Neg logit contributions | |
joy | -0.071 |
Bye | -0.063 |
Sure | -0.061 |
icol | -0.058 |
goodbye | -0.057 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
joy | +0.015 |
Bye | +0.014 |
Sure | +0.013 |
icol | +0.013 |
carriage | +0.013 |
Neg logit contributions | |
its | -0.011 |
ters | -0.010 |
ade | -0.010 |
ying | -0.010 |
aches | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
its | +0.239 |
ters | +0.222 |
ying | +0.213 |
ade | +0.212 |
aches | +0.210 |
Neg logit contributions | |
joy | -0.241 |
Bye | -0.212 |
Sure | -0.200 |
carriage | -0.191 |
icol | -0.190 |
Token |
|
Token ID | 198 |
Feature activation | -1.42e-01 |
Pos logit contributions | |
joy | +0.019 |
Bye | +0.016 |
Sure | +0.016 |
carriage | +0.015 |
goodbye | +0.015 |
Neg logit contributions | |
its | -0.017 |
ters | -0.016 |
ying | -0.015 |
ade | -0.015 |
aches | -0.015 |
Token | The |
Token ID | 464 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
joy | +0.013 |
Bye | +0.012 |
Sure | +0.012 |
carriage | +0.011 |
goodbye | +0.011 |
Neg logit contributions | |
its | -0.010 |
ters | -0.010 |
ying | -0.009 |
ade | -0.009 |
aches | -0.009 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
its | +0.032 |
ters | +0.030 |
ying | +0.028 |
ade | +0.028 |
aches | +0.028 |
Neg logit contributions | |
joy | -0.041 |
Bye | -0.037 |
Sure | -0.035 |
icol | -0.033 |
goodbye | -0.033 |
Token | was |
Token ID | 373 |
Feature activation | +8.82e-01 |
Pos logit contributions | |
its | +0.774 |
ters | +0.717 |
ying | +0.691 |
ade | +0.672 |
aches | +0.665 |
Neg logit contributions | |
joy | -0.926 |
Bye | -0.829 |
Sure | -0.790 |
goodbye | -0.762 |
carriage | -0.758 |
Token | so |
Token ID | 523 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
its | +0.067 |
ters | +0.062 |
ying | +0.062 |
idy | +0.059 |
ade | +0.059 |
Neg logit contributions | |
joy | -0.079 |
Bye | -0.068 |
goodbye | -0.065 |
carriage | -0.064 |
Sure | -0.064 |
Token | happy |
Token ID | 3772 |
Feature activation | -7.64e-01 |
Pos logit contributions | |
ters | +0.224 |
its | +0.211 |
ying | +0.207 |
idy | +0.195 |
have | +0.192 |
Neg logit contributions | |
joy | -0.237 |
Bye | -0.219 |
Sure | -0.208 |
goodbye | -0.202 |
Thank | -0.187 |
Token | that |
Token ID | 326 |
Feature activation | -6.23e-01 |
Pos logit contributions | |
joy | +0.072 |
Bye | +0.065 |
Sure | +0.060 |
carriage | +0.060 |
icol | +0.059 |
Neg logit contributions | |
its | -0.053 |
ters | -0.052 |
ade | -0.048 |
ying | -0.048 |
aches | -0.046 |
Token | it |
Token ID | 340 |
Feature activation | -4.22e-01 |
Pos logit contributions | |
joy | +0.065 |
Bye | +0.057 |
icol | +0.055 |
Sure | +0.055 |
carriage | +0.054 |
Neg logit contributions | |
its | -0.038 |
ters | -0.036 |
ying | -0.034 |
aches | -0.034 |
ade | -0.033 |
Token | Lily |
Token ID | 20037 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
its | +0.088 |
ters | +0.083 |
ying | +0.078 |
ade | +0.078 |
aches | +0.077 |
Neg logit contributions | |
joy | -0.097 |
Bye | -0.085 |
Sure | -0.080 |
carriage | -0.077 |
icol | -0.077 |
Token | said |
Token ID | 531 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
joy | +0.003 |
Bye | +0.003 |
Sure | +0.003 |
goodbye | +0.003 |
icol | +0.003 |
Neg logit contributions | |
its | -0.003 |
ying | -0.002 |
ters | -0.002 |
aches | -0.002 |
idy | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -8.63e-01 |
Pos logit contributions | |
its | +0.129 |
ters | +0.117 |
ade | +0.114 |
ying | +0.113 |
aches | +0.113 |
Neg logit contributions | |
joy | -0.137 |
Bye | -0.119 |
Sure | -0.114 |
goodbye | -0.113 |
carriage | -0.107 |
Token | She |
Token ID | 1375 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
joy | +0.074 |
Bye | +0.065 |
Sure | +0.062 |
carriage | +0.059 |
icol | +0.059 |
Neg logit contributions | |
its | -0.070 |
ters | -0.066 |
ying | -0.063 |
ade | -0.062 |
aches | -0.061 |
Token | liked |
Token ID | 8288 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
its | +0.036 |
ters | +0.033 |
ade | +0.031 |
aches | +0.031 |
ying | +0.030 |
Neg logit contributions | |
joy | -0.051 |
Bye | -0.046 |
Sure | -0.044 |
carriage | -0.042 |
goodbye | -0.042 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
joy | +0.171 |
Bye | +0.148 |
Sure | +0.139 |
goodbye | +0.137 |
carriage | +0.133 |
Neg logit contributions | |
its | -0.171 |
ters | -0.159 |
ying | -0.153 |
ade | -0.148 |
idy | -0.147 |
Token | . |
Token ID | 13 |
Feature activation | -7.85e-01 |
Pos logit contributions | |
its | +0.941 |
ying | +0.831 |
idy | +0.804 |
have | +0.802 |
ters | +0.793 |
Neg logit contributions | |
joy | -0.762 |
goodbye | -0.602 |
Bye | -0.602 |
carriage | -0.578 |
arium | -0.571 |
Token | It |
Token ID | 632 |
Feature activation | -8.61e-01 |
Pos logit contributions | |
joy | +0.068 |
Bye | +0.060 |
Sure | +0.057 |
goodbye | +0.054 |
icol | +0.053 |
Neg logit contributions | |
its | -0.064 |
ters | -0.060 |
ying | -0.057 |
ade | -0.057 |
aches | -0.057 |
Token | was |
Token ID | 373 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
joy | +0.070 |
Bye | +0.063 |
Sure | +0.062 |
carriage | +0.055 |
arium | +0.055 |
Neg logit contributions | |
its | -0.070 |
ying | -0.066 |
ters | -0.065 |
idy | -0.062 |
aches | -0.060 |
Token | orange |
Token ID | 10912 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
its | +0.036 |
ying | +0.034 |
ters | +0.033 |
idy | +0.032 |
ade | +0.031 |
Neg logit contributions | |
joy | -0.042 |
Bye | -0.036 |
goodbye | -0.035 |
Sure | -0.035 |
icol | -0.033 |
Token | and |
Token ID | 290 |
Feature activation | -7.78e-01 |
Pos logit contributions | |
its | +0.148 |
ters | +0.137 |
ying | +0.131 |
ade | +0.130 |
aches | +0.129 |
Neg logit contributions | |
joy | -0.162 |
Bye | -0.143 |
Sure | -0.136 |
carriage | -0.130 |
goodbye | -0.130 |
Token | anything |
Token ID | 1997 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
its | +0.183 |
ters | +0.170 |
ying | +0.161 |
aches | +0.158 |
ade | +0.158 |
Neg logit contributions | |
joy | -0.259 |
Bye | -0.234 |
Sure | -0.226 |
icol | -0.218 |
carriage | -0.216 |
Token | because |
Token ID | 780 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
joy | +0.023 |
Bye | +0.021 |
Sure | +0.019 |
goodbye | +0.019 |
carriage | +0.018 |
Neg logit contributions | |
its | -0.022 |
ters | -0.020 |
ade | -0.019 |
aches | -0.019 |
ying | -0.019 |
Token | it |
Token ID | 340 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
joy | +0.190 |
Bye | +0.171 |
Sure | +0.163 |
icol | +0.158 |
carriage | +0.157 |
Neg logit contributions | |
its | -0.125 |
ters | -0.115 |
ying | -0.109 |
ade | -0.108 |
aches | -0.107 |
Token | was |
Token ID | 373 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
joy | +0.013 |
Bye | +0.012 |
Sure | +0.012 |
arium | +0.011 |
carriage | +0.011 |
Neg logit contributions | |
its | -0.014 |
ters | -0.013 |
ying | -0.013 |
aches | -0.012 |
ade | -0.012 |
Token | a |
Token ID | 257 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
its | +0.100 |
ters | +0.089 |
ying | +0.088 |
ade | +0.087 |
idy | +0.084 |
Neg logit contributions | |
joy | -0.127 |
Bye | -0.111 |
goodbye | -0.105 |
Sure | -0.103 |
carriage | -0.101 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
its | +0.001 |
ters | +0.001 |
ade | +0.001 |
ying | +0.001 |
aches | +0.001 |
Neg logit contributions | |
joy | -0.001 |
Bye | -0.001 |
Sure | -0.001 |
icol | -0.001 |
carriage | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
its | +0.670 |
ters | +0.657 |
ade | +0.609 |
ying | +0.595 |
aches | +0.577 |
Neg logit contributions | |
joy | -1.011 |
Bye | -0.903 |
Sure | -0.881 |
icol | -0.851 |
carriage | -0.821 |
Token | not |
Token ID | 407 |
Feature activation | +3.31e-01 |
Pos logit contributions | |
its | +0.021 |
ters | +0.019 |
ying | +0.018 |
ade | +0.018 |
aches | +0.018 |
Neg logit contributions | |
joy | -0.034 |
Bye | -0.031 |
Sure | -0.029 |
carriage | -0.028 |
goodbye | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | +1.58e-03 |
Pos logit contributions | |
its | +0.023 |
ters | +0.021 |
aches | +0.020 |
ying | +0.020 |
ade | +0.020 |
Neg logit contributions | |
joy | -0.033 |
Bye | -0.029 |
Sure | -0.028 |
icol | -0.027 |
carriage | -0.027 |
Token | ball |
Token ID | 2613 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
its | +0.000 |
ters | +0.000 |
ying | +0.000 |
aches | +0.000 |
idy | +0.000 |
Neg logit contributions | |
joy | -0.000 |
Bye | -0.000 |
Sure | -0.000 |
goodbye | -0.000 |
carriage | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
its | +0.272 |
ters | +0.251 |
ying | +0.240 |
ade | +0.238 |
aches | +0.236 |
Neg logit contributions | |
joy | -0.323 |
Bye | -0.288 |
Sure | -0.273 |
goodbye | -0.261 |
carriage | -0.261 |
Token | how |
Token ID | 703 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
joy | +0.191 |
Bye | +0.170 |
Sure | +0.162 |
goodbye | +0.157 |
carriage | +0.156 |
Neg logit contributions | |
its | -0.150 |
ters | -0.137 |
ying | -0.130 |
ade | -0.129 |
aches | -0.128 |
Token | to |
Token ID | 284 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
its | +0.138 |
ters | +0.128 |
ade | +0.125 |
ying | +0.124 |
idy | +0.121 |
Neg logit contributions | |
joy | -0.136 |
Bye | -0.116 |
Sure | -0.113 |
icol | -0.111 |
carriage | -0.110 |
Token | fly |
Token ID | 6129 |
Feature activation | +7.22e-01 |
Pos logit contributions | |
joy | +0.013 |
Bye | +0.013 |
Sure | +0.011 |
carriage | +0.011 |
arium | +0.011 |
Neg logit contributions | |
its | -0.014 |
ying | -0.014 |
ters | -0.013 |
idy | -0.012 |
ade | -0.012 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
its | +0.051 |
ters | +0.047 |
ade | +0.045 |
ying | +0.044 |
aches | +0.044 |
Neg logit contributions | |
joy | -0.070 |
Bye | -0.063 |
Sure | -0.060 |
icol | -0.058 |
carriage | -0.058 |
Token | The |
Token ID | 383 |
Feature activation | -3.15e+00 |
Pos logit contributions | |
its | +0.319 |
ters | +0.308 |
ade | +0.294 |
aches | +0.294 |
ying | +0.284 |
Neg logit contributions | |
joy | -0.241 |
Bye | -0.197 |
icol | -0.187 |
carriage | -0.182 |
Sure | -0.174 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
joy | +0.243 |
Bye | +0.197 |
carriage | +0.184 |
goodbye | +0.183 |
Sure | +0.176 |
Neg logit contributions | |
its | -0.294 |
ying | -0.270 |
idy | -0.261 |
ters | -0.258 |
aches | -0.252 |
Token | did |
Token ID | 750 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
its | +0.739 |
ters | +0.680 |
ying | +0.649 |
ade | +0.644 |
aches | +0.636 |
Neg logit contributions | |
joy | -0.960 |
Bye | -0.857 |
Sure | -0.817 |
carriage | -0.782 |
goodbye | -0.780 |
Token | not |
Token ID | 407 |
Feature activation | +3.38e-01 |
Pos logit contributions | |
its | +0.014 |
ters | +0.013 |
ying | +0.013 |
ade | +0.013 |
idy | +0.012 |
Neg logit contributions | |
joy | -0.017 |
Bye | -0.015 |
goodbye | -0.015 |
Sure | -0.015 |
carriage | -0.014 |
Token | say |
Token ID | 910 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
its | +0.025 |
ying | +0.022 |
ade | +0.022 |
idy | +0.022 |
oving | +0.022 |
Neg logit contributions | |
joy | -0.028 |
Bye | -0.026 |
goodbye | -0.026 |
bye | -0.025 |
carriage | -0.025 |
Token | anything |
Token ID | 1997 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
its | +0.183 |
ters | +0.170 |
ying | +0.161 |
aches | +0.158 |
ade | +0.158 |
Neg logit contributions | |
joy | -0.259 |
Bye | -0.234 |
Sure | -0.226 |
icol | -0.218 |
carriage | -0.216 |
Token | because |
Token ID | 780 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
joy | +0.023 |
Bye | +0.021 |
Sure | +0.019 |
goodbye | +0.019 |
carriage | +0.018 |
Neg logit contributions | |
its | -0.022 |
ters | -0.020 |
ade | -0.019 |
aches | -0.019 |
ying | -0.019 |
Token | was |
Token ID | 373 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
joy | +0.088 |
Bye | +0.079 |
Sure | +0.075 |
carriage | +0.072 |
icol | +0.072 |
Neg logit contributions | |
its | -0.063 |
ters | -0.058 |
ade | -0.055 |
ying | -0.055 |
aches | -0.054 |
Token | about |
Token ID | 546 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
its | +0.095 |
ters | +0.086 |
ade | +0.085 |
ying | +0.083 |
idy | +0.081 |
Neg logit contributions | |
joy | -0.132 |
Bye | -0.118 |
goodbye | -0.110 |
Sure | -0.108 |
carriage | -0.105 |
Token | to |
Token ID | 284 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
its | +0.137 |
ters | +0.129 |
ying | +0.124 |
ade | +0.124 |
aches | +0.123 |
Neg logit contributions | |
joy | -0.122 |
Bye | -0.110 |
Sure | -0.102 |
carriage | -0.099 |
icol | -0.098 |
Token | touch |
Token ID | 3638 |
Feature activation | -4.72e-01 |
Pos logit contributions | |
joy | +0.017 |
Bye | +0.016 |
goodbye | +0.015 |
Sure | +0.015 |
icol | +0.014 |
Neg logit contributions | |
its | -0.013 |
ters | -0.012 |
ying | -0.012 |
idy | -0.011 |
ade | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
joy | +0.046 |
Bye | +0.040 |
Sure | +0.038 |
goodbye | +0.037 |
carriage | +0.037 |
Neg logit contributions | |
its | -0.034 |
ters | -0.031 |
ying | -0.030 |
ade | -0.029 |
aches | -0.029 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.018 |
aches | +0.017 |
have | +0.017 |
ying | +0.017 |
affles | +0.016 |
Neg logit contributions | |
joy | -0.036 |
Bye | -0.030 |
Sure | -0.030 |
reminder | -0.029 |
goodbye | -0.029 |
Token | when |
Token ID | 618 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
its | +0.883 |
ters | +0.781 |
ying | +0.770 |
ade | +0.761 |
aches | +0.760 |
Neg logit contributions | |
joy | -0.806 |
Bye | -0.693 |
Sure | -0.670 |
goodbye | -0.662 |
carriage | -0.638 |
Token | it |
Token ID | 340 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
its | +0.076 |
ters | +0.069 |
aches | +0.065 |
ying | +0.065 |
ade | +0.064 |
Neg logit contributions | |
joy | -0.138 |
Bye | -0.128 |
Sure | -0.123 |
icol | -0.123 |
carriage | -0.121 |
Token | moved |
Token ID | 3888 |
Feature activation | +5.63e-01 |
Pos logit contributions | |
joy | +0.015 |
Bye | +0.013 |
Sure | +0.013 |
carriage | +0.012 |
goodbye | +0.012 |
Neg logit contributions | |
its | -0.013 |
ters | -0.012 |
ying | -0.012 |
aches | -0.011 |
idy | -0.011 |
Token | ! |
Token ID | 0 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
its | +0.045 |
ters | +0.040 |
ying | +0.039 |
aches | +0.039 |
ade | +0.039 |
Neg logit contributions | |
joy | -0.051 |
Bye | -0.044 |
Sure | -0.042 |
goodbye | -0.041 |
carriage | -0.040 |
Token | It |
Token ID | 632 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
joy | +0.112 |
Bye | +0.099 |
carriage | +0.094 |
Sure | +0.092 |
icol | +0.092 |
Neg logit contributions | |
its | -0.087 |
ters | -0.080 |
ying | -0.076 |
ade | -0.076 |
aches | -0.073 |
Token | That |
Token ID | 1320 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
joy | +0.114 |
carriage | +0.097 |
lair | +0.093 |
Bye | +0.092 |
goodbye | +0.091 |
Neg logit contributions | |
ters | -0.097 |
its | -0.094 |
ying | -0.089 |
idy | -0.084 |
ade | -0.084 |
Token | 's |
Token ID | 338 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
its | +0.093 |
aches | +0.081 |
ters | +0.080 |
ying | +0.079 |
affles | +0.075 |
Neg logit contributions | |
joy | -0.098 |
Bye | -0.094 |
Sure | -0.087 |
arium | -0.086 |
icol | -0.084 |
Token | a |
Token ID | 257 |
Feature activation | -4.15e-02 |
Pos logit contributions | |
its | +0.206 |
ters | +0.184 |
ying | +0.177 |
ade | +0.175 |
aches | +0.170 |
Neg logit contributions | |
joy | -0.303 |
Bye | -0.278 |
Sure | -0.263 |
goodbye | -0.254 |
icol | -0.253 |
Token | really |
Token ID | 1107 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
joy | +0.005 |
Bye | +0.004 |
Sure | +0.004 |
icol | +0.004 |
carriage | +0.004 |
Neg logit contributions | |
its | -0.002 |
ters | -0.002 |
ying | -0.002 |
aches | -0.002 |
idy | -0.002 |
Token | big |
Token ID | 1263 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
its | +0.199 |
ters | +0.182 |
ying | +0.171 |
ade | +0.163 |
idy | +0.162 |
Neg logit contributions | |
joy | -0.365 |
Bye | -0.334 |
Sure | -0.321 |
goodbye | -0.308 |
carriage | -0.307 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.070 |
ters | +0.060 |
ying | +0.057 |
aches | +0.056 |
idy | +0.053 |
Neg logit contributions | |
joy | -0.189 |
Bye | -0.169 |
Sure | -0.163 |
goodbye | -0.161 |
icol | -0.160 |
Token | . |
Token ID | 13 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
its | +0.787 |
ters | +0.709 |
ying | +0.689 |
ade | +0.675 |
aches | +0.673 |
Neg logit contributions | |
joy | -0.908 |
Bye | -0.812 |
Sure | -0.767 |
carriage | -0.742 |
goodbye | -0.737 |
Token | Maybe |
Token ID | 6674 |
Feature activation | -3.69e+00 |
Pos logit contributions | |
ters | +0.042 |
its | +0.039 |
ying | +0.036 |
idy | +0.034 |
organ | +0.034 |
Neg logit contributions | |
joy | -0.046 |
carriage | -0.037 |
lair | -0.035 |
goodbye | -0.035 |
spine | -0.034 |
Token | we |
Token ID | 356 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
joy | +0.354 |
Bye | +0.316 |
Sure | +0.302 |
goodbye | +0.289 |
carriage | +0.287 |
Neg logit contributions | |
its | -0.267 |
ters | -0.243 |
ying | -0.233 |
ade | -0.231 |
aches | -0.227 |
Token | can |
Token ID | 460 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
joy | +0.158 |
Bye | +0.140 |
Sure | +0.132 |
carriage | +0.129 |
goodbye | +0.128 |
Neg logit contributions | |
its | -0.164 |
ters | -0.150 |
ying | -0.146 |
ade | -0.144 |
aches | -0.143 |
Token | make |
Token ID | 787 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
ying | +0.024 |
its | +0.023 |
ters | +0.022 |
ins | +0.022 |
have | +0.021 |
Neg logit contributions | |
Bye | -0.019 |
joy | -0.019 |
carriage | -0.019 |
Sure | -0.018 |
icol | -0.017 |
Token | Tom |
Token ID | 13787 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
its | +0.051 |
ters | +0.049 |
ying | +0.047 |
idy | +0.045 |
aches | +0.045 |
Neg logit contributions | |
joy | -0.053 |
Bye | -0.049 |
Sure | -0.046 |
goodbye | -0.043 |
carriage | -0.042 |
Token | smiled |
Token ID | 13541 |
Feature activation | -4.10e+00 |
Pos logit contributions | |
its | +0.011 |
ters | +0.010 |
ying | +0.010 |
ade | +0.009 |
aches | +0.009 |
Neg logit contributions | |
joy | -0.014 |
Bye | -0.013 |
Sure | -0.012 |
carriage | -0.012 |
goodbye | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | +5.18e-01 |
Pos logit contributions | |
joy | +0.419 |
Bye | +0.417 |
Sure | +0.389 |
habitats | +0.384 |
lifetime | +0.374 |
Neg logit contributions | |
ters | -0.219 |
its | -0.209 |
ble | -0.193 |
ade | -0.190 |
ying | -0.190 |
Token | took |
Token ID | 1718 |
Feature activation | +9.80e-01 |
Pos logit contributions | |
its | +0.031 |
ters | +0.031 |
aches | +0.029 |
ying | +0.028 |
ade | +0.027 |
Neg logit contributions | |
joy | -0.050 |
Bye | -0.046 |
habitats | -0.044 |
icol | -0.044 |
lair | -0.044 |
Token | the |
Token ID | 262 |
Feature activation | +4.33e-01 |
Pos logit contributions | |
its | +0.077 |
ters | +0.071 |
ying | +0.068 |
idy | +0.066 |
ade | +0.066 |
Neg logit contributions | |
joy | -0.087 |
Bye | -0.076 |
Sure | -0.074 |
goodbye | -0.073 |
carriage | -0.070 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.027 |
affles | +0.024 |
aches | +0.024 |
have | +0.024 |
oving | +0.023 |
Neg logit contributions | |
joy | -0.045 |
Sure | -0.038 |
goodbye | -0.037 |
reminder | -0.036 |
Bye | -0.035 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
its | +0.879 |
ters | +0.797 |
ying | +0.774 |
aches | +0.761 |
ade | +0.756 |
Neg logit contributions | |
joy | -0.819 |
Bye | -0.706 |
Sure | -0.686 |
goodbye | -0.656 |
carriage | -0.650 |
Token | ran |
Token ID | 4966 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
its | +0.007 |
ters | +0.007 |
ade | +0.007 |
aches | +0.007 |
ying | +0.006 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.010 |
Sure | -0.009 |
carriage | -0.009 |
icol | -0.009 |
Token | off |
Token ID | 572 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
its | +0.011 |
ters | +0.010 |
ade | +0.010 |
ying | +0.009 |
aches | +0.009 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.010 |
Sure | -0.009 |
carriage | -0.009 |
icol | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
its | +0.314 |
ters | +0.302 |
ade | +0.290 |
aches | +0.286 |
ying | +0.285 |
Neg logit contributions | |
joy | -0.354 |
Bye | -0.332 |
icol | -0.298 |
Sure | -0.297 |
habitats | -0.294 |
Token | the |
Token ID | 262 |
Feature activation | +4.33e-01 |
Pos logit contributions | |
joy | +0.014 |
Bye | +0.013 |
Sure | +0.012 |
goodbye | +0.012 |
carriage | +0.011 |
Neg logit contributions | |
its | -0.010 |
ters | -0.009 |
ying | -0.009 |
ade | -0.008 |
idy | -0.008 |
Token | help |
Token ID | 1037 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
joy | +0.093 |
Bye | +0.085 |
Sure | +0.081 |
goodbye | +0.079 |
carriage | +0.078 |
Neg logit contributions | |
its | -0.060 |
ters | -0.055 |
ying | -0.052 |
ade | -0.051 |
aches | -0.050 |
Token | ?" |
Token ID | 1701 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
its | +0.088 |
ters | +0.078 |
ying | +0.075 |
ade | +0.072 |
idy | +0.072 |
Neg logit contributions | |
joy | -0.089 |
Bye | -0.080 |
carriage | -0.076 |
Sure | -0.075 |
goodbye | -0.075 |
Token |
|
Token ID | 198 |
Feature activation | +6.84e-01 |
Pos logit contributions | |
its | +0.168 |
ters | +0.157 |
ying | +0.144 |
ade | +0.144 |
she | +0.144 |
Neg logit contributions | |
joy | -0.406 |
Bye | -0.378 |
habitats | -0.359 |
icol | -0.355 |
lair | -0.346 |
Token |
|
Token ID | 198 |
Feature activation | +6.88e-01 |
Pos logit contributions | |
its | +0.053 |
ters | +0.049 |
ying | +0.047 |
ade | +0.047 |
aches | +0.046 |
Neg logit contributions | |
joy | -0.061 |
Bye | -0.054 |
Sure | -0.051 |
carriage | -0.049 |
icol | -0.049 |
Token | The |
Token ID | 464 |
Feature activation | +6.25e-01 |
Pos logit contributions | |
its | +0.046 |
ters | +0.042 |
ying | +0.040 |
ade | +0.039 |
aches | +0.039 |
Neg logit contributions | |
joy | -0.069 |
Bye | -0.063 |
Sure | -0.060 |
carriage | -0.058 |
goodbye | -0.057 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.034 |
aches | +0.029 |
ters | +0.028 |
ying | +0.026 |
oving | +0.026 |
Neg logit contributions | |
joy | -0.072 |
Sure | -0.060 |
Bye | -0.059 |
goodbye | -0.058 |
arium | -0.056 |
Token | wondered |
Token ID | 14028 |
Feature activation | +8.48e-02 |
Pos logit contributions | |
its | +0.850 |
ters | +0.794 |
ying | +0.762 |
ade | +0.760 |
aches | +0.752 |
Neg logit contributions | |
joy | -0.837 |
Bye | -0.737 |
Sure | -0.694 |
icol | -0.661 |
carriage | -0.658 |
Token | . |
Token ID | 13 |
Feature activation | +4.64e-01 |
Pos logit contributions | |
its | +0.005 |
ters | +0.005 |
ying | +0.005 |
aches | +0.005 |
ade | +0.005 |
Neg logit contributions | |
joy | -0.008 |
Bye | -0.008 |
Sure | -0.007 |
icol | -0.007 |
carriage | -0.007 |
Token | Then |
Token ID | 3244 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
ters | +0.027 |
its | +0.024 |
she | +0.024 |
ying | +0.024 |
ade | +0.022 |
Neg logit contributions | |
joy | -0.044 |
Bye | -0.041 |
habitats | -0.041 |
carriage | -0.040 |
lair | -0.040 |
Token | she |
Token ID | 673 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
habitats | +0.258 |
joy | +0.256 |
lair | +0.250 |
Bye | +0.247 |
spine | +0.242 |
Neg logit contributions | |
ters | -0.077 |
sure | -0.069 |
she | -0.066 |
do | -0.063 |
idea | -0.061 |
Token | said |
Token ID | 531 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
its | +0.074 |
ade | +0.070 |
ters | +0.069 |
aches | +0.066 |
idy | +0.064 |
Neg logit contributions | |
joy | -0.117 |
Bye | -0.107 |
Sure | -0.098 |
icol | -0.095 |
habitats | -0.095 |
Token | The |
Token ID | 383 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
its | +0.019 |
ters | +0.019 |
ade | +0.017 |
ying | +0.017 |
aches | +0.017 |
Neg logit contributions | |
joy | -0.016 |
Bye | -0.013 |
carriage | -0.012 |
icol | -0.012 |
Sure | -0.012 |
Token | goat |
Token ID | 26917 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
joy | +0.220 |
Bye | +0.182 |
carriage | +0.165 |
goodbye | +0.163 |
Sure | +0.159 |
Neg logit contributions | |
its | -0.334 |
ying | -0.310 |
ters | -0.297 |
aches | -0.296 |
ade | -0.293 |
Token | went |
Token ID | 1816 |
Feature activation | -4.37e-01 |
Pos logit contributions | |
its | +0.128 |
ters | +0.117 |
ade | +0.113 |
aches | +0.111 |
ying | +0.111 |
Neg logit contributions | |
joy | -0.183 |
Bye | -0.163 |
Sure | -0.156 |
icol | -0.150 |
carriage | -0.149 |
Token | to |
Token ID | 284 |
Feature activation | -7.90e-02 |
Pos logit contributions | |
joy | +0.039 |
Bye | +0.035 |
Sure | +0.033 |
icol | +0.032 |
carriage | +0.031 |
Neg logit contributions | |
its | -0.033 |
ters | -0.031 |
ade | -0.030 |
ying | -0.030 |
aches | -0.030 |
Token | the |
Token ID | 262 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
joy | +0.008 |
Bye | +0.007 |
Sure | +0.007 |
goodbye | +0.006 |
carriage | +0.006 |
Neg logit contributions | |
its | -0.006 |
ters | -0.005 |
ying | -0.005 |
ade | -0.005 |
idy | -0.005 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.031 |
ying | +0.028 |
ters | +0.026 |
idy | +0.026 |
aches | +0.026 |
Neg logit contributions | |
joy | -0.030 |
Bye | -0.027 |
Sure | -0.025 |
carriage | -0.025 |
goodbye | -0.024 |
Token | and |
Token ID | 290 |
Feature activation | +9.26e-03 |
Pos logit contributions | |
ters | +0.606 |
its | +0.594 |
ade | +0.589 |
ying | +0.565 |
aches | +0.546 |
Neg logit contributions | |
joy | -1.019 |
Bye | -0.949 |
icol | -0.896 |
Sure | -0.862 |
habitats | -0.846 |
Token | started |
Token ID | 2067 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
its | +0.001 |
aches | +0.000 |
ters | +0.000 |
ade | +0.000 |
ying | +0.000 |
Neg logit contributions | |
joy | -0.001 |
Bye | -0.001 |
icol | -0.001 |
habitats | -0.001 |
carriage | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | -6.87e-02 |
Pos logit contributions | |
its | +0.163 |
ters | +0.152 |
ade | +0.147 |
ying | +0.146 |
aches | +0.146 |
Neg logit contributions | |
joy | -0.143 |
Bye | -0.126 |
Sure | -0.118 |
carriage | -0.113 |
icol | -0.112 |
Token | chew |
Token ID | 34722 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
joy | +0.006 |
Bye | +0.005 |
Sure | +0.005 |
goodbye | +0.005 |
icol | +0.005 |
Neg logit contributions | |
its | -0.006 |
ters | -0.005 |
ying | -0.005 |
idy | -0.005 |
ade | -0.005 |
Token | on |
Token ID | 319 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
its | +0.118 |
ying | +0.106 |
ics | +0.106 |
ters | +0.104 |
aches | +0.104 |
Neg logit contributions | |
joy | -0.123 |
Bye | -0.102 |
goodbye | -0.101 |
Sure | -0.098 |
icol | -0.088 |
Token | that |
Token ID | 326 |
Feature activation | -4.45e-01 |
Pos logit contributions | |
its | +0.224 |
ters | +0.210 |
ying | +0.201 |
ade | +0.196 |
idy | +0.193 |
Neg logit contributions | |
joy | -0.269 |
Bye | -0.242 |
Sure | -0.230 |
icol | -0.222 |
carriage | -0.221 |
Token | he |
Token ID | 339 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
joy | +0.045 |
icol | +0.040 |
Bye | +0.040 |
Sure | +0.038 |
carriage | +0.037 |
Neg logit contributions | |
its | -0.030 |
ying | -0.026 |
ters | -0.026 |
aches | -0.025 |
ade | -0.024 |
Token | dropped |
Token ID | 5710 |
Feature activation | +2.58e+00 |
Pos logit contributions | |
joy | +0.014 |
Bye | +0.013 |
Sure | +0.012 |
goodbye | +0.012 |
carriage | +0.012 |
Neg logit contributions | |
its | -0.012 |
ters | -0.011 |
ying | -0.010 |
ade | -0.010 |
aches | -0.010 |
Token | the |
Token ID | 262 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
its | +0.171 |
ters | +0.158 |
ying | +0.148 |
ade | +0.145 |
aches | +0.144 |
Neg logit contributions | |
joy | -0.259 |
Bye | -0.236 |
Sure | -0.224 |
icol | -0.219 |
carriage | -0.217 |
Token | purple |
Token ID | 14032 |
Feature activation | +7.82e-01 |
Pos logit contributions | |
its | +0.015 |
oving | +0.012 |
affles | +0.012 |
organ | +0.012 |
have | +0.012 |
Neg logit contributions | |
joy | -0.027 |
goodbye | -0.022 |
reminder | -0.020 |
Sure | -0.020 |
arium | -0.020 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.036 |
have | +0.030 |
ying | +0.029 |
aches | +0.028 |
organ | +0.027 |
Neg logit contributions | |
joy | -0.096 |
Sure | -0.080 |
goodbye | -0.080 |
arium | -0.077 |
carriage | -0.077 |
Token | and |
Token ID | 290 |
Feature activation | -5.14e-03 |
Pos logit contributions | |
its | +0.761 |
ters | +0.707 |
ying | +0.674 |
ade | +0.671 |
aches | +0.660 |
Neg logit contributions | |
joy | -0.925 |
Bye | -0.824 |
Sure | -0.783 |
carriage | -0.748 |
icol | -0.747 |
Token | ran |
Token ID | 4966 |
Feature activation | +3.24e-02 |
Pos logit contributions | |
joy | +0.001 |
Bye | +0.000 |
Sure | +0.000 |
icol | +0.000 |
carriage | +0.000 |
Neg logit contributions | |
its | -0.000 |
ters | -0.000 |
aches | -0.000 |
ade | -0.000 |
ying | -0.000 |
Token | away |
Token ID | 1497 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
its | +0.002 |
ters | +0.002 |
ade | +0.002 |
ying | +0.002 |
aches | +0.002 |
Neg logit contributions | |
joy | -0.003 |
Bye | -0.003 |
Sure | -0.003 |
icol | -0.003 |
lifetime | -0.003 |
Token | as |
Token ID | 355 |
Feature activation | -7.97e-01 |
Pos logit contributions | |
joy | +0.132 |
Bye | +0.120 |
Sure | +0.114 |
carriage | +0.109 |
icol | +0.109 |
Neg logit contributions | |
its | -0.100 |
ters | -0.093 |
ying | -0.088 |
ade | -0.087 |
aches | -0.086 |
Token | fast |
Token ID | 3049 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
joy | +0.084 |
icol | +0.078 |
Bye | +0.078 |
carriage | +0.073 |
Sure | +0.071 |
Neg logit contributions | |
its | -0.048 |
ters | -0.042 |
aches | -0.039 |
ying | -0.039 |
idy | -0.038 |
Token | We |
Token ID | 775 |
Feature activation | -4.64e+00 |
Pos logit contributions | |
ters | +0.010 |
its | +0.010 |
ying | +0.009 |
have | +0.009 |
First | +0.009 |
Neg logit contributions | |
joy | -0.012 |
carriage | -0.009 |
lifetime | -0.009 |
lair | -0.009 |
icol | -0.009 |
Token | need |
Token ID | 761 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
joy | +0.427 |
Bye | +0.390 |
Sure | +0.368 |
carriage | +0.358 |
goodbye | +0.356 |
Neg logit contributions | |
its | -0.337 |
ters | -0.312 |
ying | -0.301 |
ade | -0.295 |
idy | -0.290 |
Token | to |
Token ID | 284 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
joy | +0.097 |
Bye | +0.083 |
icol | +0.081 |
Sure | +0.079 |
carriage | +0.077 |
Neg logit contributions | |
its | -0.071 |
ters | -0.067 |
aches | -0.065 |
ade | -0.065 |
idy | -0.062 |
Token | buy |
Token ID | 2822 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
joy | +0.028 |
Bye | +0.027 |
goodbye | +0.025 |
carriage | +0.025 |
Sure | +0.025 |
Neg logit contributions | |
its | -0.022 |
ters | -0.021 |
ying | -0.020 |
ade | -0.020 |
idy | -0.019 |
Token | some |
Token ID | 617 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
its | +0.127 |
ters | +0.119 |
aches | +0.110 |
ade | +0.110 |
ying | +0.109 |
Neg logit contributions | |
joy | -0.219 |
Bye | -0.195 |
Sure | -0.189 |
icol | -0.183 |
carriage | -0.182 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.030 |
ters | +0.027 |
ying | +0.026 |
ade | +0.025 |
aches | +0.024 |
Neg logit contributions | |
joy | -0.043 |
Bye | -0.040 |
Sure | -0.038 |
goodbye | -0.038 |
carriage | -0.037 |
Token | for |
Token ID | 329 |
Feature activation | -3.46e+00 |
Pos logit contributions | |
its | +0.882 |
ying | +0.744 |
ters | +0.741 |
idy | +0.724 |
ade | +0.712 |
Neg logit contributions | |
joy | -0.796 |
Bye | -0.707 |
goodbye | -0.679 |
Sure | -0.678 |
carriage | -0.667 |
Token | dinner |
Token ID | 8073 |
Feature activation | -3.72e-02 |
Pos logit contributions | |
joy | +0.329 |
Bye | +0.295 |
Sure | +0.280 |
goodbye | +0.269 |
carriage | +0.269 |
Neg logit contributions | |
its | -0.250 |
ters | -0.229 |
ying | -0.220 |
ade | -0.218 |
aches | -0.213 |
Token | . |
Token ID | 13 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
joy | +0.004 |
Bye | +0.003 |
Sure | +0.003 |
goodbye | +0.003 |
carriage | +0.003 |
Neg logit contributions | |
its | -0.003 |
ters | -0.002 |
ying | -0.002 |
ade | -0.002 |
aches | -0.002 |
Token | Do |
Token ID | 2141 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
ters | +0.013 |
its | +0.012 |
ying | +0.011 |
have | +0.011 |
First | +0.011 |
Neg logit contributions | |
joy | -0.013 |
carriage | -0.011 |
lifetime | -0.010 |
icol | -0.010 |
lair | -0.010 |
Token | you |
Token ID | 345 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
joy | +0.190 |
Bye | +0.177 |
Sure | +0.164 |
goodbye | +0.160 |
carriage | +0.156 |
Neg logit contributions | |
its | -0.146 |
ters | -0.133 |
ying | -0.127 |
ade | -0.126 |
idy | -0.121 |
Token | became |
Token ID | 2627 |
Feature activation | -3.25e-01 |
Pos logit contributions | |
joy | +0.023 |
carriage | +0.020 |
Bye | +0.020 |
icol | +0.020 |
Sure | +0.020 |
Neg logit contributions | |
ters | -0.014 |
aches | -0.014 |
its | -0.014 |
ade | -0.013 |
squash | -0.013 |
Token | good |
Token ID | 922 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
joy | +0.034 |
Bye | +0.030 |
Sure | +0.028 |
goodbye | +0.028 |
carriage | +0.027 |
Neg logit contributions | |
its | -0.021 |
ying | -0.019 |
ters | -0.018 |
idy | -0.018 |
ade | -0.017 |
Token | friends |
Token ID | 2460 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
its | +0.079 |
ters | +0.071 |
ying | +0.066 |
ade | +0.066 |
aches | +0.064 |
Neg logit contributions | |
joy | -0.153 |
Bye | -0.139 |
Sure | -0.134 |
carriage | -0.129 |
icol | -0.129 |
Token | . |
Token ID | 13 |
Feature activation | +5.30e-02 |
Pos logit contributions | |
ters | +0.076 |
its | +0.052 |
ching | +0.045 |
ying | +0.045 |
ade | +0.043 |
Neg logit contributions | |
icol | -0.291 |
Sure | -0.281 |
joy | -0.279 |
carriage | -0.269 |
spine | -0.268 |
Token | The |
Token ID | 383 |
Feature activation | -3.38e+00 |
Pos logit contributions | |
its | +0.004 |
ade | +0.004 |
ters | +0.004 |
ying | +0.004 |
aches | +0.004 |
Neg logit contributions | |
joy | -0.005 |
carriage | -0.004 |
icol | -0.004 |
lair | -0.004 |
lifetime | -0.004 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
joy | +0.326 |
Bye | +0.274 |
goodbye | +0.261 |
Sure | +0.253 |
bye | +0.247 |
Neg logit contributions | |
its | -0.235 |
ters | -0.217 |
aches | -0.205 |
ying | -0.205 |
idy | -0.203 |
Token | was |
Token ID | 373 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
its | +0.699 |
ade | +0.644 |
ters | +0.639 |
aches | +0.620 |
ying | +0.614 |
Neg logit contributions | |
joy | -1.001 |
Bye | -0.891 |
Sure | -0.853 |
icol | -0.841 |
carriage | -0.801 |
Token | glad |
Token ID | 9675 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
its | +0.067 |
ters | +0.061 |
aches | +0.058 |
ade | +0.058 |
ying | +0.058 |
Neg logit contributions | |
joy | -0.113 |
Bye | -0.102 |
Sure | -0.099 |
icol | -0.095 |
carriage | -0.094 |
Token | to |
Token ID | 284 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
joy | +0.422 |
carriage | +0.397 |
icol | +0.394 |
Bye | +0.393 |
spine | +0.378 |
Neg logit contributions | |
ters | -0.227 |
its | -0.219 |
ade | -0.206 |
ying | -0.204 |
aches | -0.194 |
Token | have |
Token ID | 423 |
Feature activation | +8.01e-01 |
Pos logit contributions | |
joy | +0.022 |
Bye | +0.019 |
Sure | +0.019 |
icol | +0.018 |
carriage | +0.018 |
Neg logit contributions | |
its | -0.012 |
ters | -0.011 |
aches | -0.011 |
ade | -0.010 |
ying | -0.010 |
Token | friends |
Token ID | 2460 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
its | +0.045 |
ters | +0.045 |
ade | +0.043 |
aches | +0.041 |
idy | +0.037 |
Neg logit contributions | |
joy | -0.084 |
Bye | -0.078 |
Sure | -0.077 |
icol | -0.075 |
spine | -0.075 |
Token | wanted |
Token ID | 2227 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
joy | +0.054 |
Bye | +0.049 |
Sure | +0.047 |
goodbye | +0.044 |
carriage | +0.044 |
Neg logit contributions | |
its | -0.051 |
ters | -0.048 |
ying | -0.047 |
idy | -0.044 |
aches | -0.043 |
Token | to |
Token ID | 284 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
its | +0.092 |
ters | +0.088 |
ade | +0.086 |
aches | +0.084 |
ying | +0.082 |
Neg logit contributions | |
joy | -0.099 |
Bye | -0.087 |
icol | -0.082 |
Sure | -0.082 |
carriage | -0.081 |
Token | chew |
Token ID | 34722 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
joy | +0.011 |
Bye | +0.010 |
Sure | +0.009 |
goodbye | +0.009 |
carriage | +0.009 |
Neg logit contributions | |
its | -0.009 |
ters | -0.009 |
ying | -0.008 |
idy | -0.008 |
ade | -0.007 |
Token | on |
Token ID | 319 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
its | +0.111 |
ying | +0.098 |
ters | +0.097 |
idy | +0.095 |
aches | +0.094 |
Neg logit contributions | |
joy | -0.125 |
Bye | -0.110 |
goodbye | -0.104 |
Sure | -0.104 |
icol | -0.095 |
Token | the |
Token ID | 262 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
its | +0.131 |
ters | +0.119 |
ying | +0.117 |
ade | +0.113 |
aches | +0.110 |
Neg logit contributions | |
joy | -0.165 |
Bye | -0.147 |
Sure | -0.140 |
goodbye | -0.135 |
icol | -0.133 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.020 |
ying | +0.018 |
aches | +0.016 |
ters | +0.015 |
have | +0.015 |
Neg logit contributions | |
joy | -0.038 |
Bye | -0.034 |
goodbye | -0.033 |
Sure | -0.032 |
carriage | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
its | +0.870 |
ters | +0.769 |
ying | +0.755 |
aches | +0.739 |
idy | +0.736 |
Neg logit contributions | |
joy | -0.827 |
Bye | -0.719 |
Sure | -0.693 |
goodbye | -0.672 |
carriage | -0.659 |
Token | The |
Token ID | 383 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
its | +0.019 |
ters | +0.019 |
ade | +0.017 |
ying | +0.017 |
aches | +0.017 |
Neg logit contributions | |
joy | -0.016 |
Bye | -0.013 |
carriage | -0.012 |
icol | -0.012 |
Sure | -0.012 |
Token | goat |
Token ID | 26917 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
joy | +0.220 |
Bye | +0.182 |
carriage | +0.165 |
goodbye | +0.163 |
Sure | +0.159 |
Neg logit contributions | |
its | -0.334 |
ying | -0.310 |
ters | -0.297 |
aches | -0.296 |
ade | -0.293 |
Token | went |
Token ID | 1816 |
Feature activation | -4.37e-01 |
Pos logit contributions | |
its | +0.128 |
ters | +0.117 |
ade | +0.113 |
aches | +0.111 |
ying | +0.111 |
Neg logit contributions | |
joy | -0.183 |
Bye | -0.163 |
Sure | -0.156 |
icol | -0.150 |
carriage | -0.149 |
Token | to |
Token ID | 284 |
Feature activation | -7.90e-02 |
Pos logit contributions | |
joy | +0.039 |
Bye | +0.035 |
Sure | +0.033 |
icol | +0.032 |
carriage | +0.031 |
Neg logit contributions | |
its | -0.033 |
ters | -0.031 |
ade | -0.030 |
ying | -0.030 |
aches | -0.030 |
Token | the |
Token ID | 262 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
joy | +0.010 |
Sure | +0.008 |
Bye | +0.008 |
carriage | +0.008 |
goodbye | +0.008 |
Neg logit contributions | |
its | -0.011 |
ters | -0.011 |
ying | -0.010 |
ade | -0.010 |
idy | -0.009 |
Token | garden |
Token ID | 11376 |
Feature activation | -5.81e-01 |
Pos logit contributions | |
its | +0.032 |
ters | +0.029 |
ying | +0.029 |
aches | +0.028 |
idy | +0.028 |
Neg logit contributions | |
joy | -0.023 |
Bye | -0.020 |
Sure | -0.019 |
carriage | -0.018 |
icol | -0.018 |
Token | to |
Token ID | 284 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
joy | +0.056 |
Bye | +0.052 |
icol | +0.048 |
Sure | +0.048 |
carriage | +0.047 |
Neg logit contributions | |
its | -0.038 |
ters | -0.038 |
ade | -0.035 |
ying | -0.035 |
aches | -0.033 |
Token | find |
Token ID | 1064 |
Feature activation | +6.67e-01 |
Pos logit contributions | |
joy | +0.011 |
Bye | +0.011 |
Sure | +0.010 |
goodbye | +0.010 |
arium | +0.010 |
Neg logit contributions | |
its | -0.011 |
ters | -0.011 |
ying | -0.010 |
idy | -0.010 |
ins | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
its | +0.055 |
ters | +0.047 |
ying | +0.047 |
oving | +0.045 |
aches | +0.045 |
Neg logit contributions | |
joy | -0.059 |
Bye | -0.050 |
Sure | -0.049 |
goodbye | -0.049 |
carriage | -0.047 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
joy | +0.011 |
Bye | +0.009 |
Sure | +0.009 |
carriage | +0.009 |
goodbye | +0.009 |
Neg logit contributions | |
its | -0.008 |
ters | -0.007 |
ying | -0.007 |
idy | -0.007 |
aches | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
its | +0.891 |
ying | +0.769 |
ters | +0.767 |
aches | +0.752 |
idy | +0.744 |
Neg logit contributions | |
joy | -0.809 |
Bye | -0.704 |
Sure | -0.673 |
carriage | -0.656 |
goodbye | -0.653 |
Token | She |
Token ID | 1375 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
its | +0.012 |
ters | +0.011 |
ying | +0.010 |
aches | +0.010 |
ade | +0.010 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.010 |
Sure | -0.010 |
goodbye | -0.009 |
icol | -0.008 |
Token | spotted |
Token ID | 13489 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
its | +0.085 |
ters | +0.079 |
ying | +0.076 |
ade | +0.074 |
aches | +0.074 |
Neg logit contributions | |
joy | -0.097 |
Bye | -0.086 |
Sure | -0.082 |
carriage | -0.078 |
goodbye | -0.078 |
Token | one |
Token ID | 530 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
joy | +0.197 |
Bye | +0.159 |
Sure | +0.158 |
goodbye | +0.157 |
carriage | +0.146 |
Neg logit contributions | |
its | -0.206 |
ying | -0.183 |
ters | -0.175 |
aches | -0.171 |
ade | -0.171 |
Token | that |
Token ID | 326 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
joy | +0.163 |
Sure | +0.142 |
Bye | +0.140 |
goodbye | +0.137 |
carriage | +0.132 |
Neg logit contributions | |
its | -0.151 |
ters | -0.134 |
aches | -0.128 |
ying | -0.128 |
have | -0.126 |
Token |
|
Token ID | 198 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
its | +0.030 |
ters | +0.028 |
ade | +0.027 |
ying | +0.026 |
aches | +0.026 |
Neg logit contributions | |
joy | -0.035 |
Bye | -0.031 |
Sure | -0.029 |
carriage | -0.029 |
goodbye | -0.028 |
Token |
|
Token ID | 198 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
ters | +0.041 |
its | +0.041 |
aches | +0.038 |
ying | +0.038 |
idy | +0.036 |
Neg logit contributions | |
joy | -0.028 |
Sure | -0.025 |
Bye | -0.024 |
arium | -0.022 |
goodbye | -0.021 |
Token | After |
Token ID | 3260 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
its | +0.040 |
ying | +0.037 |
ters | +0.036 |
aches | +0.036 |
ics | +0.034 |
Neg logit contributions | |
joy | -0.033 |
Sure | -0.031 |
Bye | -0.030 |
lifetime | -0.028 |
arium | -0.027 |
Token | eating |
Token ID | 6600 |
Feature activation | +6.83e-01 |
Pos logit contributions | |
its | +0.187 |
ters | +0.173 |
ying | +0.165 |
ade | +0.165 |
aches | +0.163 |
Neg logit contributions | |
joy | -0.232 |
Bye | -0.207 |
Sure | -0.196 |
carriage | -0.189 |
icol | -0.188 |
Token | the |
Token ID | 262 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
its | +0.059 |
ters | +0.054 |
idy | +0.051 |
ying | +0.050 |
ade | +0.049 |
Neg logit contributions | |
joy | -0.058 |
Bye | -0.049 |
Sure | -0.049 |
goodbye | -0.048 |
arium | -0.043 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.021 |
ters | +0.020 |
ba | +0.020 |
ying | +0.019 |
idy | +0.019 |
Neg logit contributions | |
joy | -0.031 |
Sure | -0.025 |
reminder | -0.025 |
goodbye | -0.025 |
sight | -0.024 |
Token | , |
Token ID | 11 |
Feature activation | +3.93e-01 |
Pos logit contributions | |
its | +0.868 |
ters | +0.791 |
ying | +0.760 |
aches | +0.748 |
ade | +0.746 |
Neg logit contributions | |
joy | -0.832 |
Bye | -0.722 |
Sure | -0.698 |
goodbye | -0.661 |
carriage | -0.649 |
Token | Benny |
Token ID | 44275 |
Feature activation | +3.00e+00 |
Pos logit contributions | |
its | +0.031 |
ters | +0.028 |
ying | +0.027 |
aches | +0.027 |
ade | +0.027 |
Neg logit contributions | |
joy | -0.036 |
Bye | -0.032 |
Sure | -0.031 |
goodbye | -0.029 |
icol | -0.029 |
Token | felt |
Token ID | 2936 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
its | +0.228 |
ters | +0.210 |
ying | +0.201 |
ade | +0.199 |
aches | +0.197 |
Neg logit contributions | |
joy | -0.275 |
Bye | -0.244 |
Sure | -0.233 |
carriage | -0.222 |
goodbye | -0.222 |
Token | very |
Token ID | 845 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
joy | +0.015 |
Bye | +0.013 |
goodbye | +0.013 |
Sure | +0.012 |
carriage | +0.011 |
Neg logit contributions | |
its | -0.012 |
ters | -0.012 |
ying | -0.011 |
idy | -0.011 |
ade | -0.011 |
Token | sleepy |
Token ID | 42023 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
joy | +0.020 |
Bye | +0.018 |
goodbye | +0.017 |
Sure | +0.016 |
bye | +0.015 |
Neg logit contributions | |
ters | -0.018 |
its | -0.018 |
ying | -0.016 |
idy | -0.016 |
ade | -0.016 |
Token | , |
Token ID | 11 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
joy | +0.042 |
Bye | +0.039 |
Sure | +0.036 |
icol | +0.035 |
carriage | +0.035 |
Neg logit contributions | |
its | -0.032 |
ters | -0.031 |
ade | -0.029 |
ying | -0.029 |
aches | -0.028 |
Token | she |
Token ID | 673 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
its | +0.023 |
ters | +0.023 |
ying | +0.021 |
ade | +0.020 |
idy | +0.020 |
Neg logit contributions | |
joy | -0.047 |
Bye | -0.044 |
Sure | -0.042 |
carriage | -0.041 |
icol | -0.041 |
Token | noticed |
Token ID | 6810 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
its | +0.080 |
ters | +0.077 |
ade | +0.075 |
aches | +0.073 |
ying | +0.072 |
Neg logit contributions | |
joy | -0.087 |
Bye | -0.081 |
Sure | -0.076 |
icol | -0.073 |
goodbye | -0.072 |
Token | a |
Token ID | 257 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
joy | +0.014 |
Bye | +0.012 |
Sure | +0.012 |
goodbye | +0.011 |
carriage | +0.011 |
Neg logit contributions | |
its | -0.012 |
ters | -0.010 |
ying | -0.010 |
aches | -0.010 |
ade | -0.010 |
Token | big |
Token ID | 1263 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
joy | +0.012 |
Bye | +0.011 |
Sure | +0.011 |
carriage | +0.010 |
icol | +0.010 |
Neg logit contributions | |
its | -0.008 |
ters | -0.007 |
ying | -0.007 |
aches | -0.006 |
ade | -0.006 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.098 |
ters | +0.092 |
ade | +0.090 |
ying | +0.085 |
aches | +0.084 |
Neg logit contributions | |
joy | -0.149 |
Bye | -0.139 |
Sure | -0.134 |
habitats | -0.128 |
goodbye | -0.125 |
Token | . |
Token ID | 13 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
its | +0.782 |
ying | +0.676 |
ters | +0.675 |
aches | +0.664 |
idy | +0.658 |
Neg logit contributions | |
joy | -0.904 |
Bye | -0.789 |
carriage | -0.745 |
Sure | -0.745 |
goodbye | -0.734 |
Token | She |
Token ID | 1375 |
Feature activation | +9.43e-01 |
Pos logit contributions | |
its | +0.008 |
ters | +0.008 |
she | +0.008 |
ying | +0.007 |
idy | +0.007 |
Neg logit contributions | |
joy | -0.015 |
Bye | -0.013 |
carriage | -0.013 |
habitats | -0.013 |
lair | -0.013 |
Token | felt |
Token ID | 2936 |
Feature activation | -2.51e-01 |
Pos logit contributions | |
its | +0.071 |
ters | +0.067 |
ying | +0.065 |
ade | +0.062 |
aches | +0.061 |
Neg logit contributions | |
joy | -0.086 |
Bye | -0.077 |
Sure | -0.074 |
carriage | -0.070 |
goodbye | -0.070 |
Token | so |
Token ID | 523 |
Feature activation | +2.71e+00 |
Pos logit contributions | |
joy | +0.022 |
goodbye | +0.019 |
Bye | +0.018 |
Sure | +0.017 |
content | +0.016 |
Neg logit contributions | |
its | -0.020 |
ters | -0.019 |
ying | -0.019 |
ikes | -0.019 |
ade | -0.019 |
Token | excited |
Token ID | 6568 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
ters | +0.231 |
its | +0.204 |
ying | +0.192 |
idy | +0.191 |
aches | +0.190 |
Neg logit contributions | |
joy | -0.230 |
Bye | -0.196 |
goodbye | -0.193 |
Sure | -0.191 |
content | -0.173 |
Token | girl |
Token ID | 2576 |
Feature activation | +6.95e-01 |
Pos logit contributions | |
its | +0.045 |
ters | +0.040 |
aches | +0.040 |
ying | +0.040 |
ade | +0.039 |
Neg logit contributions | |
joy | -0.040 |
Bye | -0.034 |
goodbye | -0.032 |
Sure | -0.032 |
carriage | -0.031 |
Token | never |
Token ID | 1239 |
Feature activation | -6.09e+00 |
Pos logit contributions | |
its | +0.038 |
aches | +0.036 |
ade | +0.036 |
ters | +0.034 |
idy | +0.032 |
Neg logit contributions | |
joy | -0.076 |
spine | -0.066 |
Bye | -0.065 |
Sure | -0.065 |
habitats | -0.064 |
Token | forgot |
Token ID | 16453 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
joy | +0.579 |
Sure | +0.533 |
Bye | +0.525 |
carriage | +0.513 |
icol | +0.513 |
Neg logit contributions | |
its | -0.383 |
ade | -0.369 |
ters | -0.355 |
meant | -0.347 |
aches | -0.343 |
Token | her |
Token ID | 607 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
joy | +0.103 |
Bye | +0.093 |
Sure | +0.090 |
icol | +0.086 |
carriage | +0.086 |
Neg logit contributions | |
its | -0.067 |
ters | -0.061 |
ying | -0.059 |
ade | -0.058 |
aches | -0.058 |
Token | special |
Token ID | 2041 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
its | +0.081 |
ters | +0.073 |
ying | +0.069 |
ade | +0.069 |
aches | +0.068 |
Neg logit contributions | |
joy | -0.132 |
Bye | -0.119 |
Sure | -0.114 |
carriage | -0.110 |
icol | -0.110 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.072 |
ters | +0.065 |
ying | +0.061 |
ade | +0.060 |
aches | +0.059 |
Neg logit contributions | |
joy | -0.144 |
Bye | -0.131 |
Sure | -0.126 |
carriage | -0.121 |
goodbye | -0.121 |
Token | . |
Token ID | 13 |
Feature activation | +5.15e-01 |
Pos logit contributions | |
ters | +0.692 |
its | +0.683 |
ade | +0.672 |
ying | +0.652 |
aches | +0.651 |
Neg logit contributions | |
joy | -0.910 |
Bye | -0.854 |
Sure | -0.809 |
icol | -0.794 |
habitats | -0.760 |
Token | As |
Token ID | 1081 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
its | +0.020 |
she | +0.018 |
ying | +0.017 |
ters | +0.017 |
idy | +0.016 |
Neg logit contributions | |
joy | -0.060 |
carriage | -0.057 |
lair | -0.055 |
icol | -0.054 |
spine | -0.053 |
Token | she |
Token ID | 673 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
joy | +0.155 |
Bye | +0.153 |
icol | +0.148 |
lair | +0.146 |
carriage | +0.145 |
Neg logit contributions | |
its | -0.038 |
idy | -0.037 |
aches | -0.037 |
ade | -0.036 |
ying | -0.035 |
Token | grew |
Token ID | 6348 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
its | +0.069 |
ade | +0.062 |
aches | +0.061 |
ters | +0.057 |
ying | +0.054 |
Neg logit contributions | |
joy | -0.115 |
Bye | -0.101 |
Sure | -0.098 |
spine | -0.097 |
icol | -0.095 |
Token | older |
Token ID | 4697 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
joy | +0.267 |
goodbye | +0.225 |
Bye | +0.222 |
Sure | +0.220 |
carriage | +0.214 |
Neg logit contributions | |
its | -0.141 |
ters | -0.123 |
ade | -0.111 |
idy | -0.110 |
ying | -0.108 |
Token | ™ |
Token ID | 8151 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
its | +0.215 |
ters | +0.203 |
ade | +0.200 |
ics | +0.192 |
ying | +0.188 |
Neg logit contributions | |
joy | -0.285 |
Bye | -0.258 |
carriage | -0.253 |
goodbye | -0.252 |
spine | -0.251 |
Token | ve |
Token ID | 303 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
its | +0.033 |
ters | +0.030 |
ying | +0.029 |
ade | +0.028 |
aches | +0.028 |
Neg logit contributions | |
joy | -0.043 |
Bye | -0.038 |
Sure | -0.036 |
goodbye | -0.035 |
carriage | -0.035 |
Token | sent |
Token ID | 1908 |
Feature activation | -2.37e+00 |
Pos logit contributions | |
its | +0.199 |
ters | +0.185 |
ying | +0.178 |
ade | +0.176 |
aches | +0.174 |
Neg logit contributions | |
joy | -0.215 |
Bye | -0.190 |
Sure | -0.180 |
carriage | -0.172 |
icol | -0.171 |
Token | you |
Token ID | 345 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
joy | +0.224 |
Bye | +0.202 |
Sure | +0.191 |
goodbye | +0.186 |
carriage | +0.182 |
Neg logit contributions | |
its | -0.173 |
ters | -0.158 |
ying | -0.152 |
ade | -0.150 |
aches | -0.148 |
Token | this |
Token ID | 428 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
joy | +0.154 |
Bye | +0.138 |
Sure | +0.134 |
icol | +0.131 |
carriage | +0.127 |
Neg logit contributions | |
its | -0.100 |
ters | -0.095 |
ade | -0.090 |
aches | -0.090 |
ying | -0.089 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
joy | +0.127 |
Bye | +0.109 |
Sure | +0.108 |
goodbye | +0.107 |
arium | +0.101 |
Neg logit contributions | |
its | -0.084 |
ters | -0.077 |
ying | -0.072 |
aches | -0.070 |
organ | -0.070 |
Token | . |
Token ID | 13 |
Feature activation | +4.10e-01 |
Pos logit contributions | |
its | +0.721 |
ters | +0.688 |
ade | +0.658 |
ying | +0.646 |
aches | +0.639 |
Neg logit contributions | |
joy | -0.950 |
Bye | -0.841 |
Sure | -0.803 |
icol | -0.772 |
carriage | -0.759 |
Token | I |
Token ID | 314 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
its | +0.035 |
ters | +0.034 |
ying | +0.032 |
ade | +0.031 |
aches | +0.031 |
Neg logit contributions | |
joy | -0.033 |
Bye | -0.028 |
Sure | -0.026 |
carriage | -0.026 |
icol | -0.025 |
Token | hope |
Token ID | 2911 |
Feature activation | -4.66e+00 |
Pos logit contributions | |
joy | +0.265 |
Bye | +0.238 |
Sure | +0.228 |
carriage | +0.218 |
goodbye | +0.218 |
Neg logit contributions | |
its | -0.186 |
ters | -0.171 |
ying | -0.163 |
ade | -0.160 |
aches | -0.159 |
Token | you |
Token ID | 345 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
joy | +0.477 |
Bye | +0.426 |
Sure | +0.415 |
icol | +0.404 |
carriage | +0.397 |
Neg logit contributions | |
its | -0.290 |
ters | -0.271 |
ying | -0.262 |
aches | -0.259 |
ade | -0.256 |
Token | like |
Token ID | 588 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
joy | +0.160 |
Bye | +0.142 |
Sure | +0.137 |
icol | +0.132 |
carriage | +0.129 |
Neg logit contributions | |
its | -0.100 |
ters | -0.092 |
ade | -0.086 |
aches | -0.086 |
ying | -0.084 |
Token | . |
Token ID | 13 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
joy | +0.063 |
Bye | +0.058 |
icol | +0.058 |
Sure | +0.055 |
carriage | +0.054 |
Neg logit contributions | |
its | -0.038 |
ters | -0.037 |
ying | -0.034 |
ade | -0.034 |
aches | -0.032 |
Token | The |
Token ID | 383 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
its | +0.019 |
ters | +0.018 |
ying | +0.018 |
ade | +0.017 |
aches | +0.017 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.009 |
Sure | -0.009 |
goodbye | -0.008 |
carriage | -0.008 |
Token | bird |
Token ID | 6512 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
joy | +0.312 |
Bye | +0.264 |
goodbye | +0.254 |
carriage | +0.251 |
Sure | +0.245 |
Neg logit contributions | |
its | -0.238 |
ying | -0.206 |
idy | -0.198 |
ters | -0.194 |
aches | -0.190 |
Token | saw |
Token ID | 2497 |
Feature activation | -3.67e+00 |
Pos logit contributions | |
its | +0.024 |
ters | +0.022 |
ying | +0.021 |
ade | +0.020 |
idy | +0.020 |
Neg logit contributions | |
joy | -0.021 |
Bye | -0.018 |
Sure | -0.017 |
arium | -0.017 |
carriage | -0.017 |
Token | the |
Token ID | 262 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
joy | +0.295 |
Bye | +0.263 |
Sure | +0.243 |
goodbye | +0.242 |
arium | +0.228 |
Neg logit contributions | |
its | -0.319 |
ters | -0.289 |
ying | -0.285 |
ade | -0.282 |
idy | -0.279 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
its | +0.022 |
ying | +0.019 |
affles | +0.018 |
aches | +0.018 |
oons | +0.017 |
Neg logit contributions | |
joy | -0.037 |
Bye | -0.029 |
spine | -0.029 |
goodbye | -0.028 |
Sure | -0.028 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
its | +0.915 |
ters | +0.825 |
ying | +0.805 |
idy | +0.802 |
aches | +0.796 |
Neg logit contributions | |
joy | -0.755 |
Bye | -0.636 |
goodbye | -0.602 |
Sure | -0.601 |
arium | -0.581 |
Token | thought |
Token ID | 1807 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
joy | +0.009 |
Bye | +0.008 |
Sure | +0.008 |
goodbye | +0.007 |
carriage | +0.007 |
Neg logit contributions | |
its | -0.008 |
ters | -0.007 |
ying | -0.007 |
ade | -0.007 |
idy | -0.007 |
Token | it |
Token ID | 340 |
Feature activation | -2.25e-01 |
Pos logit contributions | |
its | +0.093 |
ters | +0.088 |
ying | +0.080 |
ade | +0.079 |
idy | +0.079 |
Neg logit contributions | |
joy | -0.102 |
Bye | -0.088 |
goodbye | -0.086 |
Sure | -0.086 |
carriage | -0.079 |
Token | was |
Token ID | 373 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
joy | +0.014 |
Bye | +0.013 |
Sure | +0.013 |
arium | +0.012 |
goodbye | +0.011 |
Neg logit contributions | |
its | -0.021 |
ters | -0.020 |
ying | -0.020 |
aches | -0.019 |
idy | -0.018 |
Token | a |
Token ID | 257 |
Feature activation | -4.84e-02 |
Pos logit contributions | |
its | +0.102 |
ying | +0.093 |
ters | +0.088 |
idy | +0.086 |
ade | +0.085 |
Neg logit contributions | |
joy | -0.112 |
Bye | -0.096 |
goodbye | -0.091 |
lair | -0.088 |
arium | -0.086 |
Token | funny |
Token ID | 8258 |
Feature activation | +3.50e+00 |
Pos logit contributions | |
its | +0.001 |
ters | +0.001 |
ying | +0.001 |
ade | +0.001 |
aches | +0.001 |
Neg logit contributions | |
joy | -0.001 |
Bye | -0.001 |
Sure | -0.001 |
carriage | -0.001 |
goodbye | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +3.93e-01 |
Pos logit contributions | |
its | +0.277 |
ters | +0.255 |
ying | +0.254 |
aches | +0.246 |
idy | +0.244 |
Neg logit contributions | |
joy | -0.316 |
Bye | -0.266 |
Sure | -0.249 |
goodbye | -0.249 |
icol | -0.244 |
Token | It |
Token ID | 632 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
its | +0.030 |
ters | +0.027 |
ying | +0.026 |
ade | +0.026 |
aches | +0.025 |
Neg logit contributions | |
joy | -0.034 |
Bye | -0.030 |
carriage | -0.029 |
lifetime | -0.028 |
Sure | -0.028 |
Token | was |
Token ID | 373 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
joy | +0.042 |
Bye | +0.038 |
Sure | +0.037 |
icol | +0.033 |
carriage | +0.033 |
Neg logit contributions | |
its | -0.055 |
ying | -0.053 |
ters | -0.050 |
aches | -0.049 |
affles | -0.048 |
Token | a |
Token ID | 257 |
Feature activation | -5.21e-02 |
Pos logit contributions | |
its | +0.101 |
ying | +0.092 |
ters | +0.090 |
ade | +0.088 |
aches | +0.087 |
Neg logit contributions | |
joy | -0.117 |
Bye | -0.103 |
Sure | -0.097 |
goodbye | -0.095 |
icol | -0.093 |
Token | squash |
Token ID | 34613 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
joy | +0.005 |
Bye | +0.005 |
Sure | +0.005 |
goodbye | +0.005 |
carriage | +0.005 |
Neg logit contributions | |
its | -0.003 |
ters | -0.003 |
ade | -0.003 |
aches | -0.003 |
ying | -0.003 |
Token | ! |
Token ID | 0 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
its | +0.831 |
ters | +0.754 |
ying | +0.740 |
aches | +0.723 |
ade | +0.716 |
Neg logit contributions | |
joy | -0.859 |
Bye | -0.760 |
Sure | -0.717 |
carriage | -0.693 |
goodbye | -0.683 |
Token | It |
Token ID | 632 |
Feature activation | -5.74e-01 |
Pos logit contributions | |
joy | +0.110 |
Bye | +0.098 |
Sure | +0.092 |
carriage | +0.092 |
icol | +0.090 |
Neg logit contributions | |
its | -0.097 |
ters | -0.088 |
ying | -0.085 |
ade | -0.085 |
aches | -0.083 |
Token | was |
Token ID | 373 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
joy | +0.037 |
Sure | +0.034 |
Bye | +0.034 |
icol | +0.030 |
arium | +0.029 |
Neg logit contributions | |
its | -0.054 |
ying | -0.054 |
ters | -0.049 |
affles | -0.048 |
aches | -0.048 |
Token | orange |
Token ID | 10912 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
its | +0.107 |
ying | +0.101 |
ade | +0.095 |
ters | +0.095 |
idy | +0.093 |
Neg logit contributions | |
joy | -0.112 |
Bye | -0.096 |
Sure | -0.090 |
goodbye | -0.089 |
icol | -0.087 |
Token | and |
Token ID | 290 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
its | +0.176 |
ying | +0.157 |
ters | +0.157 |
aches | +0.155 |
have | +0.150 |
Neg logit contributions | |
joy | -0.159 |
Bye | -0.137 |
Sure | -0.129 |
icol | -0.124 |
goodbye | -0.124 |
Token | " |
Token ID | 366 |
Feature activation | +4.28e-02 |
Pos logit contributions | |
joy | +0.056 |
habitats | +0.052 |
lair | +0.051 |
icol | +0.050 |
arium | +0.049 |
Neg logit contributions | |
ters | -0.029 |
its | -0.025 |
whip | -0.024 |
ying | -0.023 |
ble | -0.023 |
Token | You |
Token ID | 1639 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
ters | +0.002 |
its | +0.002 |
have | +0.002 |
ying | +0.002 |
idy | +0.002 |
Neg logit contributions | |
joy | -0.005 |
icol | -0.004 |
spine | -0.004 |
carriage | -0.004 |
lair | -0.004 |
Token | 're |
Token ID | 821 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
its | +0.108 |
ters | +0.096 |
ying | +0.089 |
ade | +0.088 |
aches | +0.086 |
Neg logit contributions | |
joy | -0.249 |
Bye | -0.228 |
Sure | -0.219 |
carriage | -0.212 |
goodbye | -0.212 |
Token | welcome |
Token ID | 7062 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
its | +0.144 |
ters | +0.142 |
ying | +0.130 |
aches | +0.129 |
ics | +0.122 |
Neg logit contributions | |
joy | -0.257 |
Sure | -0.232 |
Bye | -0.224 |
icol | -0.224 |
habitats | -0.218 |
Token | . |
Token ID | 13 |
Feature activation | -6.82e-01 |
Pos logit contributions | |
joy | +0.145 |
Sure | +0.138 |
habitats | +0.134 |
Bye | +0.134 |
spine | +0.133 |
Neg logit contributions | |
ters | -0.077 |
its | -0.069 |
ying | -0.062 |
ade | -0.060 |
aches | -0.057 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.071 |
carriage | +0.063 |
lair | +0.063 |
lifetime | +0.061 |
arium | +0.060 |
Neg logit contributions | |
ters | -0.039 |
matters | -0.033 |
its | -0.030 |
ying | -0.028 |
have | -0.028 |
Token | - |
Token ID | 12 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
joy | +1.109 |
lair | +1.109 |
doorway | +1.037 |
nowhere | +1.009 |
habitats | +0.998 |
Neg logit contributions | |
ters | -0.650 |
bles | -0.504 |
ade | -0.495 |
its | -0.493 |
do | -0.471 |
Token | bye |
Token ID | 16390 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
joy | +0.241 |
lair | +0.202 |
icol | +0.182 |
habitats | +0.179 |
arium | +0.177 |
Neg logit contributions | |
ters | -0.436 |
qu | -0.396 |
its | -0.394 |
ade | -0.394 |
aches | -0.389 |
Token | ." |
Token ID | 526 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
joy | +1.140 |
Sure | +1.103 |
Bye | +1.051 |
lair | +1.027 |
habitats | +1.026 |
Neg logit contributions | |
ters | -0.611 |
its | -0.455 |
ying | -0.435 |
ade | -0.399 |
idy | -0.396 |
Token |
|
Token ID | 198 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
joy | +0.012 |
lifetime | +0.011 |
cle | +0.010 |
lair | +0.010 |
icol | +0.010 |
Neg logit contributions | |
ters | -0.007 |
its | -0.005 |
ade | -0.005 |
she | -0.005 |
ying | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -3.83e-01 |
Pos logit contributions | |
joy | +0.039 |
Bye | +0.034 |
Sure | +0.033 |
icol | +0.032 |
carriage | +0.032 |
Neg logit contributions | |
its | -0.030 |
ters | -0.027 |
ade | -0.026 |
ying | -0.026 |
aches | -0.026 |
Token | and |
Token ID | 290 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
joy | +0.145 |
Bye | +0.125 |
Sure | +0.117 |
icol | +0.111 |
carriage | +0.110 |
Neg logit contributions | |
its | -0.187 |
ters | -0.177 |
ying | -0.170 |
ade | -0.168 |
aches | -0.167 |
Token | hug |
Token ID | 16225 |
Feature activation | -4.59e+00 |
Pos logit contributions | |
joy | +0.137 |
Bye | +0.116 |
Sure | +0.115 |
icol | +0.114 |
carriage | +0.109 |
Neg logit contributions | |
its | -0.071 |
aches | -0.068 |
ters | -0.066 |
ade | -0.062 |
ying | -0.060 |
Token | you |
Token ID | 345 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
joy | +0.486 |
Bye | +0.427 |
Sure | +0.423 |
icol | +0.411 |
carriage | +0.407 |
Neg logit contributions | |
its | -0.275 |
ters | -0.270 |
aches | -0.239 |
ying | -0.238 |
idy | -0.230 |
Token | too |
Token ID | 1165 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
joy | +0.204 |
Bye | +0.177 |
icol | +0.177 |
Sure | +0.177 |
carriage | +0.166 |
Neg logit contributions | |
ters | -0.127 |
its | -0.126 |
ying | -0.112 |
aches | -0.109 |
ade | -0.108 |
Token | . |
Token ID | 13 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
joy | +0.281 |
icol | +0.251 |
Sure | +0.250 |
Bye | +0.250 |
carriage | +0.243 |
Neg logit contributions | |
its | -0.143 |
ters | -0.129 |
ying | -0.116 |
ade | -0.115 |
aches | -0.114 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.109 |
carriage | +0.091 |
lifetime | +0.091 |
lair | +0.089 |
arium | +0.086 |
Neg logit contributions | |
ters | -0.075 |
its | -0.066 |
matters | -0.063 |
First | -0.061 |
have | -0.059 |
Token | for |
Token ID | 329 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
joy | +1.213 |
lair | +1.154 |
lifetime | +1.088 |
habitats | +1.075 |
generation | +1.065 |
Neg logit contributions | |
ters | -0.580 |
its | -0.488 |
ade | -0.479 |
ying | -0.451 |
do | -0.414 |
Token | now |
Token ID | 783 |
Feature activation | -3.84e+00 |
Pos logit contributions | |
joy | +0.402 |
Sure | +0.371 |
icol | +0.350 |
carriage | +0.342 |
Bye | +0.341 |
Neg logit contributions | |
its | -0.218 |
ters | -0.204 |
aches | -0.193 |
have | -0.175 |
happen | -0.175 |
Token | ." |
Token ID | 526 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
joy | +0.397 |
Bye | +0.345 |
Sure | +0.342 |
carriage | +0.323 |
icol | +0.323 |
Neg logit contributions | |
its | -0.249 |
ters | -0.237 |
ying | -0.217 |
ade | -0.213 |
aches | -0.207 |
Token |
|
Token ID | 198 |
Feature activation | -5.67e-01 |
Pos logit contributions | |
joy | +0.038 |
lifetime | +0.037 |
habitats | +0.036 |
icol | +0.035 |
spine | +0.035 |
Neg logit contributions | |
its | -0.009 |
she | -0.009 |
ters | -0.009 |
ade | -0.008 |
First | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
joy | +0.054 |
Bye | +0.048 |
Sure | +0.045 |
icol | +0.045 |
carriage | +0.044 |
Neg logit contributions | |
its | -0.041 |
ters | -0.037 |
ade | -0.036 |
ying | -0.036 |
aches | -0.035 |
Token | good |
Token ID | 922 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
its | +0.075 |
ters | +0.069 |
ade | +0.063 |
aches | +0.063 |
ying | +0.061 |
Neg logit contributions | |
joy | -0.147 |
Bye | -0.132 |
Sure | -0.128 |
spine | -0.126 |
lair | -0.126 |
Token | care |
Token ID | 1337 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
its | +0.087 |
ters | +0.078 |
ade | +0.076 |
ying | +0.073 |
aches | +0.073 |
Neg logit contributions | |
joy | -0.112 |
Bye | -0.101 |
Sure | -0.099 |
carriage | -0.094 |
arium | -0.093 |
Token | of |
Token ID | 286 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
joy | +0.253 |
Bye | +0.230 |
Sure | +0.222 |
icol | +0.216 |
carriage | +0.213 |
Neg logit contributions | |
its | -0.119 |
ters | -0.109 |
ying | -0.103 |
ade | -0.101 |
aches | -0.098 |
Token | it |
Token ID | 340 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
its | +0.068 |
ters | +0.063 |
ying | +0.059 |
aches | +0.059 |
ade | +0.058 |
Neg logit contributions | |
joy | -0.114 |
Bye | -0.102 |
Sure | -0.099 |
icol | -0.095 |
carriage | -0.094 |
Token | . |
Token ID | 13 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
joy | +0.050 |
Bye | +0.045 |
Sure | +0.043 |
carriage | +0.041 |
goodbye | +0.041 |
Neg logit contributions | |
its | -0.036 |
ters | -0.033 |
ying | -0.032 |
ade | -0.031 |
aches | -0.031 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
ters | +0.013 |
its | +0.013 |
ying | +0.012 |
she | +0.011 |
idy | +0.011 |
Neg logit contributions | |
joy | -0.017 |
lair | -0.014 |
carriage | -0.013 |
spine | -0.013 |
habitats | -0.013 |
Token | !" |
Token ID | 2474 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
joy | +0.865 |
lair | +0.791 |
arium | +0.730 |
habitats | +0.717 |
Sure | +0.701 |
Neg logit contributions | |
ters | -0.916 |
its | -0.837 |
ade | -0.801 |
aches | -0.776 |
ble | -0.772 |
Token |
|
Token ID | 198 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
its | +0.080 |
ters | +0.078 |
ics | +0.072 |
ying | +0.070 |
she | +0.069 |
Neg logit contributions | |
joy | -0.156 |
lair | -0.140 |
icol | -0.134 |
carriage | -0.133 |
habitats | -0.132 |
Token |
|
Token ID | 198 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
its | +0.024 |
ters | +0.022 |
ying | +0.021 |
ade | +0.021 |
aches | +0.021 |
Neg logit contributions | |
joy | -0.030 |
Bye | -0.027 |
Sure | -0.026 |
icol | -0.025 |
carriage | -0.025 |
Token | John |
Token ID | 7554 |
Feature activation | +7.01e-01 |
Pos logit contributions | |
its | +0.027 |
ters | +0.025 |
ying | +0.024 |
ade | +0.024 |
aches | +0.023 |
Neg logit contributions | |
joy | -0.030 |
Bye | -0.027 |
Sure | -0.026 |
carriage | -0.024 |
goodbye | -0.024 |
Token | smiled |
Token ID | 13541 |
Feature activation | -4.48e+00 |
Pos logit contributions | |
its | +0.048 |
ters | +0.045 |
ade | +0.043 |
aches | +0.042 |
idy | +0.041 |
Neg logit contributions | |
joy | -0.069 |
Bye | -0.059 |
Sure | -0.058 |
icol | -0.056 |
lair | -0.054 |
Token | fun |
Token ID | 1257 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
joy | +0.306 |
Sure | +0.280 |
spine | +0.276 |
carriage | +0.271 |
Bye | +0.265 |
Neg logit contributions | |
ade | -0.102 |
its | -0.101 |
ters | -0.094 |
aches | -0.091 |
matters | -0.090 |
Token | with |
Token ID | 351 |
Feature activation | -9.04e-01 |
Pos logit contributions | |
its | +0.026 |
ters | +0.025 |
ying | +0.022 |
ade | +0.021 |
aches | +0.021 |
Neg logit contributions | |
joy | -0.046 |
Sure | -0.043 |
Bye | -0.042 |
icol | -0.041 |
carriage | -0.040 |
Token | the |
Token ID | 262 |
Feature activation | -4.63e-01 |
Pos logit contributions | |
joy | +0.096 |
Sure | +0.085 |
Bye | +0.084 |
icol | +0.083 |
spine | +0.082 |
Neg logit contributions | |
its | -0.055 |
ters | -0.054 |
aches | -0.050 |
ying | -0.048 |
idy | -0.047 |
Token | sail |
Token ID | 14936 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
joy | +0.042 |
Bye | +0.036 |
Sure | +0.034 |
carriage | +0.034 |
goodbye | +0.033 |
Neg logit contributions | |
its | -0.037 |
ters | -0.034 |
ying | -0.032 |
ade | -0.032 |
aches | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | -7.76e-01 |
Pos logit contributions | |
joy | +0.062 |
Bye | +0.053 |
icol | +0.053 |
Sure | +0.052 |
habitats | +0.049 |
Neg logit contributions | |
ters | -0.044 |
its | -0.040 |
ade | -0.040 |
ying | -0.038 |
idy | -0.036 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.074 |
carriage | +0.062 |
lair | +0.062 |
lifetime | +0.059 |
spine | +0.059 |
Neg logit contributions | |
ters | -0.054 |
its | -0.050 |
matters | -0.046 |
Those | -0.043 |
ikes | -0.042 |
Token | - |
Token ID | 12 |
Feature activation | -4.06e+00 |
Pos logit contributions | |
joy | +1.110 |
lair | +1.076 |
doorway | +0.997 |
habitats | +0.986 |
generation | +0.964 |
Neg logit contributions | |
ters | -0.685 |
its | -0.557 |
ade | -0.540 |
bles | -0.532 |
ble | -0.519 |
Token | bye |
Token ID | 16390 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
joy | +0.228 |
lair | +0.176 |
icol | +0.158 |
habitats | +0.155 |
arium | +0.154 |
Neg logit contributions | |
ters | -0.450 |
its | -0.423 |
ade | -0.419 |
qu | -0.412 |
aches | -0.411 |
Token | ." |
Token ID | 526 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
joy | +1.187 |
Sure | +1.154 |
Bye | +1.090 |
habitats | +1.074 |
lair | +1.067 |
Neg logit contributions | |
ters | -0.568 |
its | -0.411 |
ying | -0.377 |
ade | -0.349 |
idy | -0.348 |
Token | The |
Token ID | 383 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
joy | +0.014 |
lifetime | +0.013 |
lair | +0.013 |
carriage | +0.012 |
habitats | +0.012 |
Neg logit contributions | |
ters | -0.007 |
she | -0.006 |
its | -0.006 |
squash | -0.006 |
ics | -0.005 |
Token | man |
Token ID | 582 |
Feature activation | -5.22e-01 |
Pos logit contributions | |
joy | +0.379 |
Bye | +0.347 |
Sure | +0.343 |
icol | +0.330 |
habitats | +0.313 |
Neg logit contributions | |
its | -0.277 |
ters | -0.256 |
ying | -0.242 |
ade | -0.241 |
aches | -0.238 |
Token | " |
Token ID | 1 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
joy | +0.045 |
Bye | +0.040 |
Sure | +0.038 |
icol | +0.037 |
goodbye | +0.037 |
Neg logit contributions | |
its | -0.031 |
ters | -0.028 |
ying | -0.027 |
ade | -0.027 |
aches | -0.026 |
Token | Okay |
Token ID | 16454 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
its | +0.140 |
ying | +0.129 |
ters | +0.128 |
ade | +0.126 |
aches | +0.125 |
Neg logit contributions | |
joy | -0.136 |
Bye | -0.122 |
Sure | -0.115 |
carriage | -0.106 |
goodbye | -0.106 |
Token | , |
Token ID | 11 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
joy | +0.345 |
Bye | +0.306 |
Sure | +0.298 |
habitats | +0.291 |
carriage | +0.285 |
Neg logit contributions | |
its | -0.200 |
ters | -0.193 |
aches | -0.174 |
ying | -0.173 |
ade | -0.173 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
joy | +0.028 |
Bye | +0.023 |
Sure | +0.023 |
icol | +0.023 |
habitats | +0.023 |
Neg logit contributions | |
ters | -0.020 |
its | -0.019 |
aches | -0.018 |
ying | -0.017 |
idea | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | -8.26e-01 |
Pos logit contributions | |
joy | +0.221 |
Bye | +0.200 |
Sure | +0.196 |
icol | +0.192 |
carriage | +0.185 |
Neg logit contributions | |
its | -0.088 |
ters | -0.085 |
ade | -0.076 |
ying | -0.075 |
aches | -0.073 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.085 |
lair | +0.074 |
carriage | +0.071 |
lifetime | +0.068 |
habitats | +0.067 |
Neg logit contributions | |
ters | -0.052 |
do | -0.040 |
its | -0.039 |
ikes | -0.038 |
rake | -0.036 |
Token | , |
Token ID | 11 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
joy | +1.257 |
lair | +1.135 |
habitats | +1.109 |
lifetime | +1.060 |
doorway | +1.041 |
Neg logit contributions | |
ters | -0.536 |
its | -0.450 |
ade | -0.427 |
aches | -0.406 |
idea | -0.401 |
Token | ostr |
Token ID | 42387 |
Feature activation | -8.75e-02 |
Pos logit contributions | |
joy | +0.035 |
Sure | +0.030 |
Bye | +0.029 |
icol | +0.029 |
lair | +0.028 |
Neg logit contributions | |
its | -0.025 |
ters | -0.024 |
aches | -0.023 |
ying | -0.022 |
idy | -0.022 |
Token | ich |
Token ID | 488 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
joy | +0.007 |
Bye | +0.007 |
Sure | +0.006 |
goodbye | +0.006 |
icol | +0.006 |
Neg logit contributions | |
its | -0.007 |
ters | -0.007 |
aches | -0.007 |
ble | -0.006 |
ying | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -8.88e-01 |
Pos logit contributions | |
joy | +0.401 |
icol | +0.345 |
Sure | +0.341 |
Bye | +0.335 |
habitats | +0.335 |
Neg logit contributions | |
ters | -0.151 |
its | -0.129 |
ade | -0.118 |
aches | -0.110 |
ying | -0.109 |
Token | We |
Token ID | 775 |
Feature activation | -4.86e+00 |
Pos logit contributions | |
joy | +0.090 |
lair | +0.076 |
carriage | +0.073 |
lifetime | +0.070 |
habitats | +0.069 |
Neg logit contributions | |
ters | -0.060 |
its | -0.049 |
do | -0.046 |
matters | -0.046 |
seem | -0.045 |
Token | to |
Token ID | 284 |
Feature activation | -6.05e-01 |
Pos logit contributions | |
its | +0.146 |
ters | +0.140 |
ade | +0.133 |
aches | +0.131 |
idy | +0.130 |
Neg logit contributions | |
joy | -0.183 |
Bye | -0.157 |
Sure | -0.153 |
icol | -0.148 |
carriage | -0.146 |
Token | be |
Token ID | 307 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
joy | +0.065 |
Sure | +0.055 |
Bye | +0.054 |
icol | +0.052 |
spine | +0.049 |
Neg logit contributions | |
its | -0.038 |
aches | -0.036 |
ters | -0.034 |
ade | -0.032 |
ics | -0.032 |
Token | his |
Token ID | 465 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
joy | +0.145 |
Sure | +0.139 |
Bye | +0.133 |
spine | +0.131 |
icol | +0.131 |
Neg logit contributions | |
ters | -0.077 |
aches | -0.071 |
its | -0.068 |
have | -0.066 |
sure | -0.066 |
Token | friends |
Token ID | 2460 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
joy | +0.127 |
icol | +0.113 |
Bye | +0.112 |
Sure | +0.112 |
spine | +0.102 |
Neg logit contributions | |
ters | -0.077 |
its | -0.077 |
idea | -0.070 |
idy | -0.066 |
aches | -0.066 |
Token | . |
Token ID | 13 |
Feature activation | -8.75e-01 |
Pos logit contributions | |
ters | +0.113 |
its | +0.099 |
ying | +0.095 |
aches | +0.093 |
ade | +0.091 |
Neg logit contributions | |
joy | -0.202 |
Sure | -0.188 |
icol | -0.186 |
Bye | -0.178 |
spine | -0.168 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.080 |
carriage | +0.059 |
arium | +0.058 |
lifetime | +0.058 |
lair | +0.057 |
Neg logit contributions | |
ters | -0.069 |
its | -0.061 |
First | -0.056 |
idy | -0.055 |
ikes | -0.055 |
Token | , |
Token ID | 11 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
joy | +1.129 |
lair | +1.024 |
doorway | +0.954 |
habitats | +0.950 |
lifetime | +0.944 |
Neg logit contributions | |
ters | -0.694 |
its | -0.557 |
ying | -0.531 |
ade | -0.531 |
bles | -0.520 |
Token | Roc |
Token ID | 13545 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
joy | +0.041 |
Sure | +0.034 |
icol | +0.033 |
spine | +0.031 |
Bye | +0.030 |
Neg logit contributions | |
ters | -0.037 |
its | -0.034 |
idea | -0.033 |
do | -0.033 |
sure | -0.033 |
Token | co |
Token ID | 1073 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
joy | +0.146 |
Bye | +0.128 |
Sure | +0.124 |
goodbye | +0.123 |
icol | +0.120 |
Neg logit contributions | |
its | -0.096 |
ters | -0.090 |
ying | -0.085 |
ade | -0.083 |
aches | -0.083 |
Token | . |
Token ID | 13 |
Feature activation | -8.67e-01 |
Pos logit contributions | |
its | +0.105 |
aches | +0.102 |
ters | +0.096 |
ying | +0.095 |
ade | +0.094 |
Neg logit contributions | |
joy | -0.169 |
icol | -0.149 |
Sure | -0.146 |
Bye | -0.141 |
lair | -0.135 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.083 |
arium | +0.062 |
lair | +0.061 |
lifetime | +0.060 |
carriage | +0.059 |
Neg logit contributions | |
ters | -0.065 |
its | -0.055 |
matters | -0.052 |
do | -0.052 |
ikes | -0.052 |
Token | You |
Token ID | 921 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
joy | +0.125 |
lifetime | +0.111 |
carriage | +0.108 |
lair | +0.108 |
arium | +0.102 |
Neg logit contributions | |
ters | -0.064 |
its | -0.058 |
ying | -0.049 |
matters | -0.049 |
idy | -0.045 |
Token | are |
Token ID | 389 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
joy | +0.189 |
Bye | +0.181 |
goodbye | +0.166 |
carriage | +0.163 |
Sure | +0.162 |
Neg logit contributions | |
its | -0.108 |
ying | -0.099 |
ters | -0.095 |
idy | -0.090 |
aches | -0.087 |
Token | very |
Token ID | 845 |
Feature activation | -9.92e-01 |
Pos logit contributions | |
its | +0.089 |
ters | +0.081 |
ying | +0.078 |
ade | +0.077 |
aches | +0.076 |
Neg logit contributions | |
joy | -0.125 |
Bye | -0.113 |
Sure | -0.106 |
carriage | -0.103 |
goodbye | -0.103 |
Token | nice |
Token ID | 3621 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
joy | +0.093 |
Bye | +0.086 |
Sure | +0.079 |
goodbye | +0.077 |
carriage | +0.077 |
Neg logit contributions | |
its | -0.071 |
ters | -0.066 |
ying | -0.063 |
ade | -0.061 |
idy | -0.060 |
Token | . |
Token ID | 13 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
joy | +0.031 |
Bye | +0.028 |
Sure | +0.028 |
icol | +0.027 |
carriage | +0.026 |
Neg logit contributions | |
its | -0.022 |
ters | -0.021 |
ying | -0.019 |
ade | -0.019 |
idy | -0.018 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.119 |
lifetime | +0.105 |
carriage | +0.105 |
lair | +0.103 |
spine | +0.097 |
Neg logit contributions | |
ters | -0.070 |
its | -0.062 |
matters | -0.056 |
ying | -0.055 |
idy | -0.052 |
Token | !" |
Token ID | 2474 |
Feature activation | +6.46e-01 |
Pos logit contributions | |
joy | +1.250 |
lair | +1.193 |
doorway | +1.131 |
habitats | +1.119 |
generation | +1.110 |
Neg logit contributions | |
ters | -0.532 |
ade | -0.427 |
its | -0.416 |
bles | -0.374 |
do | -0.367 |
Token | The |
Token ID | 383 |
Feature activation | -3.89e+00 |
Pos logit contributions | |
ters | +0.026 |
noise | +0.025 |
do | +0.025 |
its | +0.024 |
other | +0.024 |
Neg logit contributions | |
joy | -0.072 |
lifetime | -0.065 |
icol | -0.065 |
habitats | -0.064 |
Bye | -0.062 |
Token | man |
Token ID | 582 |
Feature activation | -5.62e-01 |
Pos logit contributions | |
joy | +0.376 |
Bye | +0.337 |
Sure | +0.333 |
icol | +0.327 |
arium | +0.309 |
Neg logit contributions | |
its | -0.274 |
ters | -0.249 |
ade | -0.233 |
aches | -0.233 |
ying | -0.227 |
Token | says |
Token ID | 1139 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
joy | +0.058 |
Bye | +0.052 |
Sure | +0.050 |
icol | +0.048 |
carriage | +0.048 |
Neg logit contributions | |
its | -0.037 |
ters | -0.033 |
ying | -0.031 |
ade | -0.031 |
aches | -0.031 |
Token | . |
Token ID | 13 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
its | +0.071 |
ters | +0.068 |
ying | +0.063 |
ade | +0.060 |
aches | +0.058 |
Neg logit contributions | |
joy | -0.115 |
Bye | -0.106 |
habitats | -0.102 |
icol | -0.101 |
Sure | -0.101 |
Token | said |
Token ID | 531 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
joy | +0.015 |
lair | +0.012 |
Bye | +0.012 |
habitats | +0.012 |
spine | +0.012 |
Neg logit contributions | |
its | -0.007 |
ters | -0.007 |
ade | -0.007 |
aches | -0.006 |
ying | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
its | +0.157 |
ters | +0.149 |
ying | +0.143 |
ade | +0.142 |
aches | +0.140 |
Neg logit contributions | |
joy | -0.174 |
Bye | -0.153 |
Sure | -0.145 |
icol | -0.140 |
carriage | -0.139 |
Token | " |
Token ID | 366 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
its | +0.019 |
ters | +0.019 |
ying | +0.017 |
aches | +0.017 |
ade | +0.016 |
Neg logit contributions | |
joy | -0.025 |
Bye | -0.022 |
habitats | -0.021 |
lair | -0.021 |
carriage | -0.021 |
Token | Sure |
Token ID | 19457 |
Feature activation | -9.35e-01 |
Pos logit contributions | |
its | +0.032 |
ters | +0.032 |
ade | +0.028 |
ying | +0.027 |
aches | +0.027 |
Neg logit contributions | |
joy | -0.045 |
Bye | -0.039 |
lair | -0.038 |
carriage | -0.038 |
goodbye | -0.038 |
Token | . |
Token ID | 13 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
joy | +0.101 |
habitats | +0.092 |
Sure | +0.091 |
lair | +0.089 |
Bye | +0.088 |
Neg logit contributions | |
its | -0.045 |
aches | -0.045 |
idea | -0.044 |
ade | -0.043 |
ters | -0.042 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
ters | +0.015 |
its | +0.013 |
ying | +0.012 |
ikes | +0.011 |
matters | +0.011 |
Neg logit contributions | |
joy | -0.018 |
lair | -0.015 |
carriage | -0.015 |
habitats | -0.015 |
dungeon | -0.014 |
Token | Mia |
Token ID | 32189 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
joy | +0.907 |
lair | +0.845 |
habitats | +0.794 |
arium | +0.770 |
nowhere | +0.761 |
Neg logit contributions | |
ters | -0.860 |
ade | -0.738 |
its | -0.728 |
bles | -0.704 |
ula | -0.699 |
Token | !" |
Token ID | 2474 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
joy | +0.152 |
Sure | +0.133 |
Bye | +0.133 |
icol | +0.131 |
habitats | +0.128 |
Neg logit contributions | |
ters | -0.081 |
its | -0.073 |
ying | -0.068 |
ade | -0.067 |
idy | -0.065 |
Token |
|
Token ID | 198 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
its | +0.085 |
ters | +0.082 |
ade | +0.078 |
ying | +0.077 |
aches | +0.072 |
Neg logit contributions | |
joy | -0.133 |
Bye | -0.118 |
lair | -0.117 |
carriage | -0.115 |
habitats | -0.113 |
Token |
|
Token ID | 198 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
its | +0.027 |
ters | +0.025 |
ying | +0.024 |
ade | +0.023 |
aches | +0.023 |
Neg logit contributions | |
joy | -0.031 |
Bye | -0.027 |
Sure | -0.026 |
goodbye | -0.025 |
carriage | -0.025 |
Token | M |
Token ID | 44 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
its | +0.027 |
ters | +0.025 |
ying | +0.024 |
idy | +0.023 |
aches | +0.023 |
Neg logit contributions | |
joy | -0.032 |
Bye | -0.029 |
Sure | -0.028 |
carriage | -0.026 |
goodbye | -0.026 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.080 |
carriage | +0.059 |
arium | +0.058 |
lifetime | +0.058 |
lair | +0.057 |
Neg logit contributions | |
ters | -0.069 |
its | -0.061 |
First | -0.056 |
idy | -0.055 |
ikes | -0.055 |
Token | , |
Token ID | 11 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
joy | +1.129 |
lair | +1.024 |
doorway | +0.954 |
habitats | +0.950 |
lifetime | +0.944 |
Neg logit contributions | |
ters | -0.694 |
its | -0.557 |
ying | -0.531 |
ade | -0.531 |
bles | -0.520 |
Token | Roc |
Token ID | 13545 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
joy | +0.041 |
Sure | +0.034 |
icol | +0.033 |
spine | +0.031 |
Bye | +0.030 |
Neg logit contributions | |
ters | -0.037 |
its | -0.034 |
idea | -0.033 |
do | -0.033 |
sure | -0.033 |
Token | co |
Token ID | 1073 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
joy | +0.146 |
Bye | +0.128 |
Sure | +0.124 |
goodbye | +0.123 |
icol | +0.120 |
Neg logit contributions | |
its | -0.096 |
ters | -0.090 |
ying | -0.085 |
ade | -0.083 |
aches | -0.083 |
Token | . |
Token ID | 13 |
Feature activation | -8.67e-01 |
Pos logit contributions | |
its | +0.105 |
aches | +0.102 |
ters | +0.096 |
ying | +0.095 |
ade | +0.094 |
Neg logit contributions | |
joy | -0.169 |
icol | -0.149 |
Sure | -0.146 |
Bye | -0.141 |
lair | -0.135 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.083 |
arium | +0.062 |
lair | +0.061 |
lifetime | +0.060 |
carriage | +0.059 |
Neg logit contributions | |
ters | -0.065 |
its | -0.055 |
matters | -0.052 |
do | -0.052 |
ikes | -0.052 |
Token | , |
Token ID | 11 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
joy | +1.078 |
lair | +0.999 |
habitats | +0.931 |
doorway | +0.910 |
lifetime | +0.906 |
Neg logit contributions | |
ters | -0.709 |
its | -0.589 |
ade | -0.572 |
bles | -0.560 |
ying | -0.549 |
Token | man |
Token ID | 582 |
Feature activation | -5.41e-01 |
Pos logit contributions | |
joy | +0.047 |
icol | +0.038 |
Sure | +0.038 |
lair | +0.036 |
habitats | +0.036 |
Neg logit contributions | |
ters | -0.033 |
its | -0.033 |
aches | -0.031 |
do | -0.030 |
sure | -0.030 |
Token | ." |
Token ID | 526 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
joy | +0.066 |
icol | +0.059 |
Sure | +0.058 |
lifetime | +0.058 |
habitats | +0.057 |
Neg logit contributions | |
ters | -0.025 |
its | -0.020 |
ying | -0.018 |
ching | -0.017 |
ade | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
joy | +0.018 |
lifetime | +0.016 |
Bye | +0.016 |
generation | +0.016 |
lair | +0.016 |
Neg logit contributions | |
ters | -0.009 |
its | -0.009 |
she | -0.009 |
ade | -0.008 |
First | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -4.20e-01 |
Pos logit contributions | |
joy | +0.040 |
Bye | +0.035 |
Sure | +0.033 |
icol | +0.032 |
carriage | +0.032 |
Neg logit contributions | |
its | -0.030 |
ters | -0.027 |
ade | -0.026 |
ying | -0.026 |
aches | -0.026 |
Token | Mom |
Token ID | 11254 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
joy | +0.032 |
Bye | +0.026 |
habitats | +0.026 |
icol | +0.026 |
Sure | +0.025 |
Neg logit contributions | |
its | -0.024 |
ters | -0.024 |
ying | -0.022 |
aches | -0.022 |
ade | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | -5.91e-01 |
Pos logit contributions | |
joy | +0.246 |
Bye | +0.217 |
Sure | +0.215 |
icol | +0.213 |
carriage | +0.211 |
Neg logit contributions | |
ters | -0.124 |
its | -0.120 |
ying | -0.109 |
ade | -0.103 |
idy | -0.102 |
Token | I |
Token ID | 314 |
Feature activation | -3.15e+00 |
Pos logit contributions | |
joy | +0.064 |
arium | +0.052 |
lair | +0.051 |
lifetime | +0.050 |
habitats | +0.050 |
Neg logit contributions | |
ters | -0.034 |
do | -0.029 |
its | -0.029 |
matters | -0.028 |
rake | -0.027 |
Token | will |
Token ID | 481 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
joy | +0.298 |
Bye | +0.262 |
Sure | +0.251 |
carriage | +0.242 |
icol | +0.242 |
Neg logit contributions | |
its | -0.233 |
ters | -0.210 |
ade | -0.203 |
aches | -0.200 |
ying | -0.199 |
Token | . |
Token ID | 13 |
Feature activation | -6.77e-01 |
Pos logit contributions | |
joy | +0.171 |
Sure | +0.146 |
Bye | +0.145 |
icol | +0.138 |
arium | +0.137 |
Neg logit contributions | |
its | -0.095 |
ters | -0.085 |
aches | -0.083 |
ade | -0.077 |
ying | -0.076 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.074 |
arium | +0.060 |
lifetime | +0.060 |
lair | +0.059 |
carriage | +0.057 |
Neg logit contributions | |
ters | -0.037 |
do | -0.034 |
matters | -0.032 |
its | -0.032 |
First | -0.032 |
Token | ." |
Token ID | 526 |
Feature activation | +7.30e-02 |
Pos logit contributions | |
joy | +1.154 |
lair | +1.029 |
habitats | +0.996 |
lifetime | +0.968 |
arium | +0.964 |
Neg logit contributions | |
ters | -0.655 |
its | -0.539 |
ade | -0.528 |
ying | -0.521 |
sure | -0.504 |
Token | He |
Token ID | 679 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
its | +0.004 |
ade | +0.003 |
ters | +0.003 |
ying | +0.003 |
she | +0.003 |
Neg logit contributions | |
joy | -0.008 |
Bye | -0.007 |
carriage | -0.007 |
lifetime | -0.007 |
icol | -0.007 |
Token | opened |
Token ID | 4721 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
joy | +0.114 |
Bye | +0.095 |
spine | +0.093 |
Sure | +0.093 |
lifetime | +0.091 |
Neg logit contributions | |
its | -0.072 |
ters | -0.067 |
ade | -0.067 |
aches | -0.063 |
have | -0.061 |
Token | the |
Token ID | 262 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
joy | +0.242 |
Bye | +0.230 |
lifetime | +0.220 |
Sure | +0.211 |
habitats | +0.206 |
Neg logit contributions | |
its | -0.126 |
ters | -0.118 |
ying | -0.107 |
ade | -0.106 |
aches | -0.106 |
Token | door |
Token ID | 3420 |
Feature activation | -4.71e+00 |
Pos logit contributions | |
joy | +0.029 |
Bye | +0.026 |
Sure | +0.025 |
icol | +0.024 |
lifetime | +0.023 |
Neg logit contributions | |
its | -0.026 |
ade | -0.024 |
ters | -0.024 |
dishes | -0.023 |
rake | -0.023 |
Token | are |
Token ID | 389 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
joy | +0.198 |
Bye | +0.186 |
Sure | +0.174 |
goodbye | +0.173 |
carriage | +0.172 |
Neg logit contributions | |
its | -0.096 |
ters | -0.083 |
ying | -0.082 |
ade | -0.078 |
idy | -0.076 |
Token | a |
Token ID | 257 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
its | +0.086 |
ters | +0.086 |
aches | +0.078 |
ying | +0.076 |
ics | +0.072 |
Neg logit contributions | |
joy | -0.162 |
Sure | -0.143 |
Bye | -0.141 |
icol | -0.138 |
spine | -0.133 |
Token | good |
Token ID | 922 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
joy | +0.070 |
spine | +0.067 |
habitats | +0.066 |
Sure | +0.066 |
arium | +0.064 |
Neg logit contributions | |
ters | -0.014 |
whip | -0.014 |
idea | -0.013 |
its | -0.013 |
sure | -0.013 |
Token | friend |
Token ID | 1545 |
Feature activation | -5.30e-01 |
Pos logit contributions | |
its | +0.089 |
ters | +0.088 |
ying | +0.080 |
ade | +0.079 |
idy | +0.078 |
Neg logit contributions | |
joy | -0.108 |
Bye | -0.095 |
Sure | -0.094 |
icol | -0.089 |
arium | -0.088 |
Token | . |
Token ID | 13 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
joy | +0.064 |
icol | +0.061 |
Sure | +0.058 |
spine | +0.055 |
habitats | +0.055 |
Neg logit contributions | |
ters | -0.027 |
its | -0.020 |
ying | -0.020 |
idy | -0.018 |
ade | -0.018 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.075 |
carriage | +0.063 |
lair | +0.062 |
lifetime | +0.062 |
spine | +0.060 |
Neg logit contributions | |
ters | -0.051 |
its | -0.046 |
matters | -0.043 |
First | -0.041 |
ying | -0.041 |
Token | bye |
Token ID | 33847 |
Feature activation | -9.41e+00 |
Pos logit contributions | |
joy | +1.153 |
lair | +1.106 |
doorway | +0.995 |
carriage | +0.994 |
lifetime | +0.991 |
Neg logit contributions | |
ters | -0.644 |
its | -0.542 |
ade | -0.538 |
ying | -0.501 |
aches | -0.474 |
Token | ." |
Token ID | 526 |
Feature activation | -5.67e-02 |
Pos logit contributions | |
joy | +1.051 |
Sure | +0.926 |
Bye | +0.921 |
lifetime | +0.918 |
lair | +0.891 |
Neg logit contributions | |
ters | -0.536 |
its | -0.428 |
ying | -0.394 |
ade | -0.378 |
ble | -0.365 |
Token |
|
Token ID | 198 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
joy | +0.006 |
Bye | +0.005 |
icol | +0.005 |
carriage | +0.005 |
lifetime | +0.005 |
Neg logit contributions | |
its | -0.003 |
ters | -0.003 |
ade | -0.003 |
she | -0.003 |
ying | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
joy | +0.019 |
Bye | +0.017 |
Sure | +0.016 |
goodbye | +0.015 |
carriage | +0.015 |
Neg logit contributions | |
its | -0.018 |
ters | -0.017 |
ying | -0.016 |
ade | -0.016 |
aches | -0.016 |
Token | The |
Token ID | 464 |
Feature activation | -2.58e-02 |
Pos logit contributions | |
joy | +0.021 |
Bye | +0.019 |
Sure | +0.018 |
carriage | +0.017 |
goodbye | +0.017 |
Neg logit contributions | |
its | -0.015 |
ters | -0.014 |
ying | -0.014 |
ade | -0.013 |
aches | -0.013 |
Token | with |
Token ID | 351 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
joy | +0.248 |
icol | +0.215 |
Bye | +0.197 |
Sure | +0.195 |
habitats | +0.195 |
Neg logit contributions | |
ters | -0.125 |
ying | -0.105 |
ics | -0.097 |
its | -0.096 |
ade | -0.096 |
Token | the |
Token ID | 262 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
joy | +0.078 |
Sure | +0.069 |
Bye | +0.068 |
icol | +0.067 |
spine | +0.064 |
Neg logit contributions | |
its | -0.039 |
ters | -0.036 |
aches | -0.034 |
ade | -0.032 |
idy | -0.031 |
Token | number |
Token ID | 1271 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
joy | +0.022 |
Bye | +0.020 |
Sure | +0.019 |
icol | +0.018 |
arium | +0.018 |
Neg logit contributions | |
its | -0.015 |
ters | -0.014 |
aches | -0.013 |
ade | -0.013 |
ying | -0.013 |
Token | nine |
Token ID | 5193 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
ters | +0.079 |
its | +0.078 |
ying | +0.073 |
ade | +0.069 |
aches | +0.069 |
Neg logit contributions | |
joy | -0.154 |
icol | -0.136 |
Bye | -0.134 |
Sure | -0.130 |
habitats | -0.124 |
Token | . |
Token ID | 13 |
Feature activation | -6.13e-01 |
Pos logit contributions | |
joy | +0.405 |
Bye | +0.366 |
Sure | +0.359 |
icol | +0.342 |
arium | +0.327 |
Neg logit contributions | |
its | -0.281 |
ters | -0.261 |
aches | -0.246 |
ying | -0.243 |
ade | -0.237 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.057 |
lair | +0.047 |
carriage | +0.046 |
lifetime | +0.044 |
arium | +0.043 |
Neg logit contributions | |
ters | -0.045 |
First | -0.039 |
its | -0.039 |
she | -0.036 |
sure | -0.036 |
Token | ." |
Token ID | 526 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
joy | +1.182 |
lair | +1.103 |
habitats | +1.037 |
lifetime | +1.022 |
arium | +0.996 |
Neg logit contributions | |
ters | -0.620 |
its | -0.514 |
ade | -0.505 |
ying | -0.483 |
aches | -0.461 |
Token |
|
Token ID | 198 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
ters | +0.007 |
its | +0.007 |
ying | +0.006 |
she | +0.006 |
ade | +0.006 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.010 |
lair | -0.010 |
carriage | -0.010 |
icol | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
joy | +0.013 |
Bye | +0.011 |
Sure | +0.011 |
goodbye | +0.010 |
carriage | +0.010 |
Neg logit contributions | |
its | -0.014 |
ters | -0.013 |
ying | -0.013 |
aches | -0.012 |
ade | -0.012 |
Token | Mom |
Token ID | 29252 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
joy | +0.016 |
Bye | +0.015 |
Sure | +0.014 |
carriage | +0.013 |
goodbye | +0.013 |
Neg logit contributions | |
its | -0.012 |
ters | -0.011 |
ying | -0.010 |
ade | -0.010 |
aches | -0.010 |
Token | hung |
Token ID | 9174 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
joy | +0.142 |
Bye | +0.124 |
Sure | +0.118 |
icol | +0.116 |
habitats | +0.116 |
Neg logit contributions | |
its | -0.093 |
ters | -0.088 |
ade | -0.084 |
ying | -0.082 |
aches | -0.079 |
Token | OK |
Token ID | 11380 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
its | +0.000 |
ying | +0.000 |
ters | +0.000 |
ade | +0.000 |
aches | +0.000 |
Neg logit contributions | |
joy | -0.000 |
Bye | -0.000 |
Sure | -0.000 |
goodbye | -0.000 |
icol | -0.000 |
Token | , |
Token ID | 11 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
joy | +0.328 |
Bye | +0.290 |
Sure | +0.282 |
carriage | +0.272 |
icol | +0.270 |
Neg logit contributions | |
its | -0.245 |
ters | -0.232 |
ying | -0.215 |
ade | -0.214 |
aches | -0.209 |
Token | we |
Token ID | 356 |
Feature activation | -2.37e+00 |
Pos logit contributions | |
joy | +0.055 |
Sure | +0.046 |
Bye | +0.046 |
icol | +0.045 |
habitats | +0.044 |
Neg logit contributions | |
its | -0.047 |
ters | -0.047 |
ying | -0.043 |
aches | -0.042 |
ade | -0.041 |
Token | will |
Token ID | 481 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
joy | +0.153 |
Bye | +0.144 |
goodbye | +0.128 |
Sure | +0.112 |
bye | +0.111 |
Neg logit contributions | |
its | -0.220 |
ying | -0.217 |
ters | -0.215 |
idy | -0.206 |
ics | -0.204 |
Token | . |
Token ID | 13 |
Feature activation | -9.16e-01 |
Pos logit contributions | |
joy | +0.151 |
Bye | +0.143 |
goodbye | +0.132 |
Sure | +0.128 |
icol | +0.125 |
Neg logit contributions | |
its | -0.123 |
ying | -0.118 |
ters | -0.118 |
idy | -0.111 |
ade | -0.108 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.089 |
carriage | +0.077 |
lair | +0.077 |
lifetime | +0.073 |
doorway | +0.070 |
Neg logit contributions | |
ters | -0.065 |
matters | -0.056 |
its | -0.055 |
do | -0.053 |
squash | -0.050 |
Token | , |
Token ID | 11 |
Feature activation | -6.45e-01 |
Pos logit contributions | |
joy | +1.229 |
lair | +1.135 |
habitats | +1.072 |
lifetime | +1.068 |
carriage | +1.064 |
Neg logit contributions | |
ters | -0.592 |
its | -0.489 |
ade | -0.470 |
ying | -0.434 |
bles | -0.407 |
Token | sir |
Token ID | 15967 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
joy | +0.058 |
Sure | +0.050 |
Bye | +0.049 |
icol | +0.048 |
habitats | +0.046 |
Neg logit contributions | |
its | -0.047 |
ters | -0.046 |
ade | -0.044 |
aches | -0.043 |
ying | -0.042 |
Token | ." |
Token ID | 526 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
joy | +0.223 |
icol | +0.195 |
Sure | +0.192 |
Bye | +0.191 |
lifetime | +0.187 |
Neg logit contributions | |
ters | -0.116 |
its | -0.108 |
ying | -0.097 |
ade | -0.095 |
idy | -0.090 |
Token |
|
Token ID | 198 |
Feature activation | -4.37e-01 |
Pos logit contributions | |
joy | +0.017 |
lifetime | +0.016 |
lair | +0.016 |
carriage | +0.015 |
icol | +0.015 |
Neg logit contributions | |
ters | -0.007 |
its | -0.006 |
she | -0.006 |
First | -0.005 |
ade | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -4.28e-01 |
Pos logit contributions | |
joy | +0.038 |
Bye | +0.034 |
Sure | +0.032 |
carriage | +0.031 |
goodbye | +0.031 |
Neg logit contributions | |
its | -0.035 |
ters | -0.032 |
ying | -0.031 |
ade | -0.031 |
aches | -0.030 |
Token | go |
Token ID | 467 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
joy | +0.041 |
Bye | +0.039 |
carriage | +0.036 |
goodbye | +0.036 |
Sure | +0.036 |
Neg logit contributions | |
its | -0.031 |
ters | -0.029 |
ying | -0.029 |
ade | -0.027 |
idy | -0.026 |
Token | home |
Token ID | 1363 |
Feature activation | -4.02e+00 |
Pos logit contributions | |
its | +0.114 |
ters | +0.113 |
ade | +0.113 |
aches | +0.110 |
ying | +0.106 |
Neg logit contributions | |
joy | -0.168 |
Bye | -0.152 |
Sure | -0.142 |
habitats | -0.140 |
icol | -0.136 |
Token | for |
Token ID | 329 |
Feature activation | -3.69e+00 |
Pos logit contributions | |
joy | +0.414 |
Bye | +0.378 |
Sure | +0.372 |
icol | +0.371 |
habitats | +0.350 |
Neg logit contributions | |
ters | -0.230 |
ying | -0.207 |
its | -0.203 |
ble | -0.201 |
ics | -0.199 |
Token | dinner |
Token ID | 8073 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
joy | +0.445 |
Sure | +0.401 |
Bye | +0.385 |
spine | +0.382 |
icol | +0.379 |
Neg logit contributions | |
aches | -0.148 |
its | -0.145 |
happen | -0.142 |
ters | -0.137 |
noise | -0.130 |
Token | . |
Token ID | 13 |
Feature activation | -3.66e-01 |
Pos logit contributions | |
joy | +0.038 |
Bye | +0.034 |
Sure | +0.033 |
icol | +0.032 |
carriage | +0.031 |
Neg logit contributions | |
ters | -0.022 |
its | -0.022 |
ade | -0.021 |
ying | -0.021 |
aches | -0.020 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.034 |
carriage | +0.027 |
lair | +0.027 |
lifetime | +0.026 |
habitats | +0.026 |
Neg logit contributions | |
ters | -0.026 |
its | -0.024 |
she | -0.022 |
matters | -0.022 |
First | -0.022 |
Token | !" |
Token ID | 2474 |
Feature activation | +9.59e-01 |
Pos logit contributions | |
joy | +0.987 |
lair | +0.930 |
habitats | +0.880 |
lifetime | +0.835 |
doorway | +0.825 |
Neg logit contributions | |
ters | -0.760 |
ade | -0.633 |
its | -0.630 |
sure | -0.630 |
ying | -0.616 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
she | +0.048 |
ters | +0.047 |
ics | +0.044 |
ade | +0.042 |
herself | +0.042 |
Neg logit contributions | |
joy | -0.098 |
lair | -0.089 |
lifetime | -0.084 |
habitats | -0.084 |
carriage | -0.081 |
Token | Once |
Token ID | 7454 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
its | +0.094 |
ters | +0.087 |
ade | +0.082 |
ying | +0.082 |
aches | +0.078 |
Neg logit contributions | |
joy | -0.120 |
Bye | -0.108 |
Sure | -0.103 |
icol | -0.101 |
carriage | -0.101 |
Token | upon |
Token ID | 2402 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
its | +0.082 |
ters | +0.075 |
ying | +0.074 |
ade | +0.072 |
aches | +0.071 |
Neg logit contributions | |
joy | -0.099 |
Bye | -0.089 |
Sure | -0.084 |
icol | -0.081 |
carriage | -0.080 |
Token | a |
Token ID | 257 |
Feature activation | -1.98e-01 |
Pos logit contributions | |
joy | +0.112 |
Bye | +0.101 |
Sure | +0.096 |
carriage | +0.093 |
goodbye | +0.092 |
Neg logit contributions | |
its | -0.075 |
ters | -0.068 |
ying | -0.065 |
ade | -0.064 |
aches | -0.063 |
Token | hope |
Token ID | 2911 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
joy | +0.445 |
Bye | +0.415 |
carriage | +0.386 |
Sure | +0.384 |
goodbye | +0.381 |
Neg logit contributions | |
its | -0.330 |
ters | -0.307 |
ying | -0.305 |
ade | -0.283 |
idy | -0.282 |
Token | you |
Token ID | 345 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
joy | +0.600 |
icol | +0.530 |
Bye | +0.524 |
Sure | +0.521 |
carriage | +0.508 |
Neg logit contributions | |
ters | -0.226 |
its | -0.216 |
aches | -0.198 |
ying | -0.196 |
happen | -0.196 |
Token | like |
Token ID | 588 |
Feature activation | +9.23e-01 |
Pos logit contributions | |
joy | +0.210 |
Bye | +0.183 |
Sure | +0.179 |
icol | +0.176 |
goodbye | +0.166 |
Neg logit contributions | |
its | -0.118 |
ters | -0.108 |
aches | -0.105 |
ade | -0.101 |
ying | -0.096 |
Token | it |
Token ID | 340 |
Feature activation | -8.25e-01 |
Pos logit contributions | |
its | +0.050 |
ters | +0.045 |
aches | +0.044 |
ade | +0.041 |
ying | +0.041 |
Neg logit contributions | |
joy | -0.104 |
Bye | -0.094 |
Sure | -0.092 |
icol | -0.091 |
spine | -0.088 |
Token | . |
Token ID | 13 |
Feature activation | -9.13e-01 |
Pos logit contributions | |
joy | +0.079 |
Bye | +0.070 |
Sure | +0.068 |
icol | +0.065 |
carriage | +0.064 |
Neg logit contributions | |
its | -0.059 |
ters | -0.055 |
ying | -0.052 |
ade | -0.052 |
aches | -0.051 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
joy | +0.095 |
carriage | +0.078 |
lifetime | +0.077 |
lair | +0.074 |
habitats | +0.072 |
Neg logit contributions | |
ters | -0.062 |
its | -0.058 |
matters | -0.052 |
chini | -0.048 |
shrink | -0.048 |
Token | , |
Token ID | 11 |
Feature activation | -6.54e-01 |
Pos logit contributions | |
joy | +1.216 |
lair | +1.128 |
lifetime | +1.065 |
Sure | +1.061 |
doorway | +1.053 |
Neg logit contributions | |
ters | -0.597 |
its | -0.497 |
ade | -0.455 |
ying | -0.441 |
bles | -0.431 |
Token | bug |
Token ID | 5434 |
Feature activation | +4.23e+00 |
Pos logit contributions | |
joy | +0.062 |
Sure | +0.054 |
Bye | +0.054 |
icol | +0.052 |
habitats | +0.051 |
Neg logit contributions | |
its | -0.044 |
ters | -0.043 |
ade | -0.040 |
aches | -0.040 |
ying | -0.039 |
Token | ." |
Token ID | 526 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
ters | +0.227 |
its | +0.204 |
ade | +0.192 |
ying | +0.177 |
aches | +0.173 |
Neg logit contributions | |
joy | -0.495 |
Sure | -0.437 |
Bye | -0.428 |
icol | -0.423 |
lifetime | -0.416 |
Token |
|
Token ID | 198 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
joy | +0.029 |
lifetime | +0.027 |
carriage | +0.026 |
lair | +0.026 |
icol | +0.026 |
Neg logit contributions | |
ters | -0.011 |
its | -0.010 |
she | -0.010 |
noise | -0.008 |
ade | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
joy | +0.045 |
Bye | +0.040 |
Sure | +0.038 |
carriage | +0.037 |
icol | +0.036 |
Neg logit contributions | |
its | -0.039 |
ters | -0.036 |
ying | -0.035 |
ade | -0.034 |
aches | -0.034 |
Token | to |
Token ID | 284 |
Feature activation | -6.18e-01 |
Pos logit contributions | |
joy | +0.171 |
Bye | +0.147 |
icol | +0.147 |
habitats | +0.144 |
Sure | +0.139 |
Neg logit contributions | |
ters | -0.129 |
its | -0.128 |
ble | -0.121 |
aches | -0.117 |
bles | -0.117 |
Token | visit |
Token ID | 3187 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
joy | +0.070 |
icol | +0.061 |
Bye | +0.059 |
lifetime | +0.059 |
Sure | +0.059 |
Neg logit contributions | |
its | -0.029 |
ters | -0.027 |
whip | -0.027 |
aches | -0.026 |
happen | -0.026 |
Token | you |
Token ID | 345 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
joy | +0.719 |
icol | +0.646 |
lifetime | +0.627 |
spine | +0.625 |
Sure | +0.622 |
Neg logit contributions | |
ters | -0.268 |
its | -0.247 |
ying | -0.226 |
aches | -0.225 |
she | -0.223 |
Token | soon |
Token ID | 2582 |
Feature activation | -4.47e+00 |
Pos logit contributions | |
joy | +0.190 |
Bye | +0.168 |
icol | +0.166 |
Sure | +0.165 |
carriage | +0.153 |
Neg logit contributions | |
ters | -0.138 |
its | -0.136 |
ying | -0.125 |
ade | -0.119 |
aches | -0.119 |
Token | . |
Token ID | 13 |
Feature activation | -9.65e-01 |
Pos logit contributions | |
joy | +0.427 |
Bye | +0.381 |
Sure | +0.365 |
carriage | +0.349 |
icol | +0.349 |
Neg logit contributions | |
its | -0.320 |
ters | -0.295 |
ying | -0.280 |
ade | -0.277 |
aches | -0.274 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
joy | +0.102 |
lifetime | +0.083 |
lair | +0.082 |
carriage | +0.079 |
arium | +0.079 |
Neg logit contributions | |
ters | -0.057 |
matters | -0.051 |
its | -0.049 |
she | -0.049 |
First | -0.049 |
Token | , |
Token ID | 11 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
joy | +1.140 |
lair | +1.076 |
lifetime | +1.017 |
doorway | +1.008 |
habitats | +1.005 |
Neg logit contributions | |
ters | -0.623 |
ade | -0.509 |
its | -0.502 |
bles | -0.479 |
ying | -0.469 |
Token | Tom |
Token ID | 4186 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
joy | +0.058 |
Sure | +0.051 |
icol | +0.048 |
Bye | +0.048 |
arium | +0.048 |
Neg logit contributions | |
its | -0.044 |
whip | -0.042 |
aches | -0.042 |
ters | -0.041 |
ade | -0.041 |
Token | ." |
Token ID | 526 |
Feature activation | -2.05e-01 |
Pos logit contributions | |
joy | +0.279 |
Sure | +0.247 |
Bye | +0.244 |
icol | +0.243 |
lifetime | +0.233 |
Neg logit contributions | |
ters | -0.138 |
its | -0.135 |
ying | -0.118 |
ade | -0.117 |
idy | -0.113 |
Token | She |
Token ID | 1375 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
joy | +0.023 |
lifetime | +0.022 |
lair | +0.022 |
carriage | +0.022 |
generation | +0.021 |
Neg logit contributions | |
she | -0.007 |
ade | -0.007 |
its | -0.007 |
First | -0.006 |
do | -0.006 |
Token | waves |
Token ID | 9813 |
Feature activation | +7.71e-01 |
Pos logit contributions | |
its | +0.020 |
ters | +0.018 |
ade | +0.018 |
aches | +0.017 |
ying | +0.017 |
Neg logit contributions | |
joy | -0.027 |
Bye | -0.023 |
Sure | -0.022 |
lifetime | -0.022 |
spine | -0.021 |
Token | and |
Token ID | 290 |
Feature activation | -8.28e-01 |
Pos logit contributions | |
ade | +0.105 |
its | +0.103 |
aches | +0.102 |
ying | +0.099 |
ters | +0.098 |
Neg logit contributions | |
joy | -0.168 |
Bye | -0.149 |
Sure | -0.144 |
icol | -0.143 |
habitats | -0.143 |
Token | visit |
Token ID | 3187 |
Feature activation | -6.19e+00 |
Pos logit contributions | |
joy | +0.096 |
icol | +0.079 |
habitats | +0.077 |
Bye | +0.077 |
Sure | +0.076 |
Neg logit contributions | |
aches | -0.039 |
do | -0.038 |
its | -0.038 |
shrink | -0.037 |
convince | -0.036 |
Token | more |
Token ID | 517 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
joy | +0.716 |
icol | +0.610 |
Sure | +0.606 |
Bye | +0.600 |
spine | +0.589 |
Neg logit contributions | |
ters | -0.279 |
aches | -0.273 |
its | -0.261 |
idy | -0.251 |
ying | -0.251 |
Token | children |
Token ID | 1751 |
Feature activation | +2.74e+00 |
Pos logit contributions | |
joy | +0.246 |
Bye | +0.217 |
Sure | +0.213 |
icol | +0.201 |
carriage | +0.189 |
Neg logit contributions | |
its | -0.220 |
ters | -0.205 |
ying | -0.204 |
ade | -0.200 |
aches | -0.200 |
Token | . |
Token ID | 13 |
Feature activation | -4.23e-01 |
Pos logit contributions | |
ters | +0.158 |
ying | +0.144 |
its | +0.142 |
aches | +0.137 |
have | +0.132 |
Neg logit contributions | |
joy | -0.286 |
icol | -0.263 |
Sure | -0.259 |
Bye | -0.255 |
habitats | -0.237 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
joy | +0.037 |
carriage | +0.030 |
lair | +0.030 |
lifetime | +0.029 |
spine | +0.029 |
Neg logit contributions | |
ters | -0.031 |
its | -0.029 |
First | -0.027 |
she | -0.026 |
have | -0.026 |
Token | bye |
Token ID | 33847 |
Feature activation | -9.51e+00 |
Pos logit contributions | |
joy | +0.974 |
lair | +0.884 |
habitats | +0.822 |
lifetime | +0.800 |
doorway | +0.794 |
Neg logit contributions | |
ters | -0.794 |
its | -0.679 |
ade | -0.670 |
sure | -0.667 |
ying | -0.662 |
Token | !" |
Token ID | 2474 |
Feature activation | +8.52e-01 |
Pos logit contributions | |
joy | +1.034 |
Sure | +0.913 |
lifetime | +0.899 |
Bye | +0.897 |
habitats | +0.878 |
Neg logit contributions | |
ters | -0.541 |
its | -0.417 |
ying | -0.406 |
ade | -0.380 |
idy | -0.379 |
Token | Santa |
Token ID | 8909 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
ters | +0.043 |
its | +0.041 |
she | +0.041 |
ics | +0.036 |
aches | +0.036 |
Neg logit contributions | |
joy | -0.086 |
icol | -0.075 |
lair | -0.075 |
habitats | -0.075 |
lifetime | -0.074 |
Token | said |
Token ID | 531 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
joy | +0.386 |
Bye | +0.331 |
Sure | +0.322 |
icol | +0.311 |
habitats | +0.306 |
Neg logit contributions | |
its | -0.300 |
ters | -0.286 |
ying | -0.263 |
ade | -0.262 |
aches | -0.262 |
Token | . |
Token ID | 13 |
Feature activation | -5.90e-01 |
Pos logit contributions | |
ters | +0.084 |
its | +0.084 |
ying | +0.079 |
ade | +0.073 |
aches | +0.072 |
Neg logit contributions | |
joy | -0.150 |
habitats | -0.135 |
Bye | -0.135 |
icol | -0.130 |
Sure | -0.129 |
Token | wait |
Token ID | 4043 |
Feature activation | -3.24e+00 |
Pos logit contributions | |
joy | +0.182 |
Bye | +0.163 |
Sure | +0.153 |
icol | +0.151 |
carriage | +0.142 |
Neg logit contributions | |
its | -0.146 |
idea | -0.136 |
ters | -0.134 |
dishes | -0.133 |
ade | -0.128 |
Token | for |
Token ID | 329 |
Feature activation | -3.98e+00 |
Pos logit contributions | |
joy | +0.283 |
Bye | +0.250 |
Sure | +0.237 |
goodbye | +0.226 |
carriage | +0.226 |
Neg logit contributions | |
its | -0.258 |
ters | -0.240 |
ying | -0.229 |
ade | -0.228 |
aches | -0.225 |
Token | your |
Token ID | 534 |
Feature activation | -2.21e+00 |
Pos logit contributions | |
joy | +0.407 |
Bye | +0.364 |
Sure | +0.351 |
icol | +0.338 |
carriage | +0.337 |
Neg logit contributions | |
its | -0.255 |
ters | -0.235 |
aches | -0.225 |
ade | -0.221 |
ying | -0.219 |
Token | call |
Token ID | 869 |
Feature activation | -3.99e-01 |
Pos logit contributions | |
joy | +0.206 |
Bye | +0.183 |
Sure | +0.175 |
icol | +0.166 |
carriage | +0.165 |
Neg logit contributions | |
its | -0.162 |
ters | -0.149 |
ade | -0.142 |
aches | -0.141 |
ying | -0.141 |
Token | . |
Token ID | 13 |
Feature activation | -3.45e-01 |
Pos logit contributions | |
joy | +0.039 |
Bye | +0.033 |
Sure | +0.033 |
icol | +0.032 |
carriage | +0.031 |
Neg logit contributions | |
its | -0.027 |
ters | -0.026 |
ying | -0.025 |
ade | -0.024 |
aches | -0.024 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
joy | +0.030 |
carriage | +0.024 |
icol | +0.024 |
Bye | +0.024 |
lair | +0.023 |
Neg logit contributions | |
its | -0.027 |
ters | -0.026 |
ying | -0.024 |
idy | -0.023 |
she | -0.023 |
Token | ." |
Token ID | 526 |
Feature activation | +5.13e-02 |
Pos logit contributions | |
joy | +1.212 |
lair | +1.051 |
habitats | +1.049 |
lifetime | +1.016 |
arium | +0.994 |
Neg logit contributions | |
ters | -0.569 |
its | -0.524 |
ade | -0.475 |
idea | -0.467 |
ying | -0.460 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
its | +0.003 |
ters | +0.003 |
she | +0.003 |
ying | +0.002 |
aches | +0.002 |
Neg logit contributions | |
joy | -0.005 |
icol | -0.004 |
lair | -0.004 |
habitats | -0.004 |
lifetime | -0.004 |
Token | said |
Token ID | 531 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
joy | +0.020 |
Bye | +0.018 |
Sure | +0.017 |
goodbye | +0.017 |
carriage | +0.017 |
Neg logit contributions | |
its | -0.015 |
ters | -0.014 |
ying | -0.013 |
ade | -0.013 |
aches | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -7.21e-01 |
Pos logit contributions | |
its | +0.103 |
ters | +0.098 |
ying | +0.094 |
aches | +0.091 |
ade | +0.089 |
Neg logit contributions | |
joy | -0.155 |
Bye | -0.138 |
habitats | -0.133 |
Sure | -0.133 |
icol | -0.131 |
Token |
|
Token ID | 198 |
Feature activation | -2.64e-01 |
Pos logit contributions | |
joy | +0.074 |
lifetime | +0.067 |
carriage | +0.067 |
lair | +0.066 |
habitats | +0.066 |
Neg logit contributions | |
ters | -0.038 |
its | -0.037 |
she | -0.033 |
ying | -0.030 |
ula | -0.030 |
Token | have |
Token ID | 423 |
Feature activation | +4.68e-01 |
Pos logit contributions | |
joy | +0.207 |
Bye | +0.182 |
Sure | +0.178 |
icol | +0.173 |
carriage | +0.168 |
Neg logit contributions | |
its | -0.123 |
ters | -0.112 |
aches | -0.105 |
ade | -0.104 |
ying | -0.103 |
Token | a |
Token ID | 257 |
Feature activation | -7.58e-01 |
Pos logit contributions | |
its | +0.024 |
ters | +0.023 |
aches | +0.023 |
ade | +0.022 |
have | +0.021 |
Neg logit contributions | |
joy | -0.052 |
Sure | -0.047 |
Bye | -0.046 |
icol | -0.045 |
carriage | -0.045 |
Token | good |
Token ID | 922 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
joy | +0.084 |
Bye | +0.075 |
Sure | +0.073 |
habitats | +0.072 |
icol | +0.071 |
Neg logit contributions | |
its | -0.037 |
ade | -0.036 |
whip | -0.032 |
aches | -0.032 |
idea | -0.031 |
Token | nap |
Token ID | 25422 |
Feature activation | -4.87e-01 |
Pos logit contributions | |
its | +0.082 |
ade | +0.075 |
idea | +0.074 |
ters | +0.070 |
idy | +0.068 |
Neg logit contributions | |
joy | -0.094 |
Bye | -0.085 |
Sure | -0.082 |
carriage | -0.075 |
icol | -0.075 |
Token | . |
Token ID | 13 |
Feature activation | -8.52e-01 |
Pos logit contributions | |
joy | +0.052 |
Bye | +0.047 |
Sure | +0.047 |
icol | +0.046 |
carriage | +0.043 |
Neg logit contributions | |
ters | -0.030 |
its | -0.029 |
ying | -0.027 |
ade | -0.026 |
aches | -0.025 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
joy | +0.083 |
carriage | +0.069 |
lifetime | +0.066 |
lair | +0.065 |
arium | +0.063 |
Neg logit contributions | |
ters | -0.061 |
matters | -0.053 |
its | -0.052 |
sure | -0.047 |
have | -0.047 |
Token | !" |
Token ID | 2474 |
Feature activation | +7.93e-01 |
Pos logit contributions | |
joy | +1.150 |
lair | +1.075 |
lifetime | +1.006 |
habitats | +1.006 |
carriage | +1.001 |
Neg logit contributions | |
ters | -0.654 |
its | -0.550 |
ying | -0.510 |
ade | -0.504 |
sure | -0.483 |
Token |
|
Token ID | 198 |
Feature activation | -4.16e-01 |
Pos logit contributions | |
ters | +0.039 |
its | +0.037 |
she | +0.033 |
ying | +0.031 |
ade | +0.030 |
Neg logit contributions | |
joy | -0.085 |
carriage | -0.077 |
habitats | -0.076 |
lair | -0.076 |
lifetime | -0.076 |
Token |
|
Token ID | 198 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
joy | +0.037 |
Bye | +0.033 |
Sure | +0.031 |
carriage | +0.030 |
goodbye | +0.030 |
Neg logit contributions | |
its | -0.033 |
ters | -0.030 |
ying | -0.029 |
ade | -0.029 |
aches | -0.028 |
Token | They |
Token ID | 2990 |
Feature activation | +2.54e+00 |
Pos logit contributions | |
joy | +0.046 |
Bye | +0.041 |
Sure | +0.040 |
icol | +0.039 |
carriage | +0.039 |
Neg logit contributions | |
its | -0.023 |
ters | -0.021 |
ade | -0.019 |
aches | -0.019 |
ying | -0.019 |
Token | waved |
Token ID | 26834 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
its | +0.177 |
ters | +0.169 |
aches | +0.165 |
ade | +0.165 |
idy | +0.152 |
Neg logit contributions | |
joy | -0.247 |
Sure | -0.211 |
Bye | -0.208 |
icol | -0.196 |
habitats | -0.191 |
Token | talk |
Token ID | 1561 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
its | +0.082 |
ters | +0.074 |
aches | +0.070 |
ying | +0.069 |
ade | +0.069 |
Neg logit contributions | |
joy | -0.127 |
Bye | -0.112 |
Sure | -0.109 |
icol | -0.104 |
carriage | -0.103 |
Token | to |
Token ID | 284 |
Feature activation | -5.61e-01 |
Pos logit contributions | |
joy | +0.130 |
icol | +0.117 |
Sure | +0.110 |
Bye | +0.107 |
carriage | +0.105 |
Neg logit contributions | |
ters | -0.080 |
its | -0.079 |
ying | -0.076 |
ade | -0.073 |
aches | -0.070 |
Token | you |
Token ID | 345 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
joy | +0.065 |
icol | +0.057 |
Sure | +0.057 |
Bye | +0.057 |
carriage | +0.055 |
Neg logit contributions | |
its | -0.028 |
ters | -0.027 |
ying | -0.023 |
aches | -0.023 |
idy | -0.023 |
Token | later |
Token ID | 1568 |
Feature activation | -7.10e-01 |
Pos logit contributions | |
joy | +0.190 |
Bye | +0.167 |
icol | +0.164 |
Sure | +0.164 |
carriage | +0.154 |
Neg logit contributions | |
its | -0.129 |
ters | -0.127 |
ying | -0.117 |
aches | -0.113 |
ade | -0.112 |
Token | . |
Token ID | 13 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
joy | +0.075 |
Bye | +0.068 |
Sure | +0.067 |
icol | +0.067 |
carriage | +0.066 |
Neg logit contributions | |
ters | -0.040 |
its | -0.039 |
ying | -0.036 |
idy | -0.032 |
ade | -0.032 |
Token | Bye |
Token ID | 47843 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
joy | +0.040 |
lair | +0.035 |
carriage | +0.034 |
arium | +0.034 |
lifetime | +0.034 |
Neg logit contributions | |
ters | -0.025 |
its | -0.022 |
First | -0.022 |
matters | -0.022 |
she | -0.021 |
Token | ." |
Token ID | 526 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
joy | +1.090 |
lair | +1.033 |
habitats | +0.965 |
lifetime | +0.941 |
doorway | +0.934 |
Neg logit contributions | |
ters | -0.681 |
its | -0.569 |
ying | -0.552 |
ade | -0.550 |
sure | -0.534 |
Token |
|
Token ID | 198 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
its | +0.009 |
she | +0.009 |
ters | +0.008 |
First | +0.008 |
oons | +0.007 |
Neg logit contributions | |
joy | -0.023 |
habitats | -0.021 |
lifetime | -0.021 |
icol | -0.020 |
carriage | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
joy | +0.018 |
Bye | +0.016 |
Sure | +0.015 |
icol | +0.015 |
carriage | +0.015 |
Neg logit contributions | |
its | -0.014 |
ters | -0.012 |
ade | -0.012 |
ying | -0.012 |
aches | -0.012 |
Token | He |
Token ID | 1544 |
Feature activation | +7.38e-01 |
Pos logit contributions | |
joy | +0.019 |
icol | +0.017 |
Bye | +0.016 |
spine | +0.016 |
habitats | +0.016 |
Neg logit contributions | |
its | -0.011 |
ters | -0.010 |
ade | -0.009 |
ying | -0.009 |
have | -0.009 |
Token | hung |
Token ID | 9174 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
its | +0.048 |
ters | +0.046 |
ade | +0.044 |
aches | +0.042 |
ying | +0.040 |
Neg logit contributions | |
joy | -0.075 |
Bye | -0.063 |
spine | -0.062 |
Sure | -0.062 |
habitats | -0.060 |
Token | played |
Token ID | 2826 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
joy | +0.018 |
lair | +0.016 |
Bye | +0.015 |
Sure | +0.015 |
icol | +0.014 |
Neg logit contributions | |
ters | -0.011 |
aches | -0.011 |
ade | -0.011 |
ics | -0.011 |
its | -0.011 |
Token | together |
Token ID | 1978 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
joy | +0.209 |
Bye | +0.187 |
Sure | +0.178 |
icol | +0.170 |
carriage | +0.169 |
Neg logit contributions | |
its | -0.166 |
ters | -0.156 |
ying | -0.147 |
ade | -0.146 |
aches | -0.145 |
Token | . |
Token ID | 13 |
Feature activation | +3.45e-01 |
Pos logit contributions | |
joy | +0.096 |
Bye | +0.088 |
Sure | +0.084 |
icol | +0.081 |
carriage | +0.078 |
Neg logit contributions | |
its | -0.073 |
ters | -0.070 |
ying | -0.065 |
aches | -0.064 |
ade | -0.064 |
Token | Daisy |
Token ID | 40355 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
ters | +0.024 |
its | +0.023 |
ying | +0.021 |
ade | +0.020 |
idy | +0.020 |
Neg logit contributions | |
joy | -0.032 |
Bye | -0.028 |
carriage | -0.028 |
lair | -0.027 |
icol | -0.026 |
Token | made |
Token ID | 925 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
its | +0.133 |
ters | +0.125 |
ade | +0.120 |
ying | +0.117 |
aches | +0.117 |
Neg logit contributions | |
joy | -0.225 |
Bye | -0.201 |
Sure | -0.198 |
icol | -0.190 |
spine | -0.186 |
Token | sure |
Token ID | 1654 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
joy | +0.136 |
goodbye | +0.120 |
Bye | +0.119 |
carriage | +0.114 |
Sure | +0.113 |
Neg logit contributions | |
its | -0.065 |
ters | -0.057 |
ying | -0.056 |
ade | -0.051 |
idy | -0.049 |
Token | to |
Token ID | 284 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
its | +0.486 |
ters | +0.456 |
ying | +0.446 |
ade | +0.440 |
aches | +0.440 |
Neg logit contributions | |
joy | -0.501 |
Bye | -0.441 |
Sure | -0.422 |
icol | -0.410 |
carriage | -0.399 |
Token | take |
Token ID | 1011 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
joy | +0.031 |
Bye | +0.027 |
Sure | +0.027 |
icol | +0.025 |
carriage | +0.025 |
Neg logit contributions | |
its | -0.019 |
aches | -0.018 |
ters | -0.017 |
ade | -0.017 |
ying | -0.016 |
Token | extra |
Token ID | 3131 |
Feature activation | +5.67e-01 |
Pos logit contributions | |
its | +0.092 |
ters | +0.085 |
ade | +0.080 |
ying | +0.079 |
aches | +0.079 |
Neg logit contributions | |
joy | -0.142 |
Bye | -0.129 |
Sure | -0.124 |
carriage | -0.118 |
icol | -0.118 |
Token | care |
Token ID | 1337 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
its | +0.045 |
ters | +0.043 |
ying | +0.040 |
idy | +0.039 |
aches | +0.038 |
Neg logit contributions | |
joy | -0.049 |
Bye | -0.044 |
Sure | -0.042 |
goodbye | -0.041 |
carriage | -0.040 |
Token | of |
Token ID | 286 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
joy | +0.252 |
Bye | +0.235 |
Sure | +0.224 |
icol | +0.221 |
carriage | +0.215 |
Neg logit contributions | |
its | -0.106 |
ters | -0.099 |
ying | -0.097 |
ade | -0.093 |
idy | -0.088 |
Token | . |
Token ID | 13 |
Feature activation | +2.95e-01 |
Pos logit contributions | |
its | +0.063 |
ters | +0.059 |
ying | +0.057 |
ade | +0.056 |
idy | +0.055 |
Neg logit contributions | |
joy | -0.083 |
Bye | -0.076 |
Sure | -0.072 |
carriage | -0.071 |
icol | -0.069 |
Token | He |
Token ID | 679 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
its | +0.022 |
ters | +0.022 |
ying | +0.020 |
ade | +0.020 |
she | +0.019 |
Neg logit contributions | |
joy | -0.025 |
Bye | -0.022 |
carriage | -0.020 |
lifetime | -0.020 |
icol | -0.020 |
Token | sniff |
Token ID | 26300 |
Feature activation | -8.04e-01 |
Pos logit contributions | |
joy | +0.050 |
Bye | +0.044 |
Sure | +0.042 |
icol | +0.041 |
carriage | +0.040 |
Neg logit contributions | |
its | -0.031 |
ters | -0.028 |
ade | -0.027 |
aches | -0.027 |
ying | -0.025 |
Token | ed |
Token ID | 276 |
Feature activation | -8.33e-01 |
Pos logit contributions | |
joy | +0.061 |
Bye | +0.050 |
goodbye | +0.049 |
Sure | +0.048 |
carriage | +0.045 |
Neg logit contributions | |
its | -0.072 |
aches | -0.065 |
ters | -0.063 |
ying | -0.063 |
ics | -0.062 |
Token | the |
Token ID | 262 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
joy | +0.079 |
Bye | +0.069 |
Sure | +0.066 |
goodbye | +0.066 |
carriage | +0.064 |
Neg logit contributions | |
its | -0.062 |
ters | -0.055 |
ying | -0.054 |
ade | -0.054 |
aches | -0.052 |
Token | herbs |
Token ID | 25411 |
Feature activation | +5.46e+00 |
Pos logit contributions | |
its | +0.020 |
ying | +0.018 |
oving | +0.017 |
ics | +0.017 |
aches | +0.017 |
Neg logit contributions | |
joy | -0.023 |
carriage | -0.019 |
goodbye | -0.018 |
den | -0.018 |
arium | -0.017 |
Token | and |
Token ID | 290 |
Feature activation | -7.93e-02 |
Pos logit contributions | |
its | +0.451 |
ters | +0.405 |
ying | +0.391 |
ade | +0.390 |
aches | +0.389 |
Neg logit contributions | |
joy | -0.464 |
Bye | -0.403 |
Sure | -0.386 |
goodbye | -0.378 |
carriage | -0.369 |
Token | tasted |
Token ID | 29187 |
Feature activation | +5.59e-01 |
Pos logit contributions | |
joy | +0.008 |
Bye | +0.007 |
Sure | +0.007 |
icol | +0.007 |
carriage | +0.007 |
Neg logit contributions | |
its | -0.005 |
ters | -0.005 |
aches | -0.005 |
ade | -0.004 |
ying | -0.004 |
Token | them |
Token ID | 606 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
its | +0.051 |
ying | +0.050 |
ics | +0.049 |
ikes | +0.049 |
organ | +0.049 |
Neg logit contributions | |
joy | -0.038 |
goodbye | -0.033 |
Bye | -0.027 |
content | -0.025 |
hearts | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
its | +0.281 |
ying | +0.260 |
ters | +0.251 |
ade | +0.247 |
idy | +0.247 |
Neg logit contributions | |
joy | -0.225 |
goodbye | -0.204 |
Bye | -0.193 |
Sure | -0.176 |
icol | -0.159 |
Token | The |
Token ID | 383 |
Feature activation | -3.27e+00 |
Pos logit contributions | |
its | +0.027 |
ters | +0.027 |
ade | +0.025 |
ying | +0.025 |
aches | +0.024 |
Neg logit contributions | |
joy | -0.025 |
Bye | -0.021 |
carriage | -0.020 |
lifetime | -0.020 |
icol | -0.019 |
Token | says |
Token ID | 1139 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
joy | +0.170 |
Bye | +0.160 |
goodbye | +0.146 |
Sure | +0.142 |
carriage | +0.132 |
Neg logit contributions | |
its | -0.217 |
aches | -0.209 |
ying | -0.208 |
ade | -0.205 |
ters | -0.202 |
Token | . |
Token ID | 13 |
Feature activation | -7.64e-01 |
Pos logit contributions | |
its | +0.088 |
ters | +0.081 |
ying | +0.077 |
ade | +0.076 |
aches | +0.075 |
Neg logit contributions | |
joy | -0.112 |
Bye | -0.101 |
Sure | -0.095 |
carriage | -0.092 |
icol | -0.092 |
Token | " |
Token ID | 366 |
Feature activation | +6.99e-02 |
Pos logit contributions | |
joy | +0.060 |
Bye | +0.053 |
Sure | +0.050 |
carriage | +0.047 |
goodbye | +0.047 |
Neg logit contributions | |
its | -0.068 |
ters | -0.064 |
ying | -0.061 |
ade | -0.061 |
aches | -0.060 |
Token | This |
Token ID | 1212 |
Feature activation | +7.60e-01 |
Pos logit contributions | |
ying | +0.005 |
its | +0.005 |
idy | +0.005 |
ade | +0.005 |
aches | +0.005 |
Neg logit contributions | |
joy | -0.006 |
Bye | -0.005 |
Sure | -0.005 |
bye | -0.004 |
lan | -0.004 |
Token | lemon |
Token ID | 18873 |
Feature activation | +4.87e+00 |
Pos logit contributions | |
ying | +0.066 |
ters | +0.064 |
its | +0.064 |
oving | +0.062 |
idy | +0.061 |
Neg logit contributions | |
joy | -0.055 |
Bye | -0.047 |
Sure | -0.043 |
goodbye | -0.042 |
icol | -0.040 |
Token | ade |
Token ID | 671 |
Feature activation | +8.77e+00 |
Pos logit contributions | |
its | +0.414 |
convince | +0.410 |
ters | +0.402 |
oving | +0.400 |
have | +0.397 |
Neg logit contributions | |
joy | -0.292 |
Bye | -0.273 |
Sure | -0.246 |
goodbye | -0.237 |
arium | -0.230 |
Token | is |
Token ID | 318 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
its | +0.741 |
ters | +0.731 |
ying | +0.708 |
organ | +0.685 |
idy | +0.682 |
Neg logit contributions | |
joy | -0.606 |
Bye | -0.560 |
Sure | -0.499 |
goodbye | -0.493 |
icol | -0.468 |
Token | bad |
Token ID | 2089 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
joy | +0.162 |
Bye | +0.153 |
goodbye | +0.144 |
Sure | +0.137 |
icol | +0.134 |
Neg logit contributions | |
its | -0.127 |
ying | -0.119 |
ters | -0.115 |
idy | -0.110 |
ics | -0.109 |
Token | . |
Token ID | 13 |
Feature activation | -6.94e-01 |
Pos logit contributions | |
its | +0.201 |
ters | +0.184 |
ying | +0.177 |
aches | +0.176 |
ade | +0.176 |
Neg logit contributions | |
joy | -0.228 |
Bye | -0.204 |
Sure | -0.192 |
goodbye | -0.184 |
carriage | -0.183 |
Token | It |
Token ID | 632 |
Feature activation | -9.97e-01 |
Pos logit contributions | |
joy | +0.058 |
Bye | +0.049 |
carriage | +0.048 |
Sure | +0.046 |
icol | +0.045 |
Neg logit contributions | |
its | -0.059 |
ters | -0.055 |
ying | -0.051 |
ade | -0.051 |
aches | -0.050 |
Token | tastes |
Token ID | 18221 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
Bye | +0.067 |
joy | +0.063 |
Sure | +0.059 |
goodbye | +0.057 |
icol | +0.053 |
Neg logit contributions | |
ying | -0.085 |
its | -0.084 |
ters | -0.081 |
ics | -0.078 |
aches | -0.077 |
Token | very |
Token ID | 845 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
its | +0.071 |
ters | +0.063 |
ying | +0.060 |
ade | +0.060 |
aches | +0.058 |
Neg logit contributions | |
joy | -0.127 |
Bye | -0.115 |
Sure | -0.110 |
goodbye | -0.107 |
carriage | -0.107 |
Token | proud |
Token ID | 6613 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
joy | +0.030 |
Bye | +0.027 |
goodbye | +0.025 |
Sure | +0.025 |
carriage | +0.023 |
Neg logit contributions | |
its | -0.030 |
ters | -0.029 |
ade | -0.027 |
ying | -0.027 |
idy | -0.027 |
Token | of |
Token ID | 286 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
joy | +0.119 |
Bye | +0.112 |
Sure | +0.107 |
icol | +0.105 |
carriage | +0.104 |
Neg logit contributions | |
its | -0.045 |
ters | -0.042 |
ying | -0.040 |
ade | -0.039 |
idy | -0.037 |
Token | her |
Token ID | 607 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
its | +0.065 |
ters | +0.058 |
ade | +0.054 |
ying | +0.053 |
aches | +0.052 |
Neg logit contributions | |
joy | -0.138 |
Bye | -0.125 |
Sure | -0.120 |
goodbye | -0.117 |
carriage | -0.115 |
Token | clever |
Token ID | 14169 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
its | +0.082 |
ters | +0.075 |
ying | +0.071 |
ade | +0.071 |
aches | +0.070 |
Neg logit contributions | |
joy | -0.118 |
Bye | -0.106 |
Sure | -0.101 |
carriage | -0.097 |
goodbye | -0.097 |
Token | idea |
Token ID | 2126 |
Feature activation | +7.71e+00 |
Pos logit contributions | |
its | +0.076 |
ters | +0.070 |
ying | +0.068 |
ade | +0.065 |
aches | +0.065 |
Neg logit contributions | |
joy | -0.116 |
Bye | -0.101 |
goodbye | -0.097 |
Sure | -0.097 |
carriage | -0.095 |
Token | . |
Token ID | 13 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
ters | +0.410 |
its | +0.405 |
ying | +0.405 |
ade | +0.377 |
idy | +0.367 |
Neg logit contributions | |
joy | -0.807 |
Bye | -0.750 |
icol | -0.731 |
Sure | -0.726 |
habitats | -0.707 |
Token |
|
Token ID | 198 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
its | +0.018 |
ters | +0.016 |
ade | +0.016 |
ying | +0.016 |
idy | +0.015 |
Neg logit contributions | |
joy | -0.029 |
Bye | -0.026 |
carriage | -0.025 |
icol | -0.024 |
lair | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
its | +0.029 |
ters | +0.029 |
ying | +0.026 |
aches | +0.026 |
ade | +0.026 |
Neg logit contributions | |
joy | -0.023 |
Sure | -0.020 |
Bye | -0.020 |
goodbye | -0.018 |
arium | -0.018 |
Token | One |
Token ID | 3198 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
its | +0.032 |
ters | +0.032 |
ying | +0.032 |
aches | +0.030 |
ble | +0.029 |
Neg logit contributions | |
joy | -0.021 |
Bye | -0.020 |
Sure | -0.019 |
arium | -0.017 |
habitats | -0.017 |
Token | day |
Token ID | 1110 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
joy | +0.116 |
Bye | +0.100 |
icol | +0.099 |
Sure | +0.095 |
carriage | +0.093 |
Neg logit contributions | |
its | -0.086 |
ade | -0.081 |
ying | -0.080 |
ters | -0.080 |
idy | -0.077 |
Token | so |
Token ID | 523 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
joy | +0.196 |
Bye | +0.177 |
Sure | +0.170 |
carriage | +0.164 |
icol | +0.163 |
Neg logit contributions | |
its | -0.114 |
ters | -0.104 |
ying | -0.098 |
ade | -0.098 |
aches | -0.096 |
Token | much |
Token ID | 881 |
Feature activation | -3.57e+00 |
Pos logit contributions | |
its | +0.206 |
ade | +0.184 |
ters | +0.184 |
aches | +0.178 |
ying | +0.176 |
Neg logit contributions | |
joy | -0.246 |
Bye | -0.217 |
Sure | -0.209 |
icol | -0.205 |
carriage | -0.203 |
Token | fun |
Token ID | 1257 |
Feature activation | +6.66e-01 |
Pos logit contributions | |
joy | +0.324 |
Bye | +0.289 |
Sure | +0.271 |
goodbye | +0.267 |
icol | +0.258 |
Neg logit contributions | |
its | -0.267 |
ters | -0.255 |
ying | -0.247 |
aches | -0.237 |
idy | -0.232 |
Token | with |
Token ID | 351 |
Feature activation | -6.12e-01 |
Pos logit contributions | |
its | +0.051 |
ters | +0.047 |
ying | +0.045 |
ade | +0.044 |
aches | +0.044 |
Neg logit contributions | |
joy | -0.061 |
Bye | -0.054 |
Sure | -0.051 |
goodbye | -0.049 |
carriage | -0.049 |
Token | the |
Token ID | 262 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
joy | +0.053 |
Bye | +0.045 |
Sure | +0.043 |
goodbye | +0.043 |
carriage | +0.041 |
Neg logit contributions | |
its | -0.049 |
ters | -0.045 |
ade | -0.044 |
ying | -0.044 |
aches | -0.043 |
Token | bubbles |
Token ID | 25037 |
Feature activation | +6.95e+00 |
Pos logit contributions | |
its | +0.007 |
ying | +0.007 |
ters | +0.007 |
aches | +0.006 |
organ | +0.006 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.009 |
goodbye | -0.009 |
carriage | -0.009 |
habitats | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +4.24e-02 |
Pos logit contributions | |
its | +0.503 |
ters | +0.471 |
ying | +0.446 |
ade | +0.445 |
aches | +0.434 |
Neg logit contributions | |
joy | -0.657 |
Bye | -0.588 |
Sure | -0.562 |
icol | -0.539 |
carriage | -0.534 |
Token | When |
Token ID | 1649 |
Feature activation | -6.25e-01 |
Pos logit contributions | |
its | +0.003 |
ters | +0.003 |
ade | +0.002 |
idea | +0.002 |
organ | +0.002 |
Neg logit contributions | |
joy | -0.004 |
carriage | -0.004 |
lifetime | -0.004 |
Bye | -0.003 |
icol | -0.003 |
Token | it |
Token ID | 340 |
Feature activation | -3.50e-01 |
Pos logit contributions | |
joy | +0.074 |
icol | +0.067 |
Bye | +0.066 |
spine | +0.066 |
Sure | +0.065 |
Neg logit contributions | |
its | -0.028 |
ters | -0.025 |
ade | -0.025 |
aches | -0.025 |
ics | -0.022 |
Token | was |
Token ID | 373 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
joy | +0.031 |
Bye | +0.028 |
Sure | +0.026 |
goodbye | +0.025 |
carriage | +0.025 |
Neg logit contributions | |
its | -0.027 |
ters | -0.025 |
ying | -0.024 |
aches | -0.024 |
idy | -0.023 |
Token | time |
Token ID | 640 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
its | +0.075 |
ters | +0.068 |
ying | +0.065 |
ade | +0.063 |
aches | +0.063 |
Neg logit contributions | |
joy | -0.114 |
Bye | -0.103 |
Sure | -0.097 |
goodbye | -0.095 |
carriage | -0.094 |
Token | Lily |
Token ID | 20037 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
its | +0.000 |
ying | +0.000 |
aches | +0.000 |
ters | +0.000 |
ade | +0.000 |
Neg logit contributions | |
joy | -0.000 |
Bye | -0.000 |
Sure | -0.000 |
goodbye | -0.000 |
icol | -0.000 |
Token | 's |
Token ID | 338 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
its | +0.023 |
ters | +0.021 |
ying | +0.020 |
ade | +0.020 |
aches | +0.020 |
Neg logit contributions | |
joy | -0.028 |
Bye | -0.025 |
Sure | -0.024 |
carriage | -0.023 |
goodbye | -0.023 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
its | +0.228 |
ters | +0.213 |
ade | +0.208 |
aches | +0.205 |
ying | +0.200 |
Neg logit contributions | |
joy | -0.274 |
Bye | -0.247 |
Sure | -0.235 |
icol | -0.224 |
lifetime | -0.212 |
Token | packed |
Token ID | 11856 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
joy | +0.115 |
Bye | +0.102 |
Sure | +0.100 |
carriage | +0.096 |
arium | +0.092 |
Neg logit contributions | |
its | -0.124 |
ters | -0.112 |
ying | -0.108 |
aches | -0.105 |
ade | -0.103 |
Token | a |
Token ID | 257 |
Feature activation | -2.64e-01 |
Pos logit contributions | |
joy | +0.309 |
goodbye | +0.273 |
Bye | +0.268 |
Sure | +0.266 |
icol | +0.254 |
Neg logit contributions | |
its | -0.248 |
ters | -0.227 |
ying | -0.222 |
idy | -0.208 |
aches | -0.205 |
Token | green |
Token ID | 4077 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
joy | +0.023 |
Bye | +0.020 |
Sure | +0.019 |
carriage | +0.019 |
goodbye | +0.019 |
Neg logit contributions | |
its | -0.021 |
ters | -0.020 |
ying | -0.019 |
idy | -0.018 |
aches | -0.018 |
Token | basket |
Token ID | 7988 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
its | +0.043 |
ters | +0.040 |
ade | +0.038 |
ying | +0.038 |
aches | +0.037 |
Neg logit contributions | |
joy | -0.053 |
Bye | -0.047 |
Sure | -0.045 |
icol | -0.043 |
goodbye | -0.043 |
Token | with |
Token ID | 351 |
Feature activation | -5.92e-01 |
Pos logit contributions | |
joy | +0.162 |
Bye | +0.145 |
habitats | +0.140 |
icol | +0.140 |
Sure | +0.132 |
Neg logit contributions | |
ters | -0.077 |
ade | -0.073 |
its | -0.071 |
ying | -0.071 |
ics | -0.066 |
Token | y |
Token ID | 331 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
joy | +0.058 |
Bye | +0.051 |
goodbye | +0.050 |
carriage | +0.049 |
Sure | +0.048 |
Neg logit contributions | |
its | -0.043 |
ying | -0.039 |
ters | -0.037 |
aches | -0.035 |
idy | -0.035 |
Token | ummy |
Token ID | 13513 |
Feature activation | +6.86e-02 |
Pos logit contributions | |
its | +0.236 |
ters | +0.226 |
ying | +0.217 |
aches | +0.212 |
ade | +0.205 |
Neg logit contributions | |
joy | -0.229 |
Bye | -0.197 |
Sure | -0.185 |
icol | -0.181 |
goodbye | -0.179 |
Token | sandwiches |
Token ID | 29777 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
its | +0.005 |
ying | +0.005 |
ters | +0.005 |
oving | +0.005 |
ble | +0.005 |
Neg logit contributions | |
joy | -0.006 |
goodbye | -0.005 |
carriage | -0.005 |
Bye | -0.005 |
Sure | -0.005 |
Token | soft |
Token ID | 2705 |
Feature activation | +7.48e-01 |
Pos logit contributions | |
joy | +0.070 |
Bye | +0.062 |
Sure | +0.059 |
goodbye | +0.057 |
carriage | +0.057 |
Neg logit contributions | |
its | -0.050 |
ters | -0.045 |
ying | -0.044 |
ade | -0.043 |
aches | -0.042 |
Token | and |
Token ID | 290 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
its | +0.057 |
ters | +0.053 |
ying | +0.050 |
ade | +0.050 |
aches | +0.049 |
Neg logit contributions | |
joy | -0.068 |
Bye | -0.061 |
Sure | -0.058 |
carriage | -0.055 |
icol | -0.055 |
Token | wet |
Token ID | 9583 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
joy | +0.130 |
Bye | +0.115 |
Sure | +0.113 |
icol | +0.110 |
carriage | +0.110 |
Neg logit contributions | |
its | -0.058 |
ters | -0.052 |
aches | -0.049 |
ade | -0.048 |
ying | -0.046 |
Token | . |
Token ID | 13 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
its | +0.166 |
ters | +0.153 |
ying | +0.146 |
ade | +0.145 |
aches | +0.144 |
Neg logit contributions | |
joy | -0.199 |
Bye | -0.177 |
Sure | -0.168 |
carriage | -0.161 |
goodbye | -0.161 |
Token | It |
Token ID | 632 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
joy | +0.085 |
carriage | +0.076 |
Bye | +0.073 |
icol | +0.071 |
lifetime | +0.071 |
Neg logit contributions | |
its | -0.053 |
ters | -0.049 |
idy | -0.043 |
ying | -0.043 |
she | -0.042 |
Token | was |
Token ID | 373 |
Feature activation | +4.92e-01 |
Pos logit contributions | |
joy | +0.114 |
Bye | +0.101 |
Sure | +0.098 |
icol | +0.094 |
carriage | +0.093 |
Neg logit contributions | |
its | -0.076 |
ters | -0.068 |
ade | -0.065 |
aches | -0.064 |
ying | -0.064 |
Token | an |
Token ID | 281 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
its | +0.032 |
ters | +0.029 |
ying | +0.027 |
ade | +0.027 |
aches | +0.027 |
Neg logit contributions | |
joy | -0.051 |
Bye | -0.046 |
Sure | -0.044 |
carriage | -0.042 |
icol | -0.042 |
Token | unusual |
Token ID | 8468 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
joy | +0.011 |
Bye | +0.010 |
Sure | +0.009 |
goodbye | +0.009 |
carriage | +0.009 |
Neg logit contributions | |
its | -0.008 |
ters | -0.008 |
ade | -0.007 |
aches | -0.007 |
ying | -0.007 |
Token | word |
Token ID | 1573 |
Feature activation | -6.54e-01 |
Pos logit contributions | |
its | +0.191 |
ade | +0.170 |
ters | +0.170 |
aches | +0.162 |
ying | +0.161 |
Neg logit contributions | |
joy | -0.270 |
Bye | -0.244 |
Sure | -0.232 |
carriage | -0.226 |
icol | -0.223 |
Token | . |
Token ID | 13 |
Feature activation | -7.68e-01 |
Pos logit contributions | |
joy | +0.062 |
Bye | +0.054 |
Sure | +0.052 |
icol | +0.051 |
carriage | +0.050 |
Neg logit contributions | |
its | -0.047 |
ters | -0.045 |
ying | -0.042 |
ade | -0.042 |
aches | -0.041 |
Token | They |
Token ID | 1119 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
joy | +0.072 |
carriage | +0.063 |
Bye | +0.062 |
icol | +0.060 |
goodbye | +0.059 |
Neg logit contributions | |
its | -0.055 |
ters | -0.052 |
ying | -0.047 |
ade | -0.046 |
idy | -0.046 |
Token | smiled |
Token ID | 13541 |
Feature activation | -4.35e+00 |
Pos logit contributions | |
its | +0.139 |
ters | +0.129 |
ying | +0.126 |
aches | +0.123 |
ade | +0.123 |
Neg logit contributions | |
joy | -0.103 |
Bye | -0.087 |
Sure | -0.083 |
carriage | -0.079 |
goodbye | -0.079 |
Token | and |
Token ID | 290 |
Feature activation | -9.75e-02 |
Pos logit contributions | |
joy | +0.421 |
Bye | +0.410 |
Sure | +0.386 |
habitats | +0.382 |
carriage | +0.366 |
Neg logit contributions | |
ters | -0.266 |
its | -0.265 |
ying | -0.235 |
ade | -0.228 |
idy | -0.227 |
Token | said |
Token ID | 531 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
joy | +0.011 |
Bye | +0.010 |
Sure | +0.009 |
carriage | +0.009 |
habitats | +0.009 |
Neg logit contributions | |
its | -0.005 |
ters | -0.005 |
ade | -0.004 |
ying | -0.004 |
aches | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | +3.62e-01 |
Pos logit contributions | |
its | +0.182 |
ters | +0.164 |
ying | +0.160 |
ade | +0.159 |
aches | +0.157 |
Neg logit contributions | |
joy | -0.173 |
Bye | -0.151 |
Sure | -0.144 |
goodbye | -0.141 |
icol | -0.135 |
Token | " |
Token ID | 366 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
its | +0.033 |
ters | +0.030 |
ade | +0.030 |
ying | +0.030 |
aches | +0.029 |
Neg logit contributions | |
joy | -0.028 |
Bye | -0.024 |
Sure | -0.023 |
goodbye | -0.022 |
carriage | -0.022 |
Token | Well |
Token ID | 5779 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
its | +0.041 |
ters | +0.037 |
ying | +0.035 |
ade | +0.035 |
aches | +0.035 |
Neg logit contributions | |
joy | -0.064 |
Bye | -0.057 |
Sure | -0.055 |
carriage | -0.052 |
icol | -0.052 |
Token | , |
Token ID | 11 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
its | +0.049 |
ters | +0.045 |
ying | +0.044 |
aches | +0.043 |
ade | +0.042 |
Neg logit contributions | |
joy | -0.065 |
Bye | -0.058 |
Sure | -0.056 |
carriage | -0.054 |
icol | -0.053 |
Token | it |
Token ID | 340 |
Feature activation | -4.12e-01 |
Pos logit contributions | |
its | +0.028 |
ters | +0.026 |
ying | +0.025 |
ade | +0.024 |
aches | +0.024 |
Neg logit contributions | |
joy | -0.036 |
Bye | -0.032 |
Sure | -0.030 |
carriage | -0.029 |
goodbye | -0.029 |
Token | looks |
Token ID | 3073 |
Feature activation | -4.14e+00 |
Pos logit contributions | |
joy | +0.030 |
Bye | +0.029 |
Sure | +0.028 |
arium | +0.025 |
goodbye | +0.025 |
Neg logit contributions | |
its | -0.033 |
ying | -0.029 |
ters | -0.029 |
aches | -0.029 |
ade | -0.029 |
Token | like |
Token ID | 588 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
joy | +0.436 |
Bye | +0.391 |
Sure | +0.376 |
goodbye | +0.366 |
icol | +0.364 |
Neg logit contributions | |
its | -0.260 |
ters | -0.234 |
ying | -0.228 |
ade | -0.218 |
aches | -0.216 |
Token | you |
Token ID | 345 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
its | +0.071 |
ters | +0.067 |
ade | +0.062 |
aches | +0.062 |
ying | +0.061 |
Neg logit contributions | |
joy | -0.122 |
Bye | -0.110 |
Sure | -0.106 |
carriage | -0.102 |
icol | -0.102 |
Token | coat |
Token ID | 31434 |
Feature activation | +2.69e+00 |
Pos logit contributions | |
its | +0.121 |
ters | +0.116 |
ade | +0.115 |
ying | +0.106 |
aches | +0.105 |
Neg logit contributions | |
joy | -0.259 |
Bye | -0.236 |
Sure | -0.225 |
lifetime | -0.212 |
icol | -0.210 |
Token | and |
Token ID | 290 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
ters | +0.149 |
its | +0.141 |
ying | +0.137 |
ade | +0.136 |
aches | +0.125 |
Neg logit contributions | |
joy | -0.288 |
Bye | -0.260 |
Sure | -0.251 |
lair | -0.240 |
habitats | -0.239 |
Token | boots |
Token ID | 14412 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
joy | +0.012 |
Bye | +0.010 |
Sure | +0.010 |
icol | +0.009 |
carriage | +0.009 |
Neg logit contributions | |
its | -0.007 |
ters | -0.007 |
ade | -0.007 |
aches | -0.006 |
ying | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
ters | +0.224 |
its | +0.222 |
ade | +0.213 |
ying | +0.206 |
aches | +0.195 |
Neg logit contributions | |
joy | -0.354 |
Bye | -0.320 |
Sure | -0.304 |
icol | -0.293 |
habitats | -0.289 |
Token | ran |
Token ID | 4966 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
joy | +0.013 |
Bye | +0.011 |
Sure | +0.011 |
icol | +0.010 |
carriage | +0.010 |
Neg logit contributions | |
its | -0.009 |
ters | -0.008 |
ade | -0.008 |
ying | -0.008 |
aches | -0.008 |
Token | outside |
Token ID | 2354 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
joy | +0.018 |
Bye | +0.017 |
Sure | +0.016 |
icol | +0.015 |
habitats | +0.015 |
Neg logit contributions | |
its | -0.010 |
ters | -0.009 |
ade | -0.009 |
ying | -0.009 |
aches | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
its | +0.060 |
ters | +0.060 |
ying | +0.056 |
ade | +0.054 |
aches | +0.050 |
Neg logit contributions | |
joy | -0.112 |
Bye | -0.106 |
icol | -0.100 |
habitats | -0.098 |
Sure | -0.097 |
Token | play |
Token ID | 711 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
joy | +0.035 |
Bye | +0.031 |
Sure | +0.029 |
goodbye | +0.029 |
carriage | +0.028 |
Neg logit contributions | |
its | -0.041 |
ters | -0.038 |
ying | -0.036 |
idy | -0.035 |
ade | -0.035 |
Token | in |
Token ID | 287 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
joy | +0.103 |
Bye | +0.089 |
Sure | +0.085 |
goodbye | +0.085 |
carriage | +0.082 |
Neg logit contributions | |
its | -0.105 |
ters | -0.092 |
ying | -0.091 |
idy | -0.091 |
aches | -0.090 |
Token | the |
Token ID | 262 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
its | +0.118 |
ters | +0.108 |
ade | +0.103 |
ying | +0.101 |
aches | +0.100 |
Neg logit contributions | |
joy | -0.190 |
Bye | -0.173 |
Sure | -0.164 |
icol | -0.160 |
goodbye | -0.158 |
Token | rain |
Token ID | 6290 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
its | +0.006 |
ters | +0.005 |
ade | +0.005 |
ying | +0.005 |
aches | +0.005 |
Neg logit contributions | |
joy | -0.012 |
Bye | -0.011 |
Sure | -0.011 |
goodbye | -0.010 |
carriage | -0.010 |
Token | years |
Token ID | 812 |
Feature activation | -7.42e+00 |
Pos logit contributions | |
its | +0.025 |
ters | +0.024 |
ying | +0.023 |
ade | +0.023 |
aches | +0.023 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.009 |
Sure | -0.008 |
carriage | -0.008 |
goodbye | -0.008 |
Token | old |
Token ID | 1468 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
joy | +0.776 |
Bye | +0.709 |
Sure | +0.675 |
icol | +0.651 |
goodbye | +0.629 |
Neg logit contributions | |
its | -0.458 |
ying | -0.420 |
ters | -0.415 |
ade | -0.409 |
idy | -0.401 |
Token | and |
Token ID | 290 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
ters | +0.015 |
its | +0.013 |
idy | +0.012 |
ying | +0.011 |
ade | +0.011 |
Neg logit contributions | |
joy | -0.026 |
Bye | -0.024 |
Sure | -0.024 |
icol | -0.023 |
lifetime | -0.022 |
Token | loved |
Token ID | 6151 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
joy | +0.017 |
Bye | +0.015 |
Sure | +0.014 |
icol | +0.014 |
carriage | +0.014 |
Neg logit contributions | |
its | -0.013 |
ters | -0.012 |
aches | -0.012 |
ying | -0.012 |
ade | -0.011 |
Token | animals |
Token ID | 4695 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
joy | +0.103 |
Bye | +0.090 |
Sure | +0.085 |
carriage | +0.080 |
icol | +0.080 |
Neg logit contributions | |
its | -0.119 |
ters | -0.111 |
ying | -0.107 |
ade | -0.107 |
aches | -0.106 |
Token | . |
Token ID | 13 |
Feature activation | +9.23e-02 |
Pos logit contributions | |
its | +0.123 |
ters | +0.112 |
ying | +0.108 |
ade | +0.107 |
aches | +0.106 |
Neg logit contributions | |
joy | -0.134 |
Bye | -0.118 |
Sure | -0.111 |
goodbye | -0.108 |
carriage | -0.107 |
Token | |
Token ID | 220 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
its | +0.007 |
ters | +0.006 |
ying | +0.006 |
aches | +0.006 |
ade | +0.006 |
Neg logit contributions | |
joy | -0.009 |
Bye | -0.008 |
icol | -0.007 |
goodbye | -0.007 |
Sure | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | +3.54e-01 |
Pos logit contributions | |
its | +0.010 |
ters | +0.010 |
aches | +0.009 |
ade | +0.009 |
idy | +0.009 |
Neg logit contributions | |
joy | -0.007 |
Sure | -0.006 |
Bye | -0.005 |
arium | -0.005 |
goodbye | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
its | +0.031 |
ters | +0.029 |
ying | +0.028 |
ade | +0.028 |
aches | +0.027 |
Neg logit contributions | |
joy | -0.028 |
Bye | -0.025 |
Sure | -0.024 |
carriage | -0.022 |
goodbye | -0.022 |
Token | One |
Token ID | 3198 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
its | +0.028 |
ters | +0.026 |
ying | +0.025 |
ade | +0.025 |
aches | +0.025 |
Neg logit contributions | |
joy | -0.034 |
Bye | -0.030 |
Sure | -0.029 |
goodbye | -0.027 |
icol | -0.027 |
Token | day |
Token ID | 1110 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
joy | +0.115 |
Bye | +0.098 |
icol | +0.096 |
Sure | +0.092 |
carriage | +0.092 |
Neg logit contributions | |
its | -0.083 |
ade | -0.078 |
ying | -0.078 |
idy | -0.076 |
ters | -0.076 |
Token | knew |
Token ID | 2993 |
Feature activation | -2.37e+00 |
Pos logit contributions | |
its | +0.002 |
aches | +0.002 |
ade | +0.002 |
ters | +0.002 |
ying | +0.002 |
Neg logit contributions | |
joy | -0.004 |
Bye | -0.003 |
Sure | -0.003 |
spine | -0.003 |
icol | -0.003 |
Token | his |
Token ID | 465 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
joy | +0.230 |
Bye | +0.206 |
Sure | +0.195 |
icol | +0.194 |
carriage | +0.188 |
Neg logit contributions | |
its | -0.161 |
ying | -0.154 |
aches | -0.153 |
ters | -0.153 |
ade | -0.147 |
Token | wish |
Token ID | 4601 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
joy | +0.058 |
Bye | +0.051 |
Sure | +0.049 |
icol | +0.047 |
carriage | +0.046 |
Neg logit contributions | |
its | -0.046 |
ade | -0.042 |
ters | -0.041 |
idea | -0.041 |
aches | -0.041 |
Token | had |
Token ID | 550 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
joy | +0.274 |
Bye | +0.246 |
Sure | +0.236 |
icol | +0.232 |
habitats | +0.217 |
Neg logit contributions | |
its | -0.164 |
ade | -0.156 |
ying | -0.153 |
aches | -0.151 |
ters | -0.151 |
Token | come |
Token ID | 1282 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
joy | +0.210 |
Sure | +0.195 |
Bye | +0.194 |
icol | +0.190 |
carriage | +0.181 |
Neg logit contributions | |
its | -0.120 |
aches | -0.117 |
ters | -0.116 |
ade | -0.114 |
happen | -0.108 |
Token | true |
Token ID | 2081 |
Feature activation | -3.25e+00 |
Pos logit contributions | |
joy | +0.158 |
Bye | +0.145 |
Sure | +0.138 |
icol | +0.136 |
habitats | +0.129 |
Neg logit contributions | |
its | -0.112 |
ters | -0.111 |
ying | -0.101 |
aches | -0.100 |
idy | -0.098 |
Token | . |
Token ID | 13 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
joy | +0.364 |
Bye | +0.353 |
Sure | +0.343 |
icol | +0.331 |
ugg | +0.312 |
Neg logit contributions | |
ters | -0.146 |
its | -0.137 |
ying | -0.127 |
idea | -0.124 |
ade | -0.124 |
Token | In |
Token ID | 554 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
its | +0.011 |
she | +0.010 |
ying | +0.010 |
ters | +0.009 |
sure | +0.009 |
Neg logit contributions | |
joy | -0.017 |
carriage | -0.015 |
icol | -0.014 |
habitats | -0.014 |
spine | -0.014 |
Token | his |
Token ID | 465 |
Feature activation | -8.12e-01 |
Pos logit contributions | |
Bye | +0.223 |
joy | +0.220 |
icol | +0.216 |
habitats | +0.210 |
Sure | +0.210 |
Neg logit contributions | |
its | -0.065 |
idea | -0.056 |
dishes | -0.055 |
happen | -0.054 |
ics | -0.053 |
Token | pocket |
Token ID | 10000 |
Feature activation | -6.57e+00 |
Pos logit contributions | |
joy | +0.074 |
Bye | +0.066 |
Sure | +0.062 |
icol | +0.062 |
lan | +0.060 |
Neg logit contributions | |
idea | -0.054 |
do | -0.050 |
other | -0.049 |
chores | -0.048 |
plan | -0.047 |
Token | , |
Token ID | 11 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
joy | +0.623 |
Bye | +0.583 |
Sure | +0.538 |
icol | +0.537 |
habitats | +0.512 |
Neg logit contributions | |
its | -0.457 |
ters | -0.433 |
ying | -0.427 |
ade | -0.422 |
aches | -0.421 |
Token | . |
Token ID | 13 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
joy | +0.137 |
Bye | +0.121 |
Sure | +0.115 |
carriage | +0.110 |
goodbye | +0.110 |
Neg logit contributions | |
its | -0.115 |
ters | -0.106 |
ying | -0.102 |
ade | -0.101 |
aches | -0.100 |
Token | So |
Token ID | 1406 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
its | +0.001 |
ters | +0.001 |
ying | +0.001 |
she | +0.001 |
ade | +0.001 |
Neg logit contributions | |
joy | -0.002 |
carriage | -0.002 |
Bye | -0.002 |
icol | -0.002 |
lair | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | -3.07e-02 |
Pos logit contributions | |
ters | +0.115 |
its | +0.105 |
aches | +0.099 |
ying | +0.095 |
idea | +0.089 |
Neg logit contributions | |
joy | -0.264 |
Bye | -0.241 |
icol | -0.232 |
habitats | -0.231 |
lair | -0.228 |
Token | farmer |
Token ID | 18739 |
Feature activation | +3.62e-01 |
Pos logit contributions | |
joy | +0.003 |
Bye | +0.002 |
Sure | +0.002 |
carriage | +0.002 |
goodbye | +0.002 |
Neg logit contributions | |
its | -0.003 |
ters | -0.002 |
ying | -0.002 |
ade | -0.002 |
idy | -0.002 |
Token | decided |
Token ID | 3066 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
its | +0.026 |
ters | +0.024 |
ade | +0.023 |
ying | +0.023 |
aches | +0.023 |
Neg logit contributions | |
joy | -0.035 |
Bye | -0.031 |
Sure | -0.029 |
icol | -0.029 |
carriage | -0.028 |
Token | to |
Token ID | 284 |
Feature activation | -4.28e-01 |
Pos logit contributions | |
its | +0.209 |
ters | +0.201 |
aches | +0.195 |
ying | +0.195 |
ade | +0.192 |
Neg logit contributions | |
joy | -0.242 |
Bye | -0.216 |
Sure | -0.206 |
icol | -0.202 |
carriage | -0.200 |
Token | give |
Token ID | 1577 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
joy | +0.038 |
Bye | +0.037 |
goodbye | +0.035 |
Sure | +0.034 |
carriage | +0.033 |
Neg logit contributions | |
its | -0.029 |
ters | -0.027 |
ying | -0.027 |
ade | -0.025 |
idy | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | -3.40e-02 |
Pos logit contributions | |
its | +0.106 |
ters | +0.096 |
ying | +0.092 |
ade | +0.091 |
aches | +0.090 |
Neg logit contributions | |
joy | -0.145 |
Bye | -0.130 |
Sure | -0.124 |
goodbye | -0.120 |
carriage | -0.118 |
Token | lazy |
Token ID | 16931 |
Feature activation | +7.65e-01 |
Pos logit contributions | |
joy | +0.003 |
Bye | +0.003 |
goodbye | +0.003 |
carriage | +0.003 |
Sure | +0.003 |
Neg logit contributions | |
its | -0.003 |
ying | -0.002 |
ters | -0.002 |
ade | -0.002 |
idy | -0.002 |
Token | pig |
Token ID | 12967 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
its | +0.059 |
ters | +0.054 |
ying | +0.052 |
ade | +0.052 |
aches | +0.051 |
Neg logit contributions | |
joy | -0.070 |
Bye | -0.062 |
Sure | -0.058 |
carriage | -0.056 |
goodbye | -0.056 |
Token | a |
Token ID | 257 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
its | +0.137 |
ters | +0.130 |
ade | +0.124 |
aches | +0.123 |
ying | +0.122 |
Neg logit contributions | |
joy | -0.179 |
Bye | -0.160 |
Sure | -0.153 |
icol | -0.148 |
carriage | -0.145 |
Token | wished |
Token ID | 16555 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
its | +0.025 |
aches | +0.022 |
ters | +0.021 |
ade | +0.021 |
idy | +0.021 |
Neg logit contributions | |
joy | -0.040 |
Bye | -0.034 |
Sure | -0.033 |
icol | -0.032 |
carriage | -0.031 |
Token | Rose |
Token ID | 8049 |
Feature activation | -2.82e+00 |
Pos logit contributions | |
joy | +0.280 |
Bye | +0.259 |
icol | +0.250 |
carriage | +0.250 |
Sure | +0.243 |
Neg logit contributions | |
ters | -0.112 |
its | -0.107 |
ying | -0.103 |
aches | -0.095 |
idy | -0.092 |
Token | was |
Token ID | 373 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
joy | +0.263 |
Bye | +0.231 |
Sure | +0.222 |
icol | +0.220 |
carriage | +0.207 |
Neg logit contributions | |
its | -0.209 |
ters | -0.197 |
ade | -0.195 |
aches | -0.192 |
ying | -0.191 |
Token | with |
Token ID | 351 |
Feature activation | -9.03e-01 |
Pos logit contributions | |
its | +0.021 |
ters | +0.020 |
aches | +0.019 |
ying | +0.019 |
ade | +0.018 |
Neg logit contributions | |
joy | -0.034 |
Bye | -0.031 |
Sure | -0.030 |
icol | -0.029 |
carriage | -0.028 |
Token | her |
Token ID | 607 |
Feature activation | +4.95e-01 |
Pos logit contributions | |
joy | +0.109 |
Bye | +0.099 |
Sure | +0.096 |
icol | +0.093 |
carriage | +0.093 |
Neg logit contributions | |
its | -0.043 |
ters | -0.037 |
idy | -0.035 |
aches | -0.034 |
ade | -0.034 |
Token | , |
Token ID | 11 |
Feature activation | -5.93e-01 |
Pos logit contributions | |
its | +0.032 |
ters | +0.031 |
aches | +0.028 |
ade | +0.028 |
ying | +0.028 |
Neg logit contributions | |
joy | -0.049 |
Bye | -0.047 |
Sure | -0.044 |
icol | -0.042 |
carriage | -0.040 |
Token | she |
Token ID | 673 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
joy | +0.068 |
Bye | +0.062 |
icol | +0.060 |
Sure | +0.060 |
carriage | +0.058 |
Neg logit contributions | |
its | -0.028 |
ters | -0.027 |
ying | -0.025 |
aches | -0.024 |
idy | -0.023 |
Token | missed |
Token ID | 6825 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
its | +0.028 |
ters | +0.025 |
idy | +0.024 |
ade | +0.024 |
aches | +0.023 |
Neg logit contributions | |
joy | -0.047 |
Bye | -0.040 |
Sure | -0.040 |
icol | -0.039 |
spine | -0.037 |
Token | her |
Token ID | 607 |
Feature activation | +4.27e-01 |
Pos logit contributions | |
joy | +0.423 |
Bye | +0.394 |
Sure | +0.379 |
carriage | +0.372 |
icol | +0.371 |
Neg logit contributions | |
its | -0.165 |
ters | -0.154 |
aches | -0.137 |
ying | -0.135 |
ade | -0.132 |
Token | so |
Token ID | 523 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
its | +0.030 |
ters | +0.029 |
ade | +0.027 |
ying | +0.027 |
aches | +0.027 |
Neg logit contributions | |
joy | -0.040 |
Bye | -0.037 |
Sure | -0.035 |
icol | -0.034 |
carriage | -0.032 |
Token | much |
Token ID | 881 |
Feature activation | -3.85e+00 |
Pos logit contributions | |
its | +0.157 |
idy | +0.132 |
aches | +0.131 |
ade | +0.130 |
ters | +0.122 |
Neg logit contributions | |
joy | -0.246 |
Bye | -0.225 |
icol | -0.221 |
Sure | -0.215 |
carriage | -0.207 |
Token | didn |
Token ID | 1422 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
joy | +0.263 |
Bye | +0.238 |
Sure | +0.228 |
goodbye | +0.217 |
icol | +0.214 |
Neg logit contributions | |
its | -0.195 |
ters | -0.185 |
ying | -0.176 |
aches | -0.171 |
ade | -0.168 |
Token | 't |
Token ID | 470 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
ins | +0.109 |
its | +0.107 |
ters | +0.105 |
ying | +0.105 |
aches | +0.104 |
Neg logit contributions | |
Bye | -0.103 |
Sure | -0.087 |
joy | -0.084 |
goodbye | -0.083 |
Goodbye | -0.078 |
Token | mean |
Token ID | 1612 |
Feature activation | +3.91e+00 |
Pos logit contributions | |
its | +0.231 |
ics | +0.224 |
ying | +0.223 |
ters | +0.219 |
oons | +0.214 |
Neg logit contributions | |
joy | -0.284 |
Bye | -0.280 |
bye | -0.248 |
dreamed | -0.236 |
bye | -0.236 |
Token | to |
Token ID | 284 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
its | +0.398 |
ters | +0.375 |
ying | +0.361 |
aches | +0.359 |
ade | +0.358 |
Neg logit contributions | |
joy | -0.259 |
Bye | -0.222 |
goodbye | -0.200 |
Sure | -0.195 |
icol | -0.180 |
Token | break |
Token ID | 2270 |
Feature activation | +7.53e-01 |
Pos logit contributions | |
joy | +0.017 |
Bye | +0.017 |
Sure | +0.015 |
bye | +0.015 |
goodbye | +0.015 |
Neg logit contributions | |
its | -0.013 |
ying | -0.013 |
ters | -0.012 |
ade | -0.012 |
aches | -0.011 |
Token | it |
Token ID | 340 |
Feature activation | -1.87e-01 |
Pos logit contributions | |
its | +0.062 |
ade | +0.056 |
ters | +0.055 |
ying | +0.055 |
aches | +0.054 |
Neg logit contributions | |
joy | -0.063 |
Bye | -0.055 |
Sure | -0.051 |
goodbye | -0.050 |
icol | -0.048 |
Token | . |
Token ID | 13 |
Feature activation | +6.60e-01 |
Pos logit contributions | |
joy | +0.012 |
Bye | +0.012 |
goodbye | +0.011 |
Sure | +0.010 |
bye | +0.010 |
Neg logit contributions | |
its | -0.017 |
aches | -0.016 |
affles | -0.015 |
ying | -0.015 |
ters | -0.015 |
Token | I |
Token ID | 314 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
ters | +0.045 |
its | +0.045 |
ying | +0.039 |
she | +0.039 |
idy | +0.039 |
Neg logit contributions | |
joy | -0.064 |
carriage | -0.053 |
arium | -0.051 |
lair | -0.051 |
lifetime | -0.049 |
Token | will |
Token ID | 481 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
joy | +0.266 |
Bye | +0.240 |
Sure | +0.229 |
goodbye | +0.219 |
icol | +0.217 |
Neg logit contributions | |
its | -0.191 |
ters | -0.179 |
ying | -0.171 |
ade | -0.165 |
aches | -0.165 |
Token | help |
Token ID | 1037 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
joy | +0.098 |
Bye | +0.092 |
Sure | +0.085 |
goodbye | +0.084 |
icol | +0.082 |
Neg logit contributions | |
its | -0.087 |
ters | -0.083 |
ying | -0.081 |
ade | -0.078 |
idy | -0.076 |
Token | you |
Token ID | 345 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
its | +0.090 |
ade | +0.081 |
ying | +0.078 |
ters | +0.077 |
aches | +0.076 |
Neg logit contributions | |
joy | -0.088 |
Bye | -0.085 |
Sure | -0.079 |
goodbye | -0.075 |
bye | -0.071 |
Token | ! |
Token ID | 0 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
joy | +0.213 |
Bye | +0.190 |
Sure | +0.181 |
carriage | +0.174 |
goodbye | +0.173 |
Neg logit contributions | |
its | -0.165 |
ters | -0.153 |
ying | -0.145 |
ade | -0.144 |
aches | -0.142 |
Token | Soup |
Token ID | 34011 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
joy | +0.193 |
carriage | +0.158 |
lifetime | +0.155 |
habitats | +0.152 |
icol | +0.150 |
Neg logit contributions | |
its | -0.182 |
ters | -0.175 |
ying | -0.156 |
ade | -0.154 |
idy | -0.152 |
Token | !" |
Token ID | 2474 |
Feature activation | +8.43e-01 |
Pos logit contributions | |
joy | +0.083 |
Bye | +0.080 |
Sure | +0.073 |
goodbye | +0.070 |
icol | +0.069 |
Neg logit contributions | |
its | -0.084 |
ters | -0.077 |
ying | -0.076 |
aches | -0.075 |
idy | -0.074 |
Token | Tom |
Token ID | 4186 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
its | +0.069 |
ters | +0.065 |
ying | +0.061 |
ade | +0.061 |
aches | +0.061 |
Neg logit contributions | |
joy | -0.071 |
Bye | -0.062 |
Sure | -0.058 |
carriage | -0.057 |
icol | -0.057 |
Token | laughs |
Token ID | 22051 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
joy | +0.184 |
Bye | +0.168 |
Sure | +0.157 |
goodbye | +0.150 |
icol | +0.146 |
Neg logit contributions | |
its | -0.192 |
ters | -0.187 |
ying | -0.185 |
aches | -0.177 |
idy | -0.176 |
Token | and |
Token ID | 290 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
its | +0.115 |
ters | +0.107 |
ying | +0.102 |
ade | +0.101 |
aches | +0.100 |
Neg logit contributions | |
joy | -0.130 |
Bye | -0.115 |
Sure | -0.110 |
carriage | -0.105 |
icol | -0.104 |
Token | says |
Token ID | 1139 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
joy | +0.099 |
Bye | +0.090 |
Sure | +0.085 |
goodbye | +0.082 |
carriage | +0.081 |
Neg logit contributions | |
its | -0.072 |
ters | -0.066 |
ying | -0.064 |
ade | -0.063 |
aches | -0.062 |
Token | " |
Token ID | 366 |
Feature activation | +6.12e-02 |
Pos logit contributions | |
its | +0.089 |
ters | +0.083 |
ying | +0.079 |
ade | +0.079 |
aches | +0.078 |
Neg logit contributions | |
joy | -0.088 |
Bye | -0.077 |
Sure | -0.074 |
carriage | -0.071 |
icol | -0.070 |
Token | Good |
Token ID | 10248 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
its | +0.005 |
ying | +0.004 |
ters | +0.004 |
aches | +0.004 |
idy | +0.004 |
Neg logit contributions | |
joy | -0.005 |
Bye | -0.005 |
Sure | -0.005 |
icol | -0.004 |
goodbye | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -5.20e-01 |
Pos logit contributions | |
joy | +0.191 |
Bye | +0.164 |
Sure | +0.160 |
carriage | +0.157 |
arium | +0.153 |
Neg logit contributions | |
its | -0.138 |
ters | -0.127 |
ade | -0.120 |
ying | -0.114 |
aches | -0.113 |
Token | tank |
Token ID | 6873 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
joy | +0.047 |
Bye | +0.042 |
Sure | +0.040 |
carriage | +0.038 |
icol | +0.038 |
Neg logit contributions | |
its | -0.040 |
ters | -0.037 |
ying | -0.035 |
ade | -0.035 |
aches | -0.035 |
Token | they |
Token ID | 484 |
Feature activation | -4.65e-02 |
Pos logit contributions | |
its | +0.052 |
ters | +0.050 |
aches | +0.048 |
ade | +0.046 |
ying | +0.045 |
Neg logit contributions | |
joy | -0.109 |
icol | -0.094 |
Bye | -0.094 |
carriage | -0.091 |
Sure | -0.090 |
Token | could |
Token ID | 714 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
joy | +0.005 |
icol | +0.004 |
Sure | +0.004 |
Bye | +0.004 |
spine | +0.004 |
Neg logit contributions | |
its | -0.003 |
ade | -0.003 |
aches | -0.002 |
ters | -0.002 |
ics | -0.002 |
Token | find |
Token ID | 1064 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
joy | +0.162 |
Bye | +0.148 |
Sure | +0.140 |
goodbye | +0.139 |
carriage | +0.137 |
Neg logit contributions | |
its | -0.106 |
ters | -0.100 |
ying | -0.094 |
ade | -0.091 |
idy | -0.089 |
Token | a |
Token ID | 257 |
Feature activation | -6.23e-01 |
Pos logit contributions | |
its | +0.018 |
ters | +0.018 |
ade | +0.016 |
aches | +0.016 |
idy | +0.016 |
Neg logit contributions | |
joy | -0.043 |
Bye | -0.039 |
icol | -0.037 |
spine | -0.037 |
Sure | -0.037 |
Token | park |
Token ID | 3952 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
joy | +0.064 |
Bye | +0.059 |
Sure | +0.056 |
icol | +0.055 |
habitats | +0.053 |
Neg logit contributions | |
its | -0.036 |
ade | -0.033 |
ters | -0.033 |
aches | -0.032 |
whip | -0.030 |
Token | where |
Token ID | 810 |
Feature activation | -6.65e+00 |
Pos logit contributions | |
joy | +0.125 |
icol | +0.116 |
Bye | +0.114 |
Sure | +0.111 |
spine | +0.108 |
Neg logit contributions | |
ade | -0.059 |
ters | -0.058 |
aches | -0.055 |
ying | -0.054 |
its | -0.053 |
Token | dogs |
Token ID | 6844 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
joy | +0.650 |
Bye | +0.577 |
Sure | +0.554 |
icol | +0.541 |
carriage | +0.530 |
Neg logit contributions | |
its | -0.459 |
ters | -0.427 |
ade | -0.408 |
ying | -0.408 |
aches | -0.401 |
Token | were |
Token ID | 547 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
its | +0.164 |
ters | +0.151 |
ying | +0.144 |
ade | +0.143 |
aches | +0.141 |
Neg logit contributions | |
joy | -0.213 |
Bye | -0.189 |
Sure | -0.181 |
carriage | -0.173 |
icol | -0.173 |
Token | allowed |
Token ID | 3142 |
Feature activation | +2.53e+00 |
Pos logit contributions | |
its | +0.086 |
ters | +0.079 |
ying | +0.076 |
ade | +0.075 |
aches | +0.074 |
Neg logit contributions | |
joy | -0.114 |
Bye | -0.102 |
Sure | -0.097 |
carriage | -0.093 |
goodbye | -0.093 |
Token | . |
Token ID | 13 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
its | +0.196 |
ters | +0.193 |
ying | +0.181 |
ade | +0.178 |
idy | +0.174 |
Neg logit contributions | |
joy | -0.221 |
Bye | -0.193 |
Sure | -0.184 |
icol | -0.184 |
carriage | -0.179 |
Token | A |
Token ID | 317 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
joy | +0.068 |
carriage | +0.059 |
Bye | +0.057 |
lifetime | +0.057 |
goodbye | +0.057 |
Neg logit contributions | |
its | -0.042 |
ters | -0.036 |
ade | -0.034 |
ying | -0.032 |
aches | -0.031 |
Token | And |
Token ID | 843 |
Feature activation | -4.90e+00 |
Pos logit contributions | |
joy | +0.017 |
Bye | +0.013 |
icol | +0.013 |
carriage | +0.013 |
Sure | +0.013 |
Neg logit contributions | |
its | -0.015 |
ters | -0.015 |
ying | -0.014 |
idy | -0.013 |
have | -0.013 |
Token | yes |
Token ID | 3763 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
joy | +0.493 |
Bye | +0.438 |
Sure | +0.420 |
icol | +0.408 |
carriage | +0.405 |
Neg logit contributions | |
its | -0.327 |
ters | -0.304 |
ying | -0.287 |
aches | -0.284 |
ade | -0.280 |
Token | , |
Token ID | 11 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
joy | +0.234 |
Bye | +0.210 |
Sure | +0.197 |
goodbye | +0.190 |
carriage | +0.188 |
Neg logit contributions | |
its | -0.229 |
ters | -0.212 |
ying | -0.204 |
ade | -0.202 |
aches | -0.199 |
Token | it |
Token ID | 340 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
joy | +0.010 |
Bye | +0.009 |
Sure | +0.009 |
carriage | +0.008 |
icol | +0.008 |
Neg logit contributions | |
its | -0.007 |
ters | -0.007 |
ying | -0.006 |
ade | -0.006 |
aches | -0.006 |
Token | is |
Token ID | 318 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
joy | +0.047 |
Bye | +0.042 |
Sure | +0.040 |
carriage | +0.038 |
goodbye | +0.038 |
Neg logit contributions | |
its | -0.041 |
ters | -0.038 |
ying | -0.036 |
ade | -0.036 |
aches | -0.035 |
Token | far |
Token ID | 1290 |
Feature activation | -6.91e+00 |
Pos logit contributions | |
joy | +0.169 |
Bye | +0.150 |
Sure | +0.146 |
icol | +0.141 |
carriage | +0.139 |
Neg logit contributions | |
its | -0.097 |
ters | -0.089 |
aches | -0.085 |
ying | -0.083 |
ade | -0.082 |
Token | . |
Token ID | 13 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
joy | +0.624 |
Bye | +0.554 |
Sure | +0.525 |
goodbye | +0.507 |
carriage | +0.506 |
Neg logit contributions | |
its | -0.533 |
ters | -0.490 |
ying | -0.470 |
ade | -0.468 |
aches | -0.462 |
Token | We |
Token ID | 775 |
Feature activation | -4.80e+00 |
Pos logit contributions | |
joy | +0.019 |
icol | +0.014 |
carriage | +0.014 |
lair | +0.014 |
Bye | +0.014 |
Neg logit contributions | |
ters | -0.017 |
its | -0.017 |
ying | -0.015 |
have | -0.015 |
idy | -0.014 |
Token | have |
Token ID | 423 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
joy | +0.426 |
Bye | +0.393 |
Sure | +0.368 |
carriage | +0.365 |
goodbye | +0.360 |
Neg logit contributions | |
its | -0.354 |
ters | -0.329 |
ying | -0.318 |
ade | -0.312 |
idy | -0.309 |
Token | to |
Token ID | 284 |
Feature activation | -4.55e-01 |
Pos logit contributions | |
aches | +0.041 |
its | +0.039 |
ters | +0.038 |
ade | +0.036 |
have | +0.035 |
Neg logit contributions | |
joy | -0.063 |
icol | -0.059 |
Sure | -0.057 |
Bye | -0.056 |
spine | -0.053 |
Token | drive |
Token ID | 3708 |
Feature activation | -3.03e+00 |
Pos logit contributions | |
joy | +0.041 |
Bye | +0.039 |
goodbye | +0.036 |
carriage | +0.036 |
Sure | +0.036 |
Neg logit contributions | |
its | -0.032 |
ying | -0.030 |
ters | -0.030 |
ade | -0.029 |
idy | -0.029 |
Token | . |
Token ID | 13 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
joy | +0.763 |
Bye | +0.691 |
icol | +0.676 |
Sure | +0.672 |
carriage | +0.619 |
Neg logit contributions | |
its | -0.492 |
ters | -0.491 |
ying | -0.451 |
ade | -0.436 |
aches | -0.436 |
Token | The |
Token ID | 383 |
Feature activation | -3.54e+00 |
Pos logit contributions | |
its | +0.007 |
ters | +0.007 |
ade | +0.006 |
ying | +0.006 |
she | +0.006 |
Neg logit contributions | |
joy | -0.010 |
carriage | -0.009 |
spine | -0.008 |
icol | -0.008 |
lair | -0.008 |
Token | rock |
Token ID | 3881 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
joy | +0.353 |
Bye | +0.330 |
Sure | +0.322 |
icol | +0.313 |
goodbye | +0.290 |
Neg logit contributions | |
its | -0.226 |
ters | -0.220 |
aches | -0.202 |
ade | -0.198 |
ying | -0.190 |
Token | sung |
Token ID | 23568 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
its | +0.165 |
ters | +0.152 |
ade | +0.150 |
aches | +0.149 |
ying | +0.143 |
Neg logit contributions | |
joy | -0.267 |
Bye | -0.242 |
Sure | -0.231 |
icol | -0.228 |
spine | -0.211 |
Token | so |
Token ID | 523 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
joy | +0.247 |
Bye | +0.227 |
Sure | +0.215 |
icol | +0.211 |
carriage | +0.207 |
Neg logit contributions | |
ters | -0.163 |
its | -0.163 |
ade | -0.146 |
ying | -0.145 |
idy | -0.138 |
Token | beautifully |
Token ID | 21104 |
Feature activation | -6.32e+00 |
Pos logit contributions | |
its | +0.173 |
ters | +0.149 |
ade | +0.145 |
aches | +0.143 |
ying | +0.142 |
Neg logit contributions | |
joy | -0.278 |
Bye | -0.242 |
icol | -0.238 |
spine | -0.236 |
lair | -0.235 |
Token | that |
Token ID | 326 |
Feature activation | -6.02e-01 |
Pos logit contributions | |
joy | +0.619 |
Bye | +0.563 |
Sure | +0.523 |
lair | +0.513 |
carriage | +0.506 |
Neg logit contributions | |
its | -0.426 |
ters | -0.405 |
ying | -0.393 |
ade | -0.382 |
aches | -0.380 |
Token | people |
Token ID | 661 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
joy | +0.070 |
Bye | +0.063 |
icol | +0.062 |
Sure | +0.061 |
carriage | +0.061 |
Neg logit contributions | |
its | -0.028 |
ters | -0.027 |
ying | -0.026 |
aches | -0.024 |
idy | -0.024 |
Token | from |
Token ID | 422 |
Feature activation | +3.08e+00 |
Pos logit contributions | |
its | +0.136 |
ters | +0.127 |
ying | +0.122 |
aches | +0.118 |
ade | +0.118 |
Neg logit contributions | |
joy | -0.189 |
Bye | -0.167 |
Sure | -0.161 |
icol | -0.156 |
carriage | -0.151 |
Token | far |
Token ID | 1290 |
Feature activation | -6.88e+00 |
Pos logit contributions | |
its | +0.124 |
squash | +0.123 |
ters | +0.118 |
happen | +0.112 |
lled | +0.111 |
Neg logit contributions | |
joy | -0.340 |
Sure | -0.316 |
Bye | -0.314 |
ari | -0.306 |
icol | -0.302 |
Token | away |
Token ID | 1497 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
joy | +0.705 |
Bye | +0.656 |
Sure | +0.627 |
icol | +0.590 |
lair | +0.581 |
Neg logit contributions | |
its | -0.443 |
ters | -0.423 |
ying | -0.393 |
ade | -0.374 |
idy | -0.369 |
Token | learned |
Token ID | 4499 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
its | +0.068 |
ade | +0.062 |
aches | +0.061 |
idy | +0.059 |
ters | +0.059 |
Neg logit contributions | |
joy | -0.105 |
Sure | -0.089 |
Bye | -0.089 |
spine | -0.088 |
icol | -0.084 |
Token | an |
Token ID | 281 |
Feature activation | +1.29e-01 |
Pos logit contributions | |
joy | +0.361 |
Bye | +0.319 |
Sure | +0.302 |
goodbye | +0.295 |
carriage | +0.285 |
Neg logit contributions | |
its | -0.352 |
ters | -0.325 |
ying | -0.311 |
ade | -0.307 |
aches | -0.303 |
Token | important |
Token ID | 1593 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
ters | +0.009 |
its | +0.009 |
ics | +0.008 |
aches | +0.008 |
ade | +0.008 |
Neg logit contributions | |
joy | -0.011 |
Bye | -0.010 |
goodbye | -0.010 |
habitats | -0.009 |
bye | -0.009 |
Token | lesson |
Token ID | 11483 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
its | +0.147 |
ade | +0.126 |
ters | +0.123 |
ying | +0.117 |
aches | +0.115 |
Neg logit contributions | |
joy | -0.327 |
Bye | -0.295 |
carriage | -0.280 |
Sure | -0.277 |
icol | -0.274 |
Token | : |
Token ID | 25 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
ying | +0.135 |
its | +0.135 |
ters | +0.128 |
idy | +0.126 |
ade | +0.120 |
Neg logit contributions | |
joy | -0.220 |
Bye | -0.195 |
icol | -0.190 |
carriage | -0.188 |
Sure | -0.186 |
Token | never |
Token ID | 1239 |
Feature activation | -6.18e+00 |
Pos logit contributions | |
its | +0.090 |
ters | +0.083 |
ying | +0.077 |
idy | +0.076 |
aches | +0.075 |
Neg logit contributions | |
joy | -0.120 |
Bye | -0.103 |
carriage | -0.100 |
icol | -0.100 |
Sure | -0.100 |
Token | be |
Token ID | 307 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
joy | +0.579 |
Bye | +0.520 |
Sure | +0.486 |
goodbye | +0.483 |
carriage | +0.461 |
Neg logit contributions | |
its | -0.457 |
ters | -0.415 |
ying | -0.396 |
ade | -0.394 |
aches | -0.384 |
Token | afraid |
Token ID | 7787 |
Feature activation | +5.13e-01 |
Pos logit contributions | |
joy | +0.113 |
Bye | +0.100 |
Sure | +0.095 |
goodbye | +0.093 |
carriage | +0.092 |
Neg logit contributions | |
its | -0.070 |
ters | -0.061 |
ade | -0.059 |
ying | -0.059 |
aches | -0.057 |
Token | to |
Token ID | 284 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
its | +0.040 |
ters | +0.037 |
ying | +0.035 |
ade | +0.035 |
aches | +0.035 |
Neg logit contributions | |
joy | -0.046 |
Bye | -0.041 |
Sure | -0.039 |
goodbye | -0.037 |
carriage | -0.037 |
Token | express |
Token ID | 4911 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
joy | +0.020 |
Bye | +0.019 |
goodbye | +0.017 |
icol | +0.017 |
Sure | +0.017 |
Neg logit contributions | |
its | -0.019 |
ying | -0.018 |
ters | -0.018 |
ade | -0.017 |
oons | -0.017 |
Token | her |
Token ID | 607 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
its | +0.073 |
ters | +0.067 |
ying | +0.063 |
aches | +0.061 |
ade | +0.060 |
Neg logit contributions | |
joy | -0.142 |
Bye | -0.130 |
Sure | -0.125 |
carriage | -0.121 |
icol | -0.120 |
Token | day |
Token ID | 1110 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
its | +0.161 |
ade | +0.149 |
aches | +0.144 |
ying | +0.143 |
ters | +0.143 |
Neg logit contributions | |
joy | -0.191 |
Bye | -0.175 |
icol | -0.167 |
Sure | -0.166 |
carriage | -0.152 |
Token | the |
Token ID | 262 |
Feature activation | +3.97e-01 |
Pos logit contributions | |
joy | +0.108 |
Bye | +0.095 |
Sure | +0.091 |
goodbye | +0.087 |
carriage | +0.087 |
Neg logit contributions | |
its | -0.095 |
ters | -0.087 |
ying | -0.084 |
ade | -0.083 |
aches | -0.082 |
Token | fountain |
Token ID | 29420 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
its | +0.029 |
ters | +0.026 |
ying | +0.026 |
ade | +0.025 |
aches | +0.025 |
Neg logit contributions | |
joy | -0.037 |
Bye | -0.033 |
Sure | -0.032 |
carriage | -0.031 |
goodbye | -0.031 |
Token | made |
Token ID | 925 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
its | +0.151 |
ters | +0.139 |
ying | +0.133 |
ade | +0.132 |
aches | +0.131 |
Neg logit contributions | |
joy | -0.175 |
Bye | -0.155 |
Sure | -0.147 |
goodbye | -0.141 |
carriage | -0.141 |
Token | his |
Token ID | 465 |
Feature activation | -5.78e-01 |
Pos logit contributions | |
joy | +0.092 |
goodbye | +0.079 |
Bye | +0.078 |
Sure | +0.076 |
carriage | +0.070 |
Neg logit contributions | |
its | -0.087 |
ying | -0.079 |
ters | -0.077 |
aches | -0.077 |
ade | -0.075 |
Token | heart |
Token ID | 2612 |
Feature activation | -7.43e+00 |
Pos logit contributions | |
joy | +0.053 |
Bye | +0.048 |
Sure | +0.045 |
icol | +0.043 |
carriage | +0.042 |
Neg logit contributions | |
its | -0.043 |
ters | -0.039 |
aches | -0.038 |
ade | -0.038 |
ying | -0.037 |
Token | feel |
Token ID | 1254 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
joy | +0.743 |
Bye | +0.660 |
goodbye | +0.637 |
Sure | +0.632 |
carriage | +0.627 |
Neg logit contributions | |
its | -0.486 |
ters | -0.440 |
ying | -0.424 |
ade | -0.408 |
idy | -0.403 |
Token | happy |
Token ID | 3772 |
Feature activation | -7.94e-01 |
Pos logit contributions | |
its | +0.223 |
ters | +0.203 |
ying | +0.194 |
ade | +0.190 |
aches | +0.188 |
Neg logit contributions | |
joy | -0.344 |
Bye | -0.308 |
Sure | -0.292 |
goodbye | -0.289 |
carriage | -0.283 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
joy | +0.076 |
Bye | +0.071 |
Sure | +0.068 |
icol | +0.064 |
carriage | +0.064 |
Neg logit contributions | |
its | -0.053 |
ters | -0.051 |
ying | -0.048 |
ade | -0.048 |
aches | -0.046 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
its | +0.001 |
ters | +0.001 |
ying | +0.001 |
ade | +0.001 |
idy | +0.001 |
Neg logit contributions | |
joy | -0.002 |
Bye | -0.001 |
carriage | -0.001 |
icol | -0.001 |
goodbye | -0.001 |
Token | Once |
Token ID | 7454 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
its | +0.114 |
ters | +0.106 |
ying | +0.102 |
ade | +0.101 |
aches | +0.100 |
Neg logit contributions | |
joy | -0.124 |
Bye | -0.109 |
Sure | -0.104 |
carriage | -0.098 |
goodbye | -0.098 |