Token | . |
Token ID | 13 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
mie | +0.339 |
elope | +0.327 |
etsy | +0.321 |
jo | +0.316 |
hew | +0.316 |
Neg logit contributions | |
trick | -0.212 |
show | -0.209 |
my | -0.191 |
test | -0.190 |
new | -0.189 |
Token | The |
Token ID | 383 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
mie | +0.051 |
hew | +0.048 |
ppy | +0.048 |
etsy | +0.048 |
lves | +0.047 |
Neg logit contributions | |
show | -0.044 |
new | -0.042 |
grown | -0.041 |
my | -0.041 |
to | -0.040 |
Token | next |
Token ID | 1306 |
Feature activation | -6.70e-02 |
Pos logit contributions | |
show | +0.014 |
new | +0.013 |
trick | +0.012 |
grown | +0.012 |
magic | +0.012 |
Neg logit contributions | |
mie | -0.028 |
etsy | -0.027 |
jo | -0.027 |
storms | -0.027 |
ppy | -0.026 |
Token | day |
Token ID | 1110 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
show | +0.063 |
trick | +0.059 |
making | +0.056 |
new | +0.054 |
grown | +0.051 |
Neg logit contributions | |
mie | -0.156 |
elope | -0.154 |
etsy | -0.153 |
jo | -0.151 |
pillar | -0.148 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
mie | +0.058 |
etsy | +0.057 |
hew | +0.056 |
jo | +0.056 |
lves | +0.055 |
Neg logit contributions | |
show | -0.011 |
new | -0.010 |
trick | -0.009 |
grown | -0.009 |
to | -0.008 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
och | +0.221 |
oled | +0.193 |
cases | +0.184 |
etsy | +0.181 |
oped | +0.180 |
Neg logit contributions | |
show | -0.578 |
to | -0.567 |
new | -0.567 |
for | -0.566 |
time | -0.559 |
Token | went |
Token ID | 1816 |
Feature activation | -9.86e-02 |
Pos logit contributions | |
mie | +0.798 |
etsy | +0.788 |
elope | +0.754 |
hew | +0.751 |
jo | +0.746 |
Neg logit contributions | |
show | -0.729 |
trick | -0.675 |
new | -0.670 |
grown | -0.652 |
to | -0.635 |
Token | outside |
Token ID | 2354 |
Feature activation | -4.27e-02 |
Pos logit contributions | |
trick | +0.096 |
color | +0.091 |
original | +0.086 |
show | +0.086 |
style | +0.082 |
Neg logit contributions | |
mie | -0.220 |
etsy | -0.204 |
jo | -0.201 |
elope | -0.199 |
och | -0.195 |
Token | to |
Token ID | 284 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
trick | +0.042 |
show | +0.038 |
test | +0.036 |
new | +0.036 |
magic | +0.035 |
Neg logit contributions | |
mie | -0.097 |
elope | -0.095 |
jo | -0.093 |
storms | -0.091 |
etsy | -0.091 |
Token | pick |
Token ID | 2298 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
trick | +0.237 |
new | +0.226 |
making | +0.213 |
matching | +0.211 |
for | +0.210 |
Neg logit contributions | |
mie | -0.519 |
elope | -0.508 |
etsy | -0.475 |
hew | -0.460 |
jo | -0.459 |
Token | more |
Token ID | 517 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
show | +0.077 |
new | +0.072 |
trick | +0.065 |
my | +0.055 |
for | +0.055 |
Neg logit contributions | |
mie | -0.357 |
etsy | -0.355 |
jo | -0.348 |
elope | -0.347 |
hew | -0.347 |
Token | this |
Token ID | 428 |
Feature activation | -4.51e-02 |
Pos logit contributions | |
show | +0.118 |
trick | +0.104 |
new | +0.102 |
grown | +0.090 |
making | +0.088 |
Neg logit contributions | |
mie | -0.444 |
etsy | -0.434 |
hew | -0.424 |
elope | -0.424 |
jo | -0.420 |
Token | special |
Token ID | 2041 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
show | +0.045 |
trick | +0.044 |
my | +0.041 |
test | +0.040 |
grown | +0.040 |
Neg logit contributions | |
mie | -0.096 |
elope | -0.092 |
jo | -0.092 |
storms | -0.089 |
hew | -0.088 |
Token | lamp |
Token ID | 20450 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
show | +0.109 |
trick | +0.105 |
my | +0.103 |
new | +0.099 |
making | +0.098 |
Neg logit contributions | |
mie | -0.257 |
elope | -0.253 |
jo | -0.250 |
etsy | -0.246 |
pillar | -0.245 |
Token | that |
Token ID | 326 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
mie | +0.557 |
etsy | +0.543 |
elope | +0.530 |
hew | +0.529 |
jo | +0.523 |
Neg logit contributions | |
show | -0.259 |
trick | -0.241 |
new | -0.233 |
grown | -0.216 |
test | -0.213 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
mie | +0.016 |
etsy | +0.016 |
hew | +0.015 |
elope | +0.015 |
jo | +0.015 |
Neg logit contributions | |
show | -0.010 |
trick | -0.009 |
new | -0.009 |
grown | -0.009 |
making | -0.009 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
etsy | +0.265 |
lves | +0.257 |
mie | +0.250 |
ongo | +0.244 |
och | +0.243 |
Neg logit contributions | |
show | -0.518 |
trick | -0.496 |
new | -0.477 |
grown | -0.477 |
for | -0.475 |
Token | had |
Token ID | 550 |
Feature activation | -3.85e-02 |
Pos logit contributions | |
etsy | +0.825 |
mie | +0.813 |
rified | +0.775 |
uddy | +0.774 |
hew | +0.774 |
Neg logit contributions | |
show | -0.721 |
trick | -0.650 |
new | -0.647 |
grown | -0.634 |
making | -0.634 |
Token | ! |
Token ID | 0 |
Feature activation | +3.31e-02 |
Pos logit contributions | |
show | +0.056 |
trick | +0.054 |
new | +0.052 |
test | +0.050 |
my | +0.048 |
Neg logit contributions | |
mie | -0.072 |
etsy | -0.068 |
elope | -0.067 |
hew | -0.067 |
jo | -0.066 |
Token | |
Token ID | 220 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
ppa | +0.077 |
ppers | +0.076 |
lves | +0.075 |
mie | +0.074 |
pper | +0.074 |
Neg logit contributions | |
my | -0.038 |
the | -0.036 |
show | -0.035 |
your | -0.035 |
to | -0.034 |
Token |
|
Token ID | 198 |
Feature activation | +8.50e-02 |
Pos logit contributions | |
mie | +0.471 |
rified | +0.470 |
lves | +0.469 |
ley | +0.464 |
ppa | +0.453 |
Neg logit contributions | |
new | -0.177 |
to | -0.169 |
the | -0.164 |
big | -0.146 |
your | -0.146 |
Token |
|
Token ID | 198 |
Feature activation | +8.43e-02 |
Pos logit contributions | |
rified | +0.214 |
storms | +0.210 |
lves | +0.208 |
mie | +0.207 |
ley | +0.207 |
Neg logit contributions | |
new | -0.084 |
show | -0.081 |
the | -0.078 |
grown | -0.076 |
big | -0.073 |
Token | " |
Token ID | 1 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
mie | +0.117 |
etsy | +0.108 |
jo | +0.106 |
hew | +0.106 |
ongo | +0.105 |
Neg logit contributions | |
show | -0.185 |
trick | -0.175 |
new | -0.175 |
grown | -0.174 |
my | -0.174 |
Token | Hello |
Token ID | 15496 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
jo | +0.193 |
mie | +0.189 |
hew | +0.186 |
uddy | +0.184 |
apa | +0.178 |
Neg logit contributions | |
show | -0.201 |
color | -0.190 |
trick | -0.188 |
grown | -0.184 |
blue | -0.184 |
Token | !" |
Token ID | 2474 |
Feature activation | +7.26e-02 |
Pos logit contributions | |
etsy | +0.044 |
mie | +0.044 |
jo | +0.044 |
hew | +0.043 |
storms | +0.043 |
Neg logit contributions | |
show | -0.011 |
new | -0.011 |
my | -0.009 |
trick | -0.009 |
for | -0.008 |
Token | said |
Token ID | 531 |
Feature activation | +3.22e-02 |
Pos logit contributions | |
mie | +0.127 |
hew | +0.125 |
etsy | +0.125 |
ongo | +0.124 |
x | +0.122 |
Neg logit contributions | |
show | -0.129 |
the | -0.118 |
new | -0.113 |
my | -0.113 |
trick | -0.111 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
mie | +0.057 |
hew | +0.056 |
etsy | +0.055 |
jo | +0.053 |
ongo | +0.052 |
Neg logit contributions | |
show | -0.054 |
new | -0.050 |
trick | -0.050 |
my | -0.048 |
to | -0.048 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.47e-01 |
Pos logit contributions | |
och | +0.234 |
lves | +0.228 |
oled | +0.217 |
oped | +0.213 |
aden | +0.206 |
Neg logit contributions | |
to | -0.581 |
trick | -0.544 |
the | -0.543 |
new | -0.543 |
show | -0.537 |
Token | in |
Token ID | 287 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
mie | +1.143 |
etsy | +1.126 |
hew | +1.118 |
storms | +1.089 |
lves | +1.088 |
Neg logit contributions | |
show | -0.386 |
trick | -0.339 |
new | -0.335 |
to | -0.323 |
making | -0.306 |
Token | a |
Token ID | 257 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
trick | +0.146 |
show | +0.145 |
new | +0.133 |
for | +0.129 |
making | +0.122 |
Neg logit contributions | |
mie | -0.534 |
elope | -0.527 |
etsy | -0.507 |
rified | -0.505 |
pillar | -0.502 |
Token | cautious |
Token ID | 21205 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
show | +0.103 |
trick | +0.097 |
new | +0.088 |
test | +0.084 |
making | +0.084 |
Neg logit contributions | |
mie | -0.308 |
elope | -0.299 |
etsy | -0.298 |
jo | -0.292 |
pillar | -0.289 |
Token | voice |
Token ID | 3809 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
show | +0.019 |
trick | +0.017 |
new | +0.017 |
grown | +0.016 |
test | +0.016 |
Neg logit contributions | |
mie | -0.034 |
etsy | -0.033 |
elope | -0.033 |
hew | -0.032 |
jo | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | +2.93e-02 |
Pos logit contributions | |
mie | +0.256 |
etsy | +0.247 |
elope | +0.244 |
jo | +0.241 |
hew | +0.239 |
Neg logit contributions | |
show | -0.119 |
trick | -0.112 |
new | -0.109 |
grown | -0.102 |
test | -0.100 |
Token | . |
Token ID | 13 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
mie | +0.217 |
etsy | +0.212 |
hew | +0.210 |
elope | +0.210 |
jo | +0.206 |
Neg logit contributions | |
show | -0.078 |
new | -0.073 |
trick | -0.072 |
for | -0.068 |
to | -0.068 |
Token | |
Token ID | 220 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
x | +0.070 |
ppers | +0.069 |
ppa | +0.069 |
pper | +0.069 |
ppy | +0.068 |
Neg logit contributions | |
the | -0.032 |
show | -0.031 |
new | -0.031 |
to | -0.031 |
my | -0.030 |
Token |
|
Token ID | 198 |
Feature activation | +8.65e-02 |
Pos logit contributions | |
rified | +0.443 |
ley | +0.440 |
mie | +0.433 |
storms | +0.430 |
lves | +0.424 |
Neg logit contributions | |
new | -0.201 |
to | -0.194 |
the | -0.190 |
show | -0.184 |
your | -0.183 |
Token |
|
Token ID | 198 |
Feature activation | +8.53e-02 |
Pos logit contributions | |
mie | +0.190 |
storms | +0.185 |
rified | +0.183 |
lves | +0.183 |
x | +0.181 |
Neg logit contributions | |
show | -0.107 |
new | -0.103 |
trick | -0.096 |
grown | -0.095 |
the | -0.095 |
Token | Pen |
Token ID | 25553 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
mie | +0.154 |
storms | +0.146 |
etsy | +0.144 |
ongo | +0.142 |
jo | +0.141 |
Neg logit contributions | |
show | -0.137 |
trick | -0.129 |
new | -0.128 |
grown | -0.127 |
my | -0.125 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.47e-01 |
Pos logit contributions | |
mie | +0.129 |
och | +0.126 |
etsy | +0.126 |
storms | +0.116 |
ongo | +0.111 |
Neg logit contributions | |
show | -0.620 |
trick | -0.598 |
new | -0.591 |
grown | -0.586 |
making | -0.580 |
Token | and |
Token ID | 290 |
Feature activation | -9.93e-02 |
Pos logit contributions | |
mie | +0.812 |
etsy | +0.795 |
elope | +0.762 |
hew | +0.762 |
jo | +0.756 |
Neg logit contributions | |
show | -0.705 |
trick | -0.659 |
new | -0.649 |
grown | -0.628 |
making | -0.612 |
Token | the |
Token ID | 262 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
show | +0.056 |
the | +0.043 |
new | +0.042 |
for | +0.037 |
trick | +0.036 |
Neg logit contributions | |
etsy | -0.291 |
mie | -0.289 |
hew | -0.285 |
oped | -0.283 |
och | -0.282 |
Token | bird |
Token ID | 6512 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
show | +0.191 |
new | +0.182 |
trick | +0.176 |
grown | +0.171 |
magic | +0.170 |
Neg logit contributions | |
jo | -0.261 |
mie | -0.259 |
etsy | -0.258 |
storms | -0.257 |
oped | -0.251 |
Token | stayed |
Token ID | 9658 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
mie | +0.528 |
etsy | +0.526 |
thel | +0.501 |
hew | +0.496 |
ongo | +0.496 |
Neg logit contributions | |
show | -0.458 |
new | -0.420 |
for | -0.406 |
trick | -0.406 |
to | -0.396 |
Token | friends |
Token ID | 2460 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
trick | +0.157 |
test | +0.148 |
math | +0.142 |
show | +0.141 |
quiz | +0.128 |
Neg logit contributions | |
mie | -0.274 |
elope | -0.273 |
hew | -0.248 |
ley | -0.242 |
etsy | -0.237 |
Token | very |
Token ID | 845 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
show | +0.104 |
trick | +0.094 |
new | +0.092 |
grown | +0.082 |
test | +0.079 |
Neg logit contributions | |
mie | -0.336 |
etsy | -0.323 |
hew | -0.320 |
elope | -0.318 |
jo | -0.318 |
Token | long |
Token ID | 890 |
Feature activation | -4.38e-02 |
Pos logit contributions | |
show | +0.138 |
trick | +0.135 |
making | +0.128 |
math | +0.119 |
test | +0.116 |
Neg logit contributions | |
elope | -0.395 |
etsy | -0.392 |
mie | -0.391 |
hew | -0.380 |
jo | -0.378 |
Token | time |
Token ID | 640 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
show | +0.024 |
trick | +0.020 |
new | +0.019 |
grown | +0.016 |
test | +0.015 |
Neg logit contributions | |
mie | -0.125 |
etsy | -0.122 |
elope | -0.120 |
hew | -0.120 |
jo | -0.119 |
Token | . |
Token ID | 13 |
Feature activation | +2.32e-02 |
Pos logit contributions | |
show | +0.097 |
trick | +0.091 |
new | +0.086 |
test | +0.079 |
grown | +0.079 |
Neg logit contributions | |
mie | -0.255 |
etsy | -0.247 |
elope | -0.245 |
hew | -0.242 |
jo | -0.241 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
mie | +0.048 |
ppa | +0.047 |
ongo | +0.045 |
etsy | +0.045 |
och | +0.044 |
Neg logit contributions | |
show | -0.032 |
new | -0.030 |
to | -0.029 |
for | -0.029 |
the | -0.029 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
och | +0.145 |
etsy | +0.137 |
ongo | +0.135 |
mie | +0.130 |
oled | +0.120 |
Neg logit contributions | |
show | -0.626 |
trick | -0.606 |
new | -0.604 |
for | -0.595 |
the | -0.588 |
Token | was |
Token ID | 373 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
mie | +0.807 |
etsy | +0.782 |
elope | +0.756 |
hew | +0.753 |
jo | +0.747 |
Neg logit contributions | |
show | -0.707 |
trick | -0.668 |
new | -0.656 |
grown | -0.629 |
making | -0.618 |
Token | always |
Token ID | 1464 |
Feature activation | -8.87e-02 |
Pos logit contributions | |
show | +0.146 |
trick | +0.146 |
test | +0.131 |
new | +0.127 |
math | +0.121 |
Neg logit contributions | |
mie | -0.301 |
elope | -0.288 |
etsy | -0.280 |
jo | -0.272 |
hew | -0.270 |
Token | thankful |
Token ID | 25535 |
Feature activation | -5.59e-02 |
Pos logit contributions | |
trick | +0.108 |
show | +0.108 |
test | +0.100 |
math | +0.092 |
new | +0.089 |
Neg logit contributions | |
mie | -0.192 |
elope | -0.183 |
etsy | -0.172 |
rified | -0.169 |
jo | -0.168 |
Token | for |
Token ID | 329 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
trick | +0.035 |
show | +0.034 |
test | +0.031 |
matching | +0.027 |
design | +0.027 |
Neg logit contributions | |
mie | -0.144 |
elope | -0.141 |
etsy | -0.141 |
jo | -0.138 |
hew | -0.138 |
Token | how |
Token ID | 703 |
Feature activation | -9.75e-02 |
Pos logit contributions | |
show | +0.128 |
trick | +0.125 |
new | +0.101 |
test | +0.101 |
grown | +0.095 |
Neg logit contributions | |
mie | -0.573 |
elope | -0.556 |
etsy | -0.549 |
hew | -0.536 |
thel | -0.536 |
Token | in |
Token ID | 287 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
mie | +0.310 |
etsy | +0.306 |
ppy | +0.294 |
elope | +0.291 |
als | +0.290 |
Neg logit contributions | |
trick | -0.152 |
show | -0.139 |
math | -0.131 |
test | -0.129 |
new | -0.126 |
Token | her |
Token ID | 607 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
trick | +0.190 |
show | +0.175 |
test | +0.152 |
job | +0.144 |
quiz | +0.131 |
Neg logit contributions | |
mie | -0.504 |
elope | -0.499 |
Bear | -0.465 |
etsy | -0.459 |
Max | -0.458 |
Token | garden |
Token ID | 11376 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
show | +0.046 |
trick | +0.046 |
making | +0.040 |
test | +0.040 |
new | +0.040 |
Neg logit contributions | |
mie | -0.076 |
etsy | -0.073 |
elope | -0.073 |
hew | -0.071 |
pillar | -0.069 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
mie | +0.381 |
elope | +0.370 |
etsy | +0.369 |
hew | +0.357 |
storms | +0.349 |
Neg logit contributions | |
trick | -0.188 |
show | -0.177 |
test | -0.156 |
chance | -0.144 |
power | -0.143 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
new | +0.155 |
show | +0.152 |
the | +0.149 |
to | +0.144 |
grown | +0.141 |
Neg logit contributions | |
hew | -0.217 |
mie | -0.216 |
x | -0.212 |
ongo | -0.212 |
jo | -0.211 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
cases | +0.229 |
och | +0.221 |
oled | +0.209 |
oped | +0.207 |
rified | +0.203 |
Neg logit contributions | |
show | -0.559 |
to | -0.559 |
new | -0.549 |
the | -0.548 |
trick | -0.543 |
Token | heard |
Token ID | 2982 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
mie | +0.829 |
etsy | +0.811 |
jo | +0.788 |
elope | +0.774 |
storms | +0.774 |
Neg logit contributions | |
show | -0.692 |
new | -0.637 |
grown | -0.636 |
trick | -0.631 |
making | -0.617 |
Token | a |
Token ID | 257 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
show | +0.071 |
trick | +0.063 |
new | +0.053 |
test | +0.051 |
making | +0.048 |
Neg logit contributions | |
mie | -0.315 |
etsy | -0.304 |
elope | -0.302 |
jo | -0.300 |
hew | -0.297 |
Token | whisper |
Token ID | 31992 |
Feature activation | +3.52e-02 |
Pos logit contributions | |
show | +0.110 |
trick | +0.101 |
new | +0.096 |
grown | +0.088 |
test | +0.087 |
Neg logit contributions | |
mie | -0.316 |
etsy | -0.307 |
elope | -0.303 |
hew | -0.300 |
jo | -0.299 |
Token | coming |
Token ID | 2406 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
mie | +0.072 |
jo | +0.070 |
elope | +0.069 |
etsy | +0.068 |
storms | +0.068 |
Neg logit contributions | |
show | -0.041 |
my | -0.040 |
trick | -0.040 |
new | -0.039 |
your | -0.038 |
Token | from |
Token ID | 422 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
show | +0.086 |
trick | +0.079 |
new | +0.074 |
grown | +0.067 |
test | +0.067 |
Neg logit contributions | |
mie | -0.306 |
etsy | -0.298 |
elope | -0.296 |
jo | -0.293 |
hew | -0.289 |
Token | kind |
Token ID | 1611 |
Feature activation | -5.73e-02 |
Pos logit contributions | |
show | +0.141 |
trick | +0.132 |
new | +0.128 |
my | +0.124 |
making | +0.123 |
Neg logit contributions | |
mie | -0.270 |
etsy | -0.266 |
elope | -0.261 |
pillar | -0.255 |
jo | -0.254 |
Token | of |
Token ID | 286 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
show | +0.059 |
trick | +0.055 |
new | +0.053 |
grown | +0.049 |
test | +0.049 |
Neg logit contributions | |
mie | -0.135 |
etsy | -0.131 |
elope | -0.129 |
jo | -0.128 |
hew | -0.127 |
Token | answer |
Token ID | 3280 |
Feature activation | -7.69e-02 |
Pos logit contributions | |
show | +0.238 |
trick | +0.232 |
math | +0.225 |
matching | +0.225 |
my | +0.221 |
Neg logit contributions | |
elope | -0.480 |
mie | -0.480 |
pillar | -0.470 |
etsy | -0.457 |
jo | -0.456 |
Token | . |
Token ID | 13 |
Feature activation | +2.81e-02 |
Pos logit contributions | |
show | +0.074 |
trick | +0.069 |
new | +0.067 |
grown | +0.061 |
making | +0.060 |
Neg logit contributions | |
mie | -0.188 |
etsy | -0.183 |
hew | -0.179 |
elope | -0.178 |
jo | -0.176 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
mie | +0.052 |
etsy | +0.049 |
hew | +0.049 |
ppa | +0.048 |
lves | +0.048 |
Neg logit contributions | |
show | -0.045 |
new | -0.043 |
to | -0.042 |
grown | -0.041 |
my | -0.041 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
och | +0.193 |
ongo | +0.161 |
oled | +0.153 |
mie | +0.152 |
lves | +0.150 |
Neg logit contributions | |
show | -0.598 |
trick | -0.590 |
to | -0.583 |
new | -0.581 |
the | -0.570 |
Token | knew |
Token ID | 2993 |
Feature activation | -8.08e-02 |
Pos logit contributions | |
mie | +0.858 |
etsy | +0.839 |
hew | +0.812 |
elope | +0.805 |
jo | +0.804 |
Neg logit contributions | |
show | -0.661 |
trick | -0.615 |
new | -0.597 |
grown | -0.584 |
making | -0.566 |
Token | there |
Token ID | 612 |
Feature activation | +8.32e-02 |
Pos logit contributions | |
show | +0.088 |
new | +0.086 |
trick | +0.079 |
to | +0.077 |
for | +0.077 |
Neg logit contributions | |
etsy | -0.189 |
mie | -0.189 |
hew | -0.187 |
jo | -0.186 |
oped | -0.183 |
Token | must |
Token ID | 1276 |
Feature activation | -6.70e-02 |
Pos logit contributions | |
mie | +0.163 |
etsy | +0.159 |
hew | +0.156 |
ppa | +0.152 |
jo | +0.151 |
Neg logit contributions | |
show | -0.125 |
new | -0.119 |
trick | -0.117 |
grown | -0.112 |
making | -0.111 |
Token | be |
Token ID | 307 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
new | +0.056 |
show | +0.056 |
matching | +0.053 |
trick | +0.053 |
math | +0.053 |
Neg logit contributions | |
elope | -0.153 |
mie | -0.147 |
etsy | -0.143 |
hew | -0.142 |
jo | -0.139 |
Token | a |
Token ID | 257 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
show | +0.097 |
trick | +0.088 |
new | +0.080 |
test | +0.078 |
grown | +0.073 |
Neg logit contributions | |
mie | -0.269 |
etsy | -0.261 |
elope | -0.259 |
hew | -0.255 |
jo | -0.253 |
Token | ! |
Token ID | 0 |
Feature activation | +3.31e-02 |
Pos logit contributions | |
show | +0.056 |
trick | +0.054 |
new | +0.052 |
test | +0.050 |
my | +0.048 |
Neg logit contributions | |
mie | -0.072 |
etsy | -0.068 |
elope | -0.067 |
hew | -0.067 |
jo | -0.066 |
Token | |
Token ID | 220 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
ppa | +0.077 |
ppers | +0.076 |
lves | +0.075 |
mie | +0.074 |
pper | +0.074 |
Neg logit contributions | |
my | -0.038 |
the | -0.036 |
show | -0.035 |
your | -0.035 |
to | -0.034 |
Token |
|
Token ID | 198 |
Feature activation | +8.50e-02 |
Pos logit contributions | |
mie | +0.471 |
rified | +0.470 |
lves | +0.469 |
ley | +0.464 |
ppa | +0.453 |
Neg logit contributions | |
new | -0.177 |
to | -0.169 |
the | -0.164 |
big | -0.146 |
your | -0.146 |
Token |
|
Token ID | 198 |
Feature activation | +8.43e-02 |
Pos logit contributions | |
rified | +0.214 |
storms | +0.210 |
lves | +0.208 |
mie | +0.207 |
ley | +0.207 |
Neg logit contributions | |
new | -0.084 |
show | -0.081 |
the | -0.078 |
grown | -0.076 |
big | -0.073 |
Token | Pen |
Token ID | 25553 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
mie | +0.162 |
storms | +0.160 |
rified | +0.159 |
ley | +0.154 |
lves | +0.152 |
Neg logit contributions | |
show | -0.125 |
grown | -0.118 |
trick | -0.117 |
my | -0.116 |
new | -0.116 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
mie | +0.146 |
etsy | +0.142 |
och | +0.140 |
lves | +0.136 |
ongo | +0.132 |
Neg logit contributions | |
show | -0.605 |
trick | -0.576 |
grown | -0.571 |
the | -0.566 |
new | -0.563 |
Token | used |
Token ID | 973 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
mie | +0.842 |
etsy | +0.827 |
elope | +0.793 |
hew | +0.792 |
jo | +0.786 |
Neg logit contributions | |
show | -0.670 |
trick | -0.624 |
new | -0.611 |
grown | -0.593 |
making | -0.579 |
Token | her |
Token ID | 607 |
Feature activation | -3.55e-02 |
Pos logit contributions | |
show | +0.137 |
trick | +0.129 |
test | +0.118 |
job | +0.107 |
grown | +0.106 |
Neg logit contributions | |
mie | -0.393 |
etsy | -0.378 |
elope | -0.368 |
jo | -0.366 |
apa | -0.364 |
Token | lamp |
Token ID | 20450 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
show | +0.030 |
trick | +0.029 |
making | +0.027 |
grown | +0.027 |
my | +0.026 |
Neg logit contributions | |
jo | -0.078 |
elope | -0.078 |
mie | -0.077 |
hew | -0.074 |
apa | -0.073 |
Token | every |
Token ID | 790 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
mie | +0.697 |
etsy | +0.680 |
elope | +0.673 |
jo | +0.668 |
hew | +0.662 |
Neg logit contributions | |
show | -0.119 |
trick | -0.100 |
new | -0.088 |
grown | -0.080 |
test | -0.074 |
Token | night |
Token ID | 1755 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
my | +0.147 |
your | +0.143 |
new | +0.142 |
matching | +0.140 |
trick | +0.138 |
Neg logit contributions | |
elope | -0.252 |
jo | -0.246 |
pillar | -0.240 |
mie | -0.239 |
etsy | -0.226 |
Token | , |
Token ID | 11 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
show | +0.116 |
new | +0.111 |
trick | +0.107 |
grown | +0.104 |
red | +0.102 |
Neg logit contributions | |
mie | -0.159 |
hew | -0.156 |
oped | -0.150 |
etsy | -0.149 |
storms | -0.148 |
Token | bright |
Token ID | 6016 |
Feature activation | -8.08e-02 |
Pos logit contributions | |
show | +0.077 |
trick | +0.071 |
new | +0.063 |
test | +0.058 |
grown | +0.057 |
Neg logit contributions | |
mie | -0.287 |
etsy | -0.280 |
elope | -0.276 |
hew | -0.272 |
jo | -0.271 |
Token | girl |
Token ID | 2576 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
show | +0.092 |
trick | +0.090 |
new | +0.082 |
making | +0.081 |
test | +0.079 |
Neg logit contributions | |
mie | -0.175 |
etsy | -0.169 |
elope | -0.167 |
pillar | -0.165 |
jo | -0.165 |
Token | named |
Token ID | 3706 |
Feature activation | +2.76e-02 |
Pos logit contributions | |
mie | +0.476 |
etsy | +0.456 |
elope | +0.451 |
jo | +0.441 |
hew | +0.438 |
Neg logit contributions | |
show | -0.435 |
trick | -0.422 |
new | -0.410 |
grown | -0.391 |
test | -0.390 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.29e-01 |
Pos logit contributions | |
mie | +0.056 |
etsy | +0.053 |
elope | +0.053 |
jo | +0.053 |
hew | +0.052 |
Neg logit contributions | |
show | -0.039 |
trick | -0.037 |
new | -0.037 |
grown | -0.034 |
test | -0.034 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
rified | +0.345 |
cases | +0.343 |
lves | +0.343 |
och | +0.342 |
storms | +0.337 |
Neg logit contributions | |
to | -0.415 |
the | -0.408 |
show | -0.405 |
new | -0.405 |
time | -0.398 |
Token | . |
Token ID | 13 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
mie | +1.059 |
etsy | +1.031 |
hew | +1.007 |
elope | +1.002 |
jo | +0.998 |
Neg logit contributions | |
show | -0.460 |
trick | -0.420 |
new | -0.414 |
grown | -0.385 |
making | -0.376 |
Token | One |
Token ID | 1881 |
Feature activation | +4.79e-02 |
Pos logit contributions | |
mie | +0.038 |
hew | +0.035 |
etsy | +0.035 |
ppa | +0.034 |
lves | +0.034 |
Neg logit contributions | |
show | -0.050 |
new | -0.048 |
trick | -0.046 |
to | -0.046 |
grown | -0.046 |
Token | day |
Token ID | 1110 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
mie | +0.115 |
elope | +0.114 |
etsy | +0.113 |
jo | +0.111 |
pillar | +0.110 |
Neg logit contributions | |
show | -0.043 |
trick | -0.040 |
new | -0.036 |
making | -0.035 |
matching | -0.035 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
mie | +0.052 |
etsy | +0.051 |
elope | +0.050 |
jo | +0.048 |
hew | +0.048 |
Neg logit contributions | |
show | -0.016 |
trick | -0.015 |
new | -0.013 |
test | -0.012 |
grown | -0.012 |
Token | while |
Token ID | 981 |
Feature activation | -5.55e-02 |
Pos logit contributions | |
show | +0.183 |
new | +0.174 |
trick | +0.169 |
grown | +0.164 |
to | +0.164 |
Neg logit contributions | |
mie | -0.185 |
hew | -0.177 |
etsy | -0.173 |
jo | -0.173 |
storms | -0.168 |
Token | her |
Token ID | 607 |
Feature activation | -3.54e-02 |
Pos logit contributions | |
show | +0.199 |
trick | +0.196 |
new | +0.191 |
grown | +0.169 |
making | +0.164 |
Neg logit contributions | |
mie | -0.645 |
elope | -0.623 |
etsy | -0.620 |
jo | -0.603 |
hew | -0.600 |
Token | and |
Token ID | 290 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
show | +0.043 |
trick | +0.043 |
grown | +0.039 |
new | +0.039 |
making | +0.038 |
Neg logit contributions | |
mie | -0.074 |
elope | -0.071 |
etsy | -0.070 |
jo | -0.068 |
hew | -0.068 |
Token | comfort |
Token ID | 4467 |
Feature activation | -5.75e-02 |
Pos logit contributions | |
show | +0.146 |
trick | +0.143 |
new | +0.138 |
grown | +0.131 |
test | +0.130 |
Neg logit contributions | |
mie | -0.193 |
etsy | -0.183 |
elope | -0.180 |
jo | -0.177 |
hew | -0.176 |
Token | ed |
Token ID | 276 |
Feature activation | -5.63e-02 |
Pos logit contributions | |
show | +0.038 |
to | +0.034 |
your | +0.032 |
new | +0.032 |
trick | +0.031 |
Neg logit contributions | |
mie | -0.154 |
lves | -0.154 |
hew | -0.153 |
elope | -0.153 |
etsy | -0.152 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
show | +0.049 |
trick | +0.043 |
new | +0.043 |
for | +0.038 |
grown | +0.038 |
Neg logit contributions | |
mie | -0.144 |
etsy | -0.141 |
elope | -0.139 |
hew | -0.139 |
jo | -0.137 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
lves | +0.323 |
storms | +0.314 |
och | +0.306 |
ongo | +0.304 |
cases | +0.301 |
Neg logit contributions | |
to | -0.442 |
the | -0.435 |
show | -0.434 |
for | -0.430 |
new | -0.425 |
Token | . |
Token ID | 13 |
Feature activation | +2.00e-02 |
Pos logit contributions | |
mie | +0.944 |
etsy | +0.924 |
hew | +0.896 |
jo | +0.894 |
elope | +0.890 |
Neg logit contributions | |
show | -0.570 |
new | -0.529 |
trick | -0.516 |
for | -0.495 |
to | -0.492 |
Token | " |
Token ID | 366 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
x | +0.043 |
lves | +0.043 |
ppers | +0.043 |
pper | +0.042 |
hew | +0.042 |
Neg logit contributions | |
my | -0.025 |
the | -0.024 |
to | -0.023 |
your | -0.023 |
new | -0.022 |
Token | I |
Token ID | 40 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
uddy | +0.171 |
cases | +0.166 |
jo | +0.165 |
storms | +0.163 |
isc | +0.163 |
Neg logit contributions | |
show | -0.155 |
my | -0.152 |
trick | -0.147 |
your | -0.145 |
color | -0.144 |
Token | told |
Token ID | 1297 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
mie | +0.203 |
etsy | +0.196 |
elope | +0.191 |
hew | +0.189 |
jo | +0.188 |
Neg logit contributions | |
show | -0.166 |
trick | -0.159 |
new | -0.155 |
grown | -0.148 |
test | -0.146 |
Token | you |
Token ID | 345 |
Feature activation | +1.57e-01 |
Pos logit contributions | |
show | +0.138 |
my | +0.136 |
your | +0.130 |
new | +0.127 |
the | +0.126 |
Neg logit contributions | |
oped | -0.221 |
mie | -0.220 |
etsy | -0.215 |
lves | -0.214 |
ongo | -0.213 |
Token | mom |
Token ID | 1995 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
show | +0.034 |
trick | +0.032 |
new | +0.030 |
grown | +0.029 |
my | +0.028 |
Neg logit contributions | |
mie | -0.078 |
elope | -0.075 |
etsy | -0.075 |
jo | -0.074 |
hew | -0.073 |
Token | and |
Token ID | 290 |
Feature activation | -9.74e-02 |
Pos logit contributions | |
mie | +0.776 |
etsy | +0.772 |
hew | +0.753 |
elope | +0.746 |
storms | +0.745 |
Neg logit contributions | |
show | -0.250 |
new | -0.218 |
trick | -0.214 |
for | -0.213 |
to | -0.211 |
Token | dad |
Token ID | 9955 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
show | +0.127 |
trick | +0.117 |
new | +0.116 |
grown | +0.112 |
making | +0.111 |
Neg logit contributions | |
mie | -0.208 |
etsy | -0.204 |
hew | -0.201 |
jo | -0.199 |
storms | -0.197 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
mie | +0.779 |
etsy | +0.768 |
elope | +0.751 |
hew | +0.746 |
storms | +0.739 |
Neg logit contributions | |
show | -0.377 |
trick | -0.337 |
new | -0.326 |
to | -0.315 |
making | -0.314 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
show | +0.167 |
new | +0.161 |
the | +0.158 |
making | +0.154 |
to | +0.153 |
Neg logit contributions | |
ongo | -0.195 |
hew | -0.193 |
mie | -0.190 |
etsy | -0.188 |
jo | -0.182 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
och | +0.188 |
ongo | +0.169 |
Mic | +0.163 |
lves | +0.161 |
azz | +0.158 |
Neg logit contributions | |
show | -0.599 |
for | -0.586 |
the | -0.581 |
to | -0.578 |
trick | -0.575 |
Token | was |
Token ID | 373 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
mie | +0.851 |
etsy | +0.826 |
elope | +0.801 |
hew | +0.798 |
jo | +0.793 |
Neg logit contributions | |
show | -0.658 |
trick | -0.621 |
new | -0.609 |
grown | -0.582 |
making | -0.575 |
Token | able |
Token ID | 1498 |
Feature activation | -8.94e-02 |
Pos logit contributions | |
show | +0.187 |
trick | +0.181 |
test | +0.169 |
new | +0.166 |
job | +0.160 |
Neg logit contributions | |
mie | -0.263 |
elope | -0.243 |
etsy | -0.235 |
ppa | -0.228 |
hew | -0.225 |
Token | to |
Token ID | 284 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
show | +0.058 |
trick | +0.050 |
test | +0.046 |
design | +0.038 |
my | +0.037 |
Neg logit contributions | |
mie | -0.235 |
etsy | -0.229 |
elope | -0.221 |
hew | -0.215 |
storms | -0.214 |
Token | fix |
Token ID | 4259 |
Feature activation | -7.27e-02 |
Pos logit contributions | |
new | +0.258 |
my | +0.247 |
your | +0.236 |
for | +0.233 |
red | +0.232 |
Neg logit contributions | |
mie | -0.488 |
elope | -0.484 |
hew | -0.457 |
jo | -0.451 |
Bear | -0.444 |
Token | the |
Token ID | 262 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
show | +0.061 |
new | +0.055 |
trick | +0.055 |
making | +0.047 |
my | +0.047 |
Neg logit contributions | |
mie | -0.187 |
etsy | -0.186 |
hew | -0.180 |
jo | -0.178 |
elope | -0.178 |
Token | One |
Token ID | 1881 |
Feature activation | +5.25e-02 |
Pos logit contributions | |
mie | +0.053 |
etsy | +0.051 |
hew | +0.050 |
ppa | +0.050 |
lves | +0.049 |
Neg logit contributions | |
show | -0.037 |
new | -0.035 |
trick | -0.033 |
to | -0.033 |
grown | -0.032 |
Token | day |
Token ID | 1110 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
mie | +0.122 |
elope | +0.122 |
etsy | +0.120 |
jo | +0.119 |
uddy | +0.115 |
Neg logit contributions | |
show | -0.049 |
trick | -0.049 |
matching | -0.042 |
making | -0.042 |
test | -0.041 |
Token | , |
Token ID | 11 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
etsy | +0.053 |
mie | +0.053 |
elope | +0.052 |
uddy | +0.050 |
rified | +0.050 |
Neg logit contributions | |
show | -0.020 |
trick | -0.020 |
new | -0.017 |
original | -0.016 |
design | -0.016 |
Token | when |
Token ID | 618 |
Feature activation | -3.78e-02 |
Pos logit contributions | |
show | +0.181 |
trick | +0.172 |
new | +0.170 |
grown | +0.162 |
making | +0.161 |
Neg logit contributions | |
mie | -0.179 |
etsy | -0.171 |
hew | -0.167 |
elope | -0.167 |
jo | -0.165 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
show | +0.066 |
trick | +0.064 |
new | +0.061 |
test | +0.059 |
grown | +0.059 |
Neg logit contributions | |
mie | -0.062 |
etsy | -0.059 |
elope | -0.059 |
hew | -0.056 |
jo | -0.056 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
mie | +0.406 |
etsy | +0.397 |
och | +0.396 |
ongo | +0.392 |
storms | +0.390 |
Neg logit contributions | |
show | -0.382 |
trick | -0.352 |
to | -0.339 |
grown | -0.336 |
new | -0.335 |
Token | was |
Token ID | 373 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
mie | +0.799 |
etsy | +0.766 |
elope | +0.749 |
hew | +0.742 |
jo | +0.735 |
Neg logit contributions | |
show | -0.707 |
trick | -0.678 |
new | -0.663 |
grown | -0.629 |
test | -0.626 |
Token | exploring |
Token ID | 13504 |
Feature activation | -4.20e-02 |
Pos logit contributions | |
trick | +0.205 |
show | +0.180 |
common | +0.179 |
color | +0.176 |
my | +0.176 |
Neg logit contributions | |
mie | -0.224 |
oped | -0.195 |
etsy | -0.191 |
ppy | -0.191 |
elope | -0.190 |
Token | , |
Token ID | 11 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
trick | +0.042 |
show | +0.039 |
style | +0.034 |
test | +0.033 |
grown | +0.033 |
Neg logit contributions | |
mie | -0.095 |
elope | -0.092 |
etsy | -0.088 |
ley | -0.086 |
Hop | -0.086 |
Token | she |
Token ID | 673 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
new | +0.151 |
the | +0.148 |
show | +0.146 |
to | +0.145 |
grown | +0.138 |
Neg logit contributions | |
hew | -0.213 |
mie | -0.209 |
ongo | -0.206 |
x | -0.205 |
och | -0.203 |
Token | found |
Token ID | 1043 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
etsy | +0.495 |
mie | +0.482 |
uddy | +0.472 |
thel | +0.462 |
jo | +0.462 |
Neg logit contributions | |
show | -0.345 |
grown | -0.334 |
new | -0.320 |
to | -0.311 |
trick | -0.309 |
Token | bird |
Token ID | 6512 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
show | +0.189 |
trick | +0.181 |
new | +0.175 |
making | +0.168 |
my | +0.168 |
Neg logit contributions | |
mie | -0.235 |
etsy | -0.225 |
elope | -0.222 |
hew | -0.217 |
pillar | -0.215 |
Token | began |
Token ID | 2540 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
mie | +0.528 |
etsy | +0.521 |
hew | +0.503 |
thel | +0.503 |
ongo | +0.488 |
Neg logit contributions | |
show | -0.459 |
trick | -0.424 |
new | -0.423 |
grown | -0.404 |
to | -0.401 |
Token | to |
Token ID | 284 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
show | +0.089 |
test | +0.087 |
my | +0.082 |
job | +0.081 |
trick | +0.080 |
Neg logit contributions | |
elope | -0.327 |
jo | -0.320 |
storms | -0.317 |
mie | -0.315 |
etsy | -0.313 |
Token | tell |
Token ID | 1560 |
Feature activation | -7.21e-02 |
Pos logit contributions | |
show | +0.273 |
new | +0.271 |
trick | +0.265 |
math | +0.260 |
matching | +0.257 |
Neg logit contributions | |
elope | -0.467 |
mie | -0.463 |
etsy | -0.439 |
jo | -0.436 |
storms | -0.436 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
show | +0.066 |
new | +0.061 |
trick | +0.059 |
grown | +0.054 |
for | +0.054 |
Neg logit contributions | |
mie | -0.183 |
etsy | -0.178 |
hew | -0.175 |
ongo | -0.173 |
oped | -0.172 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
lves | +0.251 |
och | +0.250 |
oped | +0.242 |
oled | +0.228 |
mie | +0.207 |
Neg logit contributions | |
to | -0.575 |
new | -0.551 |
for | -0.548 |
the | -0.537 |
trick | -0.533 |
Token | it |
Token ID | 340 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
mie | +1.214 |
etsy | +1.187 |
hew | +1.173 |
jo | +1.153 |
elope | +1.148 |
Neg logit contributions | |
show | -0.301 |
new | -0.285 |
trick | -0.265 |
to | -0.243 |
for | -0.243 |
Token | 's |
Token ID | 338 |
Feature activation | -4.27e-02 |
Pos logit contributions | |
mie | +0.322 |
etsy | +0.313 |
hew | +0.304 |
elope | +0.300 |
jo | +0.299 |
Neg logit contributions | |
show | -0.178 |
trick | -0.168 |
new | -0.166 |
grown | -0.153 |
for | -0.150 |
Token | story |
Token ID | 1621 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
show | +0.046 |
trick | +0.042 |
my | +0.041 |
making | +0.040 |
your | +0.040 |
Neg logit contributions | |
elope | -0.092 |
mie | -0.091 |
etsy | -0.090 |
jo | -0.088 |
hew | -0.088 |
Token | . |
Token ID | 13 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
mie | +0.278 |
etsy | +0.269 |
elope | +0.265 |
hew | +0.263 |
jo | +0.262 |
Neg logit contributions | |
show | -0.113 |
trick | -0.104 |
new | -0.100 |
grown | -0.093 |
test | -0.091 |
Token | |
Token ID | 220 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
x | +0.053 |
mie | +0.053 |
ppa | +0.052 |
lves | +0.052 |
ongo | +0.051 |
Neg logit contributions | |
show | -0.038 |
new | -0.038 |
the | -0.038 |
to | -0.037 |
my | -0.036 |
Token | |
Token ID | 220 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
ppa | +0.055 |
x | +0.054 |
pper | +0.054 |
mie | +0.053 |
lves | +0.053 |
Neg logit contributions | |
to | -0.032 |
show | -0.032 |
the | -0.032 |
new | -0.031 |
my | -0.030 |
Token |
|
Token ID | 198 |
Feature activation | +8.67e-02 |
Pos logit contributions | |
rified | +0.459 |
ley | +0.458 |
mie | +0.452 |
lves | +0.450 |
pillar | +0.443 |
Neg logit contributions | |
new | -0.190 |
to | -0.184 |
the | -0.179 |
for | -0.161 |
your | -0.161 |
Token |
|
Token ID | 198 |
Feature activation | +8.51e-02 |
Pos logit contributions | |
mie | +0.193 |
rified | +0.189 |
storms | +0.189 |
lves | +0.188 |
x | +0.187 |
Neg logit contributions | |
show | -0.102 |
new | -0.096 |
the | -0.093 |
grown | -0.092 |
to | -0.090 |
Token | Now |
Token ID | 3844 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
mie | +0.123 |
storms | +0.116 |
ongo | +0.114 |
etsy | +0.114 |
jo | +0.112 |
Neg logit contributions | |
show | -0.166 |
trick | -0.157 |
my | -0.155 |
grown | -0.155 |
new | -0.154 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
mie | +0.039 |
etsy | +0.038 |
hew | +0.037 |
jo | +0.037 |
elope | +0.036 |
Neg logit contributions | |
show | -0.032 |
new | -0.030 |
trick | -0.030 |
my | -0.028 |
grown | -0.028 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
och | +0.133 |
mie | +0.128 |
etsy | +0.127 |
ongo | +0.122 |
lves | +0.118 |
Neg logit contributions | |
show | -0.631 |
trick | -0.612 |
new | -0.609 |
for | -0.601 |
my | -0.594 |
Token | 's |
Token ID | 338 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
mie | +0.805 |
etsy | +0.794 |
elope | +0.759 |
hew | +0.753 |
jo | +0.749 |
Neg logit contributions | |
show | -0.702 |
trick | -0.658 |
new | -0.642 |
grown | -0.622 |
making | -0.613 |
Token | special |
Token ID | 2041 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
show | +0.069 |
trick | +0.067 |
my | +0.064 |
grown | +0.063 |
your | +0.063 |
Neg logit contributions | |
mie | -0.074 |
elope | -0.073 |
hew | -0.070 |
jo | -0.069 |
etsy | -0.067 |
Token | lamp |
Token ID | 20450 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
show | +0.166 |
trick | +0.160 |
grown | +0.152 |
making | +0.152 |
your | +0.151 |
Neg logit contributions | |
elope | -0.194 |
mie | -0.191 |
jo | -0.189 |
hew | -0.180 |
Brown | -0.175 |
Token | works |
Token ID | 2499 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
mie | +0.462 |
etsy | +0.447 |
elope | +0.434 |
hew | +0.432 |
jo | +0.427 |
Neg logit contributions | |
show | -0.372 |
trick | -0.353 |
new | -0.345 |
grown | -0.328 |
test | -0.325 |
Token | better |
Token ID | 1365 |
Feature activation | -9.96e-02 |
Pos logit contributions | |
show | +0.126 |
trick | +0.118 |
new | +0.110 |
test | +0.107 |
grown | +0.107 |
Neg logit contributions | |
mie | -0.238 |
etsy | -0.224 |
hew | -0.221 |
jo | -0.221 |
elope | -0.220 |
Token | excited |
Token ID | 6568 |
Feature activation | -9.15e-02 |
Pos logit contributions | |
show | +0.162 |
trick | +0.156 |
new | +0.144 |
test | +0.139 |
making | +0.136 |
Neg logit contributions | |
mie | -0.269 |
etsy | -0.257 |
elope | -0.254 |
hew | -0.251 |
jo | -0.248 |
Token | . |
Token ID | 13 |
Feature activation | +2.33e-02 |
Pos logit contributions | |
show | +0.082 |
trick | +0.075 |
new | +0.074 |
making | +0.066 |
for | +0.066 |
Neg logit contributions | |
mie | -0.230 |
etsy | -0.225 |
elope | -0.222 |
hew | -0.221 |
jo | -0.218 |
Token |
|
Token ID | 198 |
Feature activation | +8.47e-02 |
Pos logit contributions | |
ppers | +0.060 |
pper | +0.060 |
ache | +0.057 |
ppy | +0.057 |
ppa | +0.057 |
Neg logit contributions | |
to | -0.025 |
the | -0.024 |
new | -0.021 |
my | -0.021 |
show | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | +8.39e-02 |
Pos logit contributions | |
ksh | +0.232 |
storms | +0.231 |
ley | +0.229 |
rified | +0.225 |
x | +0.220 |
Neg logit contributions | |
new | -0.068 |
the | -0.065 |
big | -0.062 |
to | -0.061 |
grown | -0.058 |
Token | Pen |
Token ID | 25553 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
storms | +0.184 |
ley | +0.180 |
Claus | +0.175 |
ksh | +0.171 |
rified | +0.170 |
Neg logit contributions | |
grown | -0.105 |
my | -0.096 |
show | -0.096 |
new | -0.094 |
your | -0.094 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
och | +0.160 |
etsy | +0.152 |
mie | +0.151 |
lves | +0.149 |
ongo | +0.146 |
Neg logit contributions | |
show | -0.585 |
grown | -0.560 |
the | -0.556 |
trick | -0.553 |
to | -0.549 |
Token | started |
Token ID | 2067 |
Feature activation | -1.56e-01 |
Pos logit contributions | |
etsy | +0.847 |
mie | +0.840 |
storms | +0.803 |
hew | +0.799 |
uddy | +0.794 |
Neg logit contributions | |
show | -0.670 |
trick | -0.602 |
grown | -0.596 |
new | -0.596 |
to | -0.590 |
Token | to |
Token ID | 284 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
show | +0.109 |
my | +0.106 |
trick | +0.103 |
job | +0.093 |
original | +0.093 |
Neg logit contributions | |
elope | -0.368 |
mie | -0.368 |
jo | -0.362 |
storms | -0.358 |
etsy | -0.348 |
Token | call |
Token ID | 869 |
Feature activation | -4.18e-03 |
Pos logit contributions | |
show | +0.265 |
new | +0.259 |
trick | +0.259 |
my | +0.235 |
for | +0.234 |
Neg logit contributions | |
mie | -0.527 |
elope | -0.513 |
etsy | -0.499 |
jo | -0.497 |
hew | -0.489 |
Token | her |
Token ID | 607 |
Feature activation | -3.60e-02 |
Pos logit contributions | |
show | +0.003 |
trick | +0.003 |
new | +0.002 |
grown | +0.002 |
test | +0.002 |
Neg logit contributions | |
mie | -0.011 |
etsy | -0.011 |
elope | -0.011 |
jo | -0.011 |
hew | -0.010 |
Token | mom |
Token ID | 1995 |
Feature activation | +2.99e-01 |
Pos logit contributions | |
show | +0.047 |
trick | +0.044 |
new | +0.043 |
grown | +0.040 |
test | +0.039 |
Neg logit contributions | |
mie | -0.078 |
etsy | -0.076 |
hew | -0.074 |
jo | -0.073 |
elope | -0.073 |
Token | went |
Token ID | 1816 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
mie | +0.362 |
jo | +0.321 |
elope | +0.317 |
bo | +0.313 |
ppy | +0.309 |
Neg logit contributions | |
new | -0.440 |
trick | -0.434 |
show | -0.433 |
my | -0.417 |
making | -0.411 |
Token | to |
Token ID | 284 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
trick | +0.119 |
common | +0.117 |
color | +0.115 |
original | +0.112 |
idea | +0.110 |
Neg logit contributions | |
mie | -0.190 |
storms | -0.173 |
jo | -0.173 |
Hop | -0.172 |
Snow | -0.170 |
Token | bed |
Token ID | 3996 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
trick | +0.316 |
matching | +0.309 |
original | +0.301 |
skills | +0.300 |
example | +0.300 |
Neg logit contributions | |
elope | -0.365 |
mie | -0.363 |
jo | -0.334 |
Snow | -0.333 |
Snow | -0.333 |
Token | , |
Token ID | 11 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
mie | +0.278 |
storms | +0.268 |
etsy | +0.262 |
jo | +0.251 |
uffy | +0.251 |
Neg logit contributions | |
trick | -0.142 |
show | -0.139 |
chance | -0.137 |
power | -0.134 |
my | -0.130 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
show | +0.176 |
new | +0.168 |
trick | +0.163 |
grown | +0.158 |
making | +0.158 |
Neg logit contributions | |
mie | -0.187 |
etsy | -0.182 |
hew | -0.181 |
jo | -0.175 |
ongo | -0.173 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
och | +0.220 |
cases | +0.218 |
oled | +0.217 |
etsy | +0.216 |
oped | +0.214 |
Neg logit contributions | |
show | -0.564 |
to | -0.551 |
new | -0.550 |
trick | -0.548 |
the | -0.539 |
Token | would |
Token ID | 561 |
Feature activation | -7.18e-02 |
Pos logit contributions | |
mie | +0.693 |
etsy | +0.645 |
elope | +0.640 |
jo | +0.630 |
hew | +0.629 |
Neg logit contributions | |
show | -0.805 |
trick | -0.786 |
new | -0.766 |
test | -0.727 |
grown | -0.725 |
Token | turn |
Token ID | 1210 |
Feature activation | -9.71e-02 |
Pos logit contributions | |
new | +0.073 |
trick | +0.070 |
show | +0.066 |
grown | +0.062 |
matching | +0.062 |
Neg logit contributions | |
mie | -0.157 |
elope | -0.149 |
jo | -0.147 |
etsy | -0.147 |
hew | -0.145 |
Token | the |
Token ID | 262 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
trick | +0.114 |
show | +0.113 |
grown | +0.103 |
test | +0.099 |
new | +0.098 |
Neg logit contributions | |
mie | -0.208 |
jo | -0.191 |
storms | -0.187 |
hew | -0.185 |
pillar | -0.185 |
Token | lamp |
Token ID | 20450 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
show | +0.170 |
trick | +0.166 |
meeting | +0.159 |
making | +0.156 |
grown | +0.156 |
Neg logit contributions | |
mie | -0.213 |
jo | -0.209 |
Brown | -0.205 |
hew | -0.205 |
elope | -0.204 |
Token | on |
Token ID | 319 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
mie | +0.572 |
storms | +0.546 |
elope | +0.543 |
jo | +0.543 |
etsy | +0.535 |
Neg logit contributions | |
show | -0.224 |
trick | -0.215 |
grown | -0.203 |
new | -0.195 |
my | -0.191 |
Token | this |
Token ID | 428 |
Feature activation | -5.09e-02 |
Pos logit contributions | |
show | +0.171 |
trick | +0.161 |
new | +0.149 |
grown | +0.139 |
test | +0.133 |
Neg logit contributions | |
mie | -0.587 |
elope | -0.566 |
etsy | -0.562 |
hew | -0.557 |
jo | -0.552 |
Token | weird |
Token ID | 7650 |
Feature activation | -9.27e-02 |
Pos logit contributions | |
show | +0.060 |
trick | +0.057 |
matching | +0.055 |
grown | +0.055 |
new | +0.054 |
Neg logit contributions | |
mie | -0.104 |
elope | -0.100 |
pillar | -0.098 |
jo | -0.096 |
etsy | -0.096 |
Token | owl |
Token ID | 39610 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
show | +0.173 |
trick | +0.165 |
new | +0.160 |
making | +0.160 |
matching | +0.160 |
Neg logit contributions | |
mie | -0.128 |
elope | -0.123 |
pillar | -0.121 |
jo | -0.119 |
etsy | -0.118 |
Token | !" |
Token ID | 2474 |
Feature activation | +5.64e-02 |
Pos logit contributions | |
mie | +0.711 |
etsy | +0.686 |
elope | +0.676 |
hew | +0.670 |
jo | +0.667 |
Neg logit contributions | |
show | -0.372 |
trick | -0.351 |
new | -0.341 |
grown | -0.320 |
test | -0.314 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
mie | +0.106 |
hew | +0.106 |
lves | +0.105 |
x | +0.104 |
ongo | +0.103 |
Neg logit contributions | |
show | -0.092 |
to | -0.085 |
the | -0.084 |
new | -0.082 |
grown | -0.080 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
och | +0.200 |
lves | +0.176 |
storms | +0.171 |
oled | +0.164 |
ongo | +0.161 |
Neg logit contributions | |
show | -0.575 |
to | -0.571 |
the | -0.559 |
trick | -0.553 |
new | -0.552 |
Token | 's |
Token ID | 338 |
Feature activation | -4.54e-02 |
Pos logit contributions | |
mie | +0.813 |
etsy | +0.811 |
hew | +0.775 |
storms | +0.774 |
jo | +0.762 |
Neg logit contributions | |
show | -0.706 |
trick | -0.647 |
new | -0.640 |
grown | -0.623 |
to | -0.615 |
Token | mom |
Token ID | 1995 |
Feature activation | +3.02e-01 |
Pos logit contributions | |
show | +0.060 |
trick | +0.056 |
new | +0.056 |
grown | +0.052 |
test | +0.051 |
Neg logit contributions | |
mie | -0.096 |
etsy | -0.093 |
elope | -0.091 |
hew | -0.090 |
jo | -0.090 |
Token | came |
Token ID | 1625 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
etsy | +0.640 |
storms | +0.635 |
lves | +0.628 |
pillar | +0.616 |
hew | +0.615 |
Neg logit contributions | |
show | -0.437 |
making | -0.376 |
to | -0.374 |
trick | -0.368 |
the | -0.364 |
Token | over |
Token ID | 625 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
show | +0.077 |
trick | +0.069 |
new | +0.066 |
grown | +0.059 |
making | +0.058 |
Neg logit contributions | |
mie | -0.265 |
etsy | -0.259 |
elope | -0.254 |
hew | -0.253 |
jo | -0.252 |
Token | to |
Token ID | 284 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
trick | +0.159 |
show | +0.154 |
test | +0.142 |
job | +0.140 |
original | +0.137 |
Neg logit contributions | |
mie | -0.353 |
elope | -0.339 |
etsy | -0.332 |
rified | -0.332 |
jo | -0.329 |
Token | a |
Token ID | 257 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
show | +0.085 |
trick | +0.078 |
new | +0.064 |
test | +0.062 |
grown | +0.058 |
Neg logit contributions | |
mie | -0.359 |
etsy | -0.350 |
elope | -0.346 |
hew | -0.340 |
jo | -0.338 |
Token | little |
Token ID | 1310 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
show | +0.109 |
new | +0.099 |
trick | +0.096 |
grown | +0.088 |
test | +0.084 |
Neg logit contributions | |
mie | -0.326 |
etsy | -0.318 |
hew | -0.316 |
jo | -0.313 |
elope | -0.311 |
Token | girl |
Token ID | 2576 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
show | +0.025 |
new | +0.024 |
red | +0.023 |
blue | +0.023 |
trick | +0.022 |
Neg logit contributions | |
hew | -0.029 |
mie | -0.029 |
etsy | -0.028 |
jo | -0.028 |
lor | -0.027 |
Token | named |
Token ID | 3706 |
Feature activation | +3.05e-02 |
Pos logit contributions | |
mie | +0.495 |
etsy | +0.476 |
elope | +0.464 |
hew | +0.462 |
jo | +0.457 |
Neg logit contributions | |
show | -0.424 |
trick | -0.403 |
new | -0.394 |
grown | -0.376 |
test | -0.372 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
mie | +0.067 |
jo | +0.063 |
storms | +0.063 |
elope | +0.063 |
hew | +0.062 |
Neg logit contributions | |
show | -0.039 |
new | -0.036 |
grown | -0.035 |
trick | -0.034 |
my | -0.034 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
lves | +0.321 |
rus | +0.318 |
storms | +0.318 |
cases | +0.317 |
rified | +0.315 |
Neg logit contributions | |
show | -0.441 |
to | -0.431 |
time | -0.428 |
new | -0.425 |
the | -0.425 |
Token | . |
Token ID | 13 |
Feature activation | +2.55e-02 |
Pos logit contributions | |
mie | +1.037 |
etsy | +1.008 |
hew | +0.989 |
elope | +0.978 |
jo | +0.974 |
Neg logit contributions | |
show | -0.479 |
trick | -0.439 |
new | -0.432 |
grown | -0.401 |
making | -0.393 |
Token | She |
Token ID | 1375 |
Feature activation | +2.69e-01 |
Pos logit contributions | |
mie | +0.040 |
hew | +0.037 |
etsy | +0.037 |
ppa | +0.037 |
lves | +0.037 |
Neg logit contributions | |
show | -0.047 |
new | -0.046 |
to | -0.044 |
my | -0.044 |
grown | -0.044 |
Token | loved |
Token ID | 6151 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
mie | +0.523 |
etsy | +0.506 |
hew | +0.494 |
elope | +0.491 |
jo | +0.484 |
Neg logit contributions | |
show | -0.400 |
trick | -0.376 |
new | -0.370 |
grown | -0.358 |
making | -0.347 |
Token | to |
Token ID | 284 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
trick | +0.133 |
show | +0.126 |
chance | +0.117 |
match | +0.106 |
answer | +0.104 |
Neg logit contributions | |
storms | -0.431 |
mie | -0.418 |
jo | -0.396 |
Brown | -0.392 |
thel | -0.390 |
Token | explore |
Token ID | 7301 |
Feature activation | -4.17e-02 |
Pos logit contributions | |
new | +0.284 |
for | +0.278 |
my | +0.272 |
chance | +0.271 |
trick | +0.258 |
Neg logit contributions | |
mie | -0.397 |
elope | -0.392 |
jo | -0.390 |
etsy | -0.381 |
Snow | -0.375 |
Token | a |
Token ID | 257 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
show | +0.050 |
new | +0.041 |
trick | +0.038 |
grown | +0.029 |
making | +0.027 |
Neg logit contributions | |
mie | -0.404 |
etsy | -0.395 |
hew | -0.389 |
jo | -0.388 |
elope | -0.387 |
Token | little |
Token ID | 1310 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
show | +0.096 |
new | +0.090 |
trick | +0.081 |
grown | +0.076 |
big | +0.071 |
Neg logit contributions | |
mie | -0.347 |
hew | -0.340 |
etsy | -0.337 |
jo | -0.335 |
storms | -0.332 |
Token | girl |
Token ID | 2576 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
show | +0.022 |
new | +0.022 |
red | +0.021 |
blue | +0.020 |
green | +0.020 |
Neg logit contributions | |
hew | -0.027 |
mie | -0.026 |
lor | -0.026 |
etsy | -0.026 |
jo | -0.026 |
Token | named |
Token ID | 3706 |
Feature activation | +2.71e-02 |
Pos logit contributions | |
mie | +0.468 |
etsy | +0.448 |
elope | +0.443 |
jo | +0.432 |
hew | +0.428 |
Neg logit contributions | |
show | -0.444 |
trick | -0.432 |
new | -0.420 |
grown | -0.401 |
test | -0.398 |
Token | Pen |
Token ID | 7507 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
mie | +0.059 |
jo | +0.056 |
hew | +0.055 |
elope | +0.055 |
rified | +0.054 |
Neg logit contributions | |
show | -0.035 |
new | -0.033 |
trick | -0.032 |
grown | -0.032 |
my | -0.031 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
cases | +0.321 |
lves | +0.316 |
rified | +0.313 |
storms | +0.310 |
rus | +0.308 |
Neg logit contributions | |
to | -0.459 |
show | -0.454 |
time | -0.446 |
the | -0.446 |
new | -0.443 |
Token | . |
Token ID | 13 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
mie | +1.014 |
etsy | +0.983 |
elope | +0.962 |
hew | +0.960 |
jo | +0.952 |
Neg logit contributions | |
show | -0.495 |
trick | -0.461 |
new | -0.449 |
grown | -0.419 |
test | -0.411 |
Token | She |
Token ID | 1375 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
mie | +0.040 |
hew | +0.037 |
etsy | +0.037 |
ppa | +0.037 |
lves | +0.037 |
Neg logit contributions | |
show | -0.050 |
new | -0.048 |
trick | -0.047 |
to | -0.047 |
grown | -0.046 |
Token | had |
Token ID | 550 |
Feature activation | -4.73e-02 |
Pos logit contributions | |
mie | +0.484 |
etsy | +0.463 |
elope | +0.455 |
jo | +0.447 |
hew | +0.446 |
Neg logit contributions | |
show | -0.424 |
trick | -0.408 |
new | -0.397 |
test | -0.377 |
grown | -0.374 |
Token | a |
Token ID | 257 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
show | +0.017 |
new | +0.015 |
trick | +0.013 |
grown | +0.011 |
making | +0.010 |
Neg logit contributions | |
mie | -0.144 |
etsy | -0.141 |
hew | -0.140 |
jo | -0.139 |
elope | -0.139 |
Token | really |
Token ID | 1107 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
show | +0.103 |
trick | +0.099 |
making | +0.090 |
my | +0.088 |
for | +0.084 |
Neg logit contributions | |
mie | -0.303 |
etsy | -0.300 |
elope | -0.295 |
pillar | -0.285 |
mi | -0.282 |
Token | had |
Token ID | 550 |
Feature activation | -4.84e-02 |
Pos logit contributions | |
etsy | +0.630 |
mie | +0.618 |
elope | +0.604 |
rified | +0.601 |
lves | +0.599 |
Neg logit contributions | |
show | -0.468 |
trick | -0.429 |
grown | -0.412 |
to | -0.408 |
new | -0.405 |
Token | hoped |
Token ID | 10719 |
Feature activation | -4.04e-02 |
Pos logit contributions | |
show | +0.055 |
test | +0.054 |
job | +0.053 |
trick | +0.052 |
quiz | +0.050 |
Neg logit contributions | |
mie | -0.097 |
hew | -0.093 |
la | -0.087 |
ppy | -0.085 |
apa | -0.084 |
Token | ! |
Token ID | 0 |
Feature activation | +2.75e-02 |
Pos logit contributions | |
show | +0.038 |
trick | +0.036 |
new | +0.032 |
test | +0.032 |
grown | +0.031 |
Neg logit contributions | |
mie | -0.096 |
hew | -0.091 |
etsy | -0.091 |
jo | -0.091 |
elope | -0.091 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +9.76e-02 |
Pos logit contributions | |
ppa | +0.062 |
mie | +0.062 |
ppy | +0.062 |
ley | +0.061 |
etsy | +0.060 |
Neg logit contributions | |
to | -0.033 |
new | -0.033 |
show | -0.033 |
his | -0.030 |
math | -0.030 |
Token | Pen |
Token ID | 25553 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
etsy | +0.219 |
lves | +0.218 |
mie | +0.218 |
ppa | +0.216 |
hew | +0.211 |
Neg logit contributions | |
show | -0.117 |
new | -0.113 |
the | -0.111 |
to | -0.111 |
trick | -0.104 |
Token | elope |
Token ID | 47329 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
mie | +0.402 |
etsy | +0.398 |
storms | +0.396 |
lves | +0.391 |
rified | +0.384 |
Neg logit contributions | |
show | -0.358 |
trick | -0.336 |
to | -0.334 |
the | -0.324 |
for | -0.321 |
Token | was |
Token ID | 373 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
mie | +0.890 |
etsy | +0.854 |
elope | +0.841 |
hew | +0.833 |
jo | +0.827 |
Neg logit contributions | |
show | -0.610 |
trick | -0.584 |
new | -0.566 |
grown | -0.533 |
test | -0.531 |
Token | a |
Token ID | 257 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
trick | +0.171 |
show | +0.152 |
test | +0.141 |
new | +0.129 |
design | +0.127 |
Neg logit contributions | |
mie | -0.286 |
elope | -0.267 |
etsy | -0.257 |
rified | -0.252 |
mi | -0.251 |
Token | lovely |
Token ID | 14081 |
Feature activation | -7.35e-02 |
Pos logit contributions | |
show | +0.108 |
new | +0.097 |
trick | +0.093 |
grown | +0.087 |
test | +0.083 |
Neg logit contributions | |
mie | -0.321 |
etsy | -0.315 |
hew | -0.312 |
jo | -0.307 |
elope | -0.306 |
Token | little |
Token ID | 1310 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
show | +0.103 |
trick | +0.099 |
new | +0.095 |
grown | +0.090 |
test | +0.090 |
Neg logit contributions | |
mie | -0.145 |
etsy | -0.140 |
elope | -0.137 |
jo | -0.135 |
hew | -0.134 |
Token | girl |
Token ID | 2576 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
show | +0.022 |
new | +0.021 |
red | +0.020 |
blue | +0.020 |
for | +0.019 |
Neg logit contributions | |
hew | -0.025 |
etsy | -0.024 |
mie | -0.024 |
lor | -0.023 |
elope | -0.023 |
Token | they |
Token ID | 484 |
Feature activation | +2.14e-01 |
Pos logit contributions | |
mie | +0.352 |
etsy | +0.343 |
hew | +0.336 |
elope | +0.336 |
jo | +0.335 |
Neg logit contributions | |
show | -0.059 |
trick | -0.050 |
new | -0.041 |
grown | -0.038 |
test | -0.037 |
Token | do |
Token ID | 466 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
mie | +0.390 |
etsy | +0.381 |
elope | +0.368 |
hew | +0.364 |
jo | +0.364 |
Neg logit contributions | |
show | -0.351 |
trick | -0.321 |
new | -0.311 |
grown | -0.308 |
for | -0.303 |
Token | , |
Token ID | 11 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
show | +0.133 |
trick | +0.124 |
new | +0.120 |
test | +0.113 |
red | +0.113 |
Neg logit contributions | |
mie | -0.273 |
elope | -0.266 |
hew | -0.265 |
jo | -0.259 |
etsy | -0.254 |
Token | they |
Token ID | 484 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
show | +0.157 |
new | +0.144 |
trick | +0.143 |
making | +0.137 |
for | +0.135 |
Neg logit contributions | |
mie | -0.257 |
etsy | -0.250 |
hew | -0.245 |
elope | -0.241 |
jo | -0.241 |
Token | bump |
Token ID | 13852 |
Feature activation | -8.24e-02 |
Pos logit contributions | |
mie | +0.482 |
etsy | +0.476 |
elope | +0.461 |
hew | +0.458 |
jo | +0.457 |
Neg logit contributions | |
show | -0.301 |
trick | -0.269 |
grown | -0.253 |
new | -0.253 |
test | -0.251 |
Token | into |
Token ID | 656 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
show | +0.086 |
trick | +0.079 |
new | +0.075 |
test | +0.071 |
grown | +0.071 |
Neg logit contributions | |
mie | -0.196 |
etsy | -0.187 |
hew | -0.184 |
elope | -0.184 |
jo | -0.183 |
Token | the |
Token ID | 262 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
show | +0.170 |
trick | +0.149 |
new | +0.140 |
grown | +0.121 |
test | +0.117 |
Neg logit contributions | |
mie | -0.798 |
etsy | -0.779 |
elope | -0.766 |
hew | -0.763 |
jo | -0.759 |
Token | tower |
Token ID | 10580 |
Feature activation | +2.37e-01 |
Pos logit contributions | |
show | +0.172 |
trick | +0.167 |
new | +0.155 |
grown | +0.151 |
making | +0.151 |
Neg logit contributions | |
mie | -0.255 |
elope | -0.246 |
etsy | -0.241 |
pillar | -0.238 |
hew | -0.238 |
Token | . |
Token ID | 13 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
mie | +0.511 |
elope | +0.499 |
hew | +0.491 |
jo | +0.491 |
etsy | +0.488 |
Neg logit contributions | |
show | -0.265 |
trick | -0.253 |
new | -0.244 |
grown | -0.234 |
test | -0.227 |
Token | The |
Token ID | 383 |
Feature activation | -2.45e-02 |
Pos logit contributions | |
mie | +0.036 |
ppa | +0.034 |
ley | +0.033 |
thel | +0.033 |
mi | +0.033 |
Neg logit contributions | |
show | -0.020 |
my | -0.019 |
new | -0.019 |
your | -0.019 |
the | -0.019 |
Token | tower |
Token ID | 10580 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
show | +0.030 |
trick | +0.028 |
new | +0.027 |
grown | +0.025 |
making | +0.025 |
Neg logit contributions | |
mie | -0.052 |
etsy | -0.050 |
elope | -0.049 |
hew | -0.049 |
jo | -0.048 |
Token | hits |
Token ID | 7127 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
mie | +0.024 |
etsy | +0.022 |
elope | +0.022 |
jo | +0.022 |
hew | +0.022 |
Neg logit contributions | |
show | -0.022 |
trick | -0.020 |
new | -0.020 |
grown | -0.019 |
making | -0.019 |
Token | the |
Token ID | 262 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
show | +0.103 |
trick | +0.091 |
new | +0.090 |
my | +0.077 |
for | +0.075 |
Neg logit contributions | |
mie | -0.480 |
etsy | -0.473 |
elope | -0.460 |
hew | -0.456 |
jo | -0.453 |
Token | wall |
Token ID | 3355 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
show | +0.172 |
trick | +0.163 |
new | +0.158 |
grown | +0.150 |
test | +0.148 |
Neg logit contributions | |
mie | -0.263 |
etsy | -0.253 |
elope | -0.249 |
hew | -0.247 |
jo | -0.245 |
Token | and |
Token ID | 290 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
mie | +0.289 |
jo | +0.287 |
storms | +0.283 |
hew | +0.282 |
elope | +0.277 |
Neg logit contributions | |
show | -0.194 |
trick | -0.185 |
new | -0.183 |
grown | -0.176 |
matching | -0.174 |
Token | breaks |
Token ID | 9457 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
trick | +0.136 |
show | +0.135 |
new | +0.131 |
grown | +0.122 |
chance | +0.121 |
Neg logit contributions | |
mie | -0.229 |
storms | -0.217 |
elope | -0.217 |
rified | -0.212 |
hew | -0.212 |
Token | into |
Token ID | 656 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
show | +0.136 |
trick | +0.126 |
new | +0.122 |
grown | +0.111 |
making | +0.110 |
Neg logit contributions | |
mie | -0.361 |
etsy | -0.352 |
elope | -0.345 |
hew | -0.343 |
jo | -0.341 |
Token | pieces |
Token ID | 5207 |
Feature activation | +7.43e-02 |
Pos logit contributions | |
show | +0.281 |
trick | +0.261 |
new | +0.255 |
grown | +0.237 |
making | +0.230 |
Neg logit contributions | |
mie | -0.691 |
etsy | -0.674 |
elope | -0.655 |
hew | -0.652 |
jo | -0.651 |
Token | . |
Token ID | 13 |
Feature activation | +7.29e-03 |
Pos logit contributions | |
mie | +0.166 |
etsy | +0.160 |
hew | +0.157 |
elope | +0.156 |
jo | +0.156 |
Neg logit contributions | |
show | -0.084 |
trick | -0.079 |
new | -0.076 |
test | -0.071 |
grown | -0.071 |
Token | Mia |
Token ID | 32189 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
mie | +0.016 |
lves | +0.015 |
etsy | +0.015 |
thel | +0.015 |
ley | +0.015 |
Neg logit contributions | |
my | -0.010 |
your | -0.010 |
show | -0.010 |
new | -0.009 |
to | -0.009 |
Token | is |
Token ID | 318 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
mie | +0.562 |
etsy | +0.544 |
elope | +0.532 |
hew | +0.528 |
jo | +0.525 |
Neg logit contributions | |
show | -0.357 |
trick | -0.337 |
new | -0.328 |
grown | -0.310 |
test | -0.307 |
Token | sad |
Token ID | 6507 |
Feature activation | -8.65e-02 |
Pos logit contributions | |
trick | +0.219 |
show | +0.216 |
test | +0.206 |
design | +0.205 |
job | +0.201 |
Neg logit contributions | |
mie | -0.210 |
ppa | -0.179 |
lves | -0.176 |
bo | -0.174 |
mi | -0.168 |
Token | a |
Token ID | 257 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
storms | +0.115 |
jo | +0.114 |
mie | +0.114 |
ppy | +0.112 |
elope | +0.112 |
Neg logit contributions | |
show | -0.057 |
test | -0.052 |
trick | -0.052 |
matching | -0.048 |
style | -0.047 |
Token | harsh |
Token ID | 11859 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
show | +0.106 |
trick | +0.098 |
new | +0.093 |
grown | +0.086 |
making | +0.085 |
Neg logit contributions | |
mie | -0.287 |
etsy | -0.279 |
elope | -0.275 |
hew | -0.271 |
jo | -0.271 |
Token | sound |
Token ID | 2128 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
show | +0.144 |
new | +0.137 |
trick | +0.131 |
matching | +0.131 |
my | +0.123 |
Neg logit contributions | |
jo | -0.253 |
elope | -0.253 |
mie | -0.251 |
etsy | -0.245 |
storms | -0.245 |
Token | and |
Token ID | 290 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
mie | +0.038 |
jo | +0.037 |
storms | +0.037 |
elope | +0.036 |
etsy | +0.036 |
Neg logit contributions | |
show | -0.021 |
new | -0.021 |
trick | -0.021 |
test | -0.019 |
math | -0.019 |
Token | broke |
Token ID | 6265 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
show | +0.128 |
trick | +0.120 |
new | +0.117 |
grown | +0.110 |
test | +0.108 |
Neg logit contributions | |
mie | -0.220 |
etsy | -0.214 |
elope | -0.208 |
hew | -0.208 |
jo | -0.206 |
Token | into |
Token ID | 656 |
Feature activation | -2.84e-01 |
Pos logit contributions | |
new | +0.077 |
show | +0.075 |
my | +0.073 |
the | +0.072 |
to | +0.070 |
Neg logit contributions | |
etsy | -0.344 |
mie | -0.339 |
oped | -0.331 |
hew | -0.330 |
pillar | -0.329 |
Token | pieces |
Token ID | 5207 |
Feature activation | +7.73e-02 |
Pos logit contributions | |
show | +0.204 |
new | +0.185 |
trick | +0.181 |
grown | +0.169 |
my | +0.161 |
Neg logit contributions | |
mie | -0.772 |
etsy | -0.762 |
hew | -0.736 |
jo | -0.730 |
elope | -0.727 |
Token | . |
Token ID | 13 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
mie | +0.181 |
etsy | +0.175 |
elope | +0.172 |
hew | +0.171 |
jo | +0.171 |
Neg logit contributions | |
show | -0.080 |
trick | -0.075 |
new | -0.072 |
grown | -0.067 |
test | -0.067 |
Token |
|
Token ID | 198 |
Feature activation | +7.62e-02 |
Pos logit contributions | |
mie | +0.034 |
pper | +0.033 |
ppa | +0.033 |
lves | +0.033 |
thel | +0.033 |
Neg logit contributions | |
my | -0.019 |
the | -0.018 |
to | -0.018 |
your | -0.018 |
his | -0.018 |
Token |
|
Token ID | 198 |
Feature activation | +7.53e-02 |
Pos logit contributions | |
rified | +0.207 |
storms | +0.202 |
mie | +0.200 |
ley | +0.199 |
lves | +0.198 |
Neg logit contributions | |
new | -0.066 |
the | -0.063 |
to | -0.062 |
big | -0.061 |
his | -0.059 |
Token | " |
Token ID | 1 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
storms | +0.164 |
rified | +0.157 |
ley | +0.154 |
mie | +0.152 |
als | +0.149 |
Neg logit contributions | |
your | -0.102 |
my | -0.101 |
grown | -0.097 |
show | -0.090 |
his | -0.089 |
Token | didn |
Token ID | 1422 |
Feature activation | -9.08e-02 |
Pos logit contributions | |
mie | +0.346 |
etsy | +0.334 |
elope | +0.328 |
jo | +0.325 |
storms | +0.324 |
Neg logit contributions | |
show | -0.273 |
trick | -0.256 |
new | -0.243 |
grown | -0.237 |
test | -0.232 |
Token | 't |
Token ID | 470 |
Feature activation | -5.95e-02 |
Pos logit contributions | |
show | +0.137 |
trick | +0.131 |
new | +0.129 |
grown | +0.124 |
making | +0.120 |
Neg logit contributions | |
mie | -0.167 |
etsy | -0.161 |
elope | -0.156 |
jo | -0.155 |
hew | -0.155 |
Token | mean |
Token ID | 1612 |
Feature activation | -9.69e-02 |
Pos logit contributions | |
show | +0.069 |
new | +0.065 |
trick | +0.064 |
making | +0.059 |
matching | +0.059 |
Neg logit contributions | |
mie | -0.130 |
etsy | -0.124 |
hew | -0.123 |
elope | -0.121 |
jo | -0.121 |
Token | to |
Token ID | 284 |
Feature activation | -2.50e-01 |
Pos logit contributions | |
show | +0.039 |
trick | +0.030 |
new | +0.026 |
grown | +0.021 |
test | +0.020 |
Neg logit contributions | |
mie | -0.289 |
etsy | -0.281 |
hew | -0.278 |
jo | -0.277 |
storms | -0.276 |
Token | bump |
Token ID | 13852 |
Feature activation | -7.70e-02 |
Pos logit contributions | |
show | +0.239 |
trick | +0.221 |
new | +0.211 |
grown | +0.194 |
test | +0.192 |
Neg logit contributions | |
mie | -0.615 |
etsy | -0.598 |
elope | -0.588 |
hew | -0.585 |
jo | -0.581 |
Token | into |
Token ID | 656 |
Feature activation | -2.84e-01 |
Pos logit contributions | |
show | +0.052 |
trick | +0.046 |
new | +0.044 |
my | +0.039 |
making | +0.039 |
Neg logit contributions | |
mie | -0.210 |
etsy | -0.206 |
elope | -0.203 |
hew | -0.202 |
jo | -0.200 |
Token | you |
Token ID | 345 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
show | +0.195 |
trick | +0.177 |
new | +0.161 |
grown | +0.143 |
test | +0.143 |
Neg logit contributions | |
mie | -0.765 |
etsy | -0.735 |
elope | -0.731 |
hew | -0.727 |
jo | -0.718 |
Token | . |
Token ID | 13 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
mie | +0.344 |
etsy | +0.329 |
hew | +0.326 |
elope | +0.323 |
storms | +0.319 |
Neg logit contributions | |
show | -0.174 |
trick | -0.166 |
new | -0.157 |
grown | -0.149 |
test | -0.147 |
Token | Please |
Token ID | 4222 |
Feature activation | +5.60e-02 |
Pos logit contributions | |
mie | +0.031 |
lves | +0.030 |
ppa | +0.029 |
hew | +0.029 |
etsy | +0.029 |
Neg logit contributions | |
my | -0.022 |
show | -0.022 |
your | -0.020 |
new | -0.019 |
to | -0.018 |
Token | forgive |
Token ID | 20927 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
mie | +0.131 |
etsy | +0.127 |
hew | +0.124 |
elope | +0.124 |
jo | +0.122 |
Neg logit contributions | |
show | -0.059 |
trick | -0.055 |
new | -0.054 |
grown | -0.050 |
making | -0.049 |
Token | me |
Token ID | 502 |
Feature activation | +4.36e-02 |
Pos logit contributions | |
show | +0.044 |
trick | +0.041 |
new | +0.040 |
my | +0.038 |
making | +0.037 |
Neg logit contributions | |
mie | -0.075 |
etsy | -0.074 |
elope | -0.072 |
hew | -0.071 |
jo | -0.071 |
Token | that |
Token ID | 326 |
Feature activation | -7.37e-03 |
Pos logit contributions | |
show | +0.082 |
trick | +0.078 |
test | +0.071 |
new | +0.068 |
grown | +0.067 |
Neg logit contributions | |
mie | -0.202 |
etsy | -0.192 |
hew | -0.189 |
elope | -0.189 |
storms | -0.188 |
Token | they |
Token ID | 484 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
show | +0.009 |
trick | +0.009 |
new | +0.008 |
test | +0.008 |
grown | +0.008 |
Neg logit contributions | |
mie | -0.015 |
etsy | -0.015 |
elope | -0.015 |
hew | -0.014 |
jo | -0.014 |
Token | should |
Token ID | 815 |
Feature activation | -5.61e-02 |
Pos logit contributions | |
mie | +0.410 |
etsy | +0.407 |
elope | +0.392 |
jo | +0.386 |
hew | +0.385 |
Neg logit contributions | |
show | -0.395 |
trick | -0.354 |
grown | -0.344 |
new | -0.343 |
for | -0.341 |
Token | not |
Token ID | 407 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
show | +0.048 |
trick | +0.043 |
new | +0.041 |
grown | +0.038 |
test | +0.037 |
Neg logit contributions | |
mie | -0.143 |
etsy | -0.140 |
elope | -0.137 |
hew | -0.136 |
jo | -0.136 |
Token | go |
Token ID | 467 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
show | +0.027 |
new | +0.025 |
trick | +0.025 |
grown | +0.022 |
making | +0.022 |
Neg logit contributions | |
mie | -0.076 |
etsy | -0.074 |
elope | -0.073 |
hew | -0.072 |
jo | -0.072 |
Token | into |
Token ID | 656 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
trick | +0.095 |
show | +0.092 |
math | +0.082 |
grown | +0.081 |
magic | +0.080 |
Neg logit contributions | |
mie | -0.245 |
etsy | -0.227 |
elope | -0.220 |
hew | -0.219 |
lves | -0.219 |
Token | places |
Token ID | 4113 |
Feature activation | +4.32e-02 |
Pos logit contributions | |
show | +0.253 |
trick | +0.245 |
new | +0.205 |
test | +0.204 |
grown | +0.195 |
Neg logit contributions | |
mie | -0.680 |
elope | -0.662 |
hew | -0.641 |
etsy | -0.634 |
jo | -0.633 |
Token | they |
Token ID | 484 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
mie | +0.100 |
etsy | +0.096 |
hew | +0.094 |
elope | +0.094 |
jo | +0.093 |
Neg logit contributions | |
show | -0.045 |
trick | -0.044 |
new | -0.041 |
grown | -0.039 |
test | -0.038 |
Token | did |
Token ID | 750 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
mie | +0.441 |
etsy | +0.436 |
elope | +0.420 |
jo | +0.413 |
pillar | +0.412 |
Neg logit contributions | |
show | -0.374 |
trick | -0.332 |
test | -0.324 |
grown | -0.324 |
to | -0.320 |
Token | not |
Token ID | 407 |
Feature activation | -3.32e-02 |
Pos logit contributions | |
show | +0.135 |
trick | +0.127 |
new | +0.118 |
test | +0.114 |
matching | +0.113 |
Neg logit contributions | |
mie | -0.242 |
hew | -0.231 |
elope | -0.230 |
jo | -0.226 |
etsy | -0.225 |
Token | know |
Token ID | 760 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
show | +0.036 |
trick | +0.034 |
new | +0.033 |
grown | +0.030 |
making | +0.030 |
Neg logit contributions | |
mie | -0.076 |
etsy | -0.074 |
elope | -0.073 |
hew | -0.072 |
jo | -0.072 |
Token | your |
Token ID | 534 |
Feature activation | -7.76e-02 |
Pos logit contributions | |
show | +0.048 |
trick | +0.046 |
test | +0.042 |
new | +0.039 |
matching | +0.039 |
Neg logit contributions | |
mie | -0.102 |
elope | -0.098 |
hew | -0.098 |
etsy | -0.098 |
ppa | -0.092 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
show | +0.088 |
trick | +0.083 |
grown | +0.078 |
new | +0.077 |
making | +0.076 |
Neg logit contributions | |
mie | -0.166 |
etsy | -0.160 |
elope | -0.158 |
hew | -0.156 |
jo | -0.152 |
Token | , |
Token ID | 11 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
mie | +0.289 |
etsy | +0.283 |
elope | +0.279 |
lves | +0.276 |
hew | +0.274 |
Neg logit contributions | |
show | -0.125 |
trick | -0.114 |
new | -0.113 |
for | -0.112 |
to | -0.107 |
Token | you |
Token ID | 345 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
show | +0.160 |
my | +0.159 |
new | +0.155 |
your | +0.150 |
trick | +0.147 |
Neg logit contributions | |
oped | -0.253 |
etsy | -0.246 |
mie | -0.245 |
jo | -0.244 |
storms | -0.239 |
Token | crashed |
Token ID | 14997 |
Feature activation | -6.15e-02 |
Pos logit contributions | |
mie | +0.340 |
elope | +0.340 |
etsy | +0.337 |
thel | +0.336 |
jo | +0.333 |
Neg logit contributions | |
show | -0.175 |
my | -0.153 |
grown | -0.153 |
new | -0.150 |
trick | -0.148 |
Token | into |
Token ID | 656 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
show | +0.060 |
trick | +0.055 |
new | +0.050 |
test | +0.049 |
grown | +0.049 |
Neg logit contributions | |
mie | -0.149 |
etsy | -0.142 |
hew | -0.142 |
jo | -0.139 |
elope | -0.139 |
Token | me |
Token ID | 502 |
Feature activation | +4.51e-02 |
Pos logit contributions | |
show | +0.182 |
trick | +0.164 |
new | +0.141 |
test | +0.134 |
grown | +0.123 |
Neg logit contributions | |
mie | -0.755 |
elope | -0.722 |
hew | -0.718 |
etsy | -0.716 |
pillar | -0.702 |
Token | !" |
Token ID | 2474 |
Feature activation | +6.00e-02 |
Pos logit contributions | |
mie | +0.098 |
hew | +0.093 |
etsy | +0.092 |
elope | +0.092 |
jo | +0.091 |
Neg logit contributions | |
show | -0.054 |
trick | -0.052 |
new | -0.050 |
grown | -0.047 |
matching | -0.046 |
Token | Ben |
Token ID | 3932 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
mie | +0.127 |
hew | +0.126 |
etsy | +0.126 |
oped | +0.122 |
lves | +0.121 |
Neg logit contributions | |
show | -0.085 |
the | -0.077 |
my | -0.074 |
to | -0.074 |
new | -0.073 |
Token | said |
Token ID | 531 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
etsy | +0.585 |
mie | +0.582 |
hew | +0.548 |
elope | +0.545 |
lves | +0.544 |
Neg logit contributions | |
show | -0.519 |
trick | -0.479 |
new | -0.466 |
grown | -0.453 |
to | -0.452 |
Token | , |
Token ID | 11 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
mie | +0.057 |
etsy | +0.056 |
elope | +0.055 |
jo | +0.054 |
hew | +0.054 |
Neg logit contributions | |
show | -0.026 |
trick | -0.025 |
new | -0.023 |
test | -0.022 |
grown | -0.022 |
Token | ." |
Token ID | 526 |
Feature activation | +5.64e-02 |
Pos logit contributions | |
mie | +0.611 |
etsy | +0.589 |
hew | +0.576 |
elope | +0.576 |
jo | +0.573 |
Neg logit contributions | |
show | -0.255 |
trick | -0.241 |
new | -0.236 |
grown | -0.219 |
test | -0.212 |
Token |
|
Token ID | 198 |
Feature activation | +6.81e-02 |
Pos logit contributions | |
mie | +0.123 |
lves | +0.123 |
hew | +0.120 |
rified | +0.119 |
storms | +0.118 |
Neg logit contributions | |
show | -0.072 |
to | -0.069 |
the | -0.069 |
your | -0.068 |
my | -0.067 |
Token |
|
Token ID | 198 |
Feature activation | +6.86e-02 |
Pos logit contributions | |
rified | +0.174 |
storms | +0.173 |
mie | +0.170 |
ley | +0.163 |
als | +0.163 |
Neg logit contributions | |
your | -0.069 |
new | -0.069 |
the | -0.067 |
show | -0.066 |
my | -0.065 |
Token | They |
Token ID | 2990 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
storms | +0.140 |
rified | +0.138 |
mie | +0.133 |
als | +0.127 |
ley | +0.126 |
Neg logit contributions | |
your | -0.104 |
my | -0.101 |
show | -0.100 |
grown | -0.094 |
trick | -0.093 |
Token | crawl |
Token ID | 27318 |
Feature activation | -4.14e-02 |
Pos logit contributions | |
mie | +0.571 |
etsy | +0.562 |
elope | +0.547 |
hew | +0.546 |
jo | +0.545 |
Neg logit contributions | |
show | -0.284 |
trick | -0.255 |
new | -0.241 |
grown | -0.232 |
test | -0.231 |
Token | into |
Token ID | 656 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
show | +0.041 |
trick | +0.038 |
new | +0.035 |
grown | +0.034 |
test | +0.034 |
Neg logit contributions | |
mie | -0.099 |
etsy | -0.096 |
elope | -0.094 |
hew | -0.093 |
jo | -0.093 |
Token | the |
Token ID | 262 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
show | +0.125 |
trick | +0.107 |
new | +0.090 |
grown | +0.077 |
test | +0.076 |
Neg logit contributions | |
mie | -0.822 |
etsy | -0.798 |
elope | -0.793 |
hew | -0.785 |
jo | -0.782 |
Token | box |
Token ID | 3091 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
show | +0.195 |
trick | +0.183 |
new | +0.182 |
grown | +0.171 |
test | +0.170 |
Neg logit contributions | |
mie | -0.274 |
etsy | -0.266 |
hew | -0.258 |
elope | -0.256 |
jo | -0.255 |
Token | and |
Token ID | 290 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
mie | +0.466 |
elope | +0.454 |
jo | +0.450 |
etsy | +0.449 |
hew | +0.443 |
Neg logit contributions | |
show | -0.201 |
trick | -0.192 |
new | -0.177 |
test | -0.177 |
my | -0.173 |
Token | peek |
Token ID | 27185 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
show | +0.125 |
trick | +0.111 |
new | +0.108 |
grown | +0.101 |
test | +0.100 |
Neg logit contributions | |
mie | -0.260 |
etsy | -0.256 |
hew | -0.249 |
jo | -0.247 |
elope | -0.247 |
Token | out |
Token ID | 503 |
Feature activation | -7.25e-02 |
Pos logit contributions | |
show | +0.027 |
trick | +0.026 |
new | +0.026 |
grown | +0.025 |
for | +0.024 |
Neg logit contributions | |
mie | -0.015 |
etsy | -0.014 |
elope | -0.013 |
hew | -0.013 |
jo | -0.013 |
Token | dog |
Token ID | 3290 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
show | +0.059 |
trick | +0.056 |
new | +0.054 |
grown | +0.051 |
test | +0.050 |
Neg logit contributions | |
mie | -0.099 |
etsy | -0.096 |
elope | -0.094 |
hew | -0.094 |
jo | -0.093 |
Token | , |
Token ID | 11 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
mie | +0.614 |
etsy | +0.608 |
hew | +0.597 |
thel | +0.586 |
ppa | +0.582 |
Neg logit contributions | |
show | -0.312 |
trick | -0.279 |
new | -0.276 |
to | -0.271 |
for | -0.265 |
Token | Spot |
Token ID | 15899 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
show | +0.172 |
the | +0.171 |
to | +0.171 |
his | +0.165 |
for | +0.165 |
Neg logit contributions | |
hew | -0.216 |
mie | -0.206 |
etsy | -0.205 |
lves | -0.197 |
thel | -0.194 |
Token | , |
Token ID | 11 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
etsy | +0.976 |
mie | +0.973 |
hew | +0.953 |
thel | +0.941 |
jo | +0.938 |
Neg logit contributions | |
show | -0.219 |
for | -0.178 |
to | -0.178 |
new | -0.173 |
trick | -0.172 |
Token | comes |
Token ID | 2058 |
Feature activation | -9.82e-02 |
Pos logit contributions | |
show | +0.140 |
new | +0.127 |
trick | +0.126 |
to | +0.125 |
making | +0.124 |
Neg logit contributions | |
mie | -0.245 |
etsy | -0.240 |
hew | -0.237 |
elope | -0.234 |
thel | -0.229 |
Token | into |
Token ID | 656 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
show | +0.090 |
trick | +0.082 |
new | +0.078 |
test | +0.073 |
grown | +0.073 |
Neg logit contributions | |
mie | -0.241 |
etsy | -0.235 |
elope | -0.232 |
jo | -0.230 |
hew | -0.230 |
Token | the |
Token ID | 262 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
show | +0.150 |
trick | +0.138 |
new | +0.118 |
test | +0.113 |
grown | +0.101 |
Neg logit contributions | |
mie | -0.771 |
elope | -0.761 |
jo | -0.743 |
etsy | -0.734 |
Bear | -0.725 |
Token | room |
Token ID | 2119 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
show | +0.185 |
trick | +0.181 |
new | +0.167 |
grown | +0.164 |
making | +0.164 |
Neg logit contributions | |
mie | -0.259 |
elope | -0.249 |
etsy | -0.244 |
pillar | -0.242 |
jo | -0.241 |
Token | . |
Token ID | 13 |
Feature activation | +7.75e-03 |
Pos logit contributions | |
mie | +0.253 |
elope | +0.242 |
etsy | +0.242 |
jo | +0.240 |
hew | +0.238 |
Neg logit contributions | |
show | -0.136 |
trick | -0.131 |
new | -0.127 |
test | -0.118 |
grown | -0.118 |
Token | Spot |
Token ID | 15899 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
mie | +0.013 |
hew | +0.013 |
etsy | +0.012 |
ppa | +0.012 |
thel | +0.012 |
Neg logit contributions | |
show | -0.013 |
new | -0.013 |
my | -0.013 |
trick | -0.012 |
your | -0.012 |
Token | is |
Token ID | 318 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
mie | +0.774 |
etsy | +0.751 |
elope | +0.735 |
hew | +0.731 |
jo | +0.727 |
Neg logit contributions | |
show | -0.404 |
trick | -0.378 |
new | -0.367 |
grown | -0.343 |
test | -0.338 |
Token | don |
Token ID | 836 |
Feature activation | +3.06e-02 |
Pos logit contributions | |
elope | +0.413 |
jo | +0.407 |
storms | +0.403 |
etsy | +0.402 |
mie | +0.399 |
Neg logit contributions | |
show | -0.338 |
trick | -0.290 |
for | -0.286 |
test | -0.283 |
to | -0.280 |
Token | 't |
Token ID | 470 |
Feature activation | -5.47e-02 |
Pos logit contributions | |
mie | +0.057 |
etsy | +0.054 |
hew | +0.053 |
elope | +0.052 |
jo | +0.052 |
Neg logit contributions | |
show | -0.046 |
trick | -0.044 |
new | -0.044 |
grown | -0.042 |
magic | -0.041 |
Token | want |
Token ID | 765 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
show | +0.066 |
trick | +0.061 |
new | +0.056 |
test | +0.056 |
grown | +0.055 |
Neg logit contributions | |
mie | -0.123 |
etsy | -0.120 |
elope | -0.119 |
jo | -0.117 |
hew | -0.116 |
Token | to |
Token ID | 284 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
show | +0.058 |
trick | +0.050 |
grown | +0.043 |
test | +0.040 |
new | +0.039 |
Neg logit contributions | |
mie | -0.299 |
storms | -0.287 |
etsy | -0.284 |
hew | -0.282 |
pillar | -0.278 |
Token | get |
Token ID | 651 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
show | +0.205 |
new | +0.198 |
trick | +0.192 |
grown | +0.175 |
magic | +0.171 |
Neg logit contributions | |
mie | -0.609 |
etsy | -0.584 |
elope | -0.575 |
hew | -0.572 |
jo | -0.565 |
Token | into |
Token ID | 656 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
show | +0.184 |
trick | +0.178 |
new | +0.161 |
grown | +0.155 |
test | +0.155 |
Neg logit contributions | |
mie | -0.425 |
etsy | -0.402 |
hew | -0.395 |
elope | -0.386 |
lves | -0.384 |
Token | trouble |
Token ID | 5876 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
show | +0.266 |
trick | +0.260 |
test | +0.220 |
new | +0.219 |
grown | +0.218 |
Neg logit contributions | |
mie | -0.655 |
elope | -0.620 |
hew | -0.615 |
lves | -0.594 |
storms | -0.592 |
Token | ." |
Token ID | 526 |
Feature activation | +7.68e-02 |
Pos logit contributions | |
show | +0.012 |
trick | +0.012 |
new | +0.012 |
grown | +0.011 |
test | +0.011 |
Neg logit contributions | |
mie | -0.021 |
storms | -0.020 |
hew | -0.020 |
etsy | -0.020 |
jo | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +8.28e-02 |
Pos logit contributions | |
lves | +0.173 |
ppy | +0.171 |
mie | +0.171 |
ppings | +0.170 |
x | +0.168 |
Neg logit contributions | |
the | -0.091 |
show | -0.089 |
to | -0.089 |
your | -0.084 |
his | -0.083 |
Token |
|
Token ID | 198 |
Feature activation | +8.08e-02 |
Pos logit contributions | |
storms | +0.218 |
rified | +0.216 |
lves | +0.211 |
als | +0.209 |
mie | +0.208 |
Neg logit contributions | |
the | -0.074 |
new | -0.074 |
show | -0.070 |
his | -0.069 |
your | -0.067 |
Token | Lisa |
Token ID | 44203 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
storms | +0.171 |
rified | +0.164 |
mie | +0.157 |
ley | +0.155 |
als | +0.155 |
Neg logit contributions | |
show | -0.109 |
your | -0.108 |
my | -0.106 |
trick | -0.105 |
grown | -0.102 |
Token | didn |
Token ID | 1422 |
Feature activation | -7.82e-02 |
Pos logit contributions | |
show | +0.086 |
trick | +0.081 |
new | +0.077 |
grown | +0.073 |
making | +0.072 |
Neg logit contributions | |
mie | -0.183 |
etsy | -0.177 |
elope | -0.175 |
hew | -0.172 |
jo | -0.171 |
Token | 't |
Token ID | 470 |
Feature activation | -5.07e-02 |
Pos logit contributions | |
show | +0.101 |
trick | +0.094 |
new | +0.092 |
to | +0.088 |
grown | +0.087 |
Neg logit contributions | |
mie | -0.167 |
etsy | -0.162 |
elope | -0.162 |
hew | -0.158 |
thel | -0.156 |
Token | want |
Token ID | 765 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
show | +0.059 |
trick | +0.055 |
new | +0.053 |
grown | +0.050 |
test | +0.049 |
Neg logit contributions | |
mie | -0.115 |
etsy | -0.112 |
elope | -0.110 |
hew | -0.109 |
jo | -0.108 |
Token | to |
Token ID | 284 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
show | +0.062 |
trick | +0.054 |
new | +0.048 |
grown | +0.045 |
test | +0.043 |
Neg logit contributions | |
mie | -0.288 |
etsy | -0.280 |
storms | -0.276 |
jo | -0.273 |
elope | -0.272 |
Token | get |
Token ID | 651 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
show | +0.208 |
trick | +0.193 |
new | +0.191 |
grown | +0.171 |
making | +0.167 |
Neg logit contributions | |
mie | -0.612 |
etsy | -0.593 |
elope | -0.584 |
hew | -0.579 |
jo | -0.576 |
Token | into |
Token ID | 656 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
show | +0.190 |
trick | +0.183 |
new | +0.168 |
test | +0.160 |
grown | +0.160 |
Neg logit contributions | |
mie | -0.422 |
etsy | -0.403 |
hew | -0.392 |
elope | -0.390 |
jo | -0.384 |
Token | trouble |
Token ID | 5876 |
Feature activation | -8.89e-03 |
Pos logit contributions | |
show | +0.272 |
trick | +0.268 |
new | +0.231 |
test | +0.227 |
grown | +0.224 |
Neg logit contributions | |
mie | -0.650 |
elope | -0.624 |
etsy | -0.601 |
hew | -0.601 |
jo | -0.598 |
Token | . |
Token ID | 13 |
Feature activation | +1.95e-02 |
Pos logit contributions | |
show | +0.010 |
trick | +0.009 |
new | +0.009 |
grown | +0.008 |
test | +0.008 |
Neg logit contributions | |
mie | -0.020 |
etsy | -0.019 |
elope | -0.019 |
hew | -0.019 |
jo | -0.019 |
Token | |
Token ID | 220 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
ppers | +0.045 |
ppa | +0.045 |
pper | +0.045 |
mie | +0.044 |
ppy | +0.044 |
Neg logit contributions | |
my | -0.022 |
to | -0.021 |
your | -0.021 |
the | -0.020 |
his | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +7.82e-02 |
Pos logit contributions | |
mie | +0.446 |
lves | +0.439 |
ley | +0.439 |
thel | +0.435 |
rified | +0.432 |
Neg logit contributions | |
new | -0.189 |
to | -0.179 |
the | -0.160 |
for | -0.157 |
big | -0.148 |
Token |
|
Token ID | 198 |
Feature activation | +7.79e-02 |
Pos logit contributions | |
storms | +0.193 |
rified | +0.191 |
als | +0.190 |
ley | +0.189 |
mie | +0.185 |
Neg logit contributions | |
new | -0.076 |
grown | -0.068 |
to | -0.068 |
his | -0.067 |
the | -0.067 |
Token | You |
Token ID | 921 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
mie | +0.009 |
lves | +0.008 |
etsy | +0.008 |
storms | +0.008 |
mi | +0.008 |
Neg logit contributions | |
my | -0.006 |
your | -0.006 |
show | -0.006 |
the | -0.005 |
new | -0.005 |
Token | could |
Token ID | 714 |
Feature activation | -4.21e-02 |
Pos logit contributions | |
mie | +0.418 |
etsy | +0.417 |
jo | +0.408 |
elope | +0.406 |
storms | +0.397 |
Neg logit contributions | |
show | -0.290 |
trick | -0.252 |
test | -0.246 |
to | -0.242 |
grown | -0.240 |
Token | fall |
Token ID | 2121 |
Feature activation | -5.02e-02 |
Pos logit contributions | |
show | +0.039 |
trick | +0.037 |
new | +0.036 |
grown | +0.033 |
making | +0.032 |
Neg logit contributions | |
mie | -0.102 |
etsy | -0.099 |
elope | -0.098 |
hew | -0.096 |
jo | -0.095 |
Token | or |
Token ID | 393 |
Feature activation | -9.78e-02 |
Pos logit contributions | |
show | +0.054 |
trick | +0.051 |
new | +0.048 |
grown | +0.047 |
test | +0.045 |
Neg logit contributions | |
mie | -0.114 |
etsy | -0.108 |
storms | -0.107 |
jo | -0.107 |
elope | -0.106 |
Token | bump |
Token ID | 13852 |
Feature activation | -7.34e-02 |
Pos logit contributions | |
show | +0.106 |
new | +0.103 |
trick | +0.103 |
grown | +0.096 |
original | +0.092 |
Neg logit contributions | |
mie | -0.214 |
etsy | -0.201 |
elope | -0.200 |
storms | -0.198 |
hew | -0.197 |
Token | into |
Token ID | 656 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
show | +0.059 |
new | +0.055 |
trick | +0.055 |
my | +0.055 |
your | +0.054 |
Neg logit contributions | |
etsy | -0.187 |
mie | -0.186 |
elope | -0.183 |
hew | -0.180 |
jo | -0.179 |
Token | someone |
Token ID | 2130 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
show | +0.179 |
trick | +0.159 |
new | +0.148 |
grown | +0.129 |
test | +0.127 |
Neg logit contributions | |
mie | -0.774 |
etsy | -0.752 |
elope | -0.742 |
hew | -0.738 |
jo | -0.733 |
Token | or |
Token ID | 393 |
Feature activation | -9.39e-02 |
Pos logit contributions | |
mie | +0.418 |
etsy | +0.407 |
elope | +0.398 |
hew | +0.395 |
jo | +0.393 |
Neg logit contributions | |
show | -0.254 |
trick | -0.238 |
new | -0.233 |
grown | -0.218 |
test | -0.217 |
Token | get |
Token ID | 651 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
show | +0.089 |
trick | +0.088 |
new | +0.086 |
grown | +0.081 |
matching | +0.076 |
Neg logit contributions | |
mie | -0.215 |
elope | -0.204 |
etsy | -0.202 |
hew | -0.199 |
storms | -0.199 |
Token | lost |
Token ID | 2626 |
Feature activation | -8.94e-02 |
Pos logit contributions | |
show | +0.192 |
trick | +0.179 |
new | +0.174 |
grown | +0.161 |
test | +0.158 |
Neg logit contributions | |
mie | -0.419 |
etsy | -0.408 |
elope | -0.401 |
hew | -0.397 |
jo | -0.396 |
Token | . |
Token ID | 13 |
Feature activation | +5.20e-03 |
Pos logit contributions | |
show | +0.087 |
trick | +0.080 |
new | +0.078 |
my | +0.073 |
for | +0.071 |
Neg logit contributions | |
mie | -0.217 |
etsy | -0.214 |
elope | -0.209 |
hew | -0.208 |
jo | -0.207 |
Token | hugged |
Token ID | 41130 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
mie | +0.415 |
etsy | +0.383 |
elope | +0.368 |
oped | +0.361 |
pillar | +0.360 |
Neg logit contributions | |
trick | -0.378 |
new | -0.376 |
show | -0.375 |
original | -0.349 |
making | -0.349 |
Token | it |
Token ID | 340 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
show | +0.109 |
new | +0.099 |
trick | +0.097 |
my | +0.090 |
your | +0.088 |
Neg logit contributions | |
mie | -0.284 |
etsy | -0.282 |
hew | -0.276 |
elope | -0.276 |
jo | -0.275 |
Token | , |
Token ID | 11 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
mie | +0.367 |
etsy | +0.353 |
elope | +0.346 |
hew | +0.337 |
jo | +0.336 |
Neg logit contributions | |
show | -0.117 |
trick | -0.114 |
grown | -0.103 |
test | -0.097 |
making | -0.095 |
Token | it |
Token ID | 340 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
show | +0.149 |
new | +0.142 |
the | +0.137 |
grown | +0.131 |
making | +0.131 |
Neg logit contributions | |
hew | -0.228 |
jo | -0.225 |
mie | -0.224 |
etsy | -0.221 |
elope | -0.216 |
Token | broke |
Token ID | 6265 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
mie | +0.294 |
etsy | +0.293 |
hew | +0.287 |
thel | +0.284 |
jo | +0.283 |
Neg logit contributions | |
show | -0.207 |
trick | -0.195 |
new | -0.191 |
grown | -0.184 |
making | -0.183 |
Token | into |
Token ID | 656 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
show | +0.096 |
new | +0.090 |
trick | +0.088 |
my | +0.079 |
grown | +0.079 |
Neg logit contributions | |
mie | -0.289 |
etsy | -0.284 |
elope | -0.279 |
jo | -0.277 |
hew | -0.276 |
Token | tiny |
Token ID | 7009 |
Feature activation | -3.99e-02 |
Pos logit contributions | |
show | +0.247 |
trick | +0.227 |
new | +0.221 |
grown | +0.203 |
making | +0.195 |
Neg logit contributions | |
mie | -0.708 |
etsy | -0.689 |
elope | -0.675 |
hew | -0.673 |
jo | -0.670 |
Token | pieces |
Token ID | 5207 |
Feature activation | +8.21e-02 |
Pos logit contributions | |
show | +0.052 |
trick | +0.049 |
new | +0.047 |
grown | +0.045 |
test | +0.045 |
Neg logit contributions | |
mie | -0.083 |
etsy | -0.080 |
elope | -0.079 |
hew | -0.078 |
jo | -0.078 |
Token | . |
Token ID | 13 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
mie | +0.185 |
etsy | +0.177 |
hew | +0.173 |
elope | +0.173 |
jo | +0.173 |
Neg logit contributions | |
show | -0.090 |
trick | -0.086 |
new | -0.082 |
test | -0.077 |
grown | -0.077 |
Token | Lily |
Token ID | 20037 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
pper | +0.038 |
ley | +0.037 |
ppers | +0.037 |
x | +0.037 |
mie | +0.036 |
Neg logit contributions | |
my | -0.020 |
to | -0.019 |
the | -0.019 |
new | -0.019 |
grown | -0.019 |
Token | was |
Token ID | 373 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
etsy | +0.526 |
storms | +0.516 |
mie | +0.514 |
och | +0.506 |
uddy | +0.505 |
Neg logit contributions | |
show | -0.338 |
grown | -0.308 |
trick | -0.306 |
making | -0.301 |
to | -0.300 |
Token | does |
Token ID | 857 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
mie | +0.468 |
etsy | +0.462 |
elope | +0.442 |
hew | +0.438 |
jo | +0.436 |
Neg logit contributions | |
show | -0.332 |
trick | -0.309 |
new | -0.302 |
grown | -0.289 |
test | -0.285 |
Token | not |
Token ID | 407 |
Feature activation | -3.97e-02 |
Pos logit contributions | |
matching | +0.158 |
color | +0.152 |
show | +0.152 |
style | +0.147 |
design | +0.146 |
Neg logit contributions | |
elope | -0.218 |
Snow | -0.217 |
mie | -0.213 |
Rex | -0.206 |
jo | -0.204 |
Token | want |
Token ID | 765 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
show | +0.042 |
trick | +0.039 |
new | +0.036 |
test | +0.034 |
grown | +0.034 |
Neg logit contributions | |
mie | -0.096 |
etsy | -0.094 |
hew | -0.092 |
elope | -0.091 |
jo | -0.090 |
Token | to |
Token ID | 284 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
show | +0.056 |
trick | +0.044 |
new | +0.039 |
grown | +0.036 |
matching | +0.035 |
Neg logit contributions | |
mie | -0.330 |
etsy | -0.322 |
jo | -0.321 |
storms | -0.320 |
elope | -0.319 |
Token | fly |
Token ID | 6129 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
show | +0.227 |
new | +0.215 |
trick | +0.212 |
grown | +0.194 |
matching | +0.190 |
Neg logit contributions | |
mie | -0.591 |
etsy | -0.570 |
elope | -0.568 |
hew | -0.557 |
jo | -0.556 |
Token | into |
Token ID | 656 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
mie | +0.066 |
etsy | +0.063 |
elope | +0.063 |
storms | +0.063 |
jo | +0.063 |
Neg logit contributions | |
show | -0.038 |
trick | -0.035 |
grown | -0.033 |
new | -0.033 |
test | -0.032 |
Token | the |
Token ID | 262 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
show | +0.129 |
trick | +0.110 |
new | +0.094 |
grown | +0.079 |
test | +0.078 |
Neg logit contributions | |
mie | -0.816 |
etsy | -0.787 |
elope | -0.787 |
hew | -0.779 |
jo | -0.777 |
Token | storm |
Token ID | 6388 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
show | +0.176 |
trick | +0.167 |
new | +0.162 |
grown | +0.153 |
test | +0.152 |
Neg logit contributions | |
mie | -0.267 |
etsy | -0.258 |
elope | -0.253 |
hew | -0.251 |
jo | -0.249 |
Token | . |
Token ID | 13 |
Feature activation | +4.58e-03 |
Pos logit contributions | |
mie | +0.412 |
etsy | +0.407 |
hew | +0.394 |
elope | +0.390 |
thel | +0.388 |
Neg logit contributions | |
show | -0.157 |
trick | -0.143 |
new | -0.134 |
making | -0.127 |
to | -0.125 |
Token | He |
Token ID | 679 |
Feature activation | +2.37e-01 |
Pos logit contributions | |
mie | +0.010 |
ppa | +0.009 |
etsy | +0.009 |
ley | +0.009 |
ppy | +0.009 |
Neg logit contributions | |
my | -0.006 |
show | -0.006 |
new | -0.006 |
your | -0.006 |
to | -0.006 |
Token | tries |
Token ID | 8404 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
mie | +0.487 |
etsy | +0.479 |
elope | +0.461 |
hew | +0.457 |
jo | +0.456 |
Neg logit contributions | |
show | -0.324 |
trick | -0.301 |
new | -0.294 |
grown | -0.279 |
test | -0.277 |
Token | But |
Token ID | 1537 |
Feature activation | -3.24e-03 |
Pos logit contributions | |
storms | +0.208 |
rified | +0.205 |
mie | +0.203 |
ley | +0.198 |
als | +0.196 |
Neg logit contributions | |
your | -0.120 |
my | -0.118 |
show | -0.109 |
his | -0.108 |
grown | -0.108 |
Token | then |
Token ID | 788 |
Feature activation | +5.58e-02 |
Pos logit contributions | |
show | +0.004 |
my | +0.004 |
your | +0.003 |
the | +0.003 |
making | +0.003 |
Neg logit contributions | |
mie | -0.007 |
etsy | -0.007 |
jo | -0.007 |
hew | -0.007 |
storms | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
etsy | +0.152 |
hew | +0.151 |
mie | +0.149 |
lves | +0.149 |
jo | +0.148 |
Neg logit contributions | |
show | -0.040 |
the | -0.037 |
my | -0.035 |
your | -0.035 |
new | -0.034 |
Token | Lily |
Token ID | 20037 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
show | +0.119 |
the | +0.105 |
new | +0.105 |
my | +0.104 |
your | +0.103 |
Neg logit contributions | |
hew | -0.255 |
mie | -0.252 |
etsy | -0.252 |
jo | -0.252 |
oped | -0.247 |
Token | bit |
Token ID | 1643 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
etsy | +0.510 |
lves | +0.476 |
uddy | +0.467 |
mie | +0.458 |
hew | +0.457 |
Neg logit contributions | |
show | -0.360 |
to | -0.337 |
grown | -0.334 |
making | -0.322 |
the | -0.312 |
Token | into |
Token ID | 656 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
show | +0.212 |
trick | +0.193 |
new | +0.191 |
grown | +0.176 |
making | +0.176 |
Neg logit contributions | |
mie | -0.512 |
etsy | -0.501 |
elope | -0.496 |
hew | -0.490 |
jo | -0.486 |
Token | her |
Token ID | 607 |
Feature activation | -3.94e-02 |
Pos logit contributions | |
show | +0.165 |
trick | +0.145 |
new | +0.136 |
grown | +0.117 |
test | +0.113 |
Neg logit contributions | |
mie | -0.788 |
etsy | -0.769 |
elope | -0.756 |
hew | -0.753 |
jo | -0.749 |
Token | sandwich |
Token ID | 20433 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
trick | +0.053 |
show | +0.051 |
grown | +0.049 |
making | +0.048 |
for | +0.046 |
Neg logit contributions | |
mie | -0.073 |
elope | -0.072 |
etsy | -0.067 |
jo | -0.066 |
pillar | -0.066 |
Token | and |
Token ID | 290 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
mie | +0.504 |
etsy | +0.486 |
hew | +0.475 |
elope | +0.473 |
jo | +0.468 |
Neg logit contributions | |
show | -0.213 |
trick | -0.199 |
new | -0.192 |
test | -0.180 |
grown | -0.177 |
Token | made |
Token ID | 925 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
show | +0.142 |
trick | +0.132 |
new | +0.128 |
grown | +0.122 |
making | +0.121 |
Neg logit contributions | |
mie | -0.213 |
etsy | -0.208 |
elope | -0.202 |
hew | -0.202 |
jo | -0.202 |
Token | a |
Token ID | 257 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
show | +0.163 |
new | +0.153 |
trick | +0.148 |
grown | +0.126 |
my | +0.124 |
Neg logit contributions | |
mie | -0.646 |
etsy | -0.645 |
jo | -0.630 |
elope | -0.629 |
hew | -0.620 |
Token | I |
Token ID | 314 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
mie | +0.016 |
etsy | +0.015 |
hew | +0.015 |
jo | +0.015 |
elope | +0.015 |
Neg logit contributions | |
show | -0.013 |
my | -0.012 |
trick | -0.011 |
your | -0.011 |
new | -0.011 |
Token | will |
Token ID | 481 |
Feature activation | -4.43e-02 |
Pos logit contributions | |
mie | +0.345 |
etsy | +0.331 |
hew | +0.322 |
elope | +0.322 |
jo | +0.316 |
Neg logit contributions | |
show | -0.278 |
trick | -0.266 |
new | -0.265 |
grown | -0.249 |
making | -0.248 |
Token | hit |
Token ID | 2277 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
new | +0.042 |
chance | +0.036 |
trick | +0.034 |
magic | +0.034 |
original | +0.033 |
Neg logit contributions | |
mie | -0.094 |
pper | -0.089 |
etsy | -0.088 |
hew | -0.088 |
ppa | -0.086 |
Token | the |
Token ID | 262 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
show | +0.202 |
trick | +0.189 |
new | +0.186 |
my | +0.172 |
grown | +0.171 |
Neg logit contributions | |
mie | -0.371 |
etsy | -0.364 |
elope | -0.355 |
jo | -0.352 |
hew | -0.350 |
Token | ball |
Token ID | 2613 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
show | +0.167 |
trick | +0.159 |
new | +0.150 |
grown | +0.145 |
test | +0.144 |
Neg logit contributions | |
mie | -0.270 |
hew | -0.257 |
etsy | -0.257 |
elope | -0.253 |
pillar | -0.253 |
Token | into |
Token ID | 656 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
mie | +0.369 |
etsy | +0.355 |
hew | +0.353 |
storms | +0.349 |
pillar | +0.348 |
Neg logit contributions | |
show | -0.179 |
trick | -0.169 |
new | -0.163 |
grown | -0.162 |
test | -0.153 |
Token | the |
Token ID | 262 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
show | +0.169 |
trick | +0.159 |
new | +0.137 |
test | +0.126 |
job | +0.118 |
Neg logit contributions | |
mie | -0.739 |
hew | -0.715 |
elope | -0.709 |
pillar | -0.705 |
etsy | -0.698 |
Token | hole |
Token ID | 7604 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
show | +0.175 |
trick | +0.170 |
new | +0.158 |
grown | +0.154 |
making | +0.153 |
Neg logit contributions | |
mie | -0.255 |
elope | -0.243 |
hew | -0.242 |
etsy | -0.240 |
pillar | -0.238 |
Token | better |
Token ID | 1365 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
mie | +0.352 |
hew | +0.339 |
etsy | +0.337 |
elope | +0.335 |
ppy | +0.333 |
Neg logit contributions | |
show | -0.200 |
trick | -0.191 |
test | -0.180 |
new | -0.176 |
grown | -0.172 |
Token | than |
Token ID | 621 |
Feature activation | -8.53e-02 |
Pos logit contributions | |
show | +0.127 |
trick | +0.120 |
new | +0.114 |
grown | +0.112 |
test | +0.109 |
Neg logit contributions | |
mie | -0.232 |
elope | -0.220 |
etsy | -0.220 |
hew | -0.219 |
storms | -0.214 |
Token | you |
Token ID | 345 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
show | +0.110 |
trick | +0.105 |
new | +0.099 |
test | +0.095 |
grown | +0.093 |
Neg logit contributions | |
mie | -0.168 |
etsy | -0.163 |
hew | -0.156 |
storms | -0.156 |
ppy | -0.154 |
Token | But |
Token ID | 887 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
ppa | +0.033 |
mie | +0.032 |
ppers | +0.032 |
thel | +0.032 |
lves | +0.032 |
Neg logit contributions | |
my | -0.017 |
your | -0.016 |
to | -0.016 |
the | -0.016 |
show | -0.016 |
Token | then |
Token ID | 788 |
Feature activation | +5.14e-02 |
Pos logit contributions | |
mie | +0.054 |
etsy | +0.053 |
jo | +0.052 |
hew | +0.052 |
elope | +0.051 |
Neg logit contributions | |
show | -0.030 |
trick | -0.028 |
new | -0.027 |
my | -0.027 |
making | -0.026 |
Token | , |
Token ID | 11 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
etsy | +0.150 |
lves | +0.147 |
hew | +0.146 |
mie | +0.146 |
jo | +0.146 |
Neg logit contributions | |
show | -0.027 |
your | -0.026 |
the | -0.026 |
my | -0.026 |
new | -0.024 |
Token | Tim |
Token ID | 5045 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
show | +0.123 |
new | +0.109 |
the | +0.106 |
my | +0.106 |
trick | +0.106 |
Neg logit contributions | |
mie | -0.258 |
hew | -0.257 |
etsy | -0.255 |
jo | -0.254 |
oped | -0.247 |
Token | fell |
Token ID | 3214 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
etsy | +0.455 |
mie | +0.423 |
lves | +0.418 |
thel | +0.416 |
elope | +0.415 |
Neg logit contributions | |
show | -0.520 |
to | -0.505 |
grown | -0.494 |
new | -0.493 |
trick | -0.492 |
Token | into |
Token ID | 656 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
show | +0.016 |
trick | +0.016 |
test | +0.015 |
grown | +0.014 |
talent | +0.014 |
Neg logit contributions | |
mie | -0.022 |
storms | -0.022 |
jo | -0.021 |
rified | -0.021 |
bo | -0.021 |
Token | a |
Token ID | 257 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
show | +0.135 |
trick | +0.120 |
new | +0.100 |
test | +0.090 |
grown | +0.084 |
Neg logit contributions | |
mie | -0.795 |
elope | -0.765 |
etsy | -0.762 |
jo | -0.751 |
hew | -0.749 |
Token | deep |
Token ID | 2769 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
show | +0.146 |
trick | +0.138 |
new | +0.128 |
making | +0.124 |
grown | +0.122 |
Neg logit contributions | |
mie | -0.290 |
etsy | -0.279 |
elope | -0.277 |
pillar | -0.272 |
jo | -0.271 |
Token | hole |
Token ID | 7604 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
trick | +0.134 |
new | +0.133 |
show | +0.133 |
math | +0.127 |
grown | +0.125 |
Neg logit contributions | |
elope | -0.210 |
mie | -0.207 |
jo | -0.200 |
ley | -0.197 |
storms | -0.194 |
Token | and |
Token ID | 290 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
oped | +0.314 |
storms | +0.312 |
mie | +0.310 |
rified | +0.307 |
jo | +0.306 |
Neg logit contributions | |
math | -0.228 |
show | -0.224 |
test | -0.220 |
job | -0.220 |
new | -0.220 |
Token | couldn |
Token ID | 3521 |
Feature activation | -6.89e-02 |
Pos logit contributions | |
show | +0.165 |
trick | +0.160 |
new | +0.155 |
grown | +0.148 |
test | +0.147 |
Neg logit contributions | |
mie | -0.184 |
etsy | -0.175 |
elope | -0.173 |
hew | -0.170 |
jo | -0.168 |
Token | I |
Token ID | 314 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
mie | +0.036 |
ppa | +0.035 |
thel | +0.034 |
lves | +0.034 |
hew | +0.034 |
Neg logit contributions | |
show | -0.022 |
my | -0.022 |
your | -0.020 |
to | -0.019 |
for | -0.018 |
Token | hope |
Token ID | 2911 |
Feature activation | -8.32e-02 |
Pos logit contributions | |
mie | +0.321 |
etsy | +0.309 |
elope | +0.301 |
jo | +0.298 |
hew | +0.296 |
Neg logit contributions | |
show | -0.328 |
trick | -0.311 |
new | -0.300 |
grown | -0.291 |
test | -0.290 |
Token | we |
Token ID | 356 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
show | +0.102 |
trick | +0.102 |
test | +0.092 |
new | +0.090 |
grown | +0.089 |
Neg logit contributions | |
mie | -0.165 |
hew | -0.156 |
etsy | -0.155 |
elope | -0.154 |
jo | -0.152 |
Token | can |
Token ID | 460 |
Feature activation | -6.65e-02 |
Pos logit contributions | |
mie | +0.346 |
etsy | +0.343 |
jo | +0.340 |
elope | +0.339 |
storms | +0.330 |
Neg logit contributions | |
show | -0.263 |
trick | -0.234 |
test | -0.227 |
new | -0.227 |
grown | -0.224 |
Token | get |
Token ID | 651 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
show | +0.053 |
trick | +0.048 |
new | +0.046 |
grown | +0.042 |
test | +0.041 |
Neg logit contributions | |
mie | -0.173 |
etsy | -0.169 |
elope | -0.166 |
hew | -0.165 |
jo | -0.164 |
Token | into |
Token ID | 656 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
show | +0.176 |
trick | +0.161 |
new | +0.158 |
grown | +0.143 |
making | +0.141 |
Neg logit contributions | |
mie | -0.447 |
etsy | -0.437 |
elope | -0.430 |
jo | -0.426 |
hew | -0.426 |
Token | the |
Token ID | 262 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
show | +0.196 |
trick | +0.192 |
test | +0.155 |
new | +0.152 |
grown | +0.150 |
Neg logit contributions | |
mie | -0.725 |
elope | -0.692 |
hew | -0.687 |
etsy | -0.665 |
lves | -0.660 |
Token | opera |
Token ID | 27296 |
Feature activation | +7.17e-02 |
Pos logit contributions | |
show | +0.174 |
trick | +0.166 |
new | +0.158 |
grown | +0.152 |
making | +0.151 |
Neg logit contributions | |
mie | -0.258 |
etsy | -0.246 |
elope | -0.245 |
hew | -0.241 |
jo | -0.237 |
Token | . |
Token ID | 13 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
mie | +0.160 |
elope | +0.153 |
jo | +0.151 |
etsy | +0.150 |
hew | +0.150 |
Neg logit contributions | |
show | -0.075 |
trick | -0.074 |
new | -0.070 |
grown | -0.068 |
test | -0.066 |
Token | I |
Token ID | 314 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
mie | +0.029 |
ppa | +0.028 |
etsy | +0.027 |
lves | +0.027 |
thel | +0.027 |
Neg logit contributions | |
show | -0.022 |
my | -0.021 |
your | -0.019 |
to | -0.019 |
new | -0.019 |
Token | have |
Token ID | 423 |
Feature activation | -6.87e-02 |
Pos logit contributions | |
mie | +0.321 |
etsy | +0.309 |
elope | +0.301 |
jo | +0.297 |
hew | +0.297 |
Neg logit contributions | |
show | -0.333 |
trick | -0.316 |
new | -0.307 |
grown | -0.296 |
test | -0.296 |
Token | neighbor |
Token ID | 4780 |
Feature activation | +2.84e-01 |
Pos logit contributions | |
show | +0.085 |
trick | +0.080 |
new | +0.077 |
grown | +0.075 |
making | +0.074 |
Neg logit contributions | |
mie | -0.126 |
etsy | -0.121 |
elope | -0.120 |
hew | -0.117 |
jo | -0.116 |
Token | 's |
Token ID | 338 |
Feature activation | -5.28e-02 |
Pos logit contributions | |
etsy | +0.612 |
mie | +0.607 |
hew | +0.588 |
elope | +0.587 |
jo | +0.585 |
Neg logit contributions | |
show | -0.354 |
new | -0.318 |
trick | -0.317 |
my | -0.305 |
making | -0.304 |
Token | cat |
Token ID | 3797 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
show | +0.070 |
trick | +0.067 |
new | +0.064 |
grown | +0.061 |
making | +0.060 |
Neg logit contributions | |
mie | -0.105 |
etsy | -0.101 |
elope | -0.100 |
hew | -0.098 |
jo | -0.097 |
Token | keeps |
Token ID | 7622 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
mie | +0.602 |
etsy | +0.587 |
hew | +0.574 |
elope | +0.573 |
jo | +0.569 |
Neg logit contributions | |
show | -0.272 |
trick | -0.251 |
new | -0.243 |
grown | -0.226 |
making | -0.224 |
Token | coming |
Token ID | 2406 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
show | +0.185 |
trick | +0.175 |
new | +0.169 |
grown | +0.158 |
test | +0.157 |
Neg logit contributions | |
mie | -0.352 |
etsy | -0.339 |
elope | -0.333 |
hew | -0.331 |
jo | -0.328 |
Token | into |
Token ID | 656 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
show | +0.110 |
trick | +0.100 |
new | +0.096 |
grown | +0.088 |
test | +0.086 |
Neg logit contributions | |
mie | -0.314 |
etsy | -0.306 |
elope | -0.301 |
hew | -0.299 |
jo | -0.297 |
Token | my |
Token ID | 616 |
Feature activation | -8.49e-02 |
Pos logit contributions | |
show | +0.193 |
trick | +0.183 |
new | +0.161 |
test | +0.147 |
grown | +0.144 |
Neg logit contributions | |
mie | -0.732 |
elope | -0.707 |
hew | -0.694 |
etsy | -0.692 |
jo | -0.686 |
Token | yard |
Token ID | 12699 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
show | +0.118 |
trick | +0.115 |
new | +0.107 |
making | +0.104 |
grown | +0.104 |
Neg logit contributions | |
mie | -0.165 |
elope | -0.160 |
etsy | -0.157 |
hew | -0.154 |
jo | -0.152 |
Token | and |
Token ID | 290 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
mie | +0.394 |
etsy | +0.380 |
elope | +0.377 |
hew | +0.374 |
jo | +0.371 |
Neg logit contributions | |
show | -0.185 |
trick | -0.175 |
new | -0.167 |
grown | -0.157 |
test | -0.155 |
Token | eating |
Token ID | 6600 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
show | +0.138 |
new | +0.124 |
trick | +0.124 |
my | +0.120 |
making | +0.120 |
Neg logit contributions | |
mie | -0.227 |
etsy | -0.223 |
hew | -0.218 |
jo | -0.216 |
elope | -0.215 |
Token | all |
Token ID | 477 |
Feature activation | -1.76e-02 |
Pos logit contributions | |
show | +0.122 |
trick | +0.115 |
new | +0.105 |
grown | +0.101 |
test | +0.101 |
Neg logit contributions | |
mie | -0.296 |
etsy | -0.283 |
hew | -0.281 |
elope | -0.280 |
jo | -0.273 |
Token | and |
Token ID | 290 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
show | +0.093 |
new | +0.082 |
trick | +0.082 |
for | +0.074 |
to | +0.074 |
Neg logit contributions | |
mie | -0.311 |
etsy | -0.303 |
hew | -0.298 |
elope | -0.297 |
pillar | -0.293 |
Token | watched |
Token ID | 7342 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
show | +0.172 |
new | +0.155 |
trick | +0.148 |
for | +0.146 |
the | +0.146 |
Neg logit contributions | |
etsy | -0.246 |
mie | -0.242 |
pillar | -0.238 |
hew | -0.237 |
storms | -0.236 |
Token | as |
Token ID | 355 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
show | +0.145 |
new | +0.130 |
trick | +0.129 |
for | +0.119 |
making | +0.117 |
Neg logit contributions | |
mie | -0.372 |
etsy | -0.364 |
hew | -0.357 |
elope | -0.355 |
pillar | -0.351 |
Token | he |
Token ID | 339 |
Feature activation | +2.14e-01 |
Pos logit contributions | |
show | +0.107 |
new | +0.106 |
the | +0.098 |
good | +0.092 |
big | +0.091 |
Neg logit contributions | |
hew | -0.288 |
mie | -0.287 |
etsy | -0.286 |
pillar | -0.279 |
lves | -0.275 |
Token | disappeared |
Token ID | 12120 |
Feature activation | -8.45e-02 |
Pos logit contributions | |
etsy | +0.395 |
mie | +0.382 |
storms | +0.373 |
uddy | +0.368 |
lves | +0.367 |
Neg logit contributions | |
show | -0.352 |
trick | -0.317 |
grown | -0.313 |
new | -0.307 |
to | -0.301 |
Token | into |
Token ID | 656 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
show | +0.088 |
trick | +0.083 |
test | +0.077 |
new | +0.074 |
grown | +0.072 |
Neg logit contributions | |
mie | -0.197 |
etsy | -0.187 |
elope | -0.187 |
jo | -0.184 |
storms | -0.183 |
Token | the |
Token ID | 262 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
show | +0.147 |
trick | +0.137 |
new | +0.111 |
test | +0.106 |
grown | +0.096 |
Neg logit contributions | |
mie | -0.780 |
elope | -0.758 |
jo | -0.746 |
etsy | -0.744 |
hew | -0.736 |
Token | distance |
Token ID | 5253 |
Feature activation | +2.21e-02 |
Pos logit contributions | |
show | +0.151 |
new | +0.145 |
trick | +0.133 |
grown | +0.129 |
magic | +0.127 |
Neg logit contributions | |
mie | -0.280 |
etsy | -0.279 |
hew | -0.272 |
ppy | -0.267 |
jo | -0.266 |
Token | . |
Token ID | 13 |
Feature activation | +2.09e-02 |
Pos logit contributions | |
mie | +0.055 |
etsy | +0.055 |
hew | +0.054 |
elope | +0.053 |
lves | +0.052 |
Neg logit contributions | |
show | -0.020 |
new | -0.019 |
trick | -0.018 |
for | -0.017 |
to | -0.017 |
Token | Gig |
Token ID | 19525 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
ppers | +0.051 |
ppa | +0.050 |
ppy | +0.050 |
lves | +0.050 |
x | +0.050 |
Neg logit contributions | |
his | -0.021 |
the | -0.020 |
my | -0.020 |
new | -0.019 |
to | -0.019 |
Token | i |
Token ID | 72 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
uddy | +0.430 |
och | +0.409 |
Rex | +0.406 |
storms | +0.404 |
â„¢ | +0.396 |
Neg logit contributions | |
new | -0.605 |
the | -0.604 |
for | -0.586 |
show | -0.580 |
to | -0.572 |
Token |
|
Token ID | 198 |
Feature activation | +9.36e-02 |
Pos logit contributions | |
mie | +0.041 |
elope | +0.039 |
etsy | +0.039 |
jo | +0.038 |
hew | +0.038 |
Neg logit contributions | |
show | -0.039 |
new | -0.037 |
trick | -0.036 |
grown | -0.036 |
making | -0.035 |
Token |
|
Token ID | 198 |
Feature activation | +9.10e-02 |
Pos logit contributions | |
storms | +0.208 |
rified | +0.205 |
mie | +0.203 |
ley | +0.198 |
als | +0.196 |
Neg logit contributions | |
your | -0.120 |
my | -0.118 |
show | -0.109 |
his | -0.108 |
grown | -0.108 |
Token | They |
Token ID | 2990 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
storms | +0.190 |
rified | +0.182 |
mie | +0.176 |
ley | +0.175 |
als | +0.173 |
Neg logit contributions | |
your | -0.131 |
my | -0.130 |
show | -0.123 |
grown | -0.121 |
his | -0.115 |
Token | cracked |
Token ID | 21368 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
etsy | +0.538 |
storms | +0.527 |
mie | +0.525 |
jo | +0.523 |
elope | +0.514 |
Neg logit contributions | |
show | -0.364 |
trick | -0.297 |
grown | -0.292 |
test | -0.292 |
the | -0.288 |
Token | eggs |
Token ID | 9653 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
show | +0.135 |
trick | +0.124 |
test | +0.108 |
grown | +0.103 |
new | +0.102 |
Neg logit contributions | |
mie | -0.493 |
elope | -0.469 |
hew | -0.468 |
etsy | -0.466 |
rified | -0.464 |
Token | into |
Token ID | 656 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
mie | +0.521 |
etsy | +0.501 |
elope | +0.495 |
hew | +0.489 |
ppy | +0.482 |
Neg logit contributions | |
show | -0.209 |
trick | -0.204 |
new | -0.190 |
grown | -0.183 |
test | -0.178 |
Token | a |
Token ID | 257 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
show | +0.164 |
trick | +0.147 |
new | +0.129 |
test | +0.116 |
grown | +0.108 |
Neg logit contributions | |
mie | -0.776 |
etsy | -0.751 |
elope | -0.751 |
hew | -0.741 |
jo | -0.735 |
Token | bowl |
Token ID | 9396 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
show | +0.116 |
trick | +0.106 |
new | +0.105 |
grown | +0.095 |
test | +0.092 |
Neg logit contributions | |
mie | -0.319 |
etsy | -0.310 |
hew | -0.304 |
elope | -0.303 |
jo | -0.302 |
Token | , |
Token ID | 11 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
mie | +0.400 |
etsy | +0.389 |
elope | +0.383 |
hew | +0.379 |
jo | +0.376 |
Neg logit contributions | |
show | -0.177 |
trick | -0.172 |
new | -0.166 |
test | -0.156 |
grown | -0.153 |
Token | stirred |
Token ID | 33091 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
trick | +0.132 |
show | +0.122 |
test | +0.117 |
new | +0.111 |
job | +0.109 |
Neg logit contributions | |
mie | -0.232 |
elope | -0.223 |
etsy | -0.217 |
ppa | -0.211 |
hew | -0.209 |
Token | them |
Token ID | 606 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
show | +0.144 |
trick | +0.135 |
new | +0.123 |
test | +0.123 |
grown | +0.120 |
Neg logit contributions | |
mie | -0.298 |
etsy | -0.284 |
elope | -0.284 |
hew | -0.283 |
jo | -0.275 |
Token | Larry |
Token ID | 13633 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
my | +0.187 |
show | +0.187 |
new | +0.187 |
the | +0.182 |
your | +0.182 |
Neg logit contributions | |
hew | -0.211 |
etsy | -0.208 |
oped | -0.203 |
mie | -0.203 |
ppa | -0.202 |
Token | . |
Token ID | 13 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
mie | +0.911 |
etsy | +0.904 |
hew | +0.885 |
elope | +0.877 |
storms | +0.867 |
Neg logit contributions | |
show | -0.348 |
new | -0.324 |
trick | -0.315 |
my | -0.297 |
for | -0.293 |
Token | What |
Token ID | 1867 |
Feature activation | +7.32e-02 |
Pos logit contributions | |
mie | +0.045 |
ppa | +0.045 |
hew | +0.044 |
lves | +0.043 |
thel | +0.043 |
Neg logit contributions | |
my | -0.034 |
show | -0.033 |
your | -0.032 |
new | -0.031 |
to | -0.031 |
Token | â |
Token ID | 22940 |
Feature activation | +3.34e-02 |
Pos logit contributions | |
mie | +0.165 |
etsy | +0.157 |
elope | +0.157 |
jo | +0.156 |
hew | +0.155 |
Neg logit contributions | |
show | -0.079 |
trick | -0.073 |
new | -0.067 |
making | -0.065 |
test | -0.064 |
Token | € |
Token ID | 26391 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
mie | +0.049 |
etsy | +0.048 |
elope | +0.046 |
hew | +0.046 |
jo | +0.045 |
Neg logit contributions | |
show | -0.064 |
trick | -0.061 |
new | -0.060 |
test | -0.058 |
grown | -0.058 |
Token | â„¢ |
Token ID | 8151 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
ley | +0.309 |
rified | +0.303 |
lves | +0.301 |
ppa | +0.298 |
mie | +0.296 |
Neg logit contributions | |
show | -0.228 |
to | -0.213 |
grown | -0.211 |
my | -0.210 |
time | -0.207 |
Token | s |
Token ID | 82 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
elope | +0.478 |
mie | +0.450 |
etsy | +0.441 |
lves | +0.431 |
hew | +0.429 |
Neg logit contributions | |
show | -0.595 |
new | -0.571 |
to | -0.570 |
my | -0.551 |
for | -0.548 |
Token | yours |
Token ID | 12431 |
Feature activation | +9.61e-02 |
Pos logit contributions | |
trick | +0.041 |
show | +0.040 |
new | +0.035 |
grown | +0.034 |
matching | +0.034 |
Neg logit contributions | |
mie | -0.108 |
jo | -0.103 |
elope | -0.100 |
thel | -0.100 |
etsy | -0.100 |
Token | ? |
Token ID | 30 |
Feature activation | +9.08e-03 |
Pos logit contributions | |
mie | +0.218 |
pillar | +0.200 |
etsy | +0.200 |
elope | +0.199 |
jo | +0.199 |
Neg logit contributions | |
trick | -0.092 |
show | -0.090 |
new | -0.089 |
grown | -0.085 |
matching | -0.083 |
Token | â |
Token ID | 22940 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
ppa | +0.018 |
hew | +0.018 |
lves | +0.018 |
mie | +0.017 |
ppers | +0.017 |
Neg logit contributions | |
my | -0.012 |
show | -0.012 |
your | -0.011 |
to | -0.011 |
the | -0.011 |
Token | € |
Token ID | 26391 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
mie | +0.049 |
etsy | +0.049 |
elope | +0.046 |
hew | +0.045 |
lves | +0.045 |
Neg logit contributions | |
show | -0.064 |
trick | -0.061 |
new | -0.058 |
test | -0.058 |
grown | -0.056 |
Token | car |
Token ID | 1097 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
show | +0.106 |
trick | +0.102 |
new | +0.100 |
grown | +0.096 |
test | +0.095 |
Neg logit contributions | |
mie | -0.095 |
etsy | -0.091 |
elope | -0.088 |
hew | -0.088 |
jo | -0.086 |
Token | came |
Token ID | 1625 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
mie | +0.388 |
etsy | +0.374 |
elope | +0.363 |
hew | +0.360 |
jo | +0.356 |
Neg logit contributions | |
show | -0.389 |
trick | -0.370 |
new | -0.362 |
grown | -0.348 |
making | -0.345 |
Token | speeding |
Token ID | 26347 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
show | +0.095 |
trick | +0.087 |
new | +0.083 |
grown | +0.077 |
test | +0.076 |
Neg logit contributions | |
mie | -0.255 |
etsy | -0.248 |
elope | -0.244 |
hew | -0.243 |
jo | -0.241 |
Token | by |
Token ID | 416 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
mie | +0.030 |
etsy | +0.029 |
elope | +0.029 |
hew | +0.028 |
jo | +0.028 |
Neg logit contributions | |
show | -0.011 |
trick | -0.010 |
new | -0.010 |
to | -0.009 |
for | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
show | +0.187 |
trick | +0.173 |
new | +0.166 |
test | +0.160 |
grown | +0.157 |
Neg logit contributions | |
mie | -0.362 |
elope | -0.350 |
etsy | -0.346 |
hew | -0.344 |
jo | -0.336 |
Token | Nut |
Token ID | 11959 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
show | +0.171 |
new | +0.165 |
making | +0.164 |
the | +0.157 |
to | +0.157 |
Neg logit contributions | |
jo | -0.181 |
mie | -0.177 |
etsy | -0.176 |
hew | -0.175 |
ppy | -0.174 |
Token | ty |
Token ID | 774 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
och | +0.616 |
apa | +0.605 |
etsy | +0.598 |
emic | +0.587 |
storms | +0.585 |
Neg logit contributions | |
trick | -0.550 |
new | -0.522 |
show | -0.517 |
the | -0.512 |
for | -0.507 |
Token | was |
Token ID | 373 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
etsy | +0.501 |
och | +0.498 |
thel | +0.490 |
mie | +0.472 |
Mic | +0.471 |
Neg logit contributions | |
show | -0.309 |
grown | -0.289 |
to | -0.279 |
trick | -0.269 |
big | -0.264 |
Token | hit |
Token ID | 2277 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
show | +0.187 |
trick | +0.183 |
test | +0.172 |
new | +0.170 |
math | +0.168 |
Neg logit contributions | |
mie | -0.256 |
elope | -0.236 |
etsy | -0.229 |
lves | -0.229 |
storms | -0.227 |
Token | . |
Token ID | 13 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
new | +0.132 |
to | +0.128 |
for | +0.125 |
the | +0.124 |
show | +0.121 |
Neg logit contributions | |
elope | -0.390 |
etsy | -0.387 |
mie | -0.385 |
jo | -0.382 |
thel | -0.381 |
Token | |
Token ID | 220 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
mie | +0.036 |
ppy | +0.036 |
jo | +0.035 |
la | +0.034 |
hew | +0.033 |
Neg logit contributions | |
new | -0.036 |
to | -0.036 |
show | -0.036 |
the | -0.034 |
grown | -0.034 |
Token | playing |
Token ID | 2712 |
Feature activation | -7.89e-02 |
Pos logit contributions | |
show | +0.060 |
trick | +0.055 |
new | +0.052 |
grown | +0.047 |
test | +0.047 |
Neg logit contributions | |
mie | -0.181 |
etsy | -0.175 |
elope | -0.172 |
hew | -0.172 |
jo | -0.170 |
Token | on |
Token ID | 319 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
show | +0.071 |
trick | +0.071 |
new | +0.066 |
grown | +0.064 |
chance | +0.064 |
Neg logit contributions | |
mie | -0.179 |
elope | -0.172 |
Hop | -0.170 |
Max | -0.169 |
rified | -0.166 |
Token | the |
Token ID | 262 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
trick | +0.130 |
show | +0.126 |
chance | +0.095 |
grown | +0.093 |
test | +0.092 |
Neg logit contributions | |
mie | -0.538 |
elope | -0.528 |
Max | -0.499 |
jo | -0.496 |
storms | -0.496 |
Token | beach |
Token ID | 10481 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
show | +0.157 |
trick | +0.151 |
new | +0.140 |
grown | +0.138 |
my | +0.137 |
Neg logit contributions | |
mie | -0.253 |
elope | -0.241 |
etsy | -0.237 |
jo | -0.234 |
hew | -0.233 |
Token | . |
Token ID | 13 |
Feature activation | +2.41e-02 |
Pos logit contributions | |
mie | +0.441 |
elope | +0.424 |
etsy | +0.423 |
jo | +0.414 |
hew | +0.413 |
Neg logit contributions | |
show | -0.211 |
trick | -0.202 |
new | -0.192 |
grown | -0.183 |
my | -0.182 |
Token | Jack |
Token ID | 3619 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
mie | +0.044 |
etsy | +0.043 |
elope | +0.042 |
hew | +0.041 |
jo | +0.041 |
Neg logit contributions | |
show | -0.037 |
trick | -0.036 |
new | -0.035 |
grown | -0.033 |
test | -0.033 |
Token | had |
Token ID | 550 |
Feature activation | -4.54e-02 |
Pos logit contributions | |
etsy | +0.680 |
rified | +0.661 |
hew | +0.650 |
lor | +0.643 |
mie | +0.640 |
Neg logit contributions | |
show | -0.476 |
making | -0.437 |
to | -0.437 |
new | -0.429 |
grown | -0.422 |
Token | a |
Token ID | 257 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
show | +0.032 |
trick | +0.028 |
new | +0.025 |
test | +0.024 |
for | +0.021 |
Neg logit contributions | |
mie | -0.123 |
etsy | -0.118 |
elope | -0.116 |
hew | -0.116 |
jo | -0.115 |
Token | bucket |
Token ID | 19236 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
show | +0.119 |
trick | +0.112 |
making | +0.104 |
my | +0.102 |
for | +0.099 |
Neg logit contributions | |
mie | -0.292 |
etsy | -0.284 |
elope | -0.277 |
pillar | -0.270 |
jo | -0.269 |
Token | and |
Token ID | 290 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
mie | +0.372 |
etsy | +0.350 |
jo | +0.345 |
ongo | +0.343 |
storms | +0.341 |
Neg logit contributions | |
show | -0.178 |
trick | -0.176 |
grown | -0.163 |
test | -0.163 |
new | -0.159 |
Token | Jill |
Token ID | 22772 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
show | +0.161 |
trick | +0.157 |
new | +0.148 |
test | +0.146 |
grown | +0.141 |
Neg logit contributions | |
mie | -0.177 |
etsy | -0.166 |
elope | -0.162 |
hew | -0.161 |
jo | -0.161 |
Token | walking |
Token ID | 6155 |
Feature activation | -4.59e-02 |
Pos logit contributions | |
trick | +0.104 |
show | +0.103 |
test | +0.091 |
new | +0.091 |
style | +0.088 |
Neg logit contributions | |
mie | -0.156 |
etsy | -0.145 |
ppa | -0.141 |
elope | -0.141 |
hew | -0.140 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
show | +0.033 |
trick | +0.031 |
new | +0.028 |
grown | +0.026 |
test | +0.025 |
Neg logit contributions | |
mie | -0.122 |
etsy | -0.119 |
elope | -0.117 |
jo | -0.116 |
hew | -0.116 |
Token | they |
Token ID | 484 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
the | +0.135 |
making | +0.127 |
new | +0.126 |
show | +0.124 |
to | +0.119 |
Neg logit contributions | |
hew | -0.233 |
mie | -0.228 |
pillar | -0.227 |
jo | -0.225 |
lor | -0.223 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
jo | +0.544 |
uddy | +0.543 |
etsy | +0.536 |
hew | +0.531 |
elope | +0.530 |
Neg logit contributions | |
the | -0.254 |
grown | -0.253 |
show | -0.253 |
to | -0.245 |
making | -0.229 |
Token | a |
Token ID | 257 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
new | +0.033 |
the | +0.017 |
show | +0.014 |
big | +0.010 |
a | +0.007 |
Neg logit contributions | |
etsy | -0.497 |
mie | -0.493 |
hew | -0.488 |
ppy | -0.484 |
jo | -0.482 |
Token | man |
Token ID | 582 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
show | +0.105 |
new | +0.096 |
trick | +0.095 |
grown | +0.084 |
test | +0.081 |
Neg logit contributions | |
mie | -0.328 |
etsy | -0.319 |
hew | -0.317 |
jo | -0.313 |
elope | -0.312 |
Token | who |
Token ID | 508 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
mie | +0.713 |
etsy | +0.680 |
elope | +0.673 |
jo | +0.665 |
hew | +0.663 |
Neg logit contributions | |
show | -0.352 |
trick | -0.338 |
new | -0.325 |
grown | -0.305 |
test | -0.298 |
Token | looked |
Token ID | 3114 |
Feature activation | -7.91e-02 |
Pos logit contributions | |
hew | +0.314 |
etsy | +0.311 |
unny | +0.298 |
ppy | +0.296 |
uddy | +0.291 |
Neg logit contributions | |
show | -0.189 |
the | -0.177 |
new | -0.167 |
making | -0.166 |
his | -0.163 |
Token | very |
Token ID | 845 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
trick | +0.113 |
show | +0.105 |
test | +0.099 |
grown | +0.094 |
design | +0.094 |
Neg logit contributions | |
mie | -0.157 |
rified | -0.141 |
lves | -0.141 |
etsy | -0.135 |
mi | -0.133 |
Token | sad |
Token ID | 6507 |
Feature activation | -7.84e-02 |
Pos logit contributions | |
show | +0.190 |
trick | +0.188 |
test | +0.169 |
making | +0.166 |
grown | +0.159 |
Neg logit contributions | |
mie | -0.368 |
etsy | -0.345 |
elope | -0.334 |
hew | -0.332 |
jo | -0.332 |
Token | . |
Token ID | 13 |
Feature activation | +1.92e-02 |
Pos logit contributions | |
show | +0.096 |
trick | +0.093 |
new | +0.086 |
test | +0.084 |
grown | +0.083 |
Neg logit contributions | |
mie | -0.166 |
etsy | -0.157 |
jo | -0.155 |
storms | -0.155 |
elope | -0.155 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +8.96e-02 |
Pos logit contributions | |
lves | +0.041 |
ppa | +0.040 |
mie | +0.040 |
ley | +0.040 |
mi | +0.039 |
Neg logit contributions | |
my | -0.027 |
your | -0.025 |
show | -0.025 |
to | -0.023 |
the | -0.023 |
Token | Once |
Token ID | 7454 |
Feature activation | -2.13e-02 |
Pos logit contributions | |
ppa | +0.191 |
etsy | +0.191 |
mie | +0.190 |
lves | +0.189 |
hew | +0.182 |
Neg logit contributions | |
show | -0.114 |
the | -0.110 |
new | -0.110 |
to | -0.108 |
trick | -0.102 |
Token | there |
Token ID | 612 |
Feature activation | +7.86e-02 |
Pos logit contributions | |
new | +0.026 |
show | +0.025 |
for | +0.023 |
to | +0.023 |
trick | +0.023 |
Neg logit contributions | |
mie | -0.047 |
etsy | -0.045 |
elope | -0.045 |
thel | -0.044 |
hew | -0.044 |
Token | was |
Token ID | 373 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
mie | +0.170 |
etsy | +0.167 |
ppa | +0.165 |
storms | +0.163 |
thel | +0.163 |
Neg logit contributions | |
show | -0.095 |
new | -0.093 |
trick | -0.087 |
to | -0.085 |
the | -0.083 |
Token | a |
Token ID | 257 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
show | +0.088 |
trick | +0.080 |
new | +0.072 |
test | +0.065 |
grown | +0.064 |
Neg logit contributions | |
mie | -0.365 |
etsy | -0.355 |
elope | -0.351 |
hew | -0.349 |
jo | -0.346 |
Token | boy |
Token ID | 2933 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
show | +0.093 |
new | +0.089 |
trick | +0.075 |
grown | +0.075 |
big | +0.073 |
Neg logit contributions | |
mie | -0.365 |
hew | -0.361 |
storms | -0.359 |
rified | -0.358 |
etsy | -0.357 |
Token | called |
Token ID | 1444 |
Feature activation | -3.80e-02 |
Pos logit contributions | |
mie | +0.542 |
elope | +0.515 |
etsy | +0.513 |
jo | +0.503 |
hew | +0.494 |
Neg logit contributions | |
show | -0.551 |
trick | -0.538 |
new | -0.525 |
grown | -0.502 |
test | -0.498 |
Token | J |
Token ID | 449 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
show | +0.062 |
my | +0.058 |
your | +0.057 |
new | +0.057 |
trick | +0.057 |
Neg logit contributions | |
mie | -0.072 |
etsy | -0.067 |
pillar | -0.067 |
hew | -0.066 |
elope | -0.065 |
Token | ax |
Token ID | 897 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
mie | +0.135 |
etsy | +0.130 |
elope | +0.129 |
hew | +0.118 |
storms | +0.116 |
Neg logit contributions | |
show | -0.308 |
trick | -0.300 |
new | -0.294 |
grown | -0.287 |
test | -0.284 |
Token | . |
Token ID | 13 |
Feature activation | +2.28e-02 |
Pos logit contributions | |
etsy | +0.749 |
mie | +0.743 |
rified | +0.732 |
hew | +0.729 |
storms | +0.719 |
Neg logit contributions | |
show | -0.245 |
new | -0.212 |
trick | -0.210 |
to | -0.208 |
for | -0.202 |
Token | He |
Token ID | 679 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
mie | +0.034 |
etsy | +0.032 |
hew | +0.031 |
elope | +0.031 |
jo | +0.031 |
Neg logit contributions | |
show | -0.043 |
trick | -0.042 |
new | -0.040 |
test | -0.039 |
grown | -0.039 |
Token | Once |
Token ID | 7454 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
ppa | +0.213 |
etsy | +0.213 |
lves | +0.211 |
mie | +0.211 |
hew | +0.202 |
Neg logit contributions | |
show | -0.105 |
the | -0.104 |
new | -0.101 |
to | -0.100 |
big | -0.093 |
Token | upon |
Token ID | 2402 |
Feature activation | -6.94e-02 |
Pos logit contributions | |
new | +0.028 |
show | +0.027 |
for | +0.025 |
trick | +0.025 |
to | +0.025 |
Neg logit contributions | |
mie | -0.050 |
etsy | -0.048 |
elope | -0.047 |
thel | -0.047 |
storms | -0.047 |
Token | a |
Token ID | 257 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
show | +0.026 |
trick | +0.021 |
new | +0.021 |
grown | +0.015 |
making | +0.013 |
Neg logit contributions | |
mie | -0.211 |
etsy | -0.208 |
hew | -0.203 |
elope | -0.203 |
jo | -0.202 |
Token | time |
Token ID | 640 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
show | +0.054 |
trick | +0.045 |
new | +0.042 |
grown | +0.033 |
test | +0.031 |
Neg logit contributions | |
mie | -0.378 |
etsy | -0.368 |
elope | -0.362 |
hew | -0.360 |
jo | -0.360 |
Token | , |
Token ID | 11 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
show | +0.061 |
trick | +0.053 |
new | +0.051 |
grown | +0.044 |
making | +0.042 |
Neg logit contributions | |
mie | -0.298 |
etsy | -0.290 |
elope | -0.286 |
hew | -0.284 |
jo | -0.283 |
Token | there |
Token ID | 612 |
Feature activation | +7.90e-02 |
Pos logit contributions | |
show | +0.108 |
new | +0.105 |
trick | +0.100 |
making | +0.095 |
for | +0.095 |
Neg logit contributions | |
mie | -0.260 |
etsy | -0.253 |
storms | -0.249 |
jo | -0.249 |
hew | -0.247 |
Token | was |
Token ID | 373 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
mie | +0.166 |
etsy | +0.162 |
hew | +0.155 |
jo | +0.155 |
ppa | +0.154 |
Neg logit contributions | |
show | -0.104 |
new | -0.099 |
trick | -0.098 |
grown | -0.093 |
making | -0.091 |
Token | a |
Token ID | 257 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
show | +0.063 |
trick | +0.052 |
new | +0.050 |
grown | +0.040 |
making | +0.037 |
Neg logit contributions | |
mie | -0.398 |
etsy | -0.389 |
elope | -0.383 |
hew | -0.381 |
jo | -0.380 |
Token | little |
Token ID | 1310 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
show | +0.101 |
new | +0.094 |
trick | +0.085 |
grown | +0.081 |
red | +0.076 |
Neg logit contributions | |
mie | -0.349 |
hew | -0.344 |
etsy | -0.342 |
jo | -0.339 |
storms | -0.337 |
Token | boy |
Token ID | 2933 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
show | +0.026 |
new | +0.025 |
red | +0.025 |
blue | +0.024 |
green | +0.024 |
Neg logit contributions | |
hew | -0.033 |
mie | -0.032 |
lor | -0.032 |
etsy | -0.032 |
jo | -0.032 |
Token | named |
Token ID | 3706 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
mie | +0.530 |
elope | +0.507 |
etsy | +0.499 |
jo | +0.495 |
hew | +0.478 |
Neg logit contributions | |
show | -0.556 |
trick | -0.546 |
new | -0.536 |
grown | -0.511 |
test | -0.506 |
Token | to |
Token ID | 284 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
show | +0.093 |
new | +0.082 |
trick | +0.082 |
for | +0.074 |
to | +0.074 |
Neg logit contributions | |
mie | -0.311 |
etsy | -0.303 |
hew | -0.298 |
elope | -0.297 |
pillar | -0.293 |
Token | the |
Token ID | 262 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
show | +0.188 |
new | +0.156 |
trick | +0.151 |
for | +0.133 |
my | +0.128 |
Neg logit contributions | |
mie | -0.723 |
etsy | -0.717 |
hew | -0.707 |
elope | -0.689 |
jo | -0.687 |
Token | other |
Token ID | 584 |
Feature activation | -1.52e-02 |
Pos logit contributions | |
show | +0.175 |
new | +0.165 |
trick | +0.161 |
grown | +0.151 |
test | +0.147 |
Neg logit contributions | |
mie | -0.269 |
etsy | -0.266 |
hew | -0.258 |
jo | -0.255 |
oped | -0.255 |
Token | animals |
Token ID | 4695 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
show | +0.018 |
new | +0.016 |
trick | +0.016 |
grown | +0.015 |
for | +0.015 |
Neg logit contributions | |
mie | -0.034 |
etsy | -0.034 |
hew | -0.033 |
elope | -0.033 |
jo | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
mie | +0.493 |
etsy | +0.483 |
hew | +0.473 |
elope | +0.473 |
jo | +0.468 |
Neg logit contributions | |
show | -0.166 |
trick | -0.147 |
new | -0.144 |
making | -0.128 |
grown | -0.128 |
Token | They |
Token ID | 1119 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ppers | +0.038 |
ppa | +0.038 |
lves | +0.038 |
mie | +0.037 |
pper | +0.036 |
Neg logit contributions | |
the | -0.016 |
my | -0.016 |
his | -0.015 |
your | -0.015 |
to | -0.014 |
Token | say |
Token ID | 910 |
Feature activation | -1.78e-02 |
Pos logit contributions | |
etsy | +0.468 |
hew | +0.454 |
mie | +0.453 |
storms | +0.453 |
uddy | +0.445 |
Neg logit contributions | |
show | -0.367 |
the | -0.307 |
grown | -0.300 |
new | -0.297 |
for | -0.297 |
Token | thank |
Token ID | 5875 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
show | +0.020 |
new | +0.019 |
trick | +0.019 |
grown | +0.018 |
to | +0.017 |
Neg logit contributions | |
mie | -0.041 |
etsy | -0.040 |
elope | -0.039 |
hew | -0.039 |
jo | -0.039 |
Token | you |
Token ID | 345 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
show | +0.183 |
new | +0.165 |
trick | +0.164 |
your | +0.161 |
for | +0.161 |
Neg logit contributions | |
mie | -0.261 |
etsy | -0.257 |
jo | -0.249 |
elope | -0.247 |
pillar | -0.246 |
Token | to |
Token ID | 284 |
Feature activation | -2.48e-01 |
Pos logit contributions | |
mie | +0.477 |
etsy | +0.468 |
elope | +0.462 |
lves | +0.460 |
oped | +0.456 |
Neg logit contributions | |
show | -0.057 |
new | -0.051 |
for | -0.050 |
to | -0.049 |
trick | -0.042 |
Token | the |
Token ID | 262 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
show | +0.157 |
trick | +0.137 |
new | +0.129 |
grown | +0.112 |
test | +0.108 |
Neg logit contributions | |
mie | -0.693 |
etsy | -0.676 |
elope | -0.664 |
hew | -0.662 |
jo | -0.658 |
Token | He |
Token ID | 679 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
mie | +0.057 |
etsy | +0.054 |
elope | +0.052 |
hew | +0.051 |
lves | +0.051 |
Neg logit contributions | |
show | -0.052 |
new | -0.049 |
trick | -0.049 |
grown | -0.047 |
to | -0.046 |
Token | was |
Token ID | 373 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
mie | +0.463 |
etsy | +0.453 |
elope | +0.438 |
hew | +0.436 |
jo | +0.429 |
Neg logit contributions | |
show | -0.416 |
trick | -0.389 |
new | -0.384 |
grown | -0.375 |
making | -0.362 |
Token | so |
Token ID | 523 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
trick | +0.185 |
show | +0.169 |
test | +0.162 |
new | +0.150 |
skills | +0.148 |
Neg logit contributions | |
mie | -0.251 |
elope | -0.226 |
storms | -0.222 |
lves | -0.220 |
la | -0.219 |
Token | excited |
Token ID | 6568 |
Feature activation | -8.88e-02 |
Pos logit contributions | |
trick | +0.180 |
show | +0.172 |
test | +0.158 |
new | +0.157 |
math | +0.155 |
Neg logit contributions | |
mie | -0.231 |
etsy | -0.219 |
jo | -0.209 |
hew | -0.209 |
elope | -0.207 |
Token | ! |
Token ID | 0 |
Feature activation | +3.40e-02 |
Pos logit contributions | |
show | +0.072 |
trick | +0.067 |
new | +0.062 |
grown | +0.058 |
test | +0.057 |
Neg logit contributions | |
mie | -0.227 |
etsy | -0.219 |
jo | -0.217 |
elope | -0.216 |
hew | -0.215 |
Token |
|
Token ID | 198 |
Feature activation | +9.31e-02 |
Pos logit contributions | |
mie | +0.070 |
etsy | +0.067 |
ppa | +0.067 |
lves | +0.066 |
ppy | +0.066 |
Neg logit contributions | |
show | -0.049 |
new | -0.047 |
to | -0.045 |
trick | -0.044 |
grown | -0.043 |
Token |
|
Token ID | 198 |
Feature activation | +9.17e-02 |
Pos logit contributions | |
mie | +0.211 |
etsy | +0.202 |
lves | +0.202 |
storms | +0.200 |
ppy | +0.199 |
Neg logit contributions | |
new | -0.112 |
show | -0.112 |
to | -0.108 |
trick | -0.105 |
the | -0.101 |
Token | He |
Token ID | 1544 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
mie | +0.123 |
etsy | +0.116 |
elope | +0.111 |
hew | +0.109 |
jo | +0.108 |
Neg logit contributions | |
show | -0.191 |
trick | -0.185 |
new | -0.182 |
grown | -0.177 |
test | -0.174 |
Token | put |
Token ID | 1234 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
mie | +0.369 |
etsy | +0.348 |
elope | +0.342 |
jo | +0.339 |
hew | +0.339 |
Neg logit contributions | |
show | -0.365 |
trick | -0.358 |
new | -0.348 |
test | -0.332 |
making | -0.327 |
Token | on |
Token ID | 319 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
trick | +0.111 |
show | +0.103 |
grown | +0.093 |
test | +0.091 |
new | +0.086 |
Neg logit contributions | |
mie | -0.329 |
mi | -0.296 |
hew | -0.296 |
ley | -0.295 |
thel | -0.294 |
Token | his |
Token ID | 465 |
Feature activation | -5.08e-02 |
Pos logit contributions | |
trick | +0.165 |
show | +0.151 |
chance | +0.139 |
test | +0.131 |
answer | +0.124 |
Neg logit contributions | |
mie | -0.501 |
hew | -0.457 |
jo | -0.452 |
elope | -0.450 |
mi | -0.447 |
Token | with |
Token ID | 351 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
show | +0.072 |
grown | +0.068 |
trick | +0.068 |
new | +0.066 |
test | +0.062 |
Neg logit contributions | |
mie | -0.250 |
etsy | -0.235 |
hew | -0.233 |
Hop | -0.233 |
elope | -0.232 |
Token | you |
Token ID | 345 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
show | +0.259 |
my | +0.256 |
new | +0.247 |
your | +0.246 |
the | +0.230 |
Neg logit contributions | |
elope | -0.405 |
jo | -0.403 |
etsy | -0.401 |
mie | -0.401 |
hew | -0.388 |
Token | , |
Token ID | 11 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
mie | +0.370 |
etsy | +0.356 |
hew | +0.350 |
elope | +0.350 |
jo | +0.346 |
Neg logit contributions | |
show | -0.170 |
trick | -0.160 |
new | -0.152 |
grown | -0.144 |
test | -0.143 |
Token | Spot |
Token ID | 15899 |
Feature activation | +3.49e-01 |
Pos logit contributions | |
show | +0.188 |
new | +0.183 |
my | +0.177 |
trick | +0.172 |
for | +0.167 |
Neg logit contributions | |
oped | -0.220 |
elope | -0.218 |
jo | -0.216 |
mie | -0.216 |
hew | -0.213 |
Token | !" |
Token ID | 2474 |
Feature activation | +5.57e-02 |
Pos logit contributions | |
etsy | +0.923 |
mie | +0.915 |
hew | +0.895 |
jo | +0.885 |
oped | +0.885 |
Neg logit contributions | |
show | -0.284 |
for | -0.257 |
new | -0.253 |
my | -0.249 |
trick | -0.246 |
Token |
|
Token ID | 198 |
Feature activation | +8.02e-02 |
Pos logit contributions | |
ppy | +0.107 |
mie | +0.105 |
hew | +0.104 |
lves | +0.104 |
jo | +0.103 |
Neg logit contributions | |
show | -0.086 |
to | -0.083 |
the | -0.081 |
new | -0.080 |
his | -0.078 |
Token |
|
Token ID | 198 |
Feature activation | +7.96e-02 |
Pos logit contributions | |
mie | +0.187 |
rified | +0.186 |
storms | +0.184 |
lves | +0.180 |
ley | +0.178 |
Neg logit contributions | |
new | -0.091 |
show | -0.087 |
to | -0.084 |
the | -0.081 |
trick | -0.081 |
Token | They |
Token ID | 2990 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
storms | +0.114 |
rified | +0.109 |
mie | +0.108 |
jo | +0.108 |
ley | +0.105 |
Neg logit contributions | |
show | -0.155 |
trick | -0.154 |
my | -0.150 |
new | -0.150 |
your | -0.147 |
Token | played |
Token ID | 2826 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
mie | +0.519 |
etsy | +0.510 |
elope | +0.506 |
jo | +0.504 |
storms | +0.500 |
Neg logit contributions | |
show | -0.362 |
trick | -0.323 |
new | -0.318 |
grown | -0.313 |
for | -0.305 |
Token | all |
Token ID | 477 |
Feature activation | -1.71e-02 |
Pos logit contributions | |
show | +0.187 |
trick | +0.184 |
test | +0.181 |
grown | +0.177 |
design | +0.175 |
Neg logit contributions | |
mie | -0.295 |
elope | -0.285 |
Hop | -0.284 |
hew | -0.282 |
Max | -0.280 |
Token | day |
Token ID | 1110 |
Feature activation | +1.83e-02 |
Pos logit contributions | |
trick | +0.017 |
show | +0.017 |
test | +0.016 |
grown | +0.016 |
magic | +0.015 |
Neg logit contributions | |
jo | -0.037 |
elope | -0.037 |
mie | -0.037 |
Rex | -0.036 |
Max | -0.035 |
Token | They |
Token ID | 2990 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
mie | +0.143 |
jo | +0.143 |
storms | +0.139 |
elope | +0.138 |
etsy | +0.133 |
Neg logit contributions | |
show | -0.143 |
new | -0.139 |
trick | -0.135 |
grown | -0.135 |
my | -0.133 |
Token | ran |
Token ID | 4966 |
Feature activation | -6.41e-02 |
Pos logit contributions | |
etsy | +0.492 |
jo | +0.488 |
storms | +0.485 |
mie | +0.483 |
elope | +0.471 |
Neg logit contributions | |
show | -0.399 |
grown | -0.351 |
trick | -0.344 |
new | -0.335 |
the | -0.334 |
Token | back |
Token ID | 736 |
Feature activation | -5.02e-02 |
Pos logit contributions | |
show | +0.050 |
trick | +0.047 |
new | +0.043 |
test | +0.040 |
grown | +0.040 |
Neg logit contributions | |
mie | -0.166 |
etsy | -0.161 |
elope | -0.158 |
hew | -0.157 |
jo | -0.156 |
Token | to |
Token ID | 284 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
trick | +0.032 |
show | +0.031 |
grown | +0.027 |
design | +0.026 |
test | +0.026 |
Neg logit contributions | |
mie | -0.130 |
elope | -0.128 |
etsy | -0.125 |
uddy | -0.123 |
jo | -0.122 |
Token | the |
Token ID | 262 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
trick | +0.262 |
show | +0.251 |
test | +0.234 |
grown | +0.231 |
style | +0.229 |
Neg logit contributions | |
mie | -0.516 |
etsy | -0.495 |
elope | -0.491 |
lves | -0.467 |
hew | -0.466 |
Token | house |
Token ID | 2156 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
trick | +0.145 |
show | +0.144 |
making | +0.139 |
for | +0.134 |
matching | +0.126 |
Neg logit contributions | |
mie | -0.254 |
elope | -0.238 |
pillar | -0.236 |
Hop | -0.236 |
etsy | -0.231 |
Token | , |
Token ID | 11 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
mie | +0.367 |
elope | +0.361 |
storms | +0.348 |
jo | +0.344 |
oped | +0.337 |
Neg logit contributions | |
trick | -0.205 |
my | -0.198 |
show | -0.192 |
test | -0.191 |
your | -0.188 |
Token | happy |
Token ID | 3772 |
Feature activation | -6.69e-02 |
Pos logit contributions | |
show | +0.123 |
trick | +0.119 |
new | +0.112 |
test | +0.107 |
grown | +0.105 |
Neg logit contributions | |
mie | -0.253 |
etsy | -0.244 |
elope | -0.241 |
hew | -0.235 |
jo | -0.234 |
Token | and |
Token ID | 290 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
show | +0.058 |
trick | +0.054 |
new | +0.051 |
test | +0.049 |
grown | +0.047 |
Neg logit contributions | |
mie | -0.165 |
etsy | -0.159 |
elope | -0.159 |
storms | -0.157 |
hew | -0.155 |
Token | hungry |
Token ID | 14720 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
trick | +0.139 |
math | +0.134 |
test | +0.132 |
show | +0.131 |
new | +0.125 |
Neg logit contributions | |
mie | -0.208 |
elope | -0.202 |
etsy | -0.197 |
hew | -0.187 |
oped | -0.185 |
Token | . |
Token ID | 13 |
Feature activation | +9.93e-03 |
Pos logit contributions | |
show | +0.037 |
trick | +0.035 |
new | +0.033 |
test | +0.032 |
grown | +0.031 |
Neg logit contributions | |
mie | -0.070 |
etsy | -0.067 |
elope | -0.067 |
storms | -0.066 |
hew | -0.065 |
Token | a |
Token ID | 257 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
show | +0.058 |
new | +0.054 |
trick | +0.053 |
grown | +0.049 |
making | +0.047 |
Neg logit contributions | |
mie | -0.143 |
etsy | -0.139 |
elope | -0.136 |
hew | -0.135 |
jo | -0.135 |
Token | dog |
Token ID | 3290 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
show | +0.109 |
trick | +0.099 |
new | +0.095 |
grown | +0.087 |
test | +0.085 |
Neg logit contributions | |
mie | -0.324 |
etsy | -0.314 |
elope | -0.309 |
hew | -0.308 |
jo | -0.306 |
Token | named |
Token ID | 3706 |
Feature activation | +2.75e-02 |
Pos logit contributions | |
mie | +0.485 |
etsy | +0.466 |
elope | +0.454 |
hew | +0.450 |
jo | +0.446 |
Neg logit contributions | |
show | -0.461 |
trick | -0.440 |
new | -0.431 |
grown | -0.413 |
test | -0.409 |
Token | Max |
Token ID | 5436 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
mie | +0.051 |
oped | +0.049 |
etsy | +0.048 |
hew | +0.048 |
ppa | +0.047 |
Neg logit contributions | |
show | -0.047 |
new | -0.045 |
my | -0.044 |
the | -0.044 |
trick | -0.043 |
Token | lived |
Token ID | 5615 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
mie | +0.905 |
etsy | +0.890 |
hew | +0.873 |
elope | +0.865 |
jo | +0.854 |
Neg logit contributions | |
show | -0.381 |
trick | -0.343 |
new | -0.333 |
grown | -0.315 |
making | -0.312 |
Token | . |
Token ID | 13 |
Feature activation | +2.44e-02 |
Pos logit contributions | |
show | +0.014 |
trick | +0.013 |
test | +0.012 |
new | +0.011 |
my | +0.011 |
Neg logit contributions | |
mie | -0.027 |
etsy | -0.026 |
elope | -0.026 |
Hop | -0.026 |
hew | -0.025 |
Token | Max |
Token ID | 5436 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
mie | +0.040 |
etsy | +0.038 |
elope | +0.037 |
hew | +0.037 |
jo | +0.035 |
Neg logit contributions | |
show | -0.044 |
new | -0.042 |
trick | -0.042 |
grown | -0.039 |
making | -0.039 |
Token | was |
Token ID | 373 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
mie | +0.761 |
etsy | +0.755 |
hew | +0.728 |
rified | +0.725 |
jo | +0.711 |
Neg logit contributions | |
show | -0.522 |
trick | -0.482 |
new | -0.481 |
grown | -0.466 |
to | -0.451 |
Token | a |
Token ID | 257 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
trick | +0.182 |
show | +0.170 |
test | +0.161 |
skills | +0.155 |
design | +0.150 |
Neg logit contributions | |
mie | -0.242 |
elope | -0.238 |
lves | -0.222 |
K | -0.218 |
bo | -0.217 |
Token | happy |
Token ID | 3772 |
Feature activation | -6.81e-02 |
Pos logit contributions | |
trick | +0.110 |
show | +0.110 |
making | +0.097 |
skills | +0.096 |
for | +0.094 |
Neg logit contributions | |
mie | -0.282 |
elope | -0.278 |
etsy | -0.277 |
Max | -0.269 |
lves | -0.268 |
Token | dog |
Token ID | 3290 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
show | +0.113 |
trick | +0.111 |
new | +0.105 |
my | +0.105 |
making | +0.104 |
Neg logit contributions | |
elope | -0.105 |
mie | -0.105 |
etsy | -0.104 |
jo | -0.101 |
pillar | -0.100 |
Token | see |
Token ID | 766 |
Feature activation | -9.01e-02 |
Pos logit contributions | |
math | +0.364 |
new | +0.357 |
red | +0.324 |
cream | +0.318 |
original | +0.318 |
Neg logit contributions | |
jo | -0.345 |
elope | -0.343 |
mie | -0.342 |
bo | -0.317 |
ppy | -0.316 |
Token | her |
Token ID | 607 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
new | +0.055 |
show | +0.052 |
the | +0.049 |
to | +0.041 |
for | +0.038 |
Neg logit contributions | |
etsy | -0.268 |
hew | -0.261 |
ppy | -0.260 |
uddy | -0.259 |
elope | -0.258 |
Token | music |
Token ID | 2647 |
Feature activation | +9.12e-02 |
Pos logit contributions | |
show | +0.029 |
trick | +0.028 |
grown | +0.027 |
my | +0.027 |
your | +0.026 |
Neg logit contributions | |
mie | -0.081 |
elope | -0.079 |
jo | -0.077 |
pillar | -0.076 |
etsy | -0.076 |
Token | had |
Token ID | 550 |
Feature activation | -4.61e-02 |
Pos logit contributions | |
mie | +0.210 |
elope | +0.201 |
etsy | +0.200 |
storms | +0.199 |
jo | +0.199 |
Neg logit contributions | |
show | -0.088 |
trick | -0.084 |
new | -0.080 |
my | -0.079 |
grown | -0.076 |
Token | made |
Token ID | 925 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
show | +0.063 |
trick | +0.059 |
test | +0.059 |
new | +0.057 |
math | +0.057 |
Neg logit contributions | |
mie | -0.087 |
etsy | -0.081 |
jo | -0.081 |
storms | -0.080 |
pillar | -0.079 |
Token | something |
Token ID | 1223 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
show | +0.172 |
trick | +0.155 |
new | +0.148 |
grown | +0.132 |
test | +0.128 |
Neg logit contributions | |
mie | -0.619 |
etsy | -0.603 |
elope | -0.593 |
hew | -0.590 |
jo | -0.586 |
Token | so |
Token ID | 523 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
mie | +0.041 |
storms | +0.038 |
etsy | +0.037 |
elope | +0.037 |
jo | +0.036 |
Neg logit contributions | |
show | -0.014 |
trick | -0.014 |
test | -0.014 |
order | -0.014 |
my | -0.014 |
Token | big |
Token ID | 1263 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
show | +0.097 |
trick | +0.093 |
test | +0.081 |
making | +0.080 |
new | +0.075 |
Neg logit contributions | |
mie | -0.317 |
etsy | -0.307 |
elope | -0.300 |
hew | -0.297 |
jo | -0.295 |
Token | and |
Token ID | 290 |
Feature activation | -9.86e-02 |
Pos logit contributions | |
show | +0.126 |
trick | +0.120 |
new | +0.113 |
grown | +0.109 |
test | +0.108 |
Neg logit contributions | |
mie | -0.295 |
storms | -0.279 |
etsy | -0.278 |
elope | -0.277 |
jo | -0.277 |
Token | strong |
Token ID | 1913 |
Feature activation | -8.56e-02 |
Pos logit contributions | |
show | +0.081 |
trick | +0.078 |
test | +0.069 |
grown | +0.066 |
new | +0.064 |
Neg logit contributions | |
mie | -0.242 |
etsy | -0.230 |
elope | -0.229 |
storms | -0.225 |
jo | -0.224 |
Token | so |
Token ID | 523 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
show | +0.088 |
trick | +0.080 |
new | +0.079 |
making | +0.072 |
grown | +0.071 |
Neg logit contributions | |
mie | -0.205 |
etsy | -0.202 |
hew | -0.198 |
elope | -0.197 |
jo | -0.194 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
mie | +0.730 |
etsy | +0.729 |
hew | +0.721 |
apa | +0.701 |
jo | +0.696 |
Neg logit contributions | |
show | -0.257 |
making | -0.205 |
for | -0.204 |
trick | -0.199 |
to | -0.199 |
Token | and |
Token ID | 290 |
Feature activation | -9.87e-02 |
Pos logit contributions | |
show | +0.105 |
trick | +0.104 |
new | +0.094 |
test | +0.091 |
grown | +0.087 |
Neg logit contributions | |
mie | -0.249 |
elope | -0.240 |
etsy | -0.237 |
rified | -0.235 |
hew | -0.234 |
Token | a |
Token ID | 257 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
show | +0.059 |
new | +0.050 |
trick | +0.049 |
grown | +0.042 |
making | +0.041 |
Neg logit contributions | |
mie | -0.282 |
etsy | -0.277 |
hew | -0.273 |
jo | -0.270 |
elope | -0.270 |
Token | pretty |
Token ID | 2495 |
Feature activation | -6.99e-02 |
Pos logit contributions | |
show | +0.181 |
new | +0.178 |
trick | +0.171 |
grown | +0.165 |
magic | +0.160 |
Neg logit contributions | |
mie | -0.249 |
hew | -0.240 |
etsy | -0.238 |
jo | -0.236 |
storms | -0.233 |
Token | flower |
Token ID | 15061 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
show | +0.109 |
trick | +0.105 |
making | +0.101 |
new | +0.098 |
test | +0.097 |
Neg logit contributions | |
mie | -0.120 |
etsy | -0.117 |
elope | -0.115 |
pillar | -0.112 |
jo | -0.109 |
Token | . |
Token ID | 13 |
Feature activation | +2.55e-02 |
Pos logit contributions | |
mie | +0.368 |
etsy | +0.356 |
elope | +0.352 |
hew | +0.347 |
jo | +0.346 |
Neg logit contributions | |
show | -0.175 |
trick | -0.165 |
new | -0.159 |
grown | -0.149 |
test | -0.146 |
Token |
|
Token ID | 198 |
Feature activation | +8.75e-02 |
Pos logit contributions | |
mie | +0.064 |
etsy | +0.061 |
ppa | +0.060 |
hew | +0.060 |
jo | +0.059 |
Neg logit contributions | |
show | -0.026 |
new | -0.024 |
to | -0.023 |
trick | -0.022 |
grown | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | +8.60e-02 |
Pos logit contributions | |
mie | +0.178 |
etsy | +0.167 |
rified | +0.162 |
lves | +0.162 |
storms | +0.161 |
Neg logit contributions | |
show | -0.128 |
trick | -0.121 |
new | -0.121 |
to | -0.114 |
grown | -0.112 |
Token | At |
Token ID | 2953 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
mie | +0.152 |
etsy | +0.145 |
elope | +0.141 |
hew | +0.140 |
jo | +0.139 |
Neg logit contributions | |
show | -0.143 |
trick | -0.137 |
new | -0.134 |
grown | -0.129 |
test | -0.127 |
Token | the |
Token ID | 262 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
grown | +0.124 |
style | +0.124 |
trick | +0.123 |
show | +0.119 |
design | +0.108 |
Neg logit contributions | |
elope | -0.370 |
mie | -0.357 |
Rex | -0.349 |
Max | -0.345 |
mi | -0.341 |
Token | end |
Token ID | 886 |
Feature activation | -6.53e-02 |
Pos logit contributions | |
show | +0.152 |
trick | +0.146 |
new | +0.133 |
making | +0.131 |
matching | +0.130 |
Neg logit contributions | |
mie | -0.278 |
elope | -0.266 |
etsy | -0.265 |
hew | -0.260 |
rified | -0.256 |
Token | people |
Token ID | 661 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
mie | +0.005 |
elope | +0.005 |
hew | +0.005 |
storms | +0.004 |
etsy | +0.004 |
Neg logit contributions | |
trick | -0.003 |
show | -0.003 |
test | -0.003 |
new | -0.003 |
chance | -0.003 |
Token | can |
Token ID | 460 |
Feature activation | -6.30e-02 |
Pos logit contributions | |
mie | +0.358 |
etsy | +0.337 |
hew | +0.330 |
elope | +0.324 |
storms | +0.322 |
Neg logit contributions | |
show | -0.265 |
trick | -0.262 |
new | -0.251 |
grown | -0.239 |
my | -0.232 |
Token | feel |
Token ID | 1254 |
Feature activation | -9.06e-02 |
Pos logit contributions | |
show | +0.051 |
trick | +0.048 |
new | +0.048 |
grown | +0.044 |
my | +0.043 |
Neg logit contributions | |
mie | -0.156 |
etsy | -0.150 |
elope | -0.147 |
hew | -0.147 |
jo | -0.144 |
Token | worried |
Token ID | 7960 |
Feature activation | -7.36e-02 |
Pos logit contributions | |
trick | +0.110 |
show | +0.109 |
test | +0.101 |
balance | +0.094 |
matching | +0.094 |
Neg logit contributions | |
mie | -0.184 |
etsy | -0.173 |
storms | -0.170 |
lves | -0.166 |
rified | -0.165 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
show | +0.075 |
trick | +0.072 |
test | +0.063 |
new | +0.061 |
grown | +0.059 |
Neg logit contributions | |
mie | -0.168 |
storms | -0.162 |
hew | -0.160 |
jo | -0.159 |
etsy | -0.159 |
Token | but |
Token ID | 475 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
show | +0.128 |
trick | +0.120 |
new | +0.118 |
grown | +0.110 |
making | +0.109 |
Neg logit contributions | |
mie | -0.237 |
etsy | -0.230 |
elope | -0.226 |
hew | -0.223 |
jo | -0.223 |
Token | a |
Token ID | 257 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
mie | +0.033 |
elope | +0.030 |
etsy | +0.030 |
hew | +0.029 |
storms | +0.029 |
Neg logit contributions | |
trick | -0.031 |
show | -0.030 |
test | -0.028 |
grown | -0.027 |
new | -0.027 |
Token | little |
Token ID | 1310 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
show | +0.117 |
trick | +0.107 |
making | +0.099 |
for | +0.098 |
my | +0.097 |
Neg logit contributions | |
mie | -0.296 |
etsy | -0.293 |
elope | -0.290 |
pillar | -0.279 |
hew | -0.276 |
Token | kindness |
Token ID | 23887 |
Feature activation | +3.64e-02 |
Pos logit contributions | |
show | +0.025 |
trick | +0.025 |
grown | +0.023 |
matching | +0.022 |
my | +0.022 |
Neg logit contributions | |
mie | -0.033 |
elope | -0.032 |
etsy | -0.031 |
storms | -0.031 |
rified | -0.031 |
Token | can |
Token ID | 460 |
Feature activation | -6.36e-02 |
Pos logit contributions | |
mie | +0.067 |
etsy | +0.065 |
jo | +0.063 |
elope | +0.063 |
storms | +0.063 |
Neg logit contributions | |
show | -0.053 |
trick | -0.051 |
new | -0.050 |
grown | -0.047 |
test | -0.047 |
Token | make |
Token ID | 787 |
Feature activation | -2.05e-01 |
Pos logit contributions | |
show | +0.045 |
trick | +0.043 |
new | +0.041 |
math | +0.039 |
grown | +0.038 |
Neg logit contributions | |
mie | -0.161 |
etsy | -0.155 |
elope | -0.155 |
hew | -0.153 |
jo | -0.152 |
Token | park |
Token ID | 3952 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
show | +0.202 |
trick | +0.200 |
new | +0.186 |
grown | +0.181 |
making | +0.180 |
Neg logit contributions | |
mie | -0.227 |
elope | -0.214 |
etsy | -0.212 |
hew | -0.208 |
jo | -0.207 |
Token | . |
Token ID | 13 |
Feature activation | +2.66e-02 |
Pos logit contributions | |
mie | +0.240 |
elope | +0.237 |
etsy | +0.232 |
jo | +0.226 |
storms | +0.225 |
Neg logit contributions | |
trick | -0.155 |
show | -0.152 |
new | -0.144 |
test | -0.140 |
grown | -0.138 |
Token | The |
Token ID | 383 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
mie | +0.055 |
etsy | +0.053 |
hew | +0.052 |
elope | +0.051 |
jo | +0.051 |
Neg logit contributions | |
show | -0.036 |
trick | -0.034 |
new | -0.033 |
grown | -0.032 |
test | -0.031 |
Token | tree |
Token ID | 5509 |
Feature activation | +2.26e-01 |
Pos logit contributions | |
show | +0.017 |
trick | +0.017 |
new | +0.015 |
making | +0.015 |
matching | +0.015 |
Neg logit contributions | |
mie | -0.022 |
etsy | -0.021 |
elope | -0.020 |
hew | -0.020 |
pillar | -0.020 |
Token | had |
Token ID | 550 |
Feature activation | -4.55e-02 |
Pos logit contributions | |
mie | +0.423 |
etsy | +0.414 |
hew | +0.399 |
elope | +0.394 |
rified | +0.392 |
Neg logit contributions | |
show | -0.350 |
new | -0.328 |
trick | -0.327 |
grown | -0.311 |
making | -0.306 |
Token | two |
Token ID | 734 |
Feature activation | +6.12e-02 |
Pos logit contributions | |
show | +0.043 |
trick | +0.040 |
test | +0.037 |
design | +0.034 |
for | +0.032 |
Neg logit contributions | |
mie | -0.104 |
elope | -0.101 |
etsy | -0.100 |
hew | -0.100 |
Snow | -0.100 |
Token | branches |
Token ID | 13737 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
mie | +0.142 |
etsy | +0.141 |
jo | +0.136 |
elope | +0.136 |
storms | +0.135 |
Neg logit contributions | |
show | -0.066 |
new | -0.065 |
grown | -0.060 |
trick | -0.059 |
red | -0.057 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
mie | +0.290 |
etsy | +0.281 |
elope | +0.275 |
jo | +0.274 |
hew | +0.271 |
Neg logit contributions | |
show | -0.152 |
trick | -0.146 |
new | -0.136 |
test | -0.130 |
my | -0.129 |
Token | one |
Token ID | 530 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
show | +0.077 |
trick | +0.068 |
new | +0.066 |
grown | +0.059 |
making | +0.057 |
Neg logit contributions | |
mie | -0.291 |
etsy | -0.284 |
elope | -0.279 |
hew | -0.278 |
jo | -0.277 |
Token | for |
Token ID | 329 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
elope | +0.073 |
mie | +0.072 |
etsy | +0.070 |
pillar | +0.069 |
jo | +0.069 |
Neg logit contributions | |
show | -0.035 |
trick | -0.034 |
test | -0.031 |
grown | -0.031 |
new | -0.030 |
Token | a |
Token ID | 257 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
show | +0.175 |
trick | +0.163 |
new | +0.145 |
test | +0.140 |
grown | +0.130 |
Neg logit contributions | |
mie | -0.519 |
elope | -0.502 |
etsy | -0.500 |
hew | -0.496 |
jo | -0.490 |
Token | his |
Token ID | 465 |
Feature activation | -4.70e-02 |
Pos logit contributions | |
show | +0.046 |
trick | +0.045 |
new | +0.041 |
test | +0.040 |
my | +0.038 |
Neg logit contributions | |
mie | -0.092 |
etsy | -0.088 |
elope | -0.087 |
hew | -0.086 |
jo | -0.085 |
Token | bath |
Token ID | 7837 |
Feature activation | +6.88e-02 |
Pos logit contributions | |
trick | +0.047 |
show | +0.047 |
making | +0.045 |
your | +0.044 |
my | +0.044 |
Neg logit contributions | |
mie | -0.102 |
etsy | -0.100 |
elope | -0.099 |
uddy | -0.097 |
hew | -0.096 |
Token | he |
Token ID | 339 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
mie | +0.157 |
etsy | +0.152 |
elope | +0.149 |
hew | +0.148 |
jo | +0.147 |
Neg logit contributions | |
show | -0.077 |
trick | -0.072 |
new | -0.070 |
grown | -0.065 |
test | -0.064 |
Token | felt |
Token ID | 2936 |
Feature activation | -9.57e-02 |
Pos logit contributions | |
mie | +0.471 |
etsy | +0.444 |
hew | +0.441 |
elope | +0.441 |
jo | +0.432 |
Neg logit contributions | |
show | -0.310 |
trick | -0.300 |
new | -0.294 |
test | -0.274 |
making | -0.273 |
Token | so |
Token ID | 523 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
trick | +0.155 |
test | +0.145 |
show | +0.143 |
math | +0.141 |
quiz | +0.138 |
Neg logit contributions | |
mie | -0.164 |
etsy | -0.142 |
hew | -0.135 |
Snow | -0.134 |
bo | -0.132 |
Token | good |
Token ID | 922 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
trick | +0.148 |
show | +0.143 |
test | +0.130 |
making | +0.127 |
math | +0.126 |
Neg logit contributions | |
mie | -0.269 |
hew | -0.262 |
etsy | -0.254 |
oped | -0.243 |
elope | -0.243 |
Token | and |
Token ID | 290 |
Feature activation | -9.83e-02 |
Pos logit contributions | |
show | +0.145 |
trick | +0.143 |
new | +0.139 |
my | +0.129 |
grown | +0.129 |
Neg logit contributions | |
mie | -0.305 |
storms | -0.282 |
etsy | -0.281 |
hew | -0.277 |
jo | -0.276 |
Token | clean |
Token ID | 3424 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
trick | +0.129 |
show | +0.128 |
test | +0.119 |
new | +0.115 |
math | +0.111 |
Neg logit contributions | |
mie | -0.199 |
hew | -0.184 |
elope | -0.182 |
etsy | -0.181 |
jo | -0.177 |
Token | . |
Token ID | 13 |
Feature activation | +2.31e-02 |
Pos logit contributions | |
show | +0.127 |
trick | +0.119 |
new | +0.114 |
grown | +0.106 |
test | +0.105 |
Neg logit contributions | |
mie | -0.287 |
etsy | -0.277 |
elope | -0.273 |
hew | -0.271 |
jo | -0.269 |
Token | The |
Token ID | 383 |
Feature activation | -4.25e-03 |
Pos logit contributions | |
ppy | +0.051 |
ppa | +0.051 |
ley | +0.050 |
mie | +0.049 |
pper | +0.049 |
Neg logit contributions | |
new | -0.029 |
show | -0.029 |
his | -0.028 |
the | -0.027 |
to | -0.027 |
Token | end |
Token ID | 886 |
Feature activation | -6.38e-02 |
Pos logit contributions | |
trick | +0.005 |
show | +0.005 |
your | +0.005 |
my | +0.004 |
new | +0.004 |
Neg logit contributions | |
mie | -0.009 |
etsy | -0.009 |
elope | -0.008 |
hew | -0.008 |
rified | -0.008 |
Token | play |
Token ID | 711 |
Feature activation | -9.48e-02 |
Pos logit contributions | |
trick | +0.082 |
new | +0.082 |
grown | +0.077 |
show | +0.077 |
chance | +0.075 |
Neg logit contributions | |
mie | -0.245 |
elope | -0.239 |
etsy | -0.230 |
hew | -0.222 |
thel | -0.221 |
Token | together |
Token ID | 1978 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
test | +0.085 |
show | +0.083 |
chance | +0.082 |
grown | +0.080 |
job | +0.079 |
Neg logit contributions | |
mie | -0.203 |
elope | -0.198 |
Hop | -0.198 |
hew | -0.195 |
Rex | -0.193 |
Token | . |
Token ID | 13 |
Feature activation | +7.86e-03 |
Pos logit contributions | |
mie | +0.043 |
elope | +0.041 |
ppy | +0.040 |
storms | +0.040 |
etsy | +0.039 |
Neg logit contributions | |
show | -0.035 |
my | -0.035 |
trick | -0.034 |
test | -0.034 |
new | -0.034 |
Token | They |
Token ID | 1119 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
mie | +0.014 |
etsy | +0.013 |
jo | +0.013 |
hew | +0.013 |
elope | +0.013 |
Neg logit contributions | |
show | -0.013 |
new | -0.013 |
trick | -0.012 |
grown | -0.012 |
my | -0.012 |
Token | learned |
Token ID | 4499 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
mie | +0.474 |
etsy | +0.464 |
jo | +0.455 |
elope | +0.455 |
hew | +0.451 |
Neg logit contributions | |
show | -0.375 |
trick | -0.348 |
new | -0.336 |
grown | -0.326 |
making | -0.321 |
Token | to |
Token ID | 284 |
Feature activation | -2.40e-01 |
Pos logit contributions | |
show | +0.184 |
test | +0.183 |
design | +0.170 |
balance | +0.170 |
matching | +0.167 |
Neg logit contributions | |
ess | -0.283 |
mie | -0.283 |
Snow | -0.282 |
ocular | -0.282 |
rots | -0.280 |
Token | be |
Token ID | 307 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
new | +0.199 |
show | +0.188 |
trick | +0.173 |
making | +0.170 |
grown | +0.167 |
Neg logit contributions | |
mie | -0.565 |
elope | -0.553 |
etsy | -0.549 |
hew | -0.547 |
ppy | -0.527 |
Token | nice |
Token ID | 3621 |
Feature activation | -8.36e-02 |
Pos logit contributions | |
show | +0.149 |
test | +0.147 |
trick | +0.137 |
design | +0.135 |
balance | +0.129 |
Neg logit contributions | |
mie | -0.213 |
elope | -0.199 |
Rex | -0.197 |
ppa | -0.193 |
Snow | -0.190 |
Token | and |
Token ID | 290 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
show | +0.075 |
trick | +0.068 |
test | +0.063 |
new | +0.062 |
grown | +0.059 |
Neg logit contributions | |
mie | -0.202 |
etsy | -0.195 |
elope | -0.194 |
storms | -0.193 |
jo | -0.193 |
Token | not |
Token ID | 407 |
Feature activation | -3.61e-02 |
Pos logit contributions | |
trick | +0.097 |
test | +0.097 |
show | +0.096 |
chance | +0.094 |
math | +0.093 |
Neg logit contributions | |
mie | -0.207 |
etsy | -0.204 |
elope | -0.204 |
Hop | -0.201 |
rice | -0.200 |
Token | fight |
Token ID | 1907 |
Feature activation | -2.68e-02 |
Pos logit contributions | |
show | +0.040 |
trick | +0.038 |
new | +0.037 |
test | +0.034 |
matching | +0.034 |
Neg logit contributions | |
mie | -0.071 |
ety | -0.070 |
ppy | -0.069 |
storms | -0.069 |
lves | -0.069 |
Token | day |
Token ID | 1110 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
elope | +0.029 |
mie | +0.028 |
jo | +0.028 |
etsy | +0.028 |
pillar | +0.027 |
Neg logit contributions | |
show | -0.012 |
trick | -0.012 |
making | -0.010 |
test | -0.010 |
matching | -0.010 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
mie | +0.061 |
etsy | +0.059 |
elope | +0.058 |
hew | +0.058 |
jo | +0.058 |
Neg logit contributions | |
show | -0.014 |
trick | -0.013 |
new | -0.012 |
grown | -0.010 |
test | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
show | +0.050 |
new | +0.040 |
trick | +0.038 |
making | +0.031 |
grown | +0.030 |
Neg logit contributions | |
mie | -0.308 |
etsy | -0.302 |
hew | -0.299 |
jo | -0.297 |
elope | -0.294 |
Token | little |
Token ID | 1310 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
show | +0.105 |
new | +0.097 |
trick | +0.095 |
grown | +0.086 |
magic | +0.081 |
Neg logit contributions | |
mie | -0.326 |
hew | -0.315 |
etsy | -0.314 |
jo | -0.310 |
storms | -0.308 |
Token | girl |
Token ID | 2576 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
show | +0.023 |
new | +0.022 |
trick | +0.022 |
red | +0.021 |
to | +0.021 |
Neg logit contributions | |
mie | -0.025 |
hew | -0.025 |
etsy | -0.024 |
jo | -0.024 |
elope | -0.023 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
mie | +0.504 |
etsy | +0.495 |
hew | +0.488 |
elope | +0.475 |
storms | +0.473 |
Neg logit contributions | |
show | -0.425 |
trick | -0.385 |
new | -0.379 |
grown | -0.376 |
to | -0.372 |
Token | the |
Token ID | 262 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
show | +0.031 |
new | +0.027 |
the | +0.022 |
to | +0.014 |
trick | +0.014 |
Neg logit contributions | |
mie | -0.467 |
etsy | -0.464 |
hew | -0.463 |
jo | -0.456 |
elope | -0.454 |
Token | glowing |
Token ID | 21377 |
Feature activation | -7.13e-02 |
Pos logit contributions | |
show | +0.148 |
trick | +0.139 |
new | +0.135 |
grown | +0.126 |
test | +0.124 |
Neg logit contributions | |
mie | -0.286 |
etsy | -0.278 |
elope | -0.272 |
hew | -0.270 |
jo | -0.270 |
Token | pond |
Token ID | 16723 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
show | +0.098 |
trick | +0.092 |
making | +0.089 |
your | +0.089 |
my | +0.088 |
Neg logit contributions | |
mie | -0.134 |
pillar | -0.127 |
etsy | -0.126 |
elope | -0.124 |
ley | -0.122 |
Token | . |
Token ID | 13 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
mie | +0.440 |
etsy | +0.422 |
elope | +0.421 |
jo | +0.411 |
hew | +0.410 |
Neg logit contributions | |
show | -0.183 |
trick | -0.175 |
new | -0.160 |
test | -0.155 |
my | -0.152 |
Token | She |
Token ID | 1375 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
mie | +0.045 |
hew | +0.044 |
etsy | +0.041 |
ppa | +0.041 |
elope | +0.041 |
Neg logit contributions | |
show | -0.047 |
new | -0.045 |
to | -0.044 |
grown | -0.044 |
my | -0.042 |
Token | said |
Token ID | 531 |
Feature activation | +3.64e-02 |
Pos logit contributions | |
show | +0.149 |
trick | +0.140 |
new | +0.138 |
grown | +0.132 |
making | +0.130 |
Neg logit contributions | |
mie | -0.183 |
etsy | -0.178 |
hew | -0.173 |
elope | -0.172 |
jo | -0.171 |
Token | : |
Token ID | 25 |
Feature activation | -8.32e-02 |
Pos logit contributions | |
mie | +0.093 |
etsy | +0.091 |
elope | +0.089 |
hew | +0.088 |
jo | +0.088 |
Neg logit contributions | |
show | -0.030 |
trick | -0.028 |
new | -0.026 |
test | -0.024 |
grown | -0.024 |
Token | " |
Token ID | 366 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
show | +0.111 |
trick | +0.103 |
new | +0.102 |
grown | +0.097 |
making | +0.095 |
Neg logit contributions | |
mie | -0.174 |
etsy | -0.167 |
hew | -0.164 |
elope | -0.163 |
jo | -0.162 |
Token | Thank |
Token ID | 10449 |
Feature activation | -8.35e-02 |
Pos logit contributions | |
uddy | +0.191 |
cases | +0.190 |
uffy | +0.189 |
anda | +0.185 |
lves | +0.185 |
Neg logit contributions | |
show | -0.165 |
color | -0.164 |
my | -0.160 |
the | -0.157 |
five | -0.157 |
Token | you |
Token ID | 345 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
show | +0.114 |
my | +0.105 |
your | +0.102 |
trick | +0.102 |
new | +0.101 |
Neg logit contributions | |
mie | -0.177 |
etsy | -0.170 |
lves | -0.169 |
jo | -0.168 |
storms | -0.167 |
Token | for |
Token ID | 329 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
mie | +0.465 |
etsy | +0.452 |
elope | +0.445 |
hew | +0.442 |
jo | +0.441 |
Neg logit contributions | |
show | -0.082 |
new | -0.067 |
trick | -0.066 |
for | -0.057 |
my | -0.054 |
Token | helping |
Token ID | 5742 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
chance | +0.196 |
new | +0.176 |
trick | +0.176 |
blue | +0.171 |
show | +0.171 |
Neg logit contributions | |
elope | -0.462 |
mie | -0.450 |
ppa | -0.441 |
thel | -0.439 |
Rust | -0.429 |
Token | me |
Token ID | 502 |
Feature activation | +5.11e-02 |
Pos logit contributions | |
show | +0.211 |
trick | +0.199 |
new | +0.193 |
grown | +0.182 |
test | +0.180 |
Neg logit contributions | |
mie | -0.356 |
etsy | -0.344 |
elope | -0.338 |
hew | -0.335 |
jo | -0.333 |
Token | to |
Token ID | 284 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
mie | +0.110 |
elope | +0.108 |
hew | +0.105 |
etsy | +0.105 |
ppy | +0.104 |
Neg logit contributions | |
new | -0.048 |
trick | -0.048 |
show | -0.047 |
red | -0.045 |
grown | -0.044 |
Token | cook |
Token ID | 4255 |
Feature activation | +2.42e-02 |
Pos logit contributions | |
new | +0.188 |
trick | +0.177 |
red | +0.173 |
show | +0.169 |
chance | +0.167 |
Neg logit contributions | |
mie | -0.563 |
elope | -0.558 |
etsy | -0.540 |
hew | -0.529 |
ppy | -0.526 |
Token | dinner |
Token ID | 8073 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
mie | +0.057 |
hew | +0.055 |
elope | +0.054 |
etsy | +0.053 |
thel | +0.053 |
Neg logit contributions | |
show | -0.021 |
trick | -0.021 |
test | -0.018 |
grown | -0.018 |
new | -0.018 |
Token | to |
Token ID | 284 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
show | +0.054 |
trick | +0.046 |
new | +0.039 |
test | +0.036 |
grown | +0.036 |
Neg logit contributions | |
mie | -0.308 |
etsy | -0.298 |
jo | -0.295 |
elope | -0.294 |
hew | -0.293 |
Token | the |
Token ID | 262 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
show | +0.183 |
trick | +0.169 |
new | +0.162 |
grown | +0.148 |
making | +0.141 |
Neg logit contributions | |
mie | -0.618 |
elope | -0.597 |
etsy | -0.589 |
hew | -0.584 |
jo | -0.580 |
Token | desk |
Token ID | 6915 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
show | +0.147 |
trick | +0.139 |
new | +0.133 |
grown | +0.126 |
making | +0.125 |
Neg logit contributions | |
mie | -0.276 |
etsy | -0.266 |
elope | -0.262 |
hew | -0.259 |
jo | -0.257 |
Token | and |
Token ID | 290 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
mie | +0.483 |
etsy | +0.465 |
elope | +0.459 |
hew | +0.457 |
jo | +0.456 |
Neg logit contributions | |
show | -0.210 |
trick | -0.197 |
new | -0.191 |
grown | -0.176 |
test | -0.174 |
Token | he |
Token ID | 339 |
Feature activation | +2.26e-01 |
Pos logit contributions | |
show | +0.152 |
trick | +0.140 |
new | +0.139 |
grown | +0.135 |
making | +0.133 |
Neg logit contributions | |
mie | -0.194 |
etsy | -0.192 |
jo | -0.186 |
hew | -0.186 |
elope | -0.185 |
Token | bumped |
Token ID | 38034 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
etsy | +0.420 |
mie | +0.412 |
thel | +0.403 |
och | +0.400 |
storms | +0.399 |
Neg logit contributions | |
show | -0.360 |
trick | -0.329 |
grown | -0.328 |
to | -0.321 |
new | -0.319 |
Token | into |
Token ID | 656 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
show | +0.072 |
trick | +0.064 |
new | +0.061 |
grown | +0.053 |
making | +0.051 |
Neg logit contributions | |
mie | -0.356 |
etsy | -0.349 |
elope | -0.344 |
hew | -0.342 |
jo | -0.340 |
Token | it |
Token ID | 340 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
show | +0.121 |
trick | +0.102 |
new | +0.101 |
grown | +0.082 |
making | +0.071 |
Neg logit contributions | |
mie | -0.808 |
etsy | -0.799 |
hew | -0.777 |
jo | -0.775 |
elope | -0.775 |
Token | . |
Token ID | 13 |
Feature activation | +2.44e-02 |
Pos logit contributions | |
mie | +0.324 |
etsy | +0.310 |
elope | +0.309 |
hew | +0.306 |
jo | +0.303 |
Neg logit contributions | |
show | -0.176 |
trick | -0.165 |
new | -0.159 |
grown | -0.154 |
test | -0.152 |
Token | The |
Token ID | 383 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
mie | +0.052 |
ppy | +0.050 |
ppa | +0.050 |
ley | +0.050 |
jo | +0.049 |
Neg logit contributions | |
show | -0.030 |
new | -0.030 |
grown | -0.029 |
to | -0.029 |
the | -0.028 |
Token | sudden |
Token ID | 4802 |
Feature activation | +7.45e-02 |
Pos logit contributions | |
show | +0.014 |
trick | +0.013 |
new | +0.012 |
grown | +0.011 |
making | +0.011 |
Neg logit contributions | |
mie | -0.030 |
etsy | -0.029 |
elope | -0.029 |
hew | -0.029 |
jo | -0.028 |