Token | family |
Token ID | 1641 |
Feature activation | +2.49e+01 |
Pos logit contributions | |
asis | +0.340 |
ymes | +0.339 |
andel | +0.339 |
robat | +0.335 |
Ta | +0.332 |
Neg logit contributions | |
not | -0.302 |
and | -0.288 |
because | -0.259 |
but | -0.242 |
, | -0.240 |
Token | and |
Token ID | 290 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
asis | +0.520 |
ymes | +0.517 |
robat | +0.506 |
ites | +0.499 |
andel | +0.494 |
Neg logit contributions | |
not | -0.207 |
and | -0.163 |
because | -0.146 |
but | -0.137 |
" | -0.133 |
Token | our |
Token ID | 674 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
not | +0.033 |
and | +0.031 |
because | +0.029 |
but | +0.028 |
: | +0.028 |
Neg logit contributions | |
ymes | -0.044 |
nests | -0.042 |
keeping | -0.042 |
asis | -0.042 |
Ta | -0.042 |
Token | friends |
Token ID | 2460 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
asis | +0.319 |
andel | +0.319 |
ymes | +0.318 |
robat | +0.314 |
Ta | +0.311 |
Neg logit contributions | |
not | -0.341 |
and | -0.327 |
because | -0.297 |
but | -0.279 |
, | -0.277 |
Token | . |
Token ID | 13 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
ymes | +0.412 |
asis | +0.407 |
robat | +0.401 |
ites | +0.393 |
ival | +0.385 |
Neg logit contributions | |
not | -0.221 |
and | -0.178 |
because | -0.170 |
but | -0.162 |
they | -0.157 |
Token | Amen |
Token ID | 34717 |
Feature activation | +7.18e+01 |
Pos logit contributions | |
Ta | +0.039 |
umm | +0.037 |
pter | +0.036 |
crow | +0.036 |
andel | +0.035 |
Neg logit contributions | |
not | -0.051 |
and | -0.048 |
because | -0.044 |
, | -0.042 |
but | -0.041 |
Token | ." |
Token ID | 526 |
Feature activation | +8.87e+00 |
Pos logit contributions | |
ymes | +1.372 |
asis | +1.370 |
andel | +1.343 |
ites | +1.341 |
robat | +1.325 |
Neg logit contributions | |
not | -0.712 |
and | -0.661 |
because | -0.581 |
but | -0.550 |
" | -0.514 |
Token |
|
Token ID | 198 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
pill | +0.153 |
pter | +0.153 |
Ta | +0.151 |
ymes | +0.151 |
pillar | +0.151 |
Neg logit contributions | |
not | -0.087 |
because | -0.069 |
and | -0.069 |
just | -0.062 |
for | -0.062 |
Token |
|
Token ID | 198 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
ymes | +0.305 |
Ta | +0.302 |
asis | +0.299 |
andel | +0.298 |
robat | +0.298 |
Neg logit contributions | |
not | -0.097 |
and | -0.085 |
because | -0.077 |
but | -0.063 |
, | -0.055 |
Token | Anna |
Token ID | 31160 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
ymes | +0.169 |
Ta | +0.162 |
robat | +0.157 |
asis | +0.157 |
ites | +0.155 |
Neg logit contributions | |
not | -0.243 |
and | -0.235 |
because | -0.224 |
but | -0.209 |
, | -0.206 |
Token | said |
Token ID | 531 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
ymes | +0.229 |
asis | +0.229 |
Ta | +0.228 |
pillar | +0.222 |
robat | +0.218 |
Neg logit contributions | |
not | -0.171 |
because | -0.152 |
and | -0.145 |
for | -0.143 |
but | -0.140 |
Token | house |
Token ID | 2156 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
andel | +0.319 |
asis | +0.317 |
robat | +0.313 |
Ta | +0.310 |
ymes | +0.309 |
Neg logit contributions | |
not | -0.296 |
and | -0.283 |
because | -0.251 |
, | -0.238 |
. | -0.235 |
Token | and |
Token ID | 290 |
Feature activation | -3.73e+00 |
Pos logit contributions | |
ymes | +0.486 |
asis | +0.484 |
keeping | +0.480 |
ites | +0.479 |
robat | +0.467 |
Neg logit contributions | |
not | -0.142 |
but | -0.089 |
because | -0.088 |
" | -0.087 |
and | -0.084 |
Token | our |
Token ID | 674 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
not | +0.039 |
and | +0.039 |
because | +0.036 |
but | +0.036 |
: | +0.033 |
Neg logit contributions | |
keeping | -0.061 |
ymes | -0.059 |
nests | -0.058 |
ites | -0.058 |
pige | -0.057 |
Token | family |
Token ID | 1641 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
andel | +0.340 |
asis | +0.334 |
robat | +0.332 |
Ta | +0.331 |
ymes | +0.329 |
Neg logit contributions | |
not | -0.297 |
and | -0.284 |
because | -0.250 |
, | -0.236 |
. | -0.235 |
Token | . |
Token ID | 13 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
ymes | +0.465 |
asis | +0.459 |
robat | +0.446 |
ites | +0.445 |
keeping | +0.438 |
Neg logit contributions | |
not | -0.232 |
and | -0.174 |
but | -0.172 |
because | -0.169 |
" | -0.161 |
Token | Amen |
Token ID | 34717 |
Feature activation | +6.98e+01 |
Pos logit contributions | |
Ta | +0.025 |
umm | +0.025 |
crow | +0.024 |
pter | +0.023 |
ocol | +0.023 |
Neg logit contributions | |
not | -0.032 |
and | -0.030 |
because | -0.027 |
but | -0.026 |
, | -0.026 |
Token | ." |
Token ID | 526 |
Feature activation | +7.45e+00 |
Pos logit contributions | |
ymes | +1.322 |
asis | +1.317 |
ites | +1.300 |
andel | +1.292 |
robat | +1.271 |
Neg logit contributions | |
not | -0.695 |
and | -0.642 |
because | -0.570 |
but | -0.551 |
" | -0.514 |
Token |
|
Token ID | 198 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
pige | +0.144 |
ites | +0.142 |
andel | +0.142 |
crow | +0.142 |
pill | +0.141 |
Neg logit contributions | |
not | -0.064 |
and | -0.051 |
because | -0.048 |
for | -0.044 |
just | -0.040 |
Token |
|
Token ID | 198 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
asis | +0.281 |
ymes | +0.280 |
andel | +0.280 |
Ta | +0.278 |
robat | +0.275 |
Neg logit contributions | |
not | -0.083 |
and | -0.073 |
because | -0.063 |
but | -0.053 |
, | -0.047 |
Token | Mom |
Token ID | 29252 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
ymes | +0.194 |
asis | +0.194 |
andel | +0.192 |
robat | +0.190 |
Ta | +0.190 |
Neg logit contributions | |
not | -0.175 |
and | -0.167 |
because | -0.153 |
but | -0.143 |
, | -0.140 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.57e+01 |
Pos logit contributions | |
ymes | +0.392 |
Ta | +0.388 |
asis | +0.381 |
robat | +0.381 |
ites | +0.376 |
Neg logit contributions | |
not | -0.167 |
because | -0.131 |
and | -0.129 |
but | -0.111 |
they | -0.104 |
Token | like |
Token ID | 588 |
Feature activation | +2.82e+01 |
Pos logit contributions | |
seas | +0.943 |
ites | +0.943 |
asis | +0.933 |
orns | +0.916 |
nests | +0.912 |
Neg logit contributions | |
not | -0.308 |
and | -0.214 |
" | -0.204 |
because | -0.189 |
but | -0.163 |
Token | lettuce |
Token ID | 39406 |
Feature activation | +5.57e+01 |
Pos logit contributions | |
ymes | +0.473 |
seas | +0.471 |
nests | +0.469 |
ocol | +0.469 |
andel | +0.466 |
Neg logit contributions | |
not | -0.321 |
and | -0.292 |
because | -0.262 |
but | -0.243 |
" | -0.234 |
Token | , |
Token ID | 11 |
Feature activation | +2.26e+01 |
Pos logit contributions | |
orns | +1.244 |
asis | +1.243 |
nests | +1.170 |
robat | +1.168 |
seas | +1.166 |
Neg logit contributions | |
not | -0.306 |
" | -0.181 |
because | -0.151 |
and | -0.134 |
: | -0.111 |
Token | tomatoes |
Token ID | 23972 |
Feature activation | +5.23e+01 |
Pos logit contributions | |
seas | +0.256 |
ocol | +0.251 |
nests | +0.250 |
orns | +0.241 |
pige | +0.241 |
Neg logit contributions | |
not | -0.379 |
and | -0.353 |
because | -0.334 |
: | -0.327 |
" | -0.318 |
Token | and |
Token ID | 290 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
asis | +1.145 |
orns | +1.139 |
nests | +1.074 |
ites | +1.073 |
robat | +1.070 |
Neg logit contributions | |
not | -0.281 |
" | -0.151 |
because | -0.149 |
and | -0.113 |
but | -0.099 |
Token | cuc |
Token ID | 38421 |
Feature activation | +6.88e+01 |
Pos logit contributions | |
seas | +0.124 |
ocol | +0.123 |
nests | +0.123 |
andel | +0.121 |
orns | +0.121 |
Neg logit contributions | |
not | -0.282 |
and | -0.270 |
because | -0.256 |
but | -0.242 |
: | -0.242 |
Token | umbers |
Token ID | 17024 |
Feature activation | +4.47e+01 |
Pos logit contributions | |
asis | +0.392 |
ymes | +0.388 |
andel | +0.387 |
Ta | +0.374 |
robat | +0.372 |
Neg logit contributions | |
not | -1.651 |
and | -1.617 |
because | -1.514 |
but | -1.462 |
, | -1.459 |
Token | . |
Token ID | 13 |
Feature activation | +1.49e+01 |
Pos logit contributions | |
orns | +0.958 |
asis | +0.956 |
pter | +0.933 |
ocol | +0.933 |
keeping | +0.930 |
Neg logit contributions | |
not | -0.251 |
because | -0.152 |
and | -0.138 |
but | -0.130 |
" | -0.129 |
Token | He |
Token ID | 679 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
andel | +0.303 |
asis | +0.299 |
ites | +0.298 |
Ta | +0.298 |
ymes | +0.298 |
Neg logit contributions | |
not | -0.134 |
and | -0.119 |
because | -0.100 |
, | -0.087 |
but | -0.086 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
asis | +0.226 |
pill | +0.220 |
arrow | +0.219 |
pter | +0.217 |
nests | +0.215 |
Neg logit contributions | |
not | -0.123 |
because | -0.113 |
and | -0.108 |
but | -0.106 |
" | -0.096 |
Token | as |
Token ID | 355 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
oceans | +0.412 |
andel | +0.407 |
umm | +0.406 |
seas | +0.402 |
kingdom | +0.398 |
Neg logit contributions | |
not | -0.094 |
they | -0.029 |
because | -0.027 |
making | -0.025 |
but | -0.024 |
Token | make |
Token ID | 787 |
Feature activation | +9.06e+00 |
Pos logit contributions | |
not | +0.003 |
and | +0.003 |
because | +0.003 |
: | +0.003 |
but | +0.003 |
Neg logit contributions | |
Ta | -0.006 |
ites | -0.006 |
ymes | -0.006 |
nests | -0.006 |
keeping | -0.006 |
Token | it |
Token ID | 340 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
asis | +0.207 |
andel | +0.205 |
robat | +0.205 |
ymes | +0.202 |
umm | +0.201 |
Neg logit contributions | |
not | -0.075 |
and | -0.067 |
because | -0.052 |
. | -0.047 |
, | -0.046 |
Token | whole |
Token ID | 2187 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
asis | +0.298 |
nests | +0.293 |
ymes | +0.287 |
seas | +0.280 |
bridge | +0.279 |
Neg logit contributions | |
not | -0.186 |
and | -0.181 |
because | -0.170 |
: | -0.170 |
" | -0.168 |
Token | again |
Token ID | 757 |
Feature activation | +6.28e+00 |
Pos logit contributions | |
ymes | +0.190 |
asis | +0.189 |
nests | +0.188 |
umm | +0.186 |
orns | +0.185 |
Neg logit contributions | |
not | -0.114 |
and | -0.098 |
" | -0.094 |
because | -0.090 |
they | -0.090 |
Token | . |
Token ID | 13 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
asis | +0.105 |
ymes | +0.103 |
ites | +0.103 |
nests | +0.100 |
keeping | +0.098 |
Neg logit contributions | |
not | -0.065 |
" | -0.052 |
and | -0.052 |
because | -0.051 |
: | -0.050 |
Token | Amen |
Token ID | 34717 |
Feature activation | +6.79e+01 |
Pos logit contributions | |
not | +0.002 |
and | +0.002 |
because | +0.002 |
for | +0.002 |
, | +0.002 |
Neg logit contributions | |
Ta | -0.003 |
ites | -0.003 |
umm | -0.003 |
asis | -0.003 |
andel | -0.003 |
Token | ." |
Token ID | 526 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
asis | +1.238 |
ites | +1.230 |
ymes | +1.206 |
pter | +1.187 |
ulture | +1.180 |
Neg logit contributions | |
not | -0.658 |
and | -0.594 |
because | -0.565 |
but | -0.560 |
" | -0.519 |
Token |
|
Token ID | 198 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
crow | +0.037 |
keeping | +0.037 |
ites | +0.037 |
pige | +0.037 |
folk | +0.036 |
Neg logit contributions | |
not | -0.019 |
and | -0.016 |
because | -0.015 |
for | -0.015 |
just | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
ymes | +0.087 |
asis | +0.087 |
andel | +0.086 |
Ta | +0.086 |
robat | +0.086 |
Neg logit contributions | |
not | -0.025 |
and | -0.022 |
because | -0.019 |
but | -0.015 |
, | -0.014 |
Token | Then |
Token ID | 6423 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
ymes | +0.034 |
asis | +0.033 |
andel | +0.033 |
robat | +0.033 |
Ta | +0.033 |
Neg logit contributions | |
not | -0.028 |
and | -0.026 |
because | -0.024 |
but | -0.022 |
, | -0.022 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+00 |
Pos logit contributions | |
not | +0.094 |
and | +0.082 |
because | +0.070 |
but | +0.054 |
" | +0.045 |
Neg logit contributions | |
asis | -0.349 |
seas | -0.348 |
crow | -0.346 |
ymes | -0.346 |
ites | -0.345 |
Token | saw |
Token ID | 2497 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
ymes | +0.122 |
asis | +0.119 |
Ta | +0.118 |
seas | +0.117 |
ites | +0.116 |
Neg logit contributions | |
not | -0.058 |
and | -0.052 |
because | -0.050 |
but | -0.044 |
for | -0.043 |
Token | clown |
Token ID | 25573 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
asis | +0.136 |
robat | +0.134 |
andel | +0.134 |
ymes | +0.133 |
umm | +0.131 |
Neg logit contributions | |
not | -0.065 |
and | -0.063 |
because | -0.052 |
, | -0.047 |
but | -0.047 |
Token | s |
Token ID | 82 |
Feature activation | +5.96e+00 |
Pos logit contributions | |
asis | +0.528 |
ymes | +0.528 |
andel | +0.526 |
robat | +0.521 |
Ta | +0.515 |
Neg logit contributions | |
not | -0.326 |
and | -0.304 |
because | -0.268 |
but | -0.245 |
, | -0.240 |
Token | and |
Token ID | 290 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
asis | +0.140 |
nests | +0.139 |
ymes | +0.137 |
ites | +0.136 |
keeping | +0.135 |
Neg logit contributions | |
not | -0.023 |
because | -0.013 |
and | -0.007 |
but | -0.006 |
they | -0.005 |
Token | ac |
Token ID | 936 |
Feature activation | +4.23e+01 |
Pos logit contributions | |
not | +0.028 |
and | +0.026 |
because | +0.024 |
but | +0.023 |
, | +0.022 |
Neg logit contributions | |
ymes | -0.026 |
asis | -0.026 |
andel | -0.026 |
robat | -0.025 |
Ta | -0.025 |
Token | rob |
Token ID | 22609 |
Feature activation | +6.78e+01 |
Pos logit contributions | |
andel | +0.270 |
umm | +0.245 |
Ta | +0.225 |
ocol | +0.197 |
igsaw | +0.189 |
Neg logit contributions | |
and | -1.079 |
not | -1.029 |
. | -0.962 |
, | -0.962 |
because | -0.958 |
Token | ats |
Token ID | 1381 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
andel | +0.585 |
asis | +0.583 |
ymes | +0.579 |
robat | +0.562 |
Ta | +0.561 |
Neg logit contributions | |
not | -1.448 |
and | -1.401 |
because | -1.308 |
, | -1.252 |
but | -1.250 |
Token | and |
Token ID | 290 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
robat | +0.399 |
crow | +0.395 |
asis | +0.395 |
orns | +0.394 |
ymes | +0.394 |
Neg logit contributions | |
not | -0.069 |
because | -0.026 |
and | -0.022 |
but | -0.011 |
" | -0.003 |
Token | lions |
Token ID | 31420 |
Feature activation | +3.44e+01 |
Pos logit contributions | |
not | +0.029 |
and | +0.028 |
because | +0.026 |
but | +0.024 |
, | +0.024 |
Neg logit contributions | |
asis | -0.019 |
ymes | -0.019 |
andel | -0.019 |
robat | -0.018 |
Ta | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -9.09e-01 |
Pos logit contributions | |
asis | +0.870 |
ymes | +0.865 |
robat | +0.861 |
orns | +0.849 |
andel | +0.847 |
Neg logit contributions | |
not | -0.146 |
and | -0.084 |
because | -0.066 |
but | -0.037 |
" | -0.030 |
Token | elephants |
Token ID | 25368 |
Feature activation | +2.92e+01 |
Pos logit contributions | |
not | +0.017 |
and | +0.017 |
because | +0.016 |
but | +0.015 |
, | +0.015 |
Neg logit contributions | |
asis | -0.010 |
andel | -0.010 |
ymes | -0.010 |
robat | -0.010 |
umm | -0.010 |
Token | soon |
Token ID | 2582 |
Feature activation | -3.42e+00 |
Pos logit contributions | |
not | +0.038 |
and | +0.037 |
because | +0.033 |
but | +0.031 |
" | +0.030 |
Neg logit contributions | |
andel | -0.072 |
asis | -0.072 |
nests | -0.072 |
ymes | -0.070 |
Ta | -0.069 |
Token | nothing |
Token ID | 2147 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
not | +0.040 |
and | +0.034 |
because | +0.033 |
" | +0.032 |
: | +0.030 |
Neg logit contributions | |
asis | -0.059 |
nests | -0.058 |
andel | -0.057 |
seas | -0.055 |
ymes | -0.055 |
Token | but |
Token ID | 475 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
ymes | +0.262 |
worm | +0.262 |
asis | +0.260 |
pillar | +0.257 |
crow | +0.254 |
Neg logit contributions | |
not | -0.161 |
and | -0.140 |
because | -0.126 |
" | -0.121 |
: | -0.116 |
Token | a |
Token ID | 257 |
Feature activation | +8.51e+00 |
Pos logit contributions | |
not | +0.021 |
and | +0.018 |
because | +0.016 |
but | +0.015 |
" | +0.015 |
Neg logit contributions | |
ymes | -0.044 |
asis | -0.043 |
nests | -0.043 |
Ta | -0.042 |
andel | -0.042 |
Token | small |
Token ID | 1402 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
asis | +0.137 |
ymes | +0.136 |
andel | +0.136 |
robat | +0.135 |
Ta | +0.134 |
Neg logit contributions | |
not | -0.119 |
and | -0.114 |
because | -0.102 |
but | -0.096 |
, | -0.095 |
Token | spe |
Token ID | 693 |
Feature activation | +6.67e+01 |
Pos logit contributions | |
andel | +0.214 |
asis | +0.214 |
ymes | +0.213 |
robat | +0.209 |
Ta | +0.205 |
Neg logit contributions | |
not | -0.269 |
and | -0.254 |
because | -0.234 |
but | -0.221 |
" | -0.217 |
Token | ck |
Token ID | 694 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
umm | +0.915 |
ival | +0.885 |
pill | +0.878 |
Ta | +0.877 |
ymes | +0.874 |
Neg logit contributions | |
not | -1.179 |
and | -1.126 |
because | -1.005 |
. | -0.985 |
, | -0.970 |
Token | in |
Token ID | 287 |
Feature activation | +8.70e+00 |
Pos logit contributions | |
asis | +0.321 |
ymes | +0.320 |
andel | +0.319 |
emaker | +0.319 |
crow | +0.318 |
Neg logit contributions | |
not | -0.327 |
and | -0.270 |
because | -0.266 |
" | -0.248 |
but | -0.245 |
Token | the |
Token ID | 262 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
andel | +0.173 |
ymes | +0.168 |
ocol | +0.166 |
asis | +0.165 |
Ta | +0.165 |
Neg logit contributions | |
not | -0.087 |
and | -0.077 |
because | -0.068 |
but | -0.061 |
" | -0.060 |
Token | sky |
Token ID | 6766 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
ymes | +0.195 |
robat | +0.191 |
ites | +0.187 |
emaker | +0.187 |
orns | +0.182 |
Neg logit contributions | |
and | -0.306 |
not | -0.301 |
because | -0.275 |
. | -0.267 |
, | -0.267 |
Token | . |
Token ID | 13 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
asis | +0.481 |
ymes | +0.457 |
nests | +0.457 |
pillar | +0.456 |
crow | +0.454 |
Neg logit contributions | |
not | -0.141 |
and | -0.075 |
because | -0.070 |
" | -0.061 |
but | -0.057 |
Token | kind |
Token ID | 1611 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
ymes | +0.041 |
asis | +0.040 |
andel | +0.039 |
ites | +0.039 |
robat | +0.039 |
Neg logit contributions | |
not | -0.030 |
and | -0.028 |
because | -0.026 |
but | -0.024 |
: | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | -4.72e+00 |
Pos logit contributions | |
ymes | +0.362 |
keeping | +0.353 |
andel | +0.351 |
ites | +0.351 |
umm | +0.349 |
Neg logit contributions | |
not | -0.085 |
and | -0.054 |
because | -0.043 |
but | -0.036 |
they | -0.036 |
Token | Thank |
Token ID | 6952 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
not | +0.055 |
and | +0.052 |
because | +0.044 |
for | +0.042 |
, | +0.041 |
Neg logit contributions | |
umm | -0.081 |
Ta | -0.080 |
crow | -0.078 |
unn | -0.078 |
ocol | -0.077 |
Token | you |
Token ID | 345 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
ymes | +0.103 |
asis | +0.103 |
andel | +0.103 |
robat | +0.101 |
Ta | +0.101 |
Neg logit contributions | |
not | -0.074 |
and | -0.070 |
because | -0.062 |
but | -0.058 |
, | -0.057 |
Token | . |
Token ID | 13 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
andel | +0.063 |
unn | +0.060 |
ymes | +0.060 |
umm | +0.058 |
pillar | +0.058 |
Neg logit contributions | |
not | -0.017 |
and | -0.011 |
because | -0.008 |
still | -0.008 |
they | -0.007 |
Token | Amen |
Token ID | 34717 |
Feature activation | +6.51e+01 |
Pos logit contributions | |
not | +0.049 |
and | +0.047 |
because | +0.041 |
but | +0.039 |
, | +0.038 |
Neg logit contributions | |
Ta | -0.057 |
umm | -0.056 |
ocol | -0.056 |
robat | -0.054 |
andel | -0.054 |
Token | ." |
Token ID | 526 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
asis | +1.191 |
ymes | +1.187 |
ites | +1.185 |
andel | +1.171 |
unn | +1.142 |
Neg logit contributions | |
not | -0.664 |
and | -0.616 |
because | -0.545 |
but | -0.537 |
" | -0.484 |
Token |
|
Token ID | 198 |
Feature activation | +6.41e+00 |
Pos logit contributions | |
pill | +0.028 |
orns | +0.028 |
pillar | +0.028 |
Ta | +0.028 |
ites | +0.028 |
Neg logit contributions | |
not | -0.016 |
and | -0.012 |
because | -0.012 |
for | -0.011 |
just | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +6.22e+00 |
Pos logit contributions | |
ymes | +0.142 |
Ta | +0.141 |
andel | +0.141 |
asis | +0.141 |
robat | +0.140 |
Neg logit contributions | |
not | -0.044 |
and | -0.038 |
because | -0.034 |
but | -0.028 |
, | -0.025 |
Token | Then |
Token ID | 6423 |
Feature activation | -7.77e+00 |
Pos logit contributions | |
ymes | +0.102 |
asis | +0.101 |
andel | +0.101 |
robat | +0.100 |
Ta | +0.100 |
Neg logit contributions | |
not | -0.085 |
and | -0.081 |
because | -0.073 |
but | -0.068 |
, | -0.067 |
Token | she |
Token ID | 673 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
not | +0.053 |
and | +0.048 |
because | +0.040 |
but | +0.034 |
" | +0.030 |
Neg logit contributions | |
seas | -0.166 |
andel | -0.164 |
ymes | -0.162 |
Ta | -0.162 |
nests | -0.161 |
Token | monkeys |
Token ID | 26697 |
Feature activation | +6.75e+01 |
Pos logit contributions | |
ymes | +0.911 |
andel | +0.903 |
asis | +0.894 |
robat | +0.890 |
Ta | +0.887 |
Neg logit contributions | |
not | -0.282 |
and | -0.243 |
because | -0.200 |
but | -0.167 |
, | -0.159 |
Token | , |
Token ID | 11 |
Feature activation | +3.11e+01 |
Pos logit contributions | |
asis | +1.539 |
ymes | +1.481 |
nests | +1.471 |
orns | +1.467 |
robat | +1.463 |
Neg logit contributions | |
not | -0.387 |
and | -0.272 |
because | -0.258 |
" | -0.211 |
but | -0.193 |
Token | elephants |
Token ID | 25368 |
Feature activation | +4.87e+01 |
Pos logit contributions | |
nests | +0.566 |
pige | +0.566 |
crow | +0.559 |
pill | +0.554 |
ymes | +0.553 |
Neg logit contributions | |
not | -0.271 |
and | -0.226 |
because | -0.214 |
: | -0.192 |
for | -0.181 |
Token | , |
Token ID | 11 |
Feature activation | +2.30e+01 |
Pos logit contributions | |
asis | +1.121 |
ites | +1.098 |
crow | +1.090 |
folk | +1.088 |
orns | +1.085 |
Neg logit contributions | |
not | -0.233 |
because | -0.127 |
and | -0.108 |
but | -0.074 |
" | -0.070 |
Token | gir |
Token ID | 37370 |
Feature activation | +5.76e+01 |
Pos logit contributions | |
nests | +0.479 |
pige | +0.477 |
oceans | +0.471 |
lakes | +0.470 |
rivers | +0.467 |
Neg logit contributions | |
not | -0.129 |
because | -0.089 |
and | -0.083 |
: | -0.069 |
for | -0.063 |
Token | aff |
Token ID | 2001 |
Feature activation | +6.43e+01 |
Pos logit contributions | |
ymes | +0.210 |
asis | +0.205 |
andel | +0.199 |
Ta | +0.193 |
robat | +0.189 |
Neg logit contributions | |
not | -1.513 |
and | -1.492 |
because | -1.404 |
, | -1.363 |
but | -1.358 |
Token | es |
Token ID | 274 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
ymes | +0.694 |
asis | +0.693 |
robat | +0.676 |
ites | +0.675 |
orns | +0.674 |
Neg logit contributions | |
not | -1.194 |
and | -1.119 |
because | -1.074 |
but | -1.035 |
" | -0.996 |
Token | , |
Token ID | 11 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
asis | +0.365 |
orns | +0.362 |
pillar | +0.358 |
robat | +0.357 |
nests | +0.356 |
Neg logit contributions | |
not | -0.084 |
because | -0.050 |
and | -0.034 |
but | -0.029 |
for | -0.025 |
Token | and |
Token ID | 290 |
Feature activation | +4.98e+00 |
Pos logit contributions | |
nests | +0.250 |
pill | +0.247 |
oceans | +0.245 |
pige | +0.245 |
asis | +0.244 |
Neg logit contributions | |
not | -0.102 |
because | -0.082 |
and | -0.075 |
but | -0.063 |
for | -0.062 |
Token | lions |
Token ID | 31420 |
Feature activation | +3.68e+01 |
Pos logit contributions | |
ymes | +0.054 |
asis | +0.053 |
andel | +0.053 |
orns | +0.052 |
nests | +0.052 |
Neg logit contributions | |
not | -0.091 |
and | -0.086 |
because | -0.081 |
but | -0.077 |
, | -0.076 |
Token | . |
Token ID | 13 |
Feature activation | +8.64e+00 |
Pos logit contributions | |
asis | +0.875 |
ymes | +0.855 |
robat | +0.848 |
orns | +0.847 |
ites | +0.842 |
Neg logit contributions | |
not | -0.190 |
and | -0.118 |
because | -0.110 |
but | -0.086 |
" | -0.074 |
Token | the |
Token ID | 262 |
Feature activation | +1.19e+01 |
Pos logit contributions | |
asis | +0.026 |
andel | +0.026 |
Ta | +0.025 |
ymes | +0.025 |
robat | +0.025 |
Neg logit contributions | |
not | -0.012 |
and | -0.012 |
because | -0.010 |
but | -0.009 |
, | -0.009 |
Token | animals |
Token ID | 4695 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
emaker | +0.165 |
andel | +0.163 |
Ta | +0.160 |
keeping | +0.157 |
asis | +0.157 |
Neg logit contributions | |
and | -0.202 |
not | -0.198 |
because | -0.174 |
but | -0.171 |
. | -0.171 |
Token | , |
Token ID | 11 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
asis | +0.385 |
ites | +0.376 |
robat | +0.372 |
ymes | +0.368 |
nests | +0.367 |
Neg logit contributions | |
not | -0.057 |
and | -0.019 |
because | -0.015 |
" | -0.010 |
but | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
not | +0.030 |
and | +0.026 |
: | +0.022 |
because | +0.021 |
. | +0.019 |
Neg logit contributions | |
seas | -0.092 |
pige | -0.092 |
andel | -0.090 |
nests | -0.090 |
asis | -0.090 |
Token | ac |
Token ID | 936 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
andel | +0.156 |
emaker | +0.155 |
Ta | +0.155 |
asis | +0.152 |
umm | +0.150 |
Neg logit contributions | |
not | -0.218 |
and | -0.218 |
because | -0.192 |
but | -0.190 |
" | -0.187 |
Token | rob |
Token ID | 22609 |
Feature activation | +6.32e+01 |
Pos logit contributions | |
andel | +0.242 |
Ta | +0.220 |
umm | +0.214 |
ocol | +0.193 |
ymes | +0.193 |
Neg logit contributions | |
and | -0.909 |
not | -0.880 |
, | -0.821 |
because | -0.821 |
. | -0.806 |
Token | ats |
Token ID | 1381 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
andel | +0.574 |
ymes | +0.561 |
Ta | +0.557 |
asis | +0.556 |
umm | +0.542 |
Neg logit contributions | |
not | -1.334 |
and | -1.289 |
because | -1.199 |
, | -1.155 |
but | -1.138 |
Token | and |
Token ID | 290 |
Feature activation | -7.85e+00 |
Pos logit contributions | |
asis | +0.244 |
robat | +0.243 |
ites | +0.241 |
folk | +0.241 |
andel | +0.236 |
Neg logit contributions | |
not | -0.053 |
and | -0.026 |
because | -0.025 |
but | -0.016 |
to | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
not | +0.079 |
and | +0.075 |
because | +0.064 |
but | +0.058 |
, | +0.057 |
Neg logit contributions | |
asis | -0.157 |
ymes | -0.156 |
andel | -0.156 |
robat | -0.155 |
Ta | -0.154 |
Token | clown |
Token ID | 25573 |
Feature activation | +2.26e+01 |
Pos logit contributions | |
asis | +0.155 |
andel | +0.155 |
emaker | +0.155 |
Ta | +0.154 |
igsaw | +0.151 |
Neg logit contributions | |
and | -0.211 |
not | -0.209 |
but | -0.187 |
because | -0.184 |
. | -0.181 |
Token | s |
Token ID | 82 |
Feature activation | +6.21e-01 |
Pos logit contributions | |
asis | +0.409 |
ites | +0.403 |
robat | +0.402 |
ymes | +0.400 |
andel | +0.391 |
Neg logit contributions | |
not | -0.264 |
and | -0.226 |
because | -0.208 |
but | -0.196 |
" | -0.183 |
Token | like |
Token ID | 588 |
Feature activation | +3.83e+01 |
Pos logit contributions | |
andel | +0.320 |
ymes | +0.318 |
asis | +0.315 |
robat | +0.314 |
Ta | +0.313 |
Neg logit contributions | |
not | -0.144 |
and | -0.134 |
because | -0.110 |
, | -0.099 |
but | -0.096 |
Token | to |
Token ID | 284 |
Feature activation | +3.98e+01 |
Pos logit contributions | |
ymes | +0.740 |
seas | +0.734 |
nests | +0.731 |
orns | +0.723 |
pige | +0.723 |
Neg logit contributions | |
not | -0.331 |
and | -0.294 |
because | -0.253 |
but | -0.232 |
: | -0.228 |
Token | collect |
Token ID | 2824 |
Feature activation | +5.18e+01 |
Pos logit contributions | |
asis | +0.658 |
andel | +0.632 |
nests | +0.631 |
robat | +0.630 |
ocol | +0.629 |
Neg logit contributions | |
not | -0.473 |
and | -0.455 |
because | -0.412 |
" | -0.384 |
but | -0.383 |
Token | things |
Token ID | 1243 |
Feature activation | +5.36e+01 |
Pos logit contributions | |
asis | +0.848 |
ymes | +0.846 |
andel | +0.846 |
robat | +0.835 |
Ta | +0.827 |
Neg logit contributions | |
not | -0.699 |
and | -0.663 |
because | -0.594 |
but | -0.554 |
, | -0.547 |
Token | . |
Token ID | 13 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
ites | +1.089 |
orns | +1.075 |
seas | +1.060 |
asis | +1.040 |
ite | +1.029 |
Neg logit contributions | |
not | -0.366 |
" | -0.277 |
and | -0.223 |
: | -0.200 |
because | -0.195 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +6.31e+01 |
Pos logit contributions | |
asis | +0.572 |
andel | +0.572 |
ymes | +0.568 |
robat | +0.565 |
Ta | +0.562 |
Neg logit contributions | |
not | -0.283 |
and | -0.258 |
because | -0.219 |
but | -0.196 |
, | -0.194 |
Token | L |
Token ID | 43 |
Feature activation | +4.08e+01 |
Pos logit contributions | |
asis | +1.474 |
ymes | +1.470 |
andel | +1.465 |
robat | +1.459 |
Ta | +1.445 |
Neg logit contributions | |
not | -0.409 |
and | -0.356 |
because | -0.280 |
but | -0.228 |
, | -0.215 |
Token | ily |
Token ID | 813 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
asis | +0.546 |
umm | +0.546 |
ymes | +0.541 |
andel | +0.532 |
robat | +0.532 |
Neg logit contributions | |
not | -0.693 |
and | -0.680 |
because | -0.604 |
, | -0.581 |
. | -0.579 |
Token | was |
Token ID | 373 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
pillar | +0.584 |
orns | +0.582 |
asis | +0.581 |
orn | +0.569 |
ites | +0.560 |
Neg logit contributions | |
not | -0.185 |
because | -0.090 |
but | -0.086 |
they | -0.081 |
" | -0.079 |
Token | hungry |
Token ID | 14720 |
Feature activation | +2.88e+01 |
Pos logit contributions | |
andel | +0.204 |
Ta | +0.201 |
ymes | +0.197 |
ocol | +0.196 |
asis | +0.196 |
Neg logit contributions | |
not | -0.106 |
and | -0.094 |
because | -0.088 |
but | -0.083 |
they | -0.079 |
Token | . |
Token ID | 13 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
andel | +0.621 |
asis | +0.615 |
seas | +0.613 |
umm | +0.595 |
nests | +0.587 |
Neg logit contributions | |
not | -0.174 |
they | -0.074 |
still | -0.065 |
" | -0.060 |
their | -0.048 |
Token | put |
Token ID | 1234 |
Feature activation | +5.85e+01 |
Pos logit contributions | |
ymes | +0.110 |
robat | +0.109 |
asis | +0.108 |
andel | +0.108 |
orns | +0.107 |
Neg logit contributions | |
not | -0.081 |
and | -0.076 |
because | -0.067 |
" | -0.065 |
but | -0.064 |
Token | flour |
Token ID | 10601 |
Feature activation | +8.30e+01 |
Pos logit contributions | |
ymes | +1.197 |
andel | +1.194 |
robat | +1.194 |
asis | +1.189 |
orns | +1.187 |
Neg logit contributions | |
not | -0.532 |
and | -0.451 |
because | -0.401 |
but | -0.352 |
" | -0.343 |
Token | , |
Token ID | 11 |
Feature activation | +2.94e+01 |
Pos logit contributions | |
ites | +1.786 |
asis | +1.785 |
orns | +1.783 |
seas | +1.761 |
keeping | +1.750 |
Neg logit contributions | |
not | -0.563 |
" | -0.274 |
because | -0.263 |
: | -0.214 |
and | -0.184 |
Token | water |
Token ID | 1660 |
Feature activation | +3.88e+01 |
Pos logit contributions | |
seas | +0.272 |
nests | +0.260 |
andel | +0.256 |
ites | +0.254 |
ocol | +0.253 |
Neg logit contributions | |
not | -0.561 |
: | -0.506 |
because | -0.494 |
and | -0.488 |
" | -0.478 |
Token | , |
Token ID | 11 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
asis | +0.867 |
orns | +0.856 |
ites | +0.843 |
nests | +0.832 |
crow | +0.831 |
Neg logit contributions | |
not | -0.215 |
because | -0.111 |
" | -0.075 |
and | -0.074 |
but | -0.066 |
Token | yeast |
Token ID | 20146 |
Feature activation | +6.29e+01 |
Pos logit contributions | |
seas | +0.286 |
nests | +0.283 |
orns | +0.271 |
lakes | +0.268 |
pige | +0.267 |
Neg logit contributions | |
not | -0.251 |
: | -0.228 |
because | -0.208 |
" | -0.207 |
and | -0.197 |
Token | and |
Token ID | 290 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
asis | +1.419 |
orns | +1.380 |
seas | +1.356 |
ites | +1.350 |
pter | +1.336 |
Neg logit contributions | |
not | -0.317 |
" | -0.184 |
because | -0.182 |
and | -0.139 |
but | -0.123 |
Token | salt |
Token ID | 8268 |
Feature activation | +4.46e+01 |
Pos logit contributions | |
nests | +0.121 |
ocol | +0.120 |
ymes | +0.119 |
seas | +0.119 |
asis | +0.119 |
Neg logit contributions | |
not | -0.188 |
and | -0.176 |
because | -0.171 |
: | -0.162 |
but | -0.159 |
Token | in |
Token ID | 287 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
asis | +0.936 |
orns | +0.932 |
ocol | +0.897 |
ites | +0.891 |
seas | +0.890 |
Neg logit contributions | |
not | -0.271 |
because | -0.182 |
" | -0.154 |
but | -0.138 |
and | -0.131 |
Token | a |
Token ID | 257 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
ocol | +0.336 |
andel | +0.326 |
seas | +0.324 |
orns | +0.323 |
nests | +0.321 |
Neg logit contributions | |
not | -0.176 |
and | -0.149 |
because | -0.144 |
: | -0.134 |
" | -0.127 |
Token | big |
Token ID | 1263 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
ymes | +0.205 |
andel | +0.204 |
asis | +0.204 |
robat | +0.201 |
Ta | +0.200 |
Neg logit contributions | |
not | -0.260 |
and | -0.251 |
because | -0.228 |
but | -0.217 |
, | -0.216 |
Token | , |
Token ID | 11 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
andel | +0.158 |
Ta | +0.156 |
ymes | +0.156 |
robat | +0.156 |
asis | +0.154 |
Neg logit contributions | |
not | -0.050 |
and | -0.045 |
because | -0.034 |
but | -0.032 |
" | -0.031 |
Token | he |
Token ID | 339 |
Feature activation | +2.85e+01 |
Pos logit contributions | |
asis | +0.501 |
seas | +0.494 |
nests | +0.493 |
crow | +0.492 |
andel | +0.491 |
Neg logit contributions | |
not | -0.186 |
and | -0.152 |
because | -0.140 |
: | -0.120 |
. | -0.103 |
Token | spun |
Token ID | 26843 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
asis | +0.520 |
ymes | +0.497 |
ites | +0.494 |
seas | +0.492 |
pillar | +0.490 |
Neg logit contributions | |
not | -0.288 |
and | -0.257 |
because | -0.252 |
but | -0.229 |
" | -0.211 |
Token | himself |
Token ID | 2241 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
robat | +0.720 |
andel | +0.713 |
ymes | +0.709 |
seas | +0.708 |
asis | +0.706 |
Neg logit contributions | |
not | -0.303 |
and | -0.240 |
because | -0.212 |
" | -0.185 |
they | -0.183 |
Token | a |
Token ID | 257 |
Feature activation | +2.31e+01 |
Pos logit contributions | |
asis | +0.359 |
andel | +0.353 |
ymes | +0.352 |
ites | +0.352 |
robat | +0.348 |
Neg logit contributions | |
not | -0.192 |
and | -0.160 |
because | -0.153 |
" | -0.144 |
they | -0.138 |
Token | coc |
Token ID | 8954 |
Feature activation | +6.27e+01 |
Pos logit contributions | |
orns | +0.392 |
ites | +0.381 |
unn | +0.379 |
keeping | +0.378 |
umm | +0.378 |
Neg logit contributions | |
not | -0.319 |
and | -0.319 |
but | -0.271 |
, | -0.269 |
because | -0.268 |
Token | oon |
Token ID | 2049 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
asis | +0.487 |
robat | +0.481 |
andel | +0.476 |
ymes | +0.471 |
orns | +0.451 |
Neg logit contributions | |
not | -1.388 |
and | -1.329 |
because | -1.259 |
but | -1.212 |
" | -1.195 |
Token | and |
Token ID | 290 |
Feature activation | +6.25e+00 |
Pos logit contributions | |
robat | +0.336 |
asis | +0.331 |
ymes | +0.326 |
ites | +0.324 |
keeping | +0.323 |
Neg logit contributions | |
not | -0.119 |
and | -0.076 |
" | -0.070 |
because | -0.070 |
they | -0.063 |
Token | never |
Token ID | 1239 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
asis | +0.120 |
ymes | +0.119 |
robat | +0.118 |
andel | +0.118 |
Ta | +0.117 |
Neg logit contributions | |
not | -0.065 |
and | -0.061 |
because | -0.053 |
but | -0.048 |
, | -0.047 |
Token | came |
Token ID | 1625 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
asis | +0.235 |
ymes | +0.233 |
andel | +0.233 |
robat | +0.231 |
Ta | +0.230 |
Neg logit contributions | |
not | -0.144 |
and | -0.133 |
because | -0.114 |
but | -0.104 |
" | -0.104 |
Token | out |
Token ID | 503 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
andel | +0.336 |
ymes | +0.333 |
asis | +0.332 |
orns | +0.329 |
nests | +0.327 |
Neg logit contributions | |
not | -0.096 |
and | -0.085 |
because | -0.067 |
they | -0.056 |
but | -0.055 |
Token | John |
Token ID | 1757 |
Feature activation | +8.64e+00 |
Pos logit contributions | |
ymes | +0.337 |
Ta | +0.334 |
asis | +0.334 |
ites | +0.333 |
robat | +0.331 |
Neg logit contributions | |
not | -0.213 |
and | -0.184 |
because | -0.173 |
but | -0.161 |
" | -0.153 |
Token | chose |
Token ID | 7690 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
asis | +0.162 |
folk | +0.159 |
pter | +0.158 |
robat | +0.157 |
keeping | +0.157 |
Neg logit contributions | |
not | -0.087 |
because | -0.067 |
and | -0.064 |
but | -0.058 |
" | -0.056 |
Token | some |
Token ID | 617 |
Feature activation | +2.06e+01 |
Pos logit contributions | |
seas | +0.241 |
ymes | +0.239 |
orns | +0.236 |
ites | +0.235 |
nests | +0.235 |
Neg logit contributions | |
not | -0.085 |
and | -0.066 |
because | -0.059 |
but | -0.050 |
" | -0.046 |
Token | carrots |
Token ID | 34397 |
Feature activation | +3.47e+01 |
Pos logit contributions | |
ymes | +0.275 |
andel | +0.275 |
asis | +0.269 |
ocol | +0.268 |
ites | +0.265 |
Neg logit contributions | |
not | -0.336 |
and | -0.305 |
because | -0.288 |
" | -0.268 |
but | -0.268 |
Token | and |
Token ID | 290 |
Feature activation | +6.54e+00 |
Pos logit contributions | |
worm | +0.728 |
asis | +0.725 |
orns | +0.720 |
ites | +0.719 |
ite | +0.707 |
Neg logit contributions | |
not | -0.220 |
" | -0.091 |
because | -0.087 |
and | -0.071 |
but | -0.061 |
Token | cuc |
Token ID | 38421 |
Feature activation | +6.27e+01 |
Pos logit contributions | |
asis | +0.111 |
nests | +0.109 |
seas | +0.109 |
orns | +0.108 |
andel | +0.108 |
Neg logit contributions | |
not | -0.076 |
and | -0.067 |
because | -0.062 |
but | -0.056 |
: | -0.056 |
Token | umbers |
Token ID | 17024 |
Feature activation | +3.97e+01 |
Pos logit contributions | |
asis | +0.359 |
ymes | +0.353 |
andel | +0.352 |
Ta | +0.339 |
robat | +0.335 |
Neg logit contributions | |
not | -1.497 |
and | -1.472 |
because | -1.374 |
, | -1.330 |
but | -1.329 |
Token | to |
Token ID | 284 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
asis | +0.832 |
orns | +0.815 |
ocol | +0.815 |
arrow | +0.815 |
pter | +0.815 |
Neg logit contributions | |
not | -0.244 |
because | -0.165 |
and | -0.146 |
but | -0.128 |
" | -0.111 |
Token | take |
Token ID | 1011 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
asis | +0.208 |
ocol | +0.205 |
andel | +0.205 |
robat | +0.201 |
ymes | +0.197 |
Neg logit contributions | |
not | -0.144 |
and | -0.138 |
because | -0.125 |
but | -0.115 |
" | -0.112 |
Token | home |
Token ID | 1363 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
andel | +0.360 |
asis | +0.359 |
ymes | +0.359 |
robat | +0.355 |
Ta | +0.352 |
Neg logit contributions | |
not | -0.172 |
and | -0.158 |
because | -0.136 |
but | -0.122 |
, | -0.118 |
Token | . |
Token ID | 13 |
Feature activation | +8.58e+00 |
Pos logit contributions | |
andel | +0.573 |
asis | +0.569 |
ymes | +0.568 |
ocol | +0.564 |
keeping | +0.562 |
Neg logit contributions | |
not | -0.145 |
and | -0.104 |
because | -0.088 |
but | -0.072 |
" | -0.072 |
Token | important |
Token ID | 1593 |
Feature activation | +2.13e+01 |
Pos logit contributions | |
andel | +0.600 |
asis | +0.593 |
robat | +0.591 |
ymes | +0.589 |
ites | +0.586 |
Neg logit contributions | |
not | -0.064 |
and | -0.010 |
because | +0.003 |
" | +0.011 |
but | +0.015 |
Token | to |
Token ID | 284 |
Feature activation | +3.07e+01 |
Pos logit contributions | |
keeping | +0.342 |
orns | +0.341 |
asis | +0.333 |
seas | +0.333 |
crow | +0.331 |
Neg logit contributions | |
not | -0.263 |
and | -0.222 |
because | -0.204 |
" | -0.203 |
they | -0.199 |
Token | be |
Token ID | 307 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
asis | +0.549 |
nests | +0.531 |
keeping | +0.526 |
handed | +0.522 |
robat | +0.519 |
Neg logit contributions | |
and | -0.311 |
not | -0.295 |
because | -0.276 |
" | -0.258 |
but | -0.258 |
Token | careful |
Token ID | 8161 |
Feature activation | +4.37e+01 |
Pos logit contributions | |
ymes | +0.461 |
nests | +0.455 |
ites | +0.446 |
handed | +0.446 |
orns | +0.441 |
Neg logit contributions | |
not | -0.461 |
and | -0.456 |
because | -0.429 |
: | -0.423 |
but | -0.419 |
Token | . |
Token ID | 13 |
Feature activation | +2.54e+01 |
Pos logit contributions | |
ites | +0.941 |
keeping | +0.940 |
ymes | +0.934 |
emaker | +0.928 |
crow | +0.917 |
Neg logit contributions | |
not | -0.185 |
and | -0.123 |
" | -0.112 |
because | -0.107 |
: | -0.084 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +6.26e+01 |
Pos logit contributions | |
asis | +0.514 |
andel | +0.512 |
ymes | +0.507 |
robat | +0.507 |
Ta | +0.506 |
Neg logit contributions | |
not | -0.235 |
and | -0.213 |
because | -0.178 |
but | -0.160 |
, | -0.158 |
Token | Once |
Token ID | 7454 |
Feature activation | +4.73e+01 |
Pos logit contributions | |
asis | +1.395 |
ymes | +1.390 |
andel | +1.384 |
robat | +1.381 |
Ta | +1.365 |
Neg logit contributions | |
not | -0.475 |
and | -0.417 |
because | -0.345 |
but | -0.293 |
, | -0.278 |
Token | upon |
Token ID | 2402 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
andel | +0.792 |
ymes | +0.790 |
asis | +0.790 |
robat | +0.775 |
ites | +0.766 |
Neg logit contributions | |
not | -0.599 |
and | -0.563 |
because | -0.508 |
but | -0.470 |
, | -0.449 |
Token | a |
Token ID | 257 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
andel | +0.844 |
asis | +0.844 |
ymes | +0.837 |
robat | +0.835 |
umm | +0.828 |
Neg logit contributions | |
not | -0.145 |
and | -0.122 |
because | -0.076 |
but | -0.049 |
, | -0.045 |
Token | time |
Token ID | 640 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
asis | +0.408 |
andel | +0.405 |
ymes | +0.403 |
robat | +0.399 |
Ta | +0.393 |
Neg logit contributions | |
not | -0.337 |
and | -0.313 |
because | -0.288 |
" | -0.266 |
but | -0.266 |
Token | , |
Token ID | 11 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
asis | +0.522 |
ites | +0.516 |
unn | +0.512 |
andel | +0.512 |
ival | +0.509 |
Neg logit contributions | |
not | -0.129 |
and | -0.104 |
because | -0.087 |
for | -0.055 |
just | -0.055 |
Token | neck |
Token ID | 7393 |
Feature activation | +5.79e+01 |
Pos logit contributions | |
asis | +0.100 |
ymes | +0.096 |
nests | +0.096 |
umm | +0.096 |
andel | +0.095 |
Neg logit contributions | |
not | -0.071 |
and | -0.069 |
" | -0.060 |
because | -0.060 |
: | -0.058 |
Token | l |
Token ID | 75 |
Feature activation | +3.58e+01 |
Pos logit contributions | |
asis | +1.364 |
andel | +1.353 |
orns | +1.344 |
robat | +1.342 |
ymes | +1.340 |
Neg logit contributions | |
not | -0.283 |
and | -0.180 |
because | -0.168 |
" | -0.129 |
but | -0.107 |
Token | aces |
Token ID | 2114 |
Feature activation | +4.63e+01 |
Pos logit contributions | |
asis | +0.677 |
robat | +0.672 |
ymes | +0.672 |
andel | +0.668 |
orns | +0.665 |
Neg logit contributions | |
not | -0.378 |
and | -0.327 |
because | -0.304 |
but | -0.278 |
" | -0.274 |
Token | , |
Token ID | 11 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
robat | +0.971 |
emaker | +0.956 |
orns | +0.953 |
asis | +0.949 |
ites | +0.949 |
Neg logit contributions | |
not | -0.338 |
and | -0.244 |
because | -0.236 |
" | -0.209 |
they | -0.192 |
Token | grape |
Token ID | 30777 |
Feature activation | +4.18e+01 |
Pos logit contributions | |
nests | +0.296 |
andel | +0.295 |
asis | +0.294 |
seas | +0.294 |
oceans | +0.292 |
Neg logit contributions | |
not | -0.093 |
and | -0.071 |
because | -0.062 |
: | -0.054 |
, | -0.049 |
Token | brace |
Token ID | 22581 |
Feature activation | +6.24e+01 |
Pos logit contributions | |
orns | +0.836 |
ymes | +0.835 |
asis | +0.834 |
pillar | +0.833 |
robat | +0.832 |
Neg logit contributions | |
not | -0.380 |
and | -0.310 |
because | -0.284 |
but | -0.250 |
" | -0.232 |
Token | lets |
Token ID | 5289 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
asis | +0.522 |
ymes | +0.511 |
andel | +0.506 |
robat | +0.494 |
Ta | +0.492 |
Neg logit contributions | |
not | -1.361 |
and | -1.333 |
because | -1.238 |
, | -1.189 |
but | -1.188 |
Token | , |
Token ID | 11 |
Feature activation | +8.10e+00 |
Pos logit contributions | |
robat | +0.771 |
asis | +0.765 |
orns | +0.765 |
ites | +0.760 |
pter | +0.759 |
Neg logit contributions | |
not | -0.171 |
because | -0.083 |
and | -0.073 |
" | -0.055 |
they | -0.048 |
Token | and |
Token ID | 290 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
andel | +0.100 |
ymes | +0.100 |
asis | +0.098 |
robat | +0.097 |
Ta | +0.096 |
Neg logit contributions | |
not | -0.138 |
and | -0.129 |
because | -0.122 |
but | -0.113 |
, | -0.113 |
Token | grape |
Token ID | 30777 |
Feature activation | +3.50e+01 |
Pos logit contributions | |
ymes | +0.019 |
andel | +0.019 |
robat | +0.019 |
asis | +0.019 |
Ta | +0.019 |
Neg logit contributions | |
not | -0.020 |
and | -0.019 |
because | -0.017 |
but | -0.016 |
, | -0.016 |
Token | crown |
Token ID | 12389 |
Feature activation | +4.08e+01 |
Pos logit contributions | |
ymes | +0.705 |
asis | +0.696 |
robat | +0.694 |
andel | +0.693 |
orns | +0.693 |
Neg logit contributions | |
not | -0.327 |
and | -0.281 |
because | -0.251 |
but | -0.223 |
" | -0.209 |
Token | - |
Token ID | 532 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
asis | +0.672 |
orn | +0.647 |
orns | +0.626 |
robat | +0.623 |
pillar | +0.619 |
Neg logit contributions | |
not | -0.260 |
and | -0.190 |
because | -0.174 |
their | -0.165 |
but | -0.163 |
Token | it |
Token ID | 340 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
not | +0.082 |
and | +0.066 |
because | +0.062 |
: | +0.060 |
. | +0.054 |
Neg logit contributions | |
seas | -0.198 |
orn | -0.192 |
pillar | -0.191 |
orns | -0.189 |
nests | -0.189 |
Token | was |
Token ID | 373 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
orn | +0.290 |
asis | +0.290 |
pillar | +0.275 |
worm | +0.274 |
seas | +0.274 |
Neg logit contributions | |
not | -0.127 |
and | -0.108 |
because | -0.104 |
but | -0.097 |
" | -0.089 |
Token | bigger |
Token ID | 5749 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
not | +0.019 |
and | +0.019 |
because | +0.017 |
they | +0.016 |
but | +0.016 |
Neg logit contributions | |
seas | -0.044 |
nests | -0.042 |
andel | -0.042 |
ocol | -0.041 |
asis | -0.041 |
Token | and |
Token ID | 290 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
asis | +0.443 |
ymes | +0.442 |
andel | +0.440 |
robat | +0.437 |
orns | +0.432 |
Neg logit contributions | |
not | -0.174 |
and | -0.153 |
because | -0.129 |
but | -0.113 |
" | -0.110 |
Token | ju |
Token ID | 7544 |
Feature activation | +6.23e+01 |
Pos logit contributions | |
not | +0.053 |
and | +0.052 |
because | +0.047 |
: | +0.045 |
, | +0.044 |
Neg logit contributions | |
asis | -0.045 |
ymes | -0.045 |
seas | -0.045 |
Ta | -0.044 |
umm | -0.044 |
Token | ic |
Token ID | 291 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
andel | +0.523 |
Ta | +0.514 |
robat | +0.500 |
crow | +0.493 |
ymes | +0.490 |
Neg logit contributions | |
not | -1.327 |
and | -1.293 |
because | -1.182 |
. | -1.151 |
, | -1.147 |
Token | ier |
Token ID | 959 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
ymes | +0.303 |
andel | +0.302 |
asis | +0.302 |
robat | +0.301 |
emaker | +0.294 |
Neg logit contributions | |
not | -0.500 |
and | -0.474 |
because | -0.442 |
but | -0.429 |
" | -0.418 |
Token | than |
Token ID | 621 |
Feature activation | +6.21e+00 |
Pos logit contributions | |
keeping | +0.321 |
asis | +0.319 |
orns | +0.311 |
umm | +0.308 |
ymes | +0.305 |
Neg logit contributions | |
not | -0.160 |
and | -0.132 |
because | -0.119 |
" | -0.116 |
they | -0.114 |
Token | any |
Token ID | 597 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
asis | +0.111 |
andel | +0.110 |
ymes | +0.110 |
orns | +0.108 |
robat | +0.108 |
Neg logit contributions | |
not | -0.071 |
and | -0.067 |
because | -0.058 |
but | -0.054 |
, | -0.053 |
Token | he |
Token ID | 339 |
Feature activation | +5.04e+00 |
Pos logit contributions | |
andel | +0.212 |
Ta | +0.211 |
asis | +0.211 |
ymes | +0.210 |
robat | +0.209 |
Neg logit contributions | |
not | -0.200 |
and | -0.195 |
because | -0.174 |
but | -0.165 |
. | -0.165 |
Token | us |
Token ID | 514 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
not | +0.038 |
and | +0.037 |
because | +0.032 |
, | +0.030 |
but | +0.030 |
Neg logit contributions | |
asis | -0.050 |
andel | -0.050 |
ymes | -0.050 |
robat | -0.049 |
Ta | -0.049 |
Token | safe |
Token ID | 3338 |
Feature activation | +9.39e+00 |
Pos logit contributions | |
andel | +0.065 |
asis | +0.064 |
ymes | +0.064 |
robat | +0.064 |
Ta | +0.064 |
Neg logit contributions | |
not | -0.032 |
and | -0.030 |
because | -0.025 |
but | -0.022 |
, | -0.022 |
Token | and |
Token ID | 290 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
keeping | +0.174 |
ymes | +0.173 |
asis | +0.171 |
ites | +0.166 |
nests | +0.165 |
Neg logit contributions | |
not | -0.097 |
" | -0.071 |
and | -0.071 |
because | -0.069 |
they | -0.068 |
Token | happy |
Token ID | 3772 |
Feature activation | +7.96e+00 |
Pos logit contributions | |
not | +0.158 |
and | +0.152 |
because | +0.136 |
but | +0.126 |
" | +0.125 |
Neg logit contributions | |
ymes | -0.210 |
asis | -0.209 |
Ta | -0.202 |
robat | -0.202 |
ites | -0.201 |
Token | . |
Token ID | 13 |
Feature activation | -7.00e+00 |
Pos logit contributions | |
ymes | +0.154 |
asis | +0.150 |
nests | +0.149 |
ites | +0.147 |
umm | +0.146 |
Neg logit contributions | |
not | -0.079 |
and | -0.064 |
because | -0.058 |
but | -0.055 |
" | -0.054 |
Token | Amen |
Token ID | 34717 |
Feature activation | +6.21e+01 |
Pos logit contributions | |
not | +0.104 |
and | +0.099 |
because | +0.089 |
, | +0.084 |
. | +0.083 |
Neg logit contributions | |
Ta | -0.098 |
ymes | -0.092 |
crow | -0.092 |
umm | -0.092 |
andel | -0.091 |
Token | ." |
Token ID | 526 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
ymes | +1.213 |
asis | +1.211 |
andel | +1.194 |
ites | +1.186 |
robat | +1.177 |
Neg logit contributions | |
not | -0.609 |
and | -0.568 |
because | -0.495 |
but | -0.460 |
" | -0.430 |
Token |
|
Token ID | 198 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
not | +0.010 |
and | +0.008 |
because | +0.008 |
for | +0.006 |
but | +0.006 |
Neg logit contributions | |
Ta | -0.024 |
ymes | -0.024 |
andel | -0.024 |
ites | -0.024 |
crow | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | +3.09e+00 |
Pos logit contributions | |
ymes | +0.079 |
asis | +0.078 |
andel | +0.078 |
robat | +0.077 |
Ta | +0.077 |
Neg logit contributions | |
not | -0.020 |
and | -0.017 |
because | -0.014 |
but | -0.011 |
, | -0.010 |
Token | " |
Token ID | 1 |
Feature activation | +6.92e+00 |
Pos logit contributions | |
andel | +0.039 |
asis | +0.039 |
ymes | +0.039 |
robat | +0.038 |
Ta | +0.038 |
Neg logit contributions | |
not | -0.054 |
and | -0.052 |
because | -0.048 |
but | -0.045 |
, | -0.045 |
Token | A |
Token ID | 32 |
Feature activation | -4.20e+00 |
Pos logit contributions | |
ymes | +0.094 |
Ta | +0.092 |
robat | +0.091 |
asis | +0.090 |
andel | +0.090 |
Neg logit contributions | |
not | -0.115 |
and | -0.110 |
because | -0.102 |
, | -0.096 |
but | -0.095 |
Token | garden |
Token ID | 11376 |
Feature activation | +4.72e+01 |
Pos logit contributions | |
andel | +0.094 |
ocol | +0.091 |
umm | +0.090 |
Ta | +0.090 |
robat | +0.090 |
Neg logit contributions | |
not | -0.047 |
and | -0.043 |
because | -0.037 |
to | -0.033 |
: | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
asis | +1.067 |
seas | +1.037 |
nests | +1.027 |
orns | +1.025 |
ites | +1.014 |
Neg logit contributions | |
not | -0.275 |
because | -0.158 |
and | -0.141 |
but | -0.115 |
" | -0.114 |
Token | Lily |
Token ID | 20037 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
andel | +0.443 |
asis | +0.440 |
Ta | +0.439 |
ites | +0.438 |
pillar | +0.437 |
Neg logit contributions | |
not | -0.231 |
and | -0.199 |
because | -0.171 |
for | -0.153 |
but | -0.152 |
Token | is |
Token ID | 318 |
Feature activation | +1.56e+01 |
Pos logit contributions | |
pillar | +0.540 |
asis | +0.535 |
ymes | +0.530 |
ites | +0.528 |
pill | +0.523 |
Neg logit contributions | |
not | -0.255 |
because | -0.186 |
but | -0.166 |
they | -0.157 |
and | -0.156 |
Token | the |
Token ID | 262 |
Feature activation | +2.94e+01 |
Pos logit contributions | |
andel | +0.273 |
ymes | +0.272 |
asis | +0.271 |
nests | +0.268 |
Ta | +0.264 |
Neg logit contributions | |
and | -0.142 |
not | -0.138 |
because | -0.127 |
they | -0.117 |
but | -0.117 |
Token | seeker |
Token ID | 45993 |
Feature activation | +6.21e+01 |
Pos logit contributions | |
ymes | +0.419 |
asis | +0.418 |
andel | +0.418 |
robat | +0.413 |
Ta | +0.411 |
Neg logit contributions | |
not | -0.468 |
and | -0.447 |
because | -0.405 |
but | -0.385 |
, | -0.380 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
emaker | +1.489 |
pillar | +1.478 |
keeping | +1.457 |
robat | +1.446 |
andel | +1.446 |
Neg logit contributions | |
not | -0.275 |
and | -0.093 |
because | -0.085 |
they | -0.081 |
their | -0.081 |
Token | Ben |
Token ID | 3932 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
Ta | +0.218 |
ymes | +0.218 |
asis | +0.215 |
robat | +0.215 |
andel | +0.212 |
Neg logit contributions | |
and | -0.094 |
not | -0.092 |
because | -0.077 |
but | -0.071 |
: | -0.067 |
Token | is |
Token ID | 318 |
Feature activation | +9.78e+00 |
Pos logit contributions | |
asis | +0.388 |
robat | +0.378 |
ymes | +0.374 |
orns | +0.374 |
ites | +0.366 |
Neg logit contributions | |
not | -0.196 |
and | -0.159 |
because | -0.155 |
but | -0.148 |
" | -0.147 |
Token | the |
Token ID | 262 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
asis | +0.180 |
ymes | +0.178 |
nests | +0.176 |
crow | +0.173 |
robat | +0.172 |
Neg logit contributions | |
not | -0.089 |
and | -0.089 |
because | -0.077 |
but | -0.072 |
they | -0.068 |
Token | h |
Token ID | 289 |
Feature activation | +3.04e+01 |
Pos logit contributions | |
asis | +0.325 |
andel | +0.325 |
ymes | +0.325 |
robat | +0.319 |
Ta | +0.316 |
Neg logit contributions | |
not | -0.425 |
and | -0.406 |
because | -0.373 |
but | -0.354 |
, | -0.350 |
Token | of |
Token ID | 286 |
Feature activation | +6.57e+00 |
Pos logit contributions | |
andel | +0.281 |
ymes | +0.280 |
ites | +0.279 |
asis | +0.276 |
emaker | +0.274 |
Neg logit contributions | |
not | -0.069 |
and | -0.046 |
because | -0.040 |
" | -0.026 |
but | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
andel | +0.138 |
ymes | +0.138 |
asis | +0.137 |
robat | +0.136 |
ocol | +0.135 |
Neg logit contributions | |
not | -0.056 |
and | -0.050 |
because | -0.043 |
but | -0.037 |
, | -0.036 |
Token | frog |
Token ID | 21264 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
andel | +0.151 |
ymes | +0.150 |
Ta | +0.149 |
asis | +0.148 |
robat | +0.147 |
Neg logit contributions | |
and | -0.221 |
not | -0.218 |
because | -0.195 |
. | -0.191 |
, | -0.191 |
Token | . |
Token ID | 13 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
asis | +0.338 |
ymes | +0.335 |
andel | +0.334 |
robat | +0.332 |
ites | +0.328 |
Neg logit contributions | |
not | -0.123 |
and | -0.107 |
because | -0.090 |
but | -0.078 |
" | -0.075 |
Token | He |
Token ID | 679 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
not | +0.016 |
and | +0.014 |
because | +0.012 |
but | +0.011 |
, | +0.011 |
Neg logit contributions | |
andel | -0.028 |
asis | -0.028 |
Ta | -0.027 |
robat | -0.027 |
ites | -0.027 |
Token | spe |
Token ID | 693 |
Feature activation | +6.20e+01 |
Pos logit contributions | |
not | +0.029 |
and | +0.026 |
because | +0.024 |
but | +0.021 |
" | +0.021 |
Neg logit contributions | |
asis | -0.055 |
ymes | -0.055 |
robat | -0.054 |
andel | -0.054 |
Ta | -0.054 |
Token | ared |
Token ID | 1144 |
Feature activation | +8.51e+00 |
Pos logit contributions | |
ival | +0.942 |
umm | +0.932 |
Ta | +0.921 |
igsaw | +0.916 |
pillar | +0.899 |
Neg logit contributions | |
not | -0.965 |
and | -0.934 |
, | -0.785 |
. | -0.785 |
because | -0.770 |
Token | the |
Token ID | 262 |
Feature activation | +6.79e+00 |
Pos logit contributions | |
nests | +0.172 |
seas | +0.172 |
andel | +0.171 |
ymes | +0.171 |
oceans | +0.169 |
Neg logit contributions | |
not | -0.061 |
because | -0.044 |
and | -0.040 |
" | -0.032 |
they | -0.032 |
Token | lazy |
Token ID | 16931 |
Feature activation | +6.71e+00 |
Pos logit contributions | |
ymes | +0.086 |
andel | +0.085 |
robat | +0.085 |
Ta | +0.085 |
asis | +0.084 |
Neg logit contributions | |
not | -0.118 |
and | -0.117 |
because | -0.102 |
, | -0.101 |
. | -0.101 |
Token | frog |
Token ID | 21264 |
Feature activation | +9.01e+00 |
Pos logit contributions | |
ymes | +0.080 |
Ta | +0.080 |
andel | +0.078 |
asis | +0.078 |
robat | +0.078 |
Neg logit contributions | |
and | -0.121 |
not | -0.121 |
because | -0.110 |
, | -0.108 |
but | -0.106 |
Token | and |
Token ID | 290 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
asis | +0.174 |
ymes | +0.168 |
robat | +0.166 |
pillar | +0.166 |
andel | +0.166 |
Neg logit contributions | |
not | -0.089 |
and | -0.076 |
because | -0.071 |
" | -0.063 |
but | -0.062 |
Token | and |
Token ID | 290 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
keeping | +0.805 |
asis | +0.792 |
handed | +0.766 |
kingdom | +0.748 |
seas | +0.725 |
Neg logit contributions | |
not | -0.230 |
" | -0.174 |
: | -0.138 |
they | -0.125 |
their | -0.110 |
Token | play |
Token ID | 711 |
Feature activation | +2.85e+01 |
Pos logit contributions | |
asis | +0.341 |
keeping | +0.330 |
nests | +0.325 |
Ta | +0.325 |
ymes | +0.324 |
Neg logit contributions | |
not | -0.167 |
and | -0.163 |
because | -0.142 |
but | -0.130 |
: | -0.128 |
Token | with |
Token ID | 351 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
robat | +0.575 |
asis | +0.572 |
ymes | +0.562 |
seas | +0.552 |
nests | +0.550 |
Neg logit contributions | |
not | -0.240 |
and | -0.183 |
because | -0.176 |
: | -0.162 |
" | -0.150 |
Token | your |
Token ID | 534 |
Feature activation | +2.53e+01 |
Pos logit contributions | |
ymes | +0.421 |
asis | +0.416 |
orns | +0.414 |
robat | +0.413 |
andel | +0.411 |
Neg logit contributions | |
not | -0.171 |
and | -0.152 |
because | -0.131 |
but | -0.117 |
" | -0.112 |
Token | or |
Token ID | 393 |
Feature activation | +7.13e+00 |
Pos logit contributions | |
andel | +0.407 |
Ta | +0.399 |
asis | +0.396 |
ymes | +0.394 |
robat | +0.391 |
Neg logit contributions | |
not | -0.369 |
and | -0.358 |
because | -0.314 |
, | -0.298 |
but | -0.298 |
Token | nam |
Token ID | 7402 |
Feature activation | +6.20e+01 |
Pos logit contributions | |
asis | +0.131 |
ymes | +0.131 |
robat | +0.128 |
andel | +0.127 |
nests | +0.127 |
Neg logit contributions | |
not | -0.076 |
and | -0.073 |
because | -0.064 |
: | -0.058 |
but | -0.057 |
Token | ents |
Token ID | 658 |
Feature activation | +4.31e+01 |
Pos logit contributions | |
asis | +0.744 |
crow | +0.718 |
robat | +0.714 |
ican | +0.680 |
andel | +0.656 |
Neg logit contributions | |
not | -1.223 |
and | -1.201 |
because | -1.069 |
to | -1.064 |
. | -1.040 |
Token | . |
Token ID | 13 |
Feature activation | +8.02e+00 |
Pos logit contributions | |
asis | +0.981 |
robat | +0.973 |
keeping | +0.973 |
ymes | +0.969 |
orns | +0.963 |
Neg logit contributions | |
not | -0.259 |
and | -0.161 |
because | -0.142 |
" | -0.137 |
but | -0.123 |
Token | Maybe |
Token ID | 6674 |
Feature activation | +2.60e+00 |
Pos logit contributions | |
andel | +0.159 |
asis | +0.158 |
Ta | +0.158 |
ymes | +0.157 |
robat | +0.157 |
Neg logit contributions | |
not | -0.076 |
and | -0.069 |
because | -0.058 |
, | -0.052 |
but | -0.050 |
Token | you |
Token ID | 345 |
Feature activation | +9.93e+00 |
Pos logit contributions | |
seas | +0.050 |
pige | +0.048 |
ites | +0.047 |
nests | +0.047 |
asis | +0.046 |
Neg logit contributions | |
not | -0.023 |
and | -0.020 |
because | -0.018 |
: | -0.016 |
" | -0.015 |
Token | can |
Token ID | 460 |
Feature activation | +7.89e+00 |
Pos logit contributions | |
asis | +0.173 |
ymes | +0.170 |
robat | +0.167 |
ites | +0.166 |
ival | +0.164 |
Neg logit contributions | |
not | -0.116 |
and | -0.105 |
because | -0.097 |
but | -0.092 |
" | -0.091 |
Token | the |
Token ID | 262 |
Feature activation | +5.52e+00 |
Pos logit contributions | |
not | +0.083 |
and | +0.076 |
because | +0.066 |
" | +0.059 |
but | +0.059 |
Neg logit contributions | |
andel | -0.184 |
seas | -0.183 |
asis | -0.178 |
ocol | -0.177 |
crow | -0.176 |
Token | cars |
Token ID | 5006 |
Feature activation | +8.86e+00 |
Pos logit contributions | |
ymes | +0.077 |
robat | +0.077 |
asis | +0.077 |
orns | +0.076 |
andel | +0.076 |
Neg logit contributions | |
not | -0.091 |
and | -0.088 |
because | -0.078 |
, | -0.075 |
. | -0.075 |
Token | stopped |
Token ID | 5025 |
Feature activation | -3.17e+00 |
Pos logit contributions | |
asis | +0.160 |
robat | +0.157 |
ymes | +0.156 |
ites | +0.156 |
andel | +0.155 |
Neg logit contributions | |
not | -0.102 |
and | -0.090 |
because | -0.084 |
but | -0.077 |
" | -0.075 |
Token | and |
Token ID | 290 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
not | +0.022 |
" | +0.013 |
: | +0.013 |
because | +0.013 |
and | +0.011 |
Neg logit contributions | |
oceans | -0.064 |
rivers | -0.063 |
nests | -0.063 |
lakes | -0.062 |
andel | -0.062 |
Token | the |
Token ID | 262 |
Feature activation | +3.33e+00 |
Pos logit contributions | |
not | +0.153 |
and | +0.141 |
because | +0.124 |
but | +0.110 |
: | +0.110 |
Neg logit contributions | |
asis | -0.304 |
Ta | -0.302 |
nests | -0.301 |
ymes | -0.300 |
andel | -0.299 |
Token | pedestrian |
Token ID | 22382 |
Feature activation | -4.14e+01 |
Pos logit contributions | |
asis | +0.045 |
ymes | +0.044 |
robat | +0.044 |
andel | +0.044 |
orns | +0.044 |
Neg logit contributions | |
not | -0.057 |
and | -0.055 |
because | -0.049 |
. | -0.047 |
but | -0.047 |
Token | light |
Token ID | 1657 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
not | +0.598 |
and | +0.560 |
because | +0.510 |
but | +0.476 |
, | +0.468 |
Neg logit contributions | |
andel | -0.643 |
ymes | -0.641 |
asis | -0.639 |
robat | -0.628 |
Ta | -0.621 |
Token | turned |
Token ID | 2900 |
Feature activation | -8.04e+00 |
Pos logit contributions | |
not | +0.017 |
and | +0.013 |
because | +0.012 |
but | +0.011 |
" | +0.010 |
Neg logit contributions | |
ymes | -0.041 |
asis | -0.040 |
andel | -0.040 |
robat | -0.040 |
umm | -0.040 |
Token | green |
Token ID | 4077 |
Feature activation | +8.17e+00 |
Pos logit contributions | |
not | +0.091 |
and | +0.083 |
because | +0.074 |
but | +0.068 |
" | +0.065 |
Neg logit contributions | |
andel | -0.148 |
ymes | -0.147 |
asis | -0.144 |
ites | -0.143 |
robat | -0.142 |
Token | . |
Token ID | 13 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
ymes | +0.108 |
andel | +0.107 |
asis | +0.107 |
robat | +0.105 |
umm | +0.103 |
Neg logit contributions | |
not | -0.137 |
and | -0.128 |
because | -0.119 |
but | -0.112 |
" | -0.110 |
Token | Then |
Token ID | 3244 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
not | +0.136 |
and | +0.119 |
because | +0.103 |
, | +0.092 |
but | +0.092 |
Neg logit contributions | |
andel | -0.247 |
Ta | -0.243 |
umm | -0.239 |
ival | -0.238 |
pillar | -0.237 |
Token | YOU |
Token ID | 7013 |
Feature activation | -2.67e+00 |
Pos logit contributions | |
not | +0.275 |
and | +0.256 |
because | +0.240 |
, | +0.229 |
but | +0.225 |
Neg logit contributions | |
ymes | -0.176 |
asis | -0.175 |
keeping | -0.173 |
robat | -0.173 |
Ta | -0.172 |
Token | STEP |
Token ID | 49154 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
not | +0.032 |
and | +0.030 |
because | +0.027 |
but | +0.026 |
they | +0.025 |
Neg logit contributions | |
asis | -0.046 |
andel | -0.046 |
robat | -0.045 |
ymes | -0.045 |
pillar | -0.044 |
Token | ON |
Token ID | 6177 |
Feature activation | -2.76e+01 |
Pos logit contributions | |
not | +0.286 |
and | +0.260 |
because | +0.227 |
they | +0.225 |
but | +0.222 |
Neg logit contributions | |
andel | -0.458 |
asis | -0.449 |
ymes | -0.447 |
robat | -0.442 |
crow | -0.441 |
Token | THE |
Token ID | 3336 |
Feature activation | -6.95e+00 |
Pos logit contributions | |
not | +0.251 |
and | +0.211 |
because | +0.182 |
but | +0.163 |
" | +0.157 |
Neg logit contributions | |
andel | -0.565 |
robat | -0.564 |
asis | -0.563 |
ymes | -0.562 |
crow | -0.550 |
Token | LE |
Token ID | 12509 |
Feature activation | -5.19e+00 |
Pos logit contributions | |
not | +0.103 |
and | +0.097 |
because | +0.088 |
but | +0.083 |
, | +0.080 |
Neg logit contributions | |
asis | -0.106 |
robat | -0.104 |
andel | -0.103 |
ymes | -0.103 |
ites | -0.101 |
Token | AF |
Token ID | 8579 |
Feature activation | -4.04e+01 |
Pos logit contributions | |
not | +0.090 |
and | +0.086 |
because | +0.079 |
, | +0.075 |
but | +0.074 |
Neg logit contributions | |
asis | -0.067 |
robat | -0.066 |
andel | -0.066 |
ymes | -0.065 |
umm | -0.064 |
Token | ?!" |
Token ID | 30823 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
not | +0.602 |
and | +0.579 |
because | +0.524 |
, | +0.494 |
but | +0.489 |
Neg logit contributions | |
asis | -0.613 |
ymes | -0.612 |
Ta | -0.609 |
robat | -0.604 |
andel | -0.600 |
Token |
|
Token ID | 198 |
Feature activation | -9.56e+00 |
Pos logit contributions | |
not | +0.122 |
and | +0.074 |
because | +0.069 |
for | +0.060 |
still | +0.057 |
Neg logit contributions | |
crow | -0.272 |
andel | -0.272 |
pillar | -0.270 |
robat | -0.268 |
folk | -0.265 |
Token |
|
Token ID | 198 |
Feature activation | -9.94e+00 |
Pos logit contributions | |
not | +0.078 |
and | +0.072 |
because | +0.061 |
but | +0.053 |
, | +0.050 |
Neg logit contributions | |
andel | -0.206 |
ymes | -0.206 |
asis | -0.205 |
robat | -0.203 |
Ta | -0.203 |
Token | The |
Token ID | 464 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
not | +0.130 |
and | +0.121 |
because | +0.106 |
" | +0.099 |
but | +0.099 |
Neg logit contributions | |
asis | -0.172 |
andel | -0.171 |
ymes | -0.169 |
robat | -0.168 |
umm | -0.167 |
Token | embarrassed |
Token ID | 21100 |
Feature activation | -9.98e+00 |
Pos logit contributions | |
not | +0.140 |
and | +0.133 |
because | +0.114 |
, | +0.111 |
. | +0.110 |
Neg logit contributions | |
asis | -0.188 |
robat | -0.182 |
Ta | -0.179 |
lor | -0.178 |
ymes | -0.178 |
Token | � |
Token ID | 6184 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
not | +0.156 |
and | +0.128 |
because | +0.117 |
their | +0.088 |
for | +0.088 |
Neg logit contributions | |
andel | -0.403 |
ival | -0.397 |
folk | -0.396 |
pillar | -0.387 |
ocol | -0.384 |
Token | � |
Token ID | 95 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
not | +0.331 |
and | +0.319 |
because | +0.295 |
but | +0.283 |
, | +0.279 |
Neg logit contributions | |
asis | -0.177 |
andel | -0.174 |
ymes | -0.171 |
robat | -0.171 |
Ta | -0.165 |
Token | € |
Token ID | 26391 |
Feature activation | +5.88e+00 |
Pos logit contributions | |
not | +0.405 |
and | +0.390 |
because | +0.359 |
but | +0.342 |
, | +0.340 |
Neg logit contributions | |
asis | -0.274 |
andel | -0.270 |
ymes | -0.269 |
robat | -0.269 |
Ta | -0.264 |
Token | � |
Token ID | 129 |
Feature activation | -7.79e+00 |
Pos logit contributions | |
asis | +0.077 |
ymes | +0.076 |
andel | +0.076 |
robat | +0.075 |
Ta | +0.074 |
Neg logit contributions | |
not | -0.099 |
and | -0.095 |
because | -0.087 |
but | -0.083 |
, | -0.082 |
Token | � |
Token ID | 241 |
Feature activation | -5.02e+00 |
Pos logit contributions | |
not | +0.133 |
and | +0.129 |
because | +0.118 |
but | +0.114 |
, | +0.112 |
Neg logit contributions | |
asis | -0.098 |
andel | -0.097 |
robat | -0.095 |
ymes | -0.094 |
Ta | -0.092 |
Token | Because |
Token ID | 8128 |
Feature activation | -3.88e+01 |
Pos logit contributions | |
not | +0.068 |
and | +0.063 |
, | +0.058 |
because | +0.058 |
for | +0.057 |
Neg logit contributions | |
robat | -0.074 |
Ta | -0.072 |
pillar | -0.072 |
asis | -0.071 |
ymes | -0.071 |
Token | the |
Token ID | 262 |
Feature activation | -9.10e+00 |
Pos logit contributions | |
not | +0.384 |
and | +0.344 |
because | +0.296 |
but | +0.275 |
: | +0.272 |
Neg logit contributions | |
ymes | -0.716 |
ites | -0.715 |
asis | -0.712 |
andel | -0.710 |
ocol | -0.709 |
Token | mill |
Token ID | 3939 |
Feature activation | +3.76e+00 |
Pos logit contributions | |
not | +0.162 |
and | +0.155 |
because | +0.143 |
but | +0.136 |
, | +0.134 |
Neg logit contributions | |
asis | -0.112 |
andel | -0.111 |
ymes | -0.110 |
robat | -0.109 |
Ta | -0.107 |
Token | is |
Token ID | 318 |
Feature activation | -2.68e+01 |
Pos logit contributions | |
asis | +0.074 |
ymes | +0.073 |
robat | +0.073 |
ites | +0.071 |
crow | +0.071 |
Neg logit contributions | |
not | -0.036 |
and | -0.032 |
because | -0.029 |
but | -0.025 |
" | -0.024 |
Token | very |
Token ID | 845 |
Feature activation | -9.84e+00 |
Pos logit contributions | |
and | +0.234 |
not | +0.233 |
because | +0.197 |
but | +0.195 |
they | +0.183 |
Neg logit contributions | |
andel | -0.458 |
asis | -0.456 |
ocol | -0.453 |
nests | -0.447 |
ymes | -0.443 |
Token | important |
Token ID | 1593 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
not | +0.140 |
and | +0.139 |
because | +0.125 |
but | +0.120 |
, | +0.114 |
Neg logit contributions | |
asis | -0.141 |
andel | -0.141 |
ocol | -0.137 |
ites | -0.135 |
ymes | -0.135 |
Token | The |
Token ID | 383 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
not | +0.088 |
and | +0.074 |
because | +0.065 |
for | +0.061 |
but | +0.056 |
Neg logit contributions | |
andel | -0.165 |
asis | -0.164 |
robat | -0.163 |
crow | -0.163 |
Ta | -0.163 |
Token | shorter |
Token ID | 12238 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
not | +0.023 |
and | +0.022 |
" | +0.020 |
, | +0.019 |
. | +0.019 |
Neg logit contributions | |
keeping | -0.028 |
robat | -0.028 |
lor | -0.027 |
andel | -0.027 |
ocol | -0.027 |
Token | one |
Token ID | 530 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
ymes | +0.175 |
andel | +0.174 |
asis | +0.174 |
Ta | +0.172 |
robat | +0.172 |
Neg logit contributions | |
not | -0.150 |
and | -0.144 |
because | -0.128 |
but | -0.120 |
, | -0.120 |
Token | replied |
Token ID | 8712 |
Feature activation | -8.23e+00 |
Pos logit contributions | |
asis | +0.044 |
ymes | +0.044 |
andel | +0.043 |
robat | +0.043 |
Ta | +0.043 |
Neg logit contributions | |
not | -0.021 |
and | -0.019 |
because | -0.017 |
but | -0.015 |
, | -0.014 |
Token | " |
Token ID | 366 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
not | +0.051 |
because | +0.035 |
and | +0.031 |
also | +0.028 |
but | +0.025 |
Neg logit contributions | |
crow | -0.161 |
andel | -0.158 |
ival | -0.157 |
ymes | -0.156 |
folk | -0.156 |
Token | because |
Token ID | 13893 |
Feature activation | -3.82e+01 |
Pos logit contributions | |
not | +0.041 |
and | +0.040 |
because | +0.036 |
but | +0.034 |
. | +0.033 |
Neg logit contributions | |
asis | -0.042 |
andel | -0.042 |
ymes | -0.041 |
robat | -0.041 |
ocol | -0.040 |
Token | it |
Token ID | 340 |
Feature activation | -8.30e-02 |
Pos logit contributions | |
not | +0.372 |
and | +0.338 |
because | +0.296 |
but | +0.265 |
: | +0.249 |
Neg logit contributions | |
ymes | -0.726 |
asis | -0.723 |
andel | -0.716 |
ites | -0.709 |
ival | -0.695 |
Token | feels |
Token ID | 5300 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
not | +0.001 |
and | +0.001 |
because | +0.001 |
but | +0.001 |
, | +0.001 |
Neg logit contributions | |
asis | -0.001 |
ymes | -0.001 |
robat | -0.001 |
ites | -0.001 |
andel | -0.001 |
Token | good |
Token ID | 922 |
Feature activation | +2.83e+00 |
Pos logit contributions | |
not | +0.118 |
and | +0.110 |
they | +0.099 |
: | +0.095 |
because | +0.095 |
Neg logit contributions | |
andel | -0.169 |
ymes | -0.165 |
asis | -0.165 |
nests | -0.162 |
risks | -0.161 |
Token | and |
Token ID | 290 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
unn | +0.056 |
keeping | +0.056 |
umm | +0.055 |
asis | +0.053 |
ocol | +0.053 |
Neg logit contributions | |
not | -0.022 |
still | -0.013 |
and | -0.013 |
" | -0.012 |
their | -0.012 |
Token | it |
Token ID | 340 |
Feature activation | -5.60e-01 |
Pos logit contributions | |
not | +0.231 |
and | +0.226 |
because | +0.198 |
but | +0.184 |
: | +0.182 |
Neg logit contributions | |
asis | -0.358 |
ymes | -0.356 |
ites | -0.349 |
nests | -0.344 |
Ta | -0.344 |
Token | the |
Token ID | 1169 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
asis | +0.134 |
andel | +0.133 |
ymes | +0.131 |
robat | +0.130 |
Ta | +0.130 |
Neg logit contributions | |
not | -0.208 |
and | -0.200 |
because | -0.185 |
but | -0.175 |
. | -0.174 |
Token | toys |
Token ID | 14958 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
not | +0.226 |
and | +0.219 |
because | +0.199 |
. | +0.188 |
, | +0.188 |
Neg logit contributions | |
asis | -0.178 |
Ta | -0.176 |
ymes | -0.176 |
robat | -0.175 |
andel | -0.175 |
Token | on |
Token ID | 319 |
Feature activation | -3.85e+00 |
Pos logit contributions | |
ymes | +0.029 |
asis | +0.029 |
emaker | +0.028 |
andel | +0.028 |
robat | +0.028 |
Neg logit contributions | |
not | -0.012 |
and | -0.010 |
because | -0.009 |
: | -0.008 |
" | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | -8.34e-01 |
Pos logit contributions | |
not | +0.036 |
and | +0.031 |
because | +0.027 |
but | +0.026 |
: | +0.024 |
Neg logit contributions | |
andel | -0.075 |
ymes | -0.074 |
ocol | -0.073 |
keeping | -0.072 |
robat | -0.072 |
Token | floor |
Token ID | 4314 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
not | +0.014 |
and | +0.014 |
because | +0.013 |
but | +0.012 |
, | +0.012 |
Neg logit contributions | |
andel | -0.011 |
asis | -0.011 |
ymes | -0.011 |
Ta | -0.011 |
robat | -0.011 |
Token | ) |
Token ID | 8 |
Feature activation | -3.81e+01 |
Pos logit contributions | |
ymes | +0.014 |
keeping | +0.014 |
andel | +0.013 |
handed | +0.013 |
crow | +0.013 |
Neg logit contributions | |
not | -0.004 |
and | -0.002 |
because | -0.002 |
but | -0.002 |
they | -0.001 |
Token | from |
Token ID | 422 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
not | +0.393 |
and | +0.358 |
because | +0.314 |
but | +0.291 |
, | +0.278 |
Neg logit contributions | |
asis | -0.718 |
ymes | -0.710 |
robat | -0.709 |
andel | -0.706 |
ites | -0.695 |
Token | taking |
Token ID | 2263 |
Feature activation | -5.66e+00 |
Pos logit contributions | |
not | +0.036 |
and | +0.033 |
because | +0.027 |
but | +0.025 |
" | +0.024 |
Neg logit contributions | |
andel | -0.084 |
ymes | -0.082 |
ocol | -0.082 |
asis | -0.082 |
robat | -0.082 |
Token | over |
Token ID | 625 |
Feature activation | -7.41e+00 |
Pos logit contributions | |
not | +0.063 |
and | +0.063 |
because | +0.053 |
, | +0.050 |
. | +0.049 |
Neg logit contributions | |
asis | -0.110 |
Ta | -0.108 |
ymes | -0.107 |
robat | -0.107 |
andel | -0.107 |
Token | his |
Token ID | 465 |
Feature activation | -8.04e+00 |
Pos logit contributions | |
not | +0.055 |
and | +0.042 |
because | +0.036 |
" | +0.031 |
: | +0.031 |
Neg logit contributions | |
ymes | -0.157 |
keeping | -0.157 |
seas | -0.156 |
andel | -0.156 |
ocol | -0.156 |
Token | room |
Token ID | 2119 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
not | +0.128 |
and | +0.120 |
because | +0.111 |
but | +0.105 |
" | +0.103 |
Neg logit contributions | |
ymes | -0.111 |
asis | -0.111 |
andel | -0.110 |
robat | -0.108 |
ites | -0.106 |
Token | � |
Token ID | 6184 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
not | +0.164 |
and | +0.126 |
because | +0.115 |
but | +0.084 |
still | +0.079 |
Neg logit contributions | |
ival | -0.452 |
folk | -0.450 |
andel | -0.443 |
crow | -0.443 |
pillar | -0.441 |
Token | � |
Token ID | 95 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
not | +0.320 |
and | +0.309 |
because | +0.286 |
but | +0.274 |
, | +0.271 |
Neg logit contributions | |
asis | -0.174 |
andel | -0.171 |
ymes | -0.170 |
robat | -0.169 |
Ta | -0.164 |
Token | € |
Token ID | 26391 |
Feature activation | +5.10e+00 |
Pos logit contributions | |
not | +0.424 |
and | +0.408 |
because | +0.378 |
but | +0.360 |
, | +0.357 |
Neg logit contributions | |
asis | -0.259 |
ymes | -0.259 |
andel | -0.258 |
robat | -0.254 |
Ta | -0.250 |
Token | � |
Token ID | 129 |
Feature activation | -8.25e+00 |
Pos logit contributions | |
asis | +0.068 |
ymes | +0.068 |
andel | +0.067 |
robat | +0.067 |
Ta | +0.065 |
Neg logit contributions | |
not | -0.084 |
and | -0.080 |
because | -0.074 |
but | -0.070 |
, | -0.069 |
Token | � |
Token ID | 241 |
Feature activation | -5.39e+00 |
Pos logit contributions | |
not | +0.150 |
and | +0.145 |
because | +0.134 |
but | +0.129 |
, | +0.127 |
Neg logit contributions | |
asis | -0.095 |
andel | -0.094 |
robat | -0.093 |
ymes | -0.092 |
Ta | -0.089 |
Token | Because |
Token ID | 8128 |
Feature activation | -3.79e+01 |
Pos logit contributions | |
not | +0.075 |
and | +0.070 |
, | +0.064 |
for | +0.064 |
because | +0.064 |
Neg logit contributions | |
robat | -0.078 |
Ta | -0.076 |
pillar | -0.076 |
ymes | -0.075 |
asis | -0.074 |
Token | we |
Token ID | 356 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
not | +0.385 |
and | +0.349 |
because | +0.301 |
but | +0.279 |
: | +0.274 |
Neg logit contributions | |
ymes | -0.695 |
ites | -0.686 |
andel | -0.681 |
robat | -0.679 |
ocol | -0.676 |
Token | are |
Token ID | 389 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
not | +0.210 |
and | +0.191 |
because | +0.174 |
" | +0.170 |
but | +0.167 |
Neg logit contributions | |
robat | -0.291 |
asis | -0.290 |
ites | -0.289 |
ymes | -0.287 |
andel | -0.286 |
Token | too |
Token ID | 1165 |
Feature activation | -8.05e+00 |
Pos logit contributions | |
not | +0.175 |
and | +0.173 |
because | +0.143 |
but | +0.136 |
: | +0.127 |
Neg logit contributions | |
ymes | -0.374 |
andel | -0.373 |
ocol | -0.371 |
asis | -0.368 |
ites | -0.367 |
Token | big |
Token ID | 1263 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
not | +0.106 |
and | +0.099 |
because | +0.090 |
but | +0.089 |
for | +0.087 |
Neg logit contributions | |
andel | -0.124 |
ites | -0.120 |
ymes | -0.119 |
asis | -0.114 |
ocol | -0.114 |
Token | ! |
Token ID | 0 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
not | +0.056 |
still | +0.023 |
they | +0.022 |
also | +0.021 |
" | +0.021 |
Neg logit contributions | |
robat | -0.172 |
orns | -0.169 |
ites | -0.169 |
ymes | -0.169 |
keeping | -0.168 |
Token | who |
Token ID | 8727 |
Feature activation | -8.05e+00 |
Pos logit contributions | |
asis | +0.084 |
andel | +0.082 |
umm | +0.082 |
Ta | +0.078 |
ymes | +0.078 |
Neg logit contributions | |
not | -0.125 |
and | -0.124 |
because | -0.113 |
. | -0.107 |
but | -0.107 |
Token | was |
Token ID | 373 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
not | +0.109 |
and | +0.100 |
because | +0.095 |
but | +0.092 |
" | +0.088 |
Neg logit contributions | |
ymes | -0.128 |
ites | -0.124 |
asis | -0.123 |
robat | -0.122 |
Ta | -0.121 |
Token | throwing |
Token ID | 9644 |
Feature activation | -8.98e+00 |
Pos logit contributions | |
not | +0.219 |
and | +0.208 |
because | +0.188 |
but | +0.186 |
, | +0.158 |
Neg logit contributions | |
ival | -0.430 |
ites | -0.427 |
ymes | -0.425 |
crow | -0.424 |
asis | -0.422 |
Token | the |
Token ID | 262 |
Feature activation | -4.63e+00 |
Pos logit contributions | |
not | +0.092 |
and | +0.082 |
because | +0.073 |
but | +0.066 |
" | +0.063 |
Neg logit contributions | |
ymes | -0.175 |
andel | -0.173 |
robat | -0.172 |
asis | -0.171 |
orns | -0.169 |
Token | ball |
Token ID | 2613 |
Feature activation | +4.04e+00 |
Pos logit contributions | |
not | +0.077 |
and | +0.074 |
because | +0.067 |
but | +0.064 |
, | +0.064 |
Neg logit contributions | |
asis | -0.063 |
andel | -0.063 |
ymes | -0.062 |
robat | -0.061 |
Ta | -0.061 |
Token | ) |
Token ID | 8 |
Feature activation | -3.76e+01 |
Pos logit contributions | |
ites | +0.078 |
asis | +0.077 |
crow | +0.076 |
pillar | +0.076 |
ite | +0.076 |
Neg logit contributions | |
not | -0.036 |
and | -0.027 |
because | -0.024 |
but | -0.024 |
" | -0.023 |
Token | was |
Token ID | 373 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
not | +0.369 |
and | +0.322 |
because | +0.284 |
but | +0.274 |
, | +0.252 |
Neg logit contributions | |
asis | -0.705 |
andel | -0.693 |
robat | -0.689 |
ymes | -0.689 |
crow | -0.686 |
Token | the |
Token ID | 262 |
Feature activation | -5.15e+00 |
Pos logit contributions | |
and | +0.199 |
not | +0.199 |
because | +0.181 |
but | +0.176 |
, | +0.155 |
Neg logit contributions | |
asis | -0.411 |
seas | -0.406 |
ymes | -0.399 |
ocol | -0.398 |
keeping | -0.396 |
Token | mysterious |
Token ID | 11428 |
Feature activation | -5.73e+00 |
Pos logit contributions | |
not | +0.079 |
and | +0.076 |
because | +0.070 |
but | +0.065 |
, | +0.065 |
Neg logit contributions | |
ymes | -0.072 |
asis | -0.072 |
andel | -0.072 |
robat | -0.071 |
umm | -0.070 |
Token | person |
Token ID | 1048 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
not | +0.095 |
and | +0.086 |
because | +0.081 |
but | +0.076 |
" | +0.075 |
Neg logit contributions | |
andel | -0.074 |
ymes | -0.074 |
asis | -0.073 |
robat | -0.073 |
umm | -0.071 |
Token | on |
Token ID | 319 |
Feature activation | -9.50e+00 |
Pos logit contributions | |
not | +0.027 |
and | +0.021 |
because | +0.018 |
but | +0.017 |
" | +0.016 |
Neg logit contributions | |
asis | -0.068 |
ymes | -0.068 |
ites | -0.067 |
emaker | -0.067 |
pillar | -0.067 |
Token | do |
Token ID | 466 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
not | +0.189 |
and | +0.158 |
" | +0.156 |
making | +0.136 |
they | +0.136 |
Neg logit contributions | |
crow | -0.337 |
robat | -0.328 |
asis | -0.325 |
emaker | -0.324 |
andel | -0.322 |
Token | it |
Token ID | 340 |
Feature activation | -5.27e+00 |
Pos logit contributions | |
and | +0.135 |
not | +0.135 |
because | +0.116 |
but | +0.111 |
" | +0.108 |
Neg logit contributions | |
ymes | -0.210 |
seas | -0.204 |
robat | -0.203 |
asis | -0.203 |
crow | -0.203 |
Token | . |
Token ID | 13 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
not | +0.035 |
" | +0.025 |
and | +0.024 |
: | +0.019 |
they | +0.019 |
Neg logit contributions | |
robat | -0.100 |
orns | -0.099 |
asis | -0.099 |
crow | -0.098 |
emaker | -0.097 |
Token | She |
Token ID | 1375 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
not | +0.199 |
and | +0.172 |
because | +0.144 |
, | +0.132 |
they | +0.131 |
Neg logit contributions | |
andel | -0.372 |
umm | -0.361 |
asis | -0.355 |
ites | -0.350 |
crow | -0.350 |
Token | sc |
Token ID | 629 |
Feature activation | -5.31e+00 |
Pos logit contributions | |
not | +0.133 |
and | +0.118 |
because | +0.104 |
but | +0.096 |
" | +0.095 |
Neg logit contributions | |
asis | -0.279 |
ymes | -0.277 |
andel | -0.276 |
robat | -0.275 |
pillar | -0.273 |
Token | run |
Token ID | 5143 |
Feature activation | -3.76e+01 |
Pos logit contributions | |
not | +0.088 |
and | +0.085 |
because | +0.077 |
, | +0.073 |
but | +0.073 |
Neg logit contributions | |
asis | -0.073 |
ymes | -0.072 |
robat | -0.071 |
andel | -0.070 |
umm | -0.069 |
Token | ched |
Token ID | 1740 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
not | +0.694 |
and | +0.662 |
because | +0.616 |
but | +0.587 |
, | +0.580 |
Neg logit contributions | |
ymes | -0.427 |
asis | -0.425 |
andel | -0.425 |
robat | -0.421 |
Ta | -0.413 |
Token | up |
Token ID | 510 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
not | +0.158 |
and | +0.138 |
because | +0.115 |
but | +0.100 |
, | +0.096 |
Neg logit contributions | |
andel | -0.421 |
ymes | -0.417 |
robat | -0.415 |
asis | -0.412 |
Ta | -0.410 |
Token | her |
Token ID | 607 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
not | +0.087 |
and | +0.048 |
because | +0.047 |
they | +0.040 |
" | +0.040 |
Neg logit contributions | |
andel | -0.291 |
seas | -0.280 |
ymes | -0.272 |
ocol | -0.272 |
crow | -0.269 |
Token | face |
Token ID | 1986 |
Feature activation | -9.74e+00 |
Pos logit contributions | |
not | +0.210 |
and | +0.183 |
because | +0.180 |
they | +0.171 |
" | +0.169 |
Neg logit contributions | |
andel | -0.159 |
ymes | -0.155 |
seas | -0.153 |
robat | -0.152 |
asis | -0.150 |
Token | . |
Token ID | 13 |
Feature activation | -2.09e+01 |
Pos logit contributions | |
not | +0.048 |
they | +0.016 |
their | +0.014 |
because | +0.013 |
" | +0.010 |
Neg logit contributions | |
andel | -0.213 |
als | -0.211 |
pillar | -0.210 |
ymes | -0.207 |
seas | -0.205 |
Token | � |
Token ID | 6184 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
not | +0.057 |
and | +0.043 |
because | +0.038 |
but | +0.033 |
they | +0.031 |
Neg logit contributions | |
andel | -0.187 |
crow | -0.183 |
pillar | -0.182 |
ival | -0.181 |
ocol | -0.177 |
Token | � |
Token ID | 95 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
not | +0.248 |
and | +0.239 |
because | +0.225 |
, | +0.214 |
but | +0.212 |
Neg logit contributions | |
ymes | -0.150 |
andel | -0.145 |
Ta | -0.144 |
asis | -0.143 |
robat | -0.142 |
Token | € |
Token ID | 26391 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
not | +0.325 |
and | +0.313 |
because | +0.293 |
but | +0.275 |
" | +0.275 |
Neg logit contributions | |
ymes | -0.207 |
andel | -0.204 |
ites | -0.195 |
asis | -0.194 |
Ta | -0.192 |
Token | � |
Token ID | 129 |
Feature activation | -3.33e+00 |
Pos logit contributions | |
andel | +0.158 |
ymes | +0.157 |
asis | +0.154 |
Ta | +0.153 |
robat | +0.153 |
Neg logit contributions | |
not | -0.172 |
and | -0.164 |
because | -0.150 |
but | -0.141 |
, | -0.141 |
Token | � |
Token ID | 241 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
not | +0.058 |
and | +0.056 |
because | +0.052 |
but | +0.048 |
, | +0.048 |
Neg logit contributions | |
ymes | -0.042 |
asis | -0.042 |
andel | -0.042 |
robat | -0.041 |
Ta | -0.041 |
Token | Because |
Token ID | 8128 |
Feature activation | -3.75e+01 |
Pos logit contributions | |
not | +0.027 |
and | +0.025 |
because | +0.023 |
, | +0.022 |
for | +0.022 |
Neg logit contributions | |
robat | -0.028 |
Ta | -0.027 |
pillar | -0.027 |
asis | -0.027 |
ymes | -0.027 |
Token | I |
Token ID | 314 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
not | +0.377 |
and | +0.338 |
because | +0.289 |
but | +0.267 |
: | +0.259 |
Neg logit contributions | |
asis | -0.693 |
ymes | -0.693 |
ites | -0.690 |
ocol | -0.689 |
robat | -0.688 |
Token | want |
Token ID | 765 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
not | +0.235 |
" | +0.212 |
and | +0.211 |
because | +0.204 |
they | +0.202 |
Neg logit contributions | |
robat | -0.255 |
asis | -0.252 |
pillar | -0.249 |
Ta | -0.241 |
crow | -0.240 |
Token | my |
Token ID | 616 |
Feature activation | -7.22e+00 |
Pos logit contributions | |
not | +0.089 |
and | +0.078 |
because | +0.060 |
but | +0.049 |
, | +0.044 |
Neg logit contributions | |
ymes | -0.341 |
robat | -0.340 |
andel | -0.338 |
Ta | -0.337 |
seas | -0.337 |
Token | nap |
Token ID | 25422 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
not | +0.113 |
and | +0.107 |
because | +0.098 |
but | +0.092 |
" | +0.091 |
Neg logit contributions | |
asis | -0.100 |
andel | -0.099 |
ymes | -0.099 |
robat | -0.098 |
Ta | -0.095 |
Token | ! |
Token ID | 0 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
robat | +0.063 |
ymes | +0.063 |
asis | +0.062 |
seas | +0.060 |
keeping | +0.057 |
Neg logit contributions | |
not | -0.042 |
and | -0.035 |
" | -0.033 |
because | -0.033 |
they | -0.032 |
Token | was |
Token ID | 373 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
not | +0.068 |
and | +0.058 |
because | +0.054 |
but | +0.050 |
" | +0.048 |
Neg logit contributions | |
asis | -0.122 |
ymes | -0.121 |
ites | -0.120 |
andel | -0.119 |
pillar | -0.118 |
Token | the |
Token ID | 262 |
Feature activation | -7.93e+00 |
Pos logit contributions | |
not | +0.261 |
and | +0.246 |
because | +0.225 |
but | +0.209 |
they | +0.196 |
Neg logit contributions | |
andel | -0.483 |
nests | -0.472 |
ymes | -0.471 |
asis | -0.468 |
ocol | -0.465 |
Token | brightest |
Token ID | 33871 |
Feature activation | +4.22e-02 |
Pos logit contributions | |
not | +0.112 |
and | +0.107 |
because | +0.096 |
but | +0.091 |
, | +0.089 |
Neg logit contributions | |
ymes | -0.128 |
asis | -0.127 |
robat | -0.126 |
andel | -0.126 |
Ta | -0.125 |
Token | it |
Token ID | 340 |
Feature activation | -8.65e+00 |
Pos logit contributions | |
andel | +0.001 |
asis | +0.001 |
ymes | +0.001 |
umm | +0.001 |
seas | +0.001 |
Neg logit contributions | |
not | -0.000 |
and | -0.000 |
because | -0.000 |
" | -0.000 |
but | -0.000 |
Token | could |
Token ID | 714 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
not | +0.075 |
and | +0.062 |
because | +0.056 |
" | +0.053 |
: | +0.050 |
Neg logit contributions | |
asis | -0.150 |
robat | -0.146 |
pillar | -0.146 |
worm | -0.146 |
seas | -0.143 |
Token | possibly |
Token ID | 5457 |
Feature activation | -3.72e+01 |
Pos logit contributions | |
not | +0.202 |
and | +0.186 |
" | +0.184 |
because | +0.179 |
they | +0.171 |
Neg logit contributions | |
asis | -0.305 |
arrow | -0.288 |
nests | -0.282 |
andel | -0.281 |
worm | -0.280 |
Token | be |
Token ID | 307 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
not | +0.407 |
and | +0.380 |
because | +0.337 |
" | +0.315 |
but | +0.307 |
Neg logit contributions | |
asis | -0.677 |
andel | -0.657 |
ymes | -0.650 |
robat | -0.643 |
nests | -0.641 |
Token | . |
Token ID | 13 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
not | +0.135 |
and | +0.118 |
because | +0.101 |
but | +0.093 |
" | +0.091 |
Neg logit contributions | |
ymes | -0.341 |
asis | -0.341 |
andel | -0.337 |
ites | -0.331 |
orns | -0.331 |
Token | Ab |
Token ID | 2275 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
not | +0.255 |
and | +0.238 |
because | +0.208 |
but | +0.190 |
, | +0.187 |
Neg logit contributions | |
asis | -0.418 |
andel | -0.417 |
ymes | -0.412 |
robat | -0.409 |
Ta | -0.408 |
Token | bi |
Token ID | 8482 |
Feature activation | +3.96e+00 |
Pos logit contributions | |
ymes | +0.016 |
andel | +0.016 |
asis | +0.016 |
robat | +0.016 |
Ta | +0.016 |
Neg logit contributions | |
not | -0.039 |
and | -0.038 |
because | -0.036 |
, | -0.034 |
but | -0.034 |
Token | had |
Token ID | 550 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
asis | +0.080 |
pillar | +0.079 |
ymes | +0.079 |
ites | +0.079 |
robat | +0.078 |
Neg logit contributions | |
not | -0.034 |
because | -0.027 |
and | -0.027 |
but | -0.025 |
" | -0.023 |
Token | sad |
Token ID | 6507 |
Feature activation | +4.38e+00 |
Pos logit contributions | |
not | +0.068 |
and | +0.064 |
because | +0.056 |
but | +0.053 |
" | +0.053 |
Neg logit contributions | |
ymes | -0.086 |
andel | -0.086 |
asis | -0.086 |
Ta | -0.083 |
emaker | -0.083 |
Token | again |
Token ID | 757 |
Feature activation | -2.41e+00 |
Pos logit contributions | |
umm | +0.075 |
andel | +0.072 |
emaker | +0.070 |
pillar | +0.069 |
kingdom | +0.068 |
Neg logit contributions | |
not | -0.050 |
and | -0.037 |
they | -0.036 |
" | -0.035 |
their | -0.035 |
Token | â |
Token ID | 22940 |
Feature activation | -6.35e+00 |
Pos logit contributions | |
not | +0.015 |
" | +0.009 |
they | +0.008 |
and | +0.007 |
: | +0.006 |
Neg logit contributions | |
asis | -0.052 |
kingdom | -0.051 |
ymes | -0.050 |
keeping | -0.050 |
handed | -0.050 |
Token | € |
Token ID | 26391 |
Feature activation | +1.57e+01 |
Pos logit contributions | |
not | +0.127 |
and | +0.122 |
because | +0.114 |
but | +0.109 |
, | +0.108 |
Neg logit contributions | |
asis | -0.064 |
andel | -0.062 |
ymes | -0.062 |
robat | -0.062 |
Ta | -0.061 |
Token | • |
Token ID | 3581 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
asis | +0.203 |
ymes | +0.200 |
andel | +0.197 |
robat | +0.197 |
ites | +0.193 |
Neg logit contributions | |
not | -0.263 |
and | -0.253 |
because | -0.233 |
but | -0.222 |
, | -0.218 |
Token | because |
Token ID | 13893 |
Feature activation | -3.71e+01 |
Pos logit contributions | |
not | +0.134 |
and | +0.099 |
because | +0.084 |
they | +0.077 |
but | +0.072 |
Neg logit contributions | |
ymes | -0.412 |
asis | -0.411 |
robat | -0.411 |
emaker | -0.407 |
keeping | -0.406 |
Token | whenever |
Token ID | 8797 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
not | +0.310 |
and | +0.245 |
because | +0.202 |
but | +0.191 |
" | +0.181 |
Neg logit contributions | |
asis | -0.730 |
pillar | -0.722 |
emaker | -0.721 |
crow | -0.717 |
robat | -0.712 |
Token | he |
Token ID | 339 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
not | +0.100 |
and | +0.090 |
because | +0.073 |
: | +0.066 |
but | +0.065 |
Neg logit contributions | |
asis | -0.216 |
seas | -0.215 |
robat | -0.210 |
ocol | -0.210 |
andel | -0.210 |
Token | needed |
Token ID | 2622 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
not | +0.140 |
and | +0.116 |
because | +0.104 |
" | +0.100 |
but | +0.100 |
Neg logit contributions | |
asis | -0.261 |
ymes | -0.255 |
robat | -0.253 |
pillar | -0.252 |
Ta | -0.247 |
Token | a |
Token ID | 257 |
Feature activation | -8.68e+00 |
Pos logit contributions | |
not | +0.110 |
and | +0.096 |
because | +0.087 |
" | +0.078 |
but | +0.074 |
Neg logit contributions | |
seas | -0.230 |
ymes | -0.227 |
ocol | -0.226 |
keeping | -0.224 |
asis | -0.224 |
Token | reminder |
Token ID | 15438 |
Feature activation | -3.13e+00 |
Pos logit contributions | |
not | +0.123 |
and | +0.117 |
because | +0.106 |
but | +0.099 |
, | +0.098 |
Neg logit contributions | |
asis | -0.137 |
ymes | -0.136 |
andel | -0.136 |
robat | -0.135 |
Ta | -0.133 |
Token | okay |
Token ID | 8788 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
not | +0.215 |
and | +0.211 |
they | +0.187 |
" | +0.187 |
: | +0.186 |
Neg logit contributions | |
asis | -0.389 |
ymes | -0.383 |
nests | -0.376 |
andel | -0.369 |
seas | -0.369 |
Token | ". |
Token ID | 1911 |
Feature activation | -2.54e+01 |
Pos logit contributions | |
not | +0.168 |
and | +0.124 |
" | +0.109 |
because | +0.107 |
making | +0.104 |
Neg logit contributions | |
keeping | -0.395 |
asis | -0.390 |
pter | -0.388 |
ymes | -0.385 |
perspective | -0.376 |
Token |
|
Token ID | 198 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
not | +0.252 |
and | +0.209 |
because | +0.184 |
for | +0.168 |
: | +0.160 |
Neg logit contributions | |
andel | -0.488 |
robat | -0.487 |
keeping | -0.485 |
Ta | -0.483 |
ival | -0.482 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
not | +0.111 |
and | +0.093 |
because | +0.082 |
but | +0.063 |
for | +0.061 |
Neg logit contributions | |
robat | -0.353 |
andel | -0.353 |
asis | -0.352 |
ymes | -0.352 |
Ta | -0.350 |
Token | Alice |
Token ID | 44484 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
not | +0.261 |
and | +0.248 |
because | +0.229 |
but | +0.214 |
, | +0.213 |
Neg logit contributions | |
asis | -0.228 |
ymes | -0.228 |
andel | -0.227 |
robat | -0.225 |
Ta | -0.223 |
Token | then |
Token ID | 788 |
Feature activation | -3.64e+01 |
Pos logit contributions | |
not | +0.103 |
because | +0.077 |
and | +0.072 |
but | +0.067 |
for | +0.065 |
Neg logit contributions | |
pillar | -0.223 |
asis | -0.222 |
ymes | -0.218 |
robat | -0.218 |
crow | -0.216 |
Token | hugged |
Token ID | 41130 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
not | +0.390 |
and | +0.322 |
because | +0.310 |
but | +0.280 |
" | +0.261 |
Neg logit contributions | |
crow | -0.643 |
andel | -0.636 |
pillar | -0.635 |
ival | -0.634 |
ymes | -0.633 |
Token | her |
Token ID | 607 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
not | +0.177 |
and | +0.122 |
because | +0.114 |
: | +0.102 |
they | +0.099 |
Neg logit contributions | |
andel | -0.398 |
crow | -0.382 |
robat | -0.381 |
ymes | -0.374 |
keeping | -0.374 |
Token | mum |
Token ID | 25682 |
Feature activation | -7.36e+00 |
Pos logit contributions | |
not | +0.204 |
and | +0.184 |
because | +0.171 |
but | +0.157 |
they | +0.152 |
Neg logit contributions | |
andel | -0.259 |
ymes | -0.257 |
asis | -0.253 |
robat | -0.250 |
ites | -0.247 |
Token | and |
Token ID | 290 |
Feature activation | -3.05e+01 |
Pos logit contributions | |
not | +0.027 |
and | +0.007 |
because | +0.004 |
but | -0.002 |
" | -0.002 |
Neg logit contributions | |
andel | -0.189 |
asis | -0.186 |
robat | -0.186 |
ymes | -0.186 |
ites | -0.184 |
Token | felt |
Token ID | 2936 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
not | +0.333 |
and | +0.275 |
because | +0.267 |
: | +0.249 |
but | +0.241 |
Neg logit contributions | |
Ta | -0.490 |
carriage | -0.486 |
keeping | -0.486 |
seas | -0.486 |
ites | -0.485 |
Token | government |
Token ID | 1230 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
not | +0.042 |
and | +0.040 |
because | +0.037 |
but | +0.035 |
, | +0.035 |
Neg logit contributions | |
asis | -0.031 |
ymes | -0.030 |
andel | -0.030 |
robat | -0.030 |
Ta | -0.030 |
Token | gives |
Token ID | 3607 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
not | +0.119 |
and | +0.090 |
because | +0.081 |
" | +0.071 |
but | +0.070 |
Neg logit contributions | |
asis | -0.315 |
ites | -0.309 |
robat | -0.307 |
andel | -0.307 |
ymes | -0.306 |
Token | to |
Token ID | 284 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
not | +0.191 |
and | +0.182 |
because | +0.157 |
, | +0.144 |
but | +0.143 |
Neg logit contributions | |
asis | -0.322 |
andel | -0.320 |
ymes | -0.319 |
robat | -0.317 |
Ta | -0.316 |
Token | people |
Token ID | 661 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
not | +0.181 |
and | +0.170 |
because | +0.150 |
but | +0.140 |
, | +0.136 |
Neg logit contributions | |
andel | -0.285 |
ymes | -0.282 |
asis | -0.279 |
ocol | -0.273 |
robat | -0.273 |
Token | to |
Token ID | 284 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
ymes | +0.034 |
ites | +0.034 |
asis | +0.034 |
andel | +0.033 |
robat | +0.033 |
Neg logit contributions | |
not | -0.012 |
and | -0.009 |
because | -0.008 |
but | -0.007 |
" | -0.007 |
Token | certify |
Token ID | 46125 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
not | +0.192 |
and | +0.181 |
because | +0.163 |
but | +0.152 |
" | +0.148 |
Neg logit contributions | |
asis | -0.262 |
andel | -0.260 |
ocol | -0.258 |
ymes | -0.258 |
robat | -0.258 |
Token | what |
Token ID | 644 |
Feature activation | -6.24e+00 |
Pos logit contributions | |
not | +0.317 |
and | +0.285 |
because | +0.245 |
but | +0.218 |
they | +0.212 |
Neg logit contributions | |
ocol | -0.709 |
andel | -0.700 |
ymes | -0.693 |
asis | -0.690 |
robat | -0.670 |
Token | they |
Token ID | 484 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
not | +0.070 |
and | +0.065 |
because | +0.060 |
but | +0.055 |
, | +0.051 |
Neg logit contributions | |
ymes | -0.112 |
ites | -0.108 |
asis | -0.107 |
robat | -0.106 |
ival | -0.105 |
Token | do |
Token ID | 466 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
not | +0.169 |
and | +0.157 |
because | +0.142 |
" | +0.139 |
but | +0.137 |
Neg logit contributions | |
asis | -0.213 |
robat | -0.209 |
ymes | -0.203 |
Ta | -0.201 |
ites | -0.197 |
Token | . |
Token ID | 13 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
not | +0.092 |
because | +0.070 |
they | +0.069 |
" | +0.068 |
and | +0.068 |
Neg logit contributions | |
keeping | -0.185 |
asis | -0.180 |
pter | -0.179 |
robat | -0.176 |
ites | -0.175 |
Token | It |
Token ID | 632 |
Feature activation | -6.37e+00 |
Pos logit contributions | |
not | +0.221 |
and | +0.207 |
because | +0.183 |
, | +0.169 |
but | +0.169 |
Neg logit contributions | |
andel | -0.303 |
asis | -0.301 |
ymes | -0.301 |
Ta | -0.297 |
robat | -0.297 |
Token | and |
Token ID | 290 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
umm | +0.104 |
orns | +0.099 |
andel | +0.099 |
asis | +0.099 |
ymes | +0.098 |
Neg logit contributions | |
not | -0.025 |
and | -0.011 |
" | -0.011 |
because | -0.010 |
: | -0.009 |
Token | Jimmy |
Token ID | 12963 |
Feature activation | -6.79e+00 |
Pos logit contributions | |
and | +0.271 |
not | +0.268 |
because | +0.237 |
but | +0.226 |
: | +0.226 |
Neg logit contributions | |
ymes | -0.302 |
ocol | -0.299 |
asis | -0.298 |
umm | -0.295 |
robat | -0.292 |
Token | 's |
Token ID | 338 |
Feature activation | -8.80e+00 |
Pos logit contributions | |
not | +0.060 |
and | +0.048 |
because | +0.047 |
but | +0.044 |
" | +0.041 |
Neg logit contributions | |
ymes | -0.131 |
pillar | -0.130 |
asis | -0.130 |
robat | -0.128 |
arrow | -0.126 |
Token | face |
Token ID | 1986 |
Feature activation | -4.92e+00 |
Pos logit contributions | |
not | +0.139 |
and | +0.132 |
because | +0.123 |
but | +0.115 |
" | +0.114 |
Neg logit contributions | |
andel | -0.119 |
asis | -0.118 |
ymes | -0.117 |
umm | -0.115 |
ocol | -0.113 |
Token | sc |
Token ID | 629 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
not | +0.057 |
and | +0.049 |
but | +0.047 |
" | +0.047 |
for | +0.046 |
Neg logit contributions | |
arrow | -0.079 |
ymes | -0.077 |
asis | -0.075 |
pillar | -0.075 |
pill | -0.074 |
Token | run |
Token ID | 5143 |
Feature activation | -3.58e+01 |
Pos logit contributions | |
not | +0.033 |
and | +0.032 |
because | +0.030 |
, | +0.028 |
. | +0.028 |
Neg logit contributions | |
ymes | -0.023 |
asis | -0.023 |
robat | -0.023 |
andel | -0.022 |
Ta | -0.022 |
Token | ched |
Token ID | 1740 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
not | +0.634 |
and | +0.607 |
because | +0.561 |
but | +0.534 |
, | +0.527 |
Neg logit contributions | |
ymes | -0.436 |
asis | -0.435 |
andel | -0.433 |
robat | -0.428 |
Ta | -0.421 |
Token | up |
Token ID | 510 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
not | +0.149 |
and | +0.110 |
because | +0.100 |
" | +0.091 |
: | +0.089 |
Neg logit contributions | |
ymes | -0.338 |
robat | -0.330 |
andel | -0.329 |
umm | -0.328 |
keeping | -0.326 |
Token | as |
Token ID | 355 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
not | +0.064 |
and | +0.033 |
because | +0.032 |
" | +0.030 |
: | +0.025 |
Neg logit contributions | |
andel | -0.228 |
seas | -0.228 |
nests | -0.227 |
ymes | -0.225 |
ocol | -0.224 |
Token | he |
Token ID | 339 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
not | +0.141 |
and | +0.138 |
because | +0.127 |
but | +0.115 |
: | +0.103 |
Neg logit contributions | |
seas | -0.293 |
ymes | -0.287 |
ocol | -0.286 |
andel | -0.286 |
ival | -0.278 |
Token | ate |
Token ID | 15063 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
not | +0.207 |
and | +0.184 |
because | +0.173 |
but | +0.163 |
" | +0.157 |
Neg logit contributions | |
asis | -0.315 |
ymes | -0.313 |
robat | -0.306 |
Ta | -0.303 |
pillar | -0.303 |
Token | old |
Token ID | 1468 |
Feature activation | -3.07e+00 |
Pos logit contributions | |
not | +0.122 |
and | +0.119 |
" | +0.099 |
. | +0.097 |
, | +0.097 |
Neg logit contributions | |
ites | -0.183 |
orns | -0.181 |
asis | -0.181 |
robat | -0.179 |
ymes | -0.179 |
Token | man |
Token ID | 582 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
and | +0.048 |
not | +0.048 |
, | +0.041 |
because | +0.041 |
" | +0.040 |
Neg logit contributions | |
andel | -0.048 |
ymes | -0.047 |
umm | -0.047 |
Ta | -0.047 |
asis | -0.046 |
Token | replied |
Token ID | 8712 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
not | +0.014 |
and | +0.012 |
because | +0.011 |
but | +0.010 |
" | +0.010 |
Neg logit contributions | |
ymes | -0.021 |
asis | -0.020 |
ival | -0.020 |
robat | -0.020 |
Ta | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
not | +0.091 |
because | +0.058 |
and | +0.055 |
also | +0.052 |
still | +0.045 |
Neg logit contributions | |
crow | -0.263 |
andel | -0.263 |
ival | -0.261 |
ocol | -0.259 |
emaker | -0.256 |
Token | " |
Token ID | 366 |
Feature activation | -7.33e+00 |
Pos logit contributions | |
not | +0.155 |
? | +0.136 |
and | +0.120 |
because | +0.120 |
their | +0.107 |
Neg logit contributions | |
folk | -0.338 |
eagle | -0.328 |
Dragon | -0.311 |
smith | -0.311 |
oceans | -0.310 |
Token | Because |
Token ID | 8128 |
Feature activation | -3.56e+01 |
Pos logit contributions | |
not | +0.095 |
and | +0.089 |
because | +0.079 |
but | +0.073 |
" | +0.071 |
Neg logit contributions | |
andel | -0.129 |
asis | -0.128 |
ymes | -0.126 |
robat | -0.125 |
ocol | -0.124 |
Token | it |
Token ID | 340 |
Feature activation | -4.88e+00 |
Pos logit contributions | |
not | +0.329 |
and | +0.298 |
because | +0.254 |
but | +0.232 |
: | +0.226 |
Neg logit contributions | |
ymes | -0.694 |
asis | -0.687 |
ocol | -0.686 |
andel | -0.685 |
robat | -0.676 |
Token | wasn |
Token ID | 2492 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
not | +0.055 |
and | +0.051 |
because | +0.046 |
but | +0.043 |
" | +0.042 |
Neg logit contributions | |
asis | -0.087 |
ymes | -0.087 |
robat | -0.084 |
pillar | -0.083 |
orns | -0.083 |
Token | 't |
Token ID | 470 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
not | +0.142 |
and | +0.141 |
because | +0.118 |
but | +0.111 |
, | +0.106 |
Neg logit contributions | |
andel | -0.305 |
asis | -0.299 |
Ta | -0.298 |
ymes | -0.296 |
robat | -0.294 |
Token | pe |
Token ID | 613 |
Feature activation | +4.40e+00 |
Pos logit contributions | |
not | +0.195 |
and | +0.183 |
because | +0.154 |
: | +0.150 |
" | +0.144 |
Neg logit contributions | |
andel | -0.385 |
ymes | -0.380 |
asis | -0.380 |
robat | -0.375 |
ocol | -0.371 |
Token | eling |
Token ID | 10809 |
Feature activation | -8.88e+00 |
Pos logit contributions | |
Ta | +0.046 |
andel | +0.044 |
robat | +0.044 |
asis | +0.044 |
ymes | +0.044 |
Neg logit contributions | |
not | -0.088 |
and | -0.084 |
because | -0.078 |
, | -0.075 |
but | -0.075 |
Token | € |
Token ID | 26391 |
Feature activation | +4.28e+00 |
Pos logit contributions | |
not | +0.335 |
and | +0.324 |
because | +0.302 |
but | +0.288 |
, | +0.286 |
Neg logit contributions | |
andel | -0.179 |
ymes | -0.179 |
asis | -0.177 |
robat | -0.172 |
Ta | -0.171 |
Token |
|
Token ID | 198 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
andel | +0.066 |
ymes | +0.066 |
asis | +0.066 |
robat | +0.065 |
Ta | +0.064 |
Neg logit contributions | |
not | -0.062 |
and | -0.059 |
because | -0.053 |
but | -0.050 |
, | -0.050 |
Token | |
Token ID | 220 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
not | +0.104 |
and | +0.093 |
because | +0.079 |
but | +0.065 |
, | +0.062 |
Neg logit contributions | |
asis | -0.328 |
andel | -0.327 |
robat | -0.326 |
ymes | -0.325 |
Ta | -0.325 |
Token |
|
Token ID | 198 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
not | +0.015 |
and | +0.013 |
because | +0.011 |
but | +0.010 |
, | +0.009 |
Neg logit contributions | |
andel | -0.041 |
asis | -0.041 |
ymes | -0.041 |
ites | -0.041 |
robat | -0.040 |
Token | From |
Token ID | 4863 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
not | +0.235 |
and | +0.223 |
because | +0.204 |
but | +0.190 |
, | +0.189 |
Neg logit contributions | |
asis | -0.233 |
andel | -0.232 |
ymes | -0.232 |
robat | -0.230 |
Ta | -0.228 |
Token | then |
Token ID | 788 |
Feature activation | -3.54e+01 |
Pos logit contributions | |
not | +0.160 |
and | +0.125 |
" | +0.111 |
because | +0.106 |
but | +0.100 |
Neg logit contributions | |
robat | -0.384 |
ites | -0.379 |
asis | -0.379 |
crow | -0.377 |
ican | -0.372 |
Token | on |
Token ID | 319 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
not | +0.361 |
because | +0.266 |
and | +0.266 |
but | +0.238 |
" | +0.216 |
Neg logit contributions | |
robat | -0.695 |
crow | -0.682 |
ites | -0.678 |
andel | -0.669 |
pillar | -0.656 |
Token | , |
Token ID | 11 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
not | +0.096 |
and | +0.065 |
because | +0.058 |
" | +0.043 |
to | +0.041 |
Neg logit contributions | |
crow | -0.293 |
robat | -0.285 |
igsaw | -0.285 |
ites | -0.284 |
ocol | -0.284 |
Token | Joe |
Token ID | 5689 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
not | +0.281 |
and | +0.259 |
because | +0.225 |
: | +0.205 |
but | +0.202 |
Neg logit contributions | |
andel | -0.476 |
asis | -0.475 |
robat | -0.471 |
ymes | -0.471 |
ites | -0.469 |
Token | wrote |
Token ID | 2630 |
Feature activation | -8.39e+00 |
Pos logit contributions | |
not | +0.136 |
because | +0.090 |
and | +0.087 |
but | +0.086 |
" | +0.077 |
Neg logit contributions | |
asis | -0.386 |
ites | -0.381 |
robat | -0.380 |
pillar | -0.378 |
orns | -0.376 |
Token | thank |
Token ID | 5875 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
not | +0.070 |
and | +0.055 |
because | +0.054 |
but | +0.044 |
they | +0.044 |
Neg logit contributions | |
ymes | -0.168 |
andel | -0.165 |
ival | -0.165 |
robat | -0.164 |
seas | -0.163 |
Token | ™ |
Token ID | 8151 |
Feature activation | +8.90e+00 |
Pos logit contributions | |
ymes | +0.011 |
andel | +0.011 |
asis | +0.011 |
robat | +0.010 |
Ta | +0.010 |
Neg logit contributions | |
not | -0.018 |
and | -0.018 |
because | -0.016 |
but | -0.015 |
, | -0.015 |
Token | t |
Token ID | 83 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
ites | +0.119 |
ival | +0.118 |
ite | +0.118 |
andel | +0.117 |
pillar | +0.117 |
Neg logit contributions | |
not | -0.138 |
and | -0.126 |
because | -0.115 |
but | -0.109 |
" | -0.107 |
Token | have |
Token ID | 423 |
Feature activation | -2.16e+01 |
Pos logit contributions | |
not | +0.242 |
and | +0.205 |
" | +0.198 |
because | +0.187 |
they | +0.180 |
Neg logit contributions | |
asis | -0.422 |
robat | -0.420 |
crow | -0.406 |
pillar | -0.405 |
andel | -0.402 |
Token | the |
Token ID | 262 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
not | +0.190 |
and | +0.181 |
because | +0.151 |
but | +0.139 |
" | +0.135 |
Neg logit contributions | |
andel | -0.428 |
ymes | -0.425 |
robat | -0.422 |
seas | -0.422 |
orns | -0.420 |
Token | cross |
Token ID | 3272 |
Feature activation | -8.73e+00 |
Pos logit contributions | |
not | +0.246 |
and | +0.238 |
because | +0.221 |
but | +0.213 |
, | +0.212 |
Neg logit contributions | |
ymes | -0.113 |
andel | -0.112 |
asis | -0.111 |
robat | -0.110 |
Ta | -0.109 |
Token | then |
Token ID | 788 |
Feature activation | -3.54e+01 |
Pos logit contributions | |
not | +0.078 |
and | +0.064 |
because | +0.057 |
" | +0.052 |
but | +0.049 |
Neg logit contributions | |
asis | -0.175 |
robat | -0.173 |
crow | -0.172 |
ites | -0.172 |
ymes | -0.171 |
Token | why |
Token ID | 1521 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
not | +0.383 |
and | +0.341 |
because | +0.305 |
" | +0.277 |
but | +0.277 |
Neg logit contributions | |
asis | -0.628 |
crow | -0.614 |
robat | -0.602 |
andel | -0.595 |
ites | -0.595 |
Token | did |
Token ID | 750 |
Feature activation | -1.88e+01 |
Pos logit contributions | |
not | +0.123 |
and | +0.120 |
because | +0.101 |
but | +0.095 |
: | +0.093 |
Neg logit contributions | |
asis | -0.225 |
ymes | -0.222 |
robat | -0.220 |
ocol | -0.220 |
andel | -0.219 |
Token | you |
Token ID | 345 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
and | +0.228 |
not | +0.225 |
because | +0.195 |
but | +0.189 |
" | +0.186 |
Neg logit contributions | |
asis | -0.295 |
ymes | -0.293 |
robat | -0.292 |
ites | -0.288 |
ocol | -0.288 |
Token | even |
Token ID | 772 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
not | +0.181 |
and | +0.162 |
" | +0.158 |
they | +0.150 |
because | +0.150 |
Neg logit contributions | |
asis | -0.287 |
robat | -0.283 |
ites | -0.276 |
pillar | -0.270 |
emaker | -0.270 |
Token | ask |
Token ID | 1265 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
not | +0.226 |
and | +0.215 |
because | +0.196 |
" | +0.187 |
but | +0.178 |
Neg logit contributions | |
asis | -0.279 |
ymes | -0.278 |
andel | -0.277 |
robat | -0.274 |
emaker | -0.271 |
Token | its |
Token ID | 663 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
not | +0.118 |
and | +0.108 |
because | +0.089 |
but | +0.078 |
, | +0.076 |
Neg logit contributions | |
asis | -0.310 |
ymes | -0.310 |
andel | -0.310 |
robat | -0.307 |
Ta | -0.304 |
Token | place |
Token ID | 1295 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
not | +0.165 |
and | +0.158 |
because | +0.144 |
but | +0.136 |
, | +0.135 |
Neg logit contributions | |
asis | -0.145 |
ymes | -0.144 |
andel | -0.144 |
robat | -0.142 |
Ta | -0.141 |
Token | . |
Token ID | 13 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
not | +0.013 |
and | +0.010 |
because | +0.008 |
" | +0.007 |
but | +0.006 |
Neg logit contributions | |
asis | -0.053 |
andel | -0.053 |
ymes | -0.053 |
keeping | -0.052 |
ites | -0.052 |
Token |
|
Token ID | 198 |
Feature activation | -9.72e+00 |
Pos logit contributions | |
not | +0.170 |
and | +0.153 |
because | +0.133 |
but | +0.118 |
, | +0.115 |
Neg logit contributions | |
Ta | -0.351 |
ymes | -0.349 |
andel | -0.349 |
asis | -0.345 |
ites | -0.345 |
Token |
|
Token ID | 198 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
not | +0.065 |
and | +0.057 |
because | +0.049 |
but | +0.040 |
, | +0.037 |
Neg logit contributions | |
ymes | -0.219 |
asis | -0.217 |
Ta | -0.217 |
robat | -0.217 |
andel | -0.216 |
Token | Because |
Token ID | 8128 |
Feature activation | -3.53e+01 |
Pos logit contributions | |
not | +0.176 |
and | +0.169 |
because | +0.155 |
but | +0.147 |
, | +0.146 |
Neg logit contributions | |
ymes | -0.138 |
asis | -0.137 |
andel | -0.137 |
robat | -0.135 |
Ta | -0.134 |
Token | of |
Token ID | 286 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
not | +0.329 |
and | +0.289 |
because | +0.254 |
but | +0.229 |
" | +0.217 |
Neg logit contributions | |
ymes | -0.696 |
andel | -0.668 |
ites | -0.663 |
emaker | -0.662 |
asis | -0.660 |
Token | the |
Token ID | 262 |
Feature activation | -5.29e+00 |
Pos logit contributions | |
not | +0.134 |
and | +0.119 |
because | +0.111 |
but | +0.098 |
to | +0.095 |
Neg logit contributions | |
ymes | -0.271 |
ocol | -0.264 |
nests | -0.260 |
orns | -0.260 |
andel | -0.260 |
Token | lady |
Token ID | 10846 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
not | +0.080 |
and | +0.078 |
because | +0.066 |
, | +0.065 |
. | +0.065 |
Neg logit contributions | |
andel | -0.084 |
robat | -0.084 |
ymes | -0.083 |
asis | -0.083 |
emaker | -0.082 |
Token | 's |
Token ID | 338 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
not | +0.017 |
and | +0.013 |
because | +0.013 |
but | +0.011 |
" | +0.011 |
Neg logit contributions | |
asis | -0.038 |
ymes | -0.037 |
ites | -0.037 |
pillar | -0.036 |
robat | -0.036 |
Token | compassion |
Token ID | 15213 |
Feature activation | -8.99e+00 |
Pos logit contributions | |
not | +0.206 |
and | +0.200 |
because | +0.177 |
, | +0.170 |
. | +0.168 |
Neg logit contributions | |
robat | -0.190 |
asis | -0.190 |
andel | -0.190 |
ymes | -0.189 |
Ta | -0.189 |
Token | just |
Token ID | 655 |
Feature activation | -2.91e+01 |
Pos logit contributions | |
not | +0.163 |
and | +0.151 |
because | +0.136 |
" | +0.128 |
but | +0.124 |
Neg logit contributions | |
asis | -0.272 |
robat | -0.265 |
andel | -0.265 |
ymes | -0.261 |
ocol | -0.257 |
Token | have |
Token ID | 423 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
not | +0.331 |
and | +0.301 |
because | +0.267 |
they | +0.250 |
but | +0.250 |
Neg logit contributions | |
asis | -0.499 |
ymes | -0.489 |
ocol | -0.487 |
andel | -0.487 |
crow | -0.482 |
Token | to |
Token ID | 284 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
not | +0.159 |
and | +0.144 |
because | +0.119 |
but | +0.106 |
" | +0.103 |
Neg logit contributions | |
andel | -0.460 |
seas | -0.459 |
ymes | -0.459 |
orns | -0.455 |
ites | -0.454 |
Token | eat |
Token ID | 4483 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
not | +0.259 |
and | +0.250 |
because | +0.226 |
" | +0.210 |
but | +0.208 |
Neg logit contributions | |
asis | -0.405 |
andel | -0.393 |
robat | -0.390 |
ymes | -0.387 |
Ta | -0.382 |
Token | you |
Token ID | 345 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
not | +0.206 |
and | +0.173 |
because | +0.157 |
" | +0.145 |
they | +0.145 |
Neg logit contributions | |
ocol | -0.302 |
seas | -0.302 |
andel | -0.301 |
asis | -0.301 |
robat | -0.300 |
Token | then |
Token ID | 788 |
Feature activation | -3.52e+01 |
Pos logit contributions | |
not | +0.158 |
and | +0.129 |
because | +0.113 |
but | +0.105 |
" | +0.105 |
Neg logit contributions | |
asis | -0.385 |
ymes | -0.375 |
robat | -0.370 |
orns | -0.369 |
ites | -0.367 |
Token | ! |
Token ID | 0 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
not | +0.388 |
and | +0.332 |
because | +0.298 |
but | +0.280 |
" | +0.275 |
Neg logit contributions | |
asis | -0.643 |
robat | -0.610 |
andel | -0.603 |
crow | -0.602 |
ites | -0.600 |
Token | â |
Token ID | 22940 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
not | +0.306 |
and | +0.281 |
because | +0.245 |
, | +0.223 |
but | +0.221 |
Neg logit contributions | |
andel | -0.501 |
asis | -0.499 |
ymes | -0.494 |
robat | -0.493 |
Ta | -0.493 |
Token | € |
Token ID | 26391 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
not | +0.351 |
and | +0.341 |
because | +0.317 |
, | +0.301 |
but | +0.301 |
Neg logit contributions | |
ymes | -0.203 |
andel | -0.202 |
asis | -0.195 |
Ta | -0.191 |
robat | -0.189 |
Token |
|
Token ID | 198 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
andel | +0.042 |
ymes | +0.042 |
asis | +0.041 |
Ta | +0.041 |
robat | +0.041 |
Neg logit contributions | |
not | -0.029 |
and | -0.027 |
because | -0.024 |
, | -0.022 |
but | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
not | +0.104 |
and | +0.094 |
because | +0.073 |
but | +0.061 |
, | +0.059 |
Neg logit contributions | |
ymes | -0.354 |
asis | -0.354 |
andel | -0.353 |
robat | -0.350 |
Ta | -0.348 |
Token | can |
Token ID | 460 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
not | +0.262 |
and | +0.245 |
because | +0.219 |
but | +0.202 |
" | +0.199 |
Neg logit contributions | |
asis | -0.386 |
andel | -0.381 |
ymes | -0.379 |
Ta | -0.379 |
robat | -0.378 |
Token | hide |
Token ID | 7808 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
not | +0.250 |
and | +0.238 |
because | +0.218 |
but | +0.206 |
" | +0.201 |
Neg logit contributions | |
asis | -0.409 |
robat | -0.394 |
ival | -0.391 |
andel | -0.391 |
ites | -0.391 |
Token | it |
Token ID | 340 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
not | +0.135 |
and | +0.109 |
because | +0.097 |
" | +0.090 |
they | +0.087 |
Neg logit contributions | |
ymes | -0.291 |
andel | -0.288 |
robat | -0.283 |
asis | -0.283 |
ites | -0.281 |
Token | away |
Token ID | 1497 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
not | +0.103 |
and | +0.079 |
they | +0.079 |
" | +0.078 |
because | +0.075 |
Neg logit contributions | |
asis | -0.188 |
ymes | -0.176 |
robat | -0.176 |
seas | -0.174 |
ites | -0.173 |
Token | until |
Token ID | 1566 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
not | +0.146 |
and | +0.105 |
" | +0.101 |
because | +0.098 |
they | +0.097 |
Neg logit contributions | |
asis | -0.321 |
keeping | -0.313 |
andel | -0.312 |
ymes | -0.307 |
crow | -0.304 |
Token | then |
Token ID | 788 |
Feature activation | -3.52e+01 |
Pos logit contributions | |
not | +0.301 |
and | +0.284 |
because | +0.248 |
" | +0.236 |
: | +0.236 |
Neg logit contributions | |
asis | -0.422 |
seas | -0.410 |
andel | -0.397 |
ocol | -0.395 |
umm | -0.393 |
Token | . |
Token ID | 13 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
not | +0.383 |
and | +0.358 |
because | +0.313 |
but | +0.284 |
" | +0.277 |
Neg logit contributions | |
asis | -0.651 |
andel | -0.640 |
ymes | -0.634 |
robat | -0.630 |
Ta | -0.622 |
Token | â |
Token ID | 22940 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
not | +0.322 |
and | +0.296 |
because | +0.261 |
, | +0.243 |
but | +0.238 |
Neg logit contributions | |
andel | -0.413 |
asis | -0.405 |
Ta | -0.402 |
umm | -0.399 |
robat | -0.398 |
Token | € |
Token ID | 26391 |
Feature activation | +1.92e+00 |
Pos logit contributions | |
not | +0.391 |
and | +0.377 |
because | +0.351 |
but | +0.335 |
, | +0.332 |
Neg logit contributions | |
asis | -0.200 |
andel | -0.198 |
ymes | -0.197 |
robat | -0.195 |
Ta | -0.191 |
Token | Joe |
Token ID | 5689 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
asis | +0.029 |
ymes | +0.029 |
andel | +0.029 |
robat | +0.028 |
Ta | +0.028 |
Neg logit contributions | |
not | -0.028 |
and | -0.027 |
because | -0.024 |
but | -0.023 |
, | -0.023 |
Token | smiled |
Token ID | 13541 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
not | +0.183 |
and | +0.141 |
because | +0.139 |
but | +0.122 |
" | +0.119 |
Neg logit contributions | |
asis | -0.373 |
pillar | -0.363 |
robat | -0.360 |
crow | -0.356 |
ites | -0.355 |
Token | kind |
Token ID | 1611 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
ymes | +0.041 |
asis | +0.040 |
andel | +0.039 |
ites | +0.039 |
robat | +0.039 |
Neg logit contributions | |
not | -0.030 |
and | -0.028 |
because | -0.026 |
but | -0.024 |
: | -0.023 |
Token | . |
Token ID | 13 |
Feature activation | -4.72e+00 |
Pos logit contributions | |
ymes | +0.362 |
keeping | +0.353 |
andel | +0.351 |
ites | +0.351 |
umm | +0.349 |
Neg logit contributions | |
not | -0.085 |
and | -0.054 |
because | -0.043 |
but | -0.036 |
they | -0.036 |
Token | Thank |
Token ID | 6952 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
not | +0.055 |
and | +0.052 |
because | +0.044 |
for | +0.042 |
, | +0.041 |
Neg logit contributions | |
umm | -0.081 |
Ta | -0.080 |
crow | -0.078 |
unn | -0.078 |
ocol | -0.077 |
Token | you |
Token ID | 345 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
ymes | +0.103 |
asis | +0.103 |
andel | +0.103 |
robat | +0.101 |
Ta | +0.101 |
Neg logit contributions | |
not | -0.074 |
and | -0.070 |
because | -0.062 |
but | -0.058 |
, | -0.057 |
Token | . |
Token ID | 13 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
andel | +0.063 |
unn | +0.060 |
ymes | +0.060 |
umm | +0.058 |
pillar | +0.058 |
Neg logit contributions | |
not | -0.017 |
and | -0.011 |
because | -0.008 |
still | -0.008 |
they | -0.007 |
Token | Amen |
Token ID | 34717 |
Feature activation | +6.51e+01 |
Pos logit contributions | |
not | +0.049 |
and | +0.047 |
because | +0.041 |
but | +0.039 |
, | +0.038 |
Neg logit contributions | |
Ta | -0.057 |
umm | -0.056 |
ocol | -0.056 |
robat | -0.054 |
andel | -0.054 |
Token | ." |
Token ID | 526 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
asis | +1.191 |
ymes | +1.187 |
ites | +1.185 |
andel | +1.171 |
unn | +1.142 |
Neg logit contributions | |
not | -0.664 |
and | -0.616 |
because | -0.545 |
but | -0.537 |
" | -0.484 |
Token |
|
Token ID | 198 |
Feature activation | +6.41e+00 |
Pos logit contributions | |
pill | +0.028 |
orns | +0.028 |
pillar | +0.028 |
Ta | +0.028 |
ites | +0.028 |
Neg logit contributions | |
not | -0.016 |
and | -0.012 |
because | -0.012 |
for | -0.011 |
just | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +6.22e+00 |
Pos logit contributions | |
ymes | +0.142 |
Ta | +0.141 |
andel | +0.141 |
asis | +0.141 |
robat | +0.140 |
Neg logit contributions | |
not | -0.044 |
and | -0.038 |
because | -0.034 |
but | -0.028 |
, | -0.025 |
Token | Then |
Token ID | 6423 |
Feature activation | -7.77e+00 |
Pos logit contributions | |
ymes | +0.102 |
asis | +0.101 |
andel | +0.101 |
robat | +0.100 |
Ta | +0.100 |
Neg logit contributions | |
not | -0.085 |
and | -0.081 |
because | -0.073 |
but | -0.068 |
, | -0.067 |
Token | she |
Token ID | 673 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
not | +0.053 |
and | +0.048 |
because | +0.040 |
but | +0.034 |
" | +0.030 |
Neg logit contributions | |
seas | -0.166 |
andel | -0.164 |
ymes | -0.162 |
Ta | -0.162 |
nests | -0.161 |
Token | soon |
Token ID | 2582 |
Feature activation | -3.42e+00 |
Pos logit contributions | |
not | +0.038 |
and | +0.037 |
because | +0.033 |
but | +0.031 |
" | +0.030 |
Neg logit contributions | |
andel | -0.072 |
asis | -0.072 |
nests | -0.072 |
ymes | -0.070 |
Ta | -0.069 |
Token | nothing |
Token ID | 2147 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
not | +0.040 |
and | +0.034 |
because | +0.033 |
" | +0.032 |
: | +0.030 |
Neg logit contributions | |
asis | -0.059 |
nests | -0.058 |
andel | -0.057 |
seas | -0.055 |
ymes | -0.055 |
Token | but |
Token ID | 475 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
ymes | +0.262 |
worm | +0.262 |
asis | +0.260 |
pillar | +0.257 |
crow | +0.254 |
Neg logit contributions | |
not | -0.161 |
and | -0.140 |
because | -0.126 |
" | -0.121 |
: | -0.116 |
Token | a |
Token ID | 257 |
Feature activation | +8.51e+00 |
Pos logit contributions | |
not | +0.021 |
and | +0.018 |
because | +0.016 |
but | +0.015 |
" | +0.015 |
Neg logit contributions | |
ymes | -0.044 |
asis | -0.043 |
nests | -0.043 |
Ta | -0.042 |
andel | -0.042 |
Token | small |
Token ID | 1402 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
asis | +0.137 |
ymes | +0.136 |
andel | +0.136 |
robat | +0.135 |
Ta | +0.134 |
Neg logit contributions | |
not | -0.119 |
and | -0.114 |
because | -0.102 |
but | -0.096 |
, | -0.095 |
Token | spe |
Token ID | 693 |
Feature activation | +6.67e+01 |
Pos logit contributions | |
andel | +0.214 |
asis | +0.214 |
ymes | +0.213 |
robat | +0.209 |
Ta | +0.205 |
Neg logit contributions | |
not | -0.269 |
and | -0.254 |
because | -0.234 |
but | -0.221 |
" | -0.217 |
Token | ck |
Token ID | 694 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
umm | +0.915 |
ival | +0.885 |
pill | +0.878 |
Ta | +0.877 |
ymes | +0.874 |
Neg logit contributions | |
not | -1.179 |
and | -1.126 |
because | -1.005 |
. | -0.985 |
, | -0.970 |
Token | in |
Token ID | 287 |
Feature activation | +8.70e+00 |
Pos logit contributions | |
asis | +0.321 |
ymes | +0.320 |
andel | +0.319 |
emaker | +0.319 |
crow | +0.318 |
Neg logit contributions | |
not | -0.327 |
and | -0.270 |
because | -0.266 |
" | -0.248 |
but | -0.245 |
Token | the |
Token ID | 262 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
andel | +0.173 |
ymes | +0.168 |
ocol | +0.166 |
asis | +0.165 |
Ta | +0.165 |
Neg logit contributions | |
not | -0.087 |
and | -0.077 |
because | -0.068 |
but | -0.061 |
" | -0.060 |
Token | sky |
Token ID | 6766 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
ymes | +0.195 |
robat | +0.191 |
ites | +0.187 |
emaker | +0.187 |
orns | +0.182 |
Neg logit contributions | |
and | -0.306 |
not | -0.301 |
because | -0.275 |
. | -0.267 |
, | -0.267 |
Token | . |
Token ID | 13 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
asis | +0.481 |
ymes | +0.457 |
nests | +0.457 |
pillar | +0.456 |
crow | +0.454 |
Neg logit contributions | |
not | -0.141 |
and | -0.075 |
because | -0.070 |
" | -0.061 |
but | -0.057 |
Token | saw |
Token ID | 2497 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
ymes | +0.122 |
asis | +0.119 |
Ta | +0.118 |
seas | +0.117 |
ites | +0.116 |
Neg logit contributions | |
not | -0.058 |
and | -0.052 |
because | -0.050 |
but | -0.044 |
for | -0.043 |
Token | clown |
Token ID | 25573 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
asis | +0.136 |
robat | +0.134 |
andel | +0.134 |
ymes | +0.133 |
umm | +0.131 |
Neg logit contributions | |
not | -0.065 |
and | -0.063 |
because | -0.052 |
, | -0.047 |
but | -0.047 |
Token | s |
Token ID | 82 |
Feature activation | +5.96e+00 |
Pos logit contributions | |
asis | +0.528 |
ymes | +0.528 |
andel | +0.526 |
robat | +0.521 |
Ta | +0.515 |
Neg logit contributions | |
not | -0.326 |
and | -0.304 |
because | -0.268 |
but | -0.245 |
, | -0.240 |
Token | and |
Token ID | 290 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
asis | +0.140 |
nests | +0.139 |
ymes | +0.137 |
ites | +0.136 |
keeping | +0.135 |
Neg logit contributions | |
not | -0.023 |
because | -0.013 |
and | -0.007 |
but | -0.006 |
they | -0.005 |
Token | ac |
Token ID | 936 |
Feature activation | +4.23e+01 |
Pos logit contributions | |
not | +0.028 |
and | +0.026 |
because | +0.024 |
but | +0.023 |
, | +0.022 |
Neg logit contributions | |
ymes | -0.026 |
asis | -0.026 |
andel | -0.026 |
robat | -0.025 |
Ta | -0.025 |
Token | rob |
Token ID | 22609 |
Feature activation | +6.78e+01 |
Pos logit contributions | |
andel | +0.270 |
umm | +0.245 |
Ta | +0.225 |
ocol | +0.197 |
igsaw | +0.189 |
Neg logit contributions | |
and | -1.079 |
not | -1.029 |
. | -0.962 |
, | -0.962 |
because | -0.958 |
Token | ats |
Token ID | 1381 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
andel | +0.585 |
asis | +0.583 |
ymes | +0.579 |
robat | +0.562 |
Ta | +0.561 |
Neg logit contributions | |
not | -1.448 |
and | -1.401 |
because | -1.308 |
, | -1.252 |
but | -1.250 |
Token | and |
Token ID | 290 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
robat | +0.399 |
crow | +0.395 |
asis | +0.395 |
orns | +0.394 |
ymes | +0.394 |
Neg logit contributions | |
not | -0.069 |
because | -0.026 |
and | -0.022 |
but | -0.011 |
" | -0.003 |
Token | lions |
Token ID | 31420 |
Feature activation | +3.44e+01 |
Pos logit contributions | |
not | +0.029 |
and | +0.028 |
because | +0.026 |
but | +0.024 |
, | +0.024 |
Neg logit contributions | |
asis | -0.019 |
ymes | -0.019 |
andel | -0.019 |
robat | -0.018 |
Ta | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -9.09e-01 |
Pos logit contributions | |
asis | +0.870 |
ymes | +0.865 |
robat | +0.861 |
orns | +0.849 |
andel | +0.847 |
Neg logit contributions | |
not | -0.146 |
and | -0.084 |
because | -0.066 |
but | -0.037 |
" | -0.030 |
Token | elephants |
Token ID | 25368 |
Feature activation | +2.92e+01 |
Pos logit contributions | |
not | +0.017 |
and | +0.017 |
because | +0.016 |
but | +0.015 |
, | +0.015 |
Neg logit contributions | |
asis | -0.010 |
andel | -0.010 |
ymes | -0.010 |
robat | -0.010 |
umm | -0.010 |
Token | family |
Token ID | 1641 |
Feature activation | +2.49e+01 |
Pos logit contributions | |
asis | +0.340 |
ymes | +0.339 |
andel | +0.339 |
robat | +0.335 |
Ta | +0.332 |
Neg logit contributions | |
not | -0.302 |
and | -0.288 |
because | -0.259 |
but | -0.242 |
, | -0.240 |
Token | and |
Token ID | 290 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
asis | +0.520 |
ymes | +0.517 |
robat | +0.506 |
ites | +0.499 |
andel | +0.494 |
Neg logit contributions | |
not | -0.207 |
and | -0.163 |
because | -0.146 |
but | -0.137 |
" | -0.133 |
Token | our |
Token ID | 674 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
not | +0.033 |
and | +0.031 |
because | +0.029 |
but | +0.028 |
: | +0.028 |
Neg logit contributions | |
ymes | -0.044 |
nests | -0.042 |
keeping | -0.042 |
asis | -0.042 |
Ta | -0.042 |
Token | friends |
Token ID | 2460 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
asis | +0.319 |
andel | +0.319 |
ymes | +0.318 |
robat | +0.314 |
Ta | +0.311 |
Neg logit contributions | |
not | -0.341 |
and | -0.327 |
because | -0.297 |
but | -0.279 |
, | -0.277 |
Token | . |
Token ID | 13 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
ymes | +0.412 |
asis | +0.407 |
robat | +0.401 |
ites | +0.393 |
ival | +0.385 |
Neg logit contributions | |
not | -0.221 |
and | -0.178 |
because | -0.170 |
but | -0.162 |
they | -0.157 |
Token | Amen |
Token ID | 34717 |
Feature activation | +7.18e+01 |
Pos logit contributions | |
Ta | +0.039 |
umm | +0.037 |
pter | +0.036 |
crow | +0.036 |
andel | +0.035 |
Neg logit contributions | |
not | -0.051 |
and | -0.048 |
because | -0.044 |
, | -0.042 |
but | -0.041 |
Token | ." |
Token ID | 526 |
Feature activation | +8.87e+00 |
Pos logit contributions | |
ymes | +1.372 |
asis | +1.370 |
andel | +1.343 |
ites | +1.341 |
robat | +1.325 |
Neg logit contributions | |
not | -0.712 |
and | -0.661 |
because | -0.581 |
but | -0.550 |
" | -0.514 |
Token |
|
Token ID | 198 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
pill | +0.153 |
pter | +0.153 |
Ta | +0.151 |
ymes | +0.151 |
pillar | +0.151 |
Neg logit contributions | |
not | -0.087 |
because | -0.069 |
and | -0.069 |
just | -0.062 |
for | -0.062 |
Token |
|
Token ID | 198 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
ymes | +0.305 |
Ta | +0.302 |
asis | +0.299 |
andel | +0.298 |
robat | +0.298 |
Neg logit contributions | |
not | -0.097 |
and | -0.085 |
because | -0.077 |
but | -0.063 |
, | -0.055 |
Token | Anna |
Token ID | 31160 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
ymes | +0.169 |
Ta | +0.162 |
robat | +0.157 |
asis | +0.157 |
ites | +0.155 |
Neg logit contributions | |
not | -0.243 |
and | -0.235 |
because | -0.224 |
but | -0.209 |
, | -0.206 |
Token | said |
Token ID | 531 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
ymes | +0.229 |
asis | +0.229 |
Ta | +0.228 |
pillar | +0.222 |
robat | +0.218 |
Neg logit contributions | |
not | -0.171 |
because | -0.152 |
and | -0.145 |
for | -0.143 |
but | -0.140 |
Token | make |
Token ID | 787 |
Feature activation | +9.06e+00 |
Pos logit contributions | |
not | +0.003 |
and | +0.003 |
because | +0.003 |
: | +0.003 |
but | +0.003 |
Neg logit contributions | |
Ta | -0.006 |
ites | -0.006 |
ymes | -0.006 |
nests | -0.006 |
keeping | -0.006 |
Token | it |
Token ID | 340 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
asis | +0.207 |
andel | +0.205 |
robat | +0.205 |
ymes | +0.202 |
umm | +0.201 |
Neg logit contributions | |
not | -0.075 |
and | -0.067 |
because | -0.052 |
. | -0.047 |
, | -0.046 |
Token | whole |
Token ID | 2187 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
asis | +0.298 |
nests | +0.293 |
ymes | +0.287 |
seas | +0.280 |
bridge | +0.279 |
Neg logit contributions | |
not | -0.186 |
and | -0.181 |
because | -0.170 |
: | -0.170 |
" | -0.168 |
Token | again |
Token ID | 757 |
Feature activation | +6.28e+00 |
Pos logit contributions | |
ymes | +0.190 |
asis | +0.189 |
nests | +0.188 |
umm | +0.186 |
orns | +0.185 |
Neg logit contributions | |
not | -0.114 |
and | -0.098 |
" | -0.094 |
because | -0.090 |
they | -0.090 |
Token | . |
Token ID | 13 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
asis | +0.105 |
ymes | +0.103 |
ites | +0.103 |
nests | +0.100 |
keeping | +0.098 |
Neg logit contributions | |
not | -0.065 |
" | -0.052 |
and | -0.052 |
because | -0.051 |
: | -0.050 |
Token | Amen |
Token ID | 34717 |
Feature activation | +6.79e+01 |
Pos logit contributions | |
not | +0.002 |
and | +0.002 |
because | +0.002 |
for | +0.002 |
, | +0.002 |
Neg logit contributions | |
Ta | -0.003 |
ites | -0.003 |
umm | -0.003 |
asis | -0.003 |
andel | -0.003 |
Token | ." |
Token ID | 526 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
asis | +1.238 |
ites | +1.230 |
ymes | +1.206 |
pter | +1.187 |
ulture | +1.180 |
Neg logit contributions | |
not | -0.658 |
and | -0.594 |
because | -0.565 |
but | -0.560 |
" | -0.519 |
Token |
|
Token ID | 198 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
crow | +0.037 |
keeping | +0.037 |
ites | +0.037 |
pige | +0.037 |
folk | +0.036 |
Neg logit contributions | |
not | -0.019 |
and | -0.016 |
because | -0.015 |
for | -0.015 |
just | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
ymes | +0.087 |
asis | +0.087 |
andel | +0.086 |
Ta | +0.086 |
robat | +0.086 |
Neg logit contributions | |
not | -0.025 |
and | -0.022 |
because | -0.019 |
but | -0.015 |
, | -0.014 |
Token | Then |
Token ID | 6423 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
ymes | +0.034 |
asis | +0.033 |
andel | +0.033 |
robat | +0.033 |
Ta | +0.033 |
Neg logit contributions | |
not | -0.028 |
and | -0.026 |
because | -0.024 |
but | -0.022 |
, | -0.022 |
Token | , |
Token ID | 11 |
Feature activation | -9.84e+00 |
Pos logit contributions | |
not | +0.094 |
and | +0.082 |
because | +0.070 |
but | +0.054 |
" | +0.045 |
Neg logit contributions | |
asis | -0.349 |
seas | -0.348 |
crow | -0.346 |
ymes | -0.346 |
ites | -0.345 |
Token | together |
Token ID | 1978 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
ymes | +0.546 |
robat | +0.541 |
nests | +0.541 |
oceans | +0.535 |
bridge | +0.534 |
Neg logit contributions | |
not | -0.158 |
also | -0.066 |
? | -0.061 |
because | -0.058 |
: | -0.053 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
robat | +0.286 |
ymes | +0.281 |
nests | +0.273 |
andel | +0.272 |
pter | +0.271 |
Neg logit contributions | |
not | -0.096 |
because | -0.048 |
and | -0.045 |
" | -0.044 |
they | -0.039 |
Token | They |
Token ID | 1119 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
ites | +0.258 |
pill | +0.258 |
andel | +0.257 |
Ta | +0.257 |
crow | +0.255 |
Neg logit contributions | |
not | -0.138 |
and | -0.119 |
because | -0.100 |
for | -0.096 |
, | -0.091 |
Token | named |
Token ID | 3706 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
robat | +0.253 |
asis | +0.247 |
ymes | +0.246 |
Ta | +0.246 |
ites | +0.242 |
Neg logit contributions | |
not | -0.138 |
and | -0.125 |
because | -0.114 |
but | -0.106 |
" | -0.105 |
Token | the |
Token ID | 262 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
asis | +0.484 |
ymes | +0.483 |
andel | +0.482 |
robat | +0.478 |
Ta | +0.474 |
Neg logit contributions | |
not | -0.196 |
and | -0.181 |
because | -0.151 |
but | -0.133 |
, | -0.130 |
Token | cat |
Token ID | 3797 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
andel | +0.283 |
asis | +0.282 |
ymes | +0.277 |
robat | +0.275 |
Ta | +0.274 |
Neg logit contributions | |
not | -0.392 |
and | -0.380 |
because | -0.340 |
" | -0.330 |
. | -0.329 |
Token | Box |
Token ID | 8315 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
nests | +0.594 |
crow | +0.594 |
pillar | +0.592 |
asis | +0.589 |
orns | +0.585 |
Neg logit contributions | |
not | -0.139 |
because | -0.064 |
and | -0.060 |
but | -0.050 |
still | -0.033 |
Token | . |
Token ID | 13 |
Feature activation | +5.28e+00 |
Pos logit contributions | |
ymes | +0.543 |
asis | +0.533 |
robat | +0.531 |
ites | +0.526 |
orns | +0.523 |
Neg logit contributions | |
not | -0.122 |
and | -0.083 |
because | -0.071 |
but | -0.057 |
" | -0.045 |
Token | They |
Token ID | 1119 |
Feature activation | +6.17e+00 |
Pos logit contributions | |
andel | +0.103 |
ites | +0.102 |
Ta | +0.101 |
robat | +0.100 |
crow | +0.100 |
Neg logit contributions | |
not | -0.050 |
and | -0.043 |
because | -0.037 |
for | -0.033 |
, | -0.032 |
Token | took |
Token ID | 1718 |
Feature activation | +5.71e+00 |
Pos logit contributions | |
robat | +0.109 |
ites | +0.107 |
ymes | +0.107 |
asis | +0.107 |
Ta | +0.104 |
Neg logit contributions | |
not | -0.065 |
and | -0.057 |
because | -0.055 |
but | -0.051 |
" | -0.049 |
Token | it |
Token ID | 340 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
asis | +0.114 |
umm | +0.104 |
robat | +0.102 |
lor | +0.100 |
actus | +0.100 |
Neg logit contributions | |
and | -0.079 |
not | -0.073 |
, | -0.069 |
to | -0.067 |
a | -0.066 |
Token | he |
Token ID | 339 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
asis | +0.444 |
seas | +0.432 |
ocol | +0.431 |
emaker | +0.430 |
ymes | +0.429 |
Neg logit contributions | |
not | -0.188 |
and | -0.183 |
because | -0.151 |
: | -0.137 |
. | -0.132 |
Token | was |
Token ID | 373 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
asis | +0.480 |
ymes | +0.458 |
pillar | +0.457 |
robat | +0.452 |
arrow | +0.451 |
Neg logit contributions | |
not | -0.189 |
and | -0.177 |
because | -0.162 |
but | -0.150 |
" | -0.137 |
Token | sleeping |
Token ID | 11029 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
asis | +0.298 |
andel | +0.293 |
ymes | +0.292 |
nests | +0.288 |
ocol | +0.287 |
Neg logit contributions | |
and | -0.124 |
not | -0.122 |
because | -0.105 |
but | -0.097 |
they | -0.094 |
Token | in |
Token ID | 287 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
seas | +0.519 |
asis | +0.518 |
ymes | +0.513 |
robat | +0.513 |
orns | +0.497 |
Neg logit contributions | |
not | -0.206 |
they | -0.124 |
" | -0.115 |
because | -0.110 |
: | -0.109 |
Token | his |
Token ID | 465 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
asis | +0.477 |
andel | +0.476 |
ymes | +0.472 |
robat | +0.471 |
keeping | +0.470 |
Neg logit contributions | |
not | -0.170 |
and | -0.145 |
because | -0.121 |
" | -0.107 |
: | -0.105 |
Token | shell |
Token ID | 7582 |
Feature activation | +3.59e+01 |
Pos logit contributions | |
ymes | +0.231 |
andel | +0.230 |
asis | +0.228 |
robat | +0.227 |
Ta | +0.225 |
Neg logit contributions | |
not | -0.271 |
and | -0.261 |
because | -0.238 |
but | -0.224 |
, | -0.224 |
Token | . |
Token ID | 13 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
asis | +0.842 |
seas | +0.817 |
robat | +0.815 |
orns | +0.810 |
ymes | +0.801 |
Neg logit contributions | |
not | -0.196 |
and | -0.105 |
they | -0.098 |
" | -0.094 |
because | -0.087 |
Token | She |
Token ID | 1375 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
andel | +0.228 |
asis | +0.226 |
Ta | +0.223 |
ymes | +0.223 |
robat | +0.222 |
Neg logit contributions | |
not | -0.108 |
and | -0.097 |
because | -0.082 |
, | -0.072 |
but | -0.072 |
Token | said |
Token ID | 531 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
asis | +0.249 |
ymes | +0.246 |
Ta | +0.241 |
seas | +0.240 |
nests | +0.238 |
Neg logit contributions | |
not | -0.136 |
and | -0.121 |
because | -0.114 |
but | -0.105 |
" | -0.102 |
Token | , |
Token ID | 11 |
Feature activation | +2.81e+00 |
Pos logit contributions | |
ymes | +0.258 |
andel | +0.257 |
asis | +0.255 |
seas | +0.253 |
ocol | +0.253 |
Neg logit contributions | |
not | -0.052 |
and | -0.043 |
because | -0.034 |
but | -0.024 |
. | -0.017 |
Token | " |
Token ID | 366 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
andel | +0.049 |
folk | +0.049 |
oceans | +0.049 |
pillar | +0.049 |
lakes | +0.048 |
Neg logit contributions | |
not | -0.021 |
because | -0.014 |
and | -0.014 |
? | -0.013 |
just | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
orns | +1.137 |
seas | +1.134 |
asis | +1.127 |
ites | +1.109 |
nests | +1.076 |
Neg logit contributions | |
not | -0.347 |
" | -0.237 |
and | -0.230 |
because | -0.186 |
: | -0.161 |
Token | They |
Token ID | 1119 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
andel | +0.539 |
asis | +0.538 |
robat | +0.532 |
Ta | +0.531 |
ymes | +0.531 |
Neg logit contributions | |
not | -0.268 |
and | -0.238 |
because | -0.202 |
but | -0.181 |
, | -0.178 |
Token | collect |
Token ID | 2824 |
Feature activation | +3.67e+01 |
Pos logit contributions | |
asis | +0.512 |
robat | +0.504 |
Ta | +0.498 |
ymes | +0.495 |
ites | +0.495 |
Neg logit contributions | |
not | -0.301 |
and | -0.275 |
because | -0.251 |
but | -0.231 |
" | -0.224 |
Token | rocks |
Token ID | 12586 |
Feature activation | +4.63e+01 |
Pos logit contributions | |
asis | +0.439 |
umm | +0.429 |
robat | +0.429 |
Ta | +0.429 |
andel | +0.427 |
Neg logit contributions | |
and | -0.687 |
not | -0.679 |
because | -0.614 |
, | -0.605 |
but | -0.594 |
Token | , |
Token ID | 11 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
orns | +1.112 |
ites | +1.110 |
seas | +1.098 |
asis | +1.086 |
andel | +1.074 |
Neg logit contributions | |
not | -0.227 |
" | -0.092 |
because | -0.092 |
and | -0.076 |
but | -0.044 |
Token | shells |
Token ID | 19679 |
Feature activation | +4.45e+01 |
Pos logit contributions | |
asis | +0.189 |
ymes | +0.188 |
andel | +0.188 |
robat | +0.184 |
Ta | +0.181 |
Neg logit contributions | |
not | -0.323 |
and | -0.309 |
because | -0.288 |
but | -0.273 |
, | -0.272 |
Token | , |
Token ID | 11 |
Feature activation | +1.38e+01 |
Pos logit contributions | |
orns | +1.046 |
ites | +1.043 |
seas | +1.039 |
asis | +1.027 |
nests | +1.009 |
Neg logit contributions | |
not | -0.231 |
because | -0.114 |
" | -0.081 |
and | -0.070 |
but | -0.047 |
Token | leaves |
Token ID | 5667 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
seas | +0.244 |
nests | +0.238 |
orns | +0.238 |
oceans | +0.235 |
andel | +0.234 |
Neg logit contributions | |
not | -0.159 |
and | -0.129 |
because | -0.127 |
" | -0.121 |
: | -0.120 |
Token | , |
Token ID | 11 |
Feature activation | +9.95e+00 |
Pos logit contributions | |
orns | +0.643 |
nests | +0.628 |
ites | +0.628 |
andel | +0.625 |
seas | +0.622 |
Neg logit contributions | |
not | -0.142 |
because | -0.072 |
" | -0.051 |
and | -0.039 |
just | -0.032 |
Token | and |
Token ID | 290 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
seas | +0.226 |
nests | +0.223 |
oceans | +0.221 |
orns | +0.220 |
lakes | +0.217 |
Neg logit contributions | |
not | -0.063 |
because | -0.040 |
and | -0.036 |
" | -0.036 |
: | -0.036 |
Token | stickers |
Token ID | 28568 |
Feature activation | +3.63e+01 |
Pos logit contributions | |
ymes | +0.031 |
asis | +0.031 |
andel | +0.031 |
Ta | +0.030 |
robat | +0.030 |
Neg logit contributions | |
not | -0.044 |
and | -0.042 |
because | -0.040 |
but | -0.037 |
" | -0.037 |
Token | stuck |
Token ID | 7819 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
asis | +0.167 |
arrow | +0.164 |
ymes | +0.164 |
robat | +0.161 |
nests | +0.161 |
Neg logit contributions | |
not | -0.082 |
and | -0.077 |
because | -0.070 |
but | -0.064 |
" | -0.062 |
Token | out |
Token ID | 503 |
Feature activation | +6.53e+00 |
Pos logit contributions | |
seas | +0.314 |
ymes | +0.305 |
oceans | +0.304 |
isher | +0.300 |
rivers | +0.298 |
Neg logit contributions | |
not | -0.157 |
because | -0.121 |
and | -0.119 |
but | -0.101 |
they | -0.099 |
Token | and |
Token ID | 290 |
Feature activation | -7.77e+00 |
Pos logit contributions | |
ymes | +0.100 |
andel | +0.095 |
ites | +0.094 |
nests | +0.093 |
seas | +0.092 |
Neg logit contributions | |
not | -0.082 |
and | -0.067 |
because | -0.066 |
" | -0.063 |
but | -0.063 |
Token | made |
Token ID | 925 |
Feature activation | +3.59e+00 |
Pos logit contributions | |
and | +0.087 |
not | +0.083 |
because | +0.074 |
: | +0.071 |
but | +0.071 |
Neg logit contributions | |
seas | -0.125 |
nests | -0.123 |
asis | -0.122 |
andel | -0.121 |
ymes | -0.121 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
asis | +0.085 |
ymes | +0.085 |
andel | +0.084 |
robat | +0.084 |
Ta | +0.083 |
Neg logit contributions | |
not | -0.023 |
and | -0.021 |
because | -0.016 |
but | -0.013 |
, | -0.013 |
Token | nest |
Token ID | 16343 |
Feature activation | +3.51e+01 |
Pos logit contributions | |
igsaw | +0.164 |
robat | +0.159 |
Ta | +0.155 |
ocol | +0.155 |
ival | +0.153 |
Neg logit contributions | |
not | -0.242 |
and | -0.234 |
. | -0.202 |
because | -0.201 |
but | -0.201 |
Token | look |
Token ID | 804 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
asis | +0.604 |
nests | +0.592 |
andel | +0.585 |
ymes | +0.583 |
arrow | +0.572 |
Neg logit contributions | |
not | -0.367 |
and | -0.343 |
because | -0.325 |
" | -0.307 |
: | -0.301 |
Token | messy |
Token ID | 24097 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
andel | +0.194 |
seas | +0.189 |
nests | +0.186 |
ocol | +0.184 |
ymes | +0.178 |
Neg logit contributions | |
not | -0.149 |
and | -0.134 |
: | -0.124 |
" | -0.124 |
because | -0.119 |
Token | . |
Token ID | 13 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
keeping | +0.357 |
umm | +0.347 |
seas | +0.333 |
ymes | +0.333 |
asis | +0.331 |
Neg logit contributions | |
not | -0.144 |
" | -0.088 |
told | -0.076 |
Their | -0.070 |
: | -0.070 |
Token | Tim |
Token ID | 5045 |
Feature activation | +9.94e+00 |
Pos logit contributions | |
not | +0.002 |
and | +0.002 |
because | +0.002 |
for | +0.002 |
but | +0.002 |
Neg logit contributions | |
andel | -0.004 |
crow | -0.004 |
umm | -0.004 |
nests | -0.004 |
pill | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | -5.66e+00 |
Pos logit contributions | |
pillar | +0.229 |
ymes | +0.224 |
robat | +0.224 |
emaker | +0.221 |
orns | +0.220 |
Neg logit contributions | |
not | -0.056 |
they | -0.035 |
because | -0.033 |
their | -0.028 |
for | -0.028 |
Token | of |
Token ID | 286 |
Feature activation | -6.96e+00 |
Pos logit contributions | |
not | +0.046 |
and | +0.034 |
" | +0.033 |
because | +0.033 |
they | +0.030 |
Neg logit contributions | |
andel | -0.067 |
ymes | -0.066 |
emaker | -0.065 |
asis | -0.065 |
crow | -0.065 |
Token | her |
Token ID | 607 |
Feature activation | -3.43e+00 |
Pos logit contributions | |
not | +0.060 |
and | +0.053 |
because | +0.045 |
" | +0.040 |
but | +0.040 |
Neg logit contributions | |
ymes | -0.143 |
andel | -0.143 |
keeping | -0.142 |
orns | -0.141 |
robat | -0.141 |
Token | chamber |
Token ID | 11847 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
not | +0.070 |
and | +0.067 |
because | +0.063 |
but | +0.060 |
" | +0.060 |
Neg logit contributions | |
asis | -0.032 |
ymes | -0.031 |
andel | -0.031 |
robat | -0.030 |
umm | -0.029 |
Token | again |
Token ID | 757 |
Feature activation | -5.13e+00 |
Pos logit contributions | |
asis | +0.299 |
ymes | +0.289 |
robat | +0.288 |
handed | +0.287 |
keeping | +0.287 |
Neg logit contributions | |
not | -0.098 |
and | -0.073 |
because | -0.061 |
" | -0.057 |
they | -0.050 |
Token | . |
Token ID | 13 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
not | +0.036 |
" | +0.022 |
and | +0.021 |
because | +0.018 |
: | +0.017 |
Neg logit contributions | |
asis | -0.108 |
keeping | -0.108 |
nests | -0.105 |
kingdom | -0.105 |
handed | -0.103 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
not | +0.125 |
and | +0.114 |
because | +0.097 |
but | +0.094 |
, | +0.088 |
Neg logit contributions | |
andel | -0.244 |
umm | -0.242 |
asis | -0.241 |
handed | -0.239 |
keeping | -0.239 |
Token | The |
Token ID | 464 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
asis | +0.545 |
ymes | +0.544 |
andel | +0.540 |
robat | +0.539 |
Ta | +0.532 |
Neg logit contributions | |
not | -0.260 |
and | -0.235 |
because | -0.204 |
but | -0.182 |
, | -0.175 |
Token | clever |
Token ID | 14169 |
Feature activation | +4.54e+00 |
Pos logit contributions | |
and | +0.017 |
not | +0.017 |
because | +0.015 |
. | +0.014 |
, | +0.014 |
Neg logit contributions | |
robat | -0.024 |
ymes | -0.023 |
asis | -0.023 |
andel | -0.023 |
Ta | -0.023 |
Token | little |
Token ID | 1310 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
keeping | +0.074 |
robat | +0.074 |
Ta | +0.073 |
ymes | +0.073 |
asis | +0.073 |
Neg logit contributions | |
and | -0.070 |
, | -0.062 |
not | -0.061 |
. | -0.059 |
because | -0.058 |
Token | girl |
Token ID | 2576 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
and | +0.032 |
, | +0.029 |
because | +0.027 |
not | +0.027 |
. | +0.027 |
Neg logit contributions | |
asis | -0.031 |
Ta | -0.031 |
lor | -0.031 |
robat | -0.030 |
andel | -0.030 |
Token | was |
Token ID | 373 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
asis | +0.061 |
pillar | +0.061 |
seas | +0.059 |
nests | +0.059 |
crow | +0.058 |
Neg logit contributions | |
not | -0.036 |
because | -0.026 |
and | -0.025 |
but | -0.024 |
" | -0.024 |
Token | knew |
Token ID | 2993 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
not | +0.084 |
and | +0.071 |
because | +0.070 |
but | +0.065 |
" | +0.063 |
Neg logit contributions | |
asis | -0.155 |
Ta | -0.151 |
seas | -0.150 |
ival | -0.150 |
pillar | -0.149 |
Token | she |
Token ID | 673 |
Feature activation | -9.86e+00 |
Pos logit contributions | |
not | +0.090 |
and | +0.089 |
because | +0.077 |
" | +0.070 |
but | +0.069 |
Neg logit contributions | |
seas | -0.192 |
crow | -0.188 |
lor | -0.186 |
andel | -0.186 |
ocol | -0.185 |
Token | had |
Token ID | 550 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
not | +0.092 |
and | +0.079 |
because | +0.072 |
but | +0.071 |
" | +0.069 |
Neg logit contributions | |
pillar | -0.178 |
ymes | -0.176 |
asis | -0.175 |
ival | -0.169 |
keeping | -0.168 |
Token | to |
Token ID | 284 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
and | +0.101 |
not | +0.101 |
because | +0.090 |
but | +0.084 |
, | +0.078 |
Neg logit contributions | |
ymes | -0.226 |
seas | -0.224 |
keeping | -0.221 |
asis | -0.218 |
nests | -0.218 |
Token | take |
Token ID | 1011 |
Feature activation | -5.80e+00 |
Pos logit contributions | |
not | +0.137 |
and | +0.131 |
" | +0.123 |
because | +0.122 |
they | +0.115 |
Neg logit contributions | |
asis | -0.205 |
robat | -0.191 |
keeping | -0.190 |
andel | -0.190 |
nests | -0.187 |
Token | care |
Token ID | 1337 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
not | +0.050 |
and | +0.046 |
because | +0.038 |
but | +0.034 |
, | +0.032 |
Neg logit contributions | |
andel | -0.123 |
ymes | -0.123 |
asis | -0.123 |
robat | -0.122 |
Ta | -0.121 |
Token | of |
Token ID | 286 |
Feature activation | -8.43e+00 |
Pos logit contributions | |
andel | +0.023 |
emaker | +0.022 |
ymes | +0.022 |
ites | +0.022 |
crow | +0.021 |
Neg logit contributions | |
not | -0.024 |
and | -0.020 |
because | -0.020 |
" | -0.020 |
but | -0.019 |
Token | her |
Token ID | 607 |
Feature activation | -4.64e+00 |
Pos logit contributions | |
not | +0.075 |
and | +0.069 |
because | +0.059 |
: | +0.055 |
" | +0.053 |
Neg logit contributions | |
ymes | -0.158 |
robat | -0.156 |
andel | -0.155 |
ocol | -0.155 |
nests | -0.155 |
Token | laser |
Token ID | 12855 |
Feature activation | +3.80e+00 |
Pos logit contributions | |
not | +0.094 |
and | +0.084 |
because | +0.080 |
" | +0.078 |
but | +0.078 |
Neg logit contributions | |
ymes | -0.042 |
andel | -0.040 |
robat | -0.040 |
ites | -0.039 |
seas | -0.039 |
Token | and |
Token ID | 290 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
asis | +0.080 |
ymes | +0.080 |
robat | +0.080 |
andel | +0.078 |
nests | +0.078 |
Neg logit contributions | |
not | -0.031 |
and | -0.025 |
because | -0.021 |
" | -0.020 |
: | -0.019 |
Token | she |
Token ID | 673 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
not | +0.182 |
and | +0.179 |
because | +0.162 |
: | +0.151 |
but | +0.148 |
Neg logit contributions | |
keeping | -0.372 |
nests | -0.359 |
asis | -0.356 |
ymes | -0.344 |
Ta | -0.344 |
Token | in |
Token ID | 287 |
Feature activation | -9.10e+00 |
Pos logit contributions | |
ymes | +0.148 |
asis | +0.146 |
crow | +0.145 |
pillar | +0.143 |
orns | +0.142 |
Neg logit contributions | |
not | -0.062 |
because | -0.050 |
and | -0.045 |
but | -0.042 |
" | -0.038 |
Token | the |
Token ID | 262 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
not | +0.062 |
and | +0.056 |
because | +0.044 |
but | +0.037 |
, | +0.036 |
Neg logit contributions | |
ymes | -0.209 |
asis | -0.209 |
andel | -0.209 |
robat | -0.207 |
Ta | -0.206 |
Token | middle |
Token ID | 3504 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
not | +0.037 |
and | +0.037 |
because | +0.034 |
, | +0.032 |
. | +0.032 |
Neg logit contributions | |
ocol | -0.025 |
ites | -0.024 |
ymes | -0.024 |
andel | -0.024 |
emaker | -0.024 |
Token | of |
Token ID | 286 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
asis | +0.028 |
andel | +0.028 |
ymes | +0.027 |
robat | +0.027 |
ites | +0.027 |
Neg logit contributions | |
not | -0.019 |
and | -0.017 |
because | -0.016 |
but | -0.014 |
" | -0.014 |
Token | the |
Token ID | 262 |
Feature activation | -2.99e+00 |
Pos logit contributions | |
not | +0.065 |
and | +0.059 |
because | +0.042 |
but | +0.033 |
, | +0.032 |
Neg logit contributions | |
asis | -0.277 |
robat | -0.274 |
ymes | -0.273 |
andel | -0.272 |
umm | -0.271 |
Token | path |
Token ID | 3108 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
and | +0.058 |
not | +0.057 |
because | +0.052 |
, | +0.051 |
. | +0.050 |
Neg logit contributions | |
ocol | -0.038 |
andel | -0.036 |
emaker | -0.036 |
ites | -0.036 |
isher | -0.035 |
Token | . |
Token ID | 13 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
ites | +0.048 |
asis | +0.047 |
ymes | +0.047 |
crow | +0.047 |
keeping | +0.047 |
Neg logit contributions | |
not | -0.013 |
and | -0.008 |
because | -0.008 |
" | -0.006 |
but | -0.006 |
Token | |
Token ID | 220 |
Feature activation | +5.69e+00 |
Pos logit contributions | |
not | +0.146 |
and | +0.136 |
because | +0.115 |
but | +0.103 |
, | +0.101 |
Neg logit contributions | |
asis | -0.318 |
ymes | -0.317 |
andel | -0.316 |
robat | -0.314 |
Ta | -0.311 |
Token |
|
Token ID | 198 |
Feature activation | -7.72e+00 |
Pos logit contributions | |
ymes | +0.131 |
asis | +0.130 |
andel | +0.130 |
ites | +0.129 |
robat | +0.129 |
Neg logit contributions | |
not | -0.035 |
and | -0.031 |
because | -0.025 |
but | -0.020 |
, | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | -8.26e+00 |
Pos logit contributions | |
not | +0.044 |
and | +0.038 |
because | +0.029 |
but | +0.022 |
, | +0.021 |
Neg logit contributions | |
ymes | -0.185 |
asis | -0.185 |
andel | -0.184 |
robat | -0.183 |
Ta | -0.182 |
Token | L |
Token ID | 43 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
not | +0.116 |
and | +0.110 |
because | +0.099 |
but | +0.092 |
, | +0.091 |
Neg logit contributions | |
asis | -0.135 |
andel | -0.134 |
ymes | -0.134 |
robat | -0.133 |
Ta | -0.130 |
Token | climb |
Token ID | 12080 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
not | +0.063 |
and | +0.055 |
because | +0.053 |
" | +0.048 |
but | +0.048 |
Neg logit contributions | |
asis | -0.079 |
Ta | -0.079 |
ymes | -0.078 |
andel | -0.077 |
robat | -0.077 |
Token | the |
Token ID | 262 |
Feature activation | +7.08e-01 |
Pos logit contributions | |
andel | +0.048 |
asis | +0.048 |
ymes | +0.048 |
robat | +0.047 |
ites | +0.047 |
Neg logit contributions | |
not | -0.020 |
and | -0.018 |
because | -0.015 |
but | -0.013 |
, | -0.013 |
Token | tree |
Token ID | 5509 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
ymes | +0.009 |
Ta | +0.009 |
ocol | +0.009 |
robat | +0.008 |
andel | +0.008 |
Neg logit contributions | |
and | -0.013 |
not | -0.013 |
because | -0.012 |
, | -0.012 |
to | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
asis | +0.255 |
ymes | +0.251 |
andel | +0.251 |
nests | +0.251 |
ites | +0.249 |
Neg logit contributions | |
not | -0.049 |
and | -0.034 |
because | -0.026 |
but | -0.018 |
" | -0.015 |
Token | They |
Token ID | 1119 |
Feature activation | -9.32e+00 |
Pos logit contributions | |
not | +0.093 |
and | +0.080 |
because | +0.063 |
but | +0.052 |
, | +0.051 |
Neg logit contributions | |
andel | -0.309 |
asis | -0.304 |
ymes | -0.302 |
Ta | -0.300 |
umm | -0.300 |
Token | pick |
Token ID | 2298 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
not | +0.108 |
and | +0.101 |
because | +0.090 |
but | +0.082 |
, | +0.081 |
Neg logit contributions | |
asis | -0.169 |
andel | -0.168 |
ymes | -0.168 |
robat | -0.166 |
Ta | -0.165 |
Token | some |
Token ID | 617 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
ymes | +0.071 |
asis | +0.071 |
robat | +0.071 |
andel | +0.070 |
Ta | +0.070 |
Neg logit contributions | |
not | -0.041 |
and | -0.040 |
because | -0.034 |
, | -0.032 |
. | -0.031 |
Token | cher |
Token ID | 21382 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
andel | +0.003 |
asis | +0.003 |
ymes | +0.003 |
orns | +0.003 |
ites | +0.003 |
Neg logit contributions | |
not | -0.006 |
and | -0.006 |
because | -0.005 |
but | -0.005 |
" | -0.005 |
Token | ries |
Token ID | 1678 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
Ta | +0.223 |
andel | +0.219 |
ymes | +0.215 |
robat | +0.213 |
asis | +0.213 |
Neg logit contributions | |
and | -0.458 |
not | -0.458 |
because | -0.419 |
, | -0.408 |
. | -0.401 |
Token | and |
Token ID | 290 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
ites | +0.273 |
nests | +0.269 |
orns | +0.267 |
ite | +0.264 |
asis | +0.262 |
Neg logit contributions | |
not | -0.085 |
" | -0.045 |
because | -0.043 |
but | -0.033 |
? | -0.031 |
Token | put |
Token ID | 1234 |
Feature activation | +2.85e+00 |
Pos logit contributions | |
not | +0.200 |
and | +0.185 |
because | +0.168 |
but | +0.150 |
" | +0.147 |
Neg logit contributions | |
asis | -0.327 |
andel | -0.325 |
ymes | -0.324 |
Ta | -0.323 |
robat | -0.320 |
Token | Lucy |
Token ID | 22162 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
not | +0.112 |
and | +0.105 |
because | +0.091 |
, | +0.083 |
but | +0.083 |
Neg logit contributions | |
asis | -0.210 |
ymes | -0.209 |
andel | -0.207 |
robat | -0.207 |
Ta | -0.204 |
Token | . |
Token ID | 13 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
not | +0.018 |
but | +0.010 |
and | +0.010 |
because | +0.009 |
" | +0.009 |
Neg logit contributions | |
ymes | -0.058 |
pter | -0.057 |
asis | -0.056 |
keeping | -0.056 |
robat | -0.055 |
Token | She |
Token ID | 1375 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
not | +0.147 |
and | +0.131 |
because | +0.110 |
but | +0.097 |
, | +0.094 |
Neg logit contributions | |
andel | -0.320 |
ymes | -0.318 |
asis | -0.318 |
Ta | -0.314 |
umm | -0.314 |
Token | was |
Token ID | 373 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
not | +0.100 |
and | +0.092 |
but | +0.083 |
because | +0.081 |
for | +0.075 |
Neg logit contributions | |
asis | -0.212 |
Ta | -0.207 |
robat | -0.206 |
ymes | -0.205 |
pillar | -0.202 |
Token | only |
Token ID | 691 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
not | +0.144 |
and | +0.134 |
because | +0.105 |
but | +0.091 |
, | +0.088 |
Neg logit contributions | |
andel | -0.462 |
ymes | -0.458 |
asis | -0.458 |
Ta | -0.454 |
robat | -0.450 |
Token | three |
Token ID | 1115 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
not | +0.313 |
and | +0.304 |
because | +0.272 |
but | +0.254 |
, | +0.250 |
Neg logit contributions | |
asis | -0.417 |
ymes | -0.407 |
robat | -0.406 |
Ta | -0.399 |
andel | -0.399 |
Token | , |
Token ID | 11 |
Feature activation | -1.80e+01 |
Pos logit contributions | |
ymes | +0.028 |
andel | +0.027 |
asis | +0.027 |
ites | +0.026 |
robat | +0.026 |
Neg logit contributions | |
not | -0.040 |
and | -0.037 |
because | -0.034 |
" | -0.033 |
but | -0.033 |
Token | with |
Token ID | 351 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
: | +0.081 |
not | +0.081 |
and | +0.057 |
. | +0.057 |
? | +0.055 |
Neg logit contributions | |
seas | -0.363 |
orns | -0.348 |
nests | -0.347 |
pter | -0.343 |
robat | -0.341 |
Token | curly |
Token ID | 45731 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
not | +0.108 |
and | +0.089 |
because | +0.075 |
, | +0.064 |
" | +0.064 |
Neg logit contributions | |
asis | -0.320 |
ymes | -0.308 |
robat | -0.306 |
ites | -0.304 |
andel | -0.301 |
Token | blonde |
Token ID | 21541 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
andel | +0.044 |
ymes | +0.043 |
asis | +0.043 |
robat | +0.043 |
Ta | +0.042 |
Neg logit contributions | |
not | -0.052 |
and | -0.050 |
because | -0.046 |
but | -0.043 |
, | -0.042 |
Token | hair |
Token ID | 4190 |
Feature activation | +7.63e+00 |
Pos logit contributions | |
asis | +0.230 |
ymes | +0.229 |
robat | +0.227 |
andel | +0.226 |
Ta | +0.222 |
Neg logit contributions | |
not | -0.256 |
and | -0.250 |
because | -0.225 |
, | -0.213 |
but | -0.211 |
Token |
|
Token ID | 198 |
Feature activation | -5.27e+00 |
Pos logit contributions | |
not | +0.028 |
and | +0.024 |
because | +0.019 |
but | +0.015 |
, | +0.014 |
Neg logit contributions | |
asis | -0.107 |
ymes | -0.107 |
andel | -0.107 |
robat | -0.106 |
Ta | -0.105 |
Token | One |
Token ID | 3198 |
Feature activation | -4.60e-01 |
Pos logit contributions | |
not | +0.074 |
and | +0.071 |
because | +0.064 |
but | +0.060 |
, | +0.060 |
Neg logit contributions | |
asis | -0.083 |
andel | -0.081 |
robat | -0.081 |
ymes | -0.081 |
Ta | -0.080 |
Token | day |
Token ID | 1110 |
Feature activation | -9.18e-01 |
Pos logit contributions | |
not | +0.008 |
and | +0.007 |
because | +0.007 |
but | +0.006 |
" | +0.006 |
Neg logit contributions | |
asis | -0.006 |
andel | -0.006 |
ymes | -0.006 |
robat | -0.006 |
Ta | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
not | +0.007 |
and | +0.004 |
because | +0.004 |
still | +0.003 |
but | +0.003 |
Neg logit contributions | |
seas | -0.019 |
andel | -0.019 |
crow | -0.019 |
asis | -0.018 |
ocol | -0.018 |
Token | Tim |
Token ID | 5045 |
Feature activation | -5.85e+00 |
Pos logit contributions | |
not | +0.178 |
and | +0.162 |
: | +0.150 |
because | +0.128 |
. | +0.125 |
Neg logit contributions | |
seas | -0.295 |
andel | -0.270 |
robat | -0.270 |
asis | -0.269 |
orns | -0.269 |
Token | 's |
Token ID | 338 |
Feature activation | -7.96e+00 |
Pos logit contributions | |
not | +0.070 |
because | +0.056 |
and | +0.055 |
" | +0.053 |
but | +0.052 |
Neg logit contributions | |
asis | -0.099 |
pillar | -0.096 |
orns | -0.094 |
robat | -0.094 |
crow | -0.094 |
Token | mom |
Token ID | 1995 |
Feature activation | +2.42e+00 |
Pos logit contributions | |
not | +0.094 |
and | +0.089 |
because | +0.078 |
but | +0.071 |
, | +0.071 |
Neg logit contributions | |
asis | -0.146 |
ymes | -0.146 |
andel | -0.145 |
robat | -0.144 |
Ta | -0.143 |
Token | got |
Token ID | 1392 |
Feature activation | -9.02e+00 |
Pos logit contributions | |
pillar | +0.037 |
ival | +0.036 |
emaker | +0.036 |
asis | +0.036 |
crow | +0.035 |
Neg logit contributions | |
not | -0.028 |
because | -0.023 |
but | -0.021 |
and | -0.020 |
their | -0.020 |
Token | a |
Token ID | 257 |
Feature activation | -8.92e+00 |
Pos logit contributions | |
not | +0.074 |
and | +0.071 |
because | +0.060 |
but | +0.056 |
" | +0.053 |
Neg logit contributions | |
ymes | -0.183 |
andel | -0.182 |
asis | -0.178 |
Ta | -0.178 |
seas | -0.178 |
Token | terrible |
Token ID | 7818 |
Feature activation | -7.46e+00 |
Pos logit contributions | |
not | +0.127 |
and | +0.121 |
because | +0.108 |
but | +0.101 |
, | +0.101 |
Neg logit contributions | |
asis | -0.142 |
ymes | -0.141 |
andel | -0.141 |
robat | -0.140 |
Ta | -0.137 |
Token | pain |
Token ID | 2356 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
not | +0.126 |
and | +0.117 |
because | +0.108 |
but | +0.103 |
" | +0.103 |
Neg logit contributions | |
asis | -0.096 |
andel | -0.094 |
robat | -0.094 |
ymes | -0.093 |
umm | -0.089 |
Token | it |
Token ID | 340 |
Feature activation | -9.36e-01 |
Pos logit contributions | |
robat | +0.085 |
ymes | +0.084 |
seas | +0.084 |
orns | +0.084 |
isher | +0.083 |
Neg logit contributions | |
not | -0.044 |
and | -0.029 |
because | -0.027 |
: | -0.027 |
" | -0.026 |
Token | looked |
Token ID | 3114 |
Feature activation | -8.56e+00 |
Pos logit contributions | |
not | +0.008 |
and | +0.007 |
" | +0.007 |
because | +0.007 |
: | +0.006 |
Neg logit contributions | |
asis | -0.017 |
robat | -0.016 |
seas | -0.016 |
ymes | -0.016 |
bridge | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
not | +0.074 |
: | +0.050 |
" | +0.050 |
they | +0.047 |
and | +0.047 |
Neg logit contributions | |
seas | -0.161 |
umm | -0.145 |
oceans | -0.143 |
bridge | -0.143 |
andel | -0.142 |
Token | He |
Token ID | 679 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
not | +0.167 |
and | +0.149 |
because | +0.122 |
, | +0.121 |
but | +0.120 |
Neg logit contributions | |
umm | -0.250 |
Ta | -0.238 |
andel | -0.235 |
igsaw | -0.234 |
keeping | -0.233 |
Token | learned |
Token ID | 4499 |
Feature activation | -5.90e+00 |
Pos logit contributions | |
not | +0.113 |
because | +0.097 |
but | +0.095 |
and | +0.093 |
" | +0.088 |
Neg logit contributions | |
Ta | -0.193 |
asis | -0.187 |
seas | -0.187 |
ites | -0.184 |
pillar | -0.183 |
Token | that |
Token ID | 326 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
not | +0.047 |
and | +0.046 |
but | +0.044 |
because | +0.040 |
" | +0.039 |
Neg logit contributions | |
seas | -0.103 |
handed | -0.101 |
ival | -0.100 |
keeping | -0.098 |
lor | -0.097 |
Token | sometimes |
Token ID | 3360 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
not | +0.123 |
and | +0.113 |
because | +0.097 |
but | +0.087 |
" | +0.085 |
Neg logit contributions | |
asis | -0.261 |
ymes | -0.260 |
andel | -0.258 |
robat | -0.258 |
Ta | -0.255 |
Token | it |
Token ID | 340 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
not | +0.124 |
and | +0.114 |
: | +0.100 |
because | +0.100 |
" | +0.096 |
Neg logit contributions | |
ymes | -0.195 |
nests | -0.194 |
seas | -0.194 |
opter | -0.189 |
oceans | -0.188 |
Token | 's |
Token ID | 338 |
Feature activation | -5.34e+00 |
Pos logit contributions | |
ymes | +0.020 |
ites | +0.020 |
asis | +0.020 |
orns | +0.020 |
unn | +0.020 |
Neg logit contributions | |
not | -0.013 |
and | -0.012 |
because | -0.011 |
but | -0.011 |
" | -0.010 |
Token | good |
Token ID | 922 |
Feature activation | +4.52e+00 |
Pos logit contributions | |
and | +0.063 |
: | +0.059 |
" | +0.057 |
not | +0.055 |
they | +0.054 |
Neg logit contributions | |
orns | -0.072 |
risks | -0.072 |
nests | -0.072 |
ymes | -0.071 |
riches | -0.070 |
Token | to |
Token ID | 284 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
orns | +0.093 |
keeping | +0.092 |
unn | +0.091 |
isher | +0.089 |
seas | +0.089 |
Neg logit contributions | |
not | -0.031 |
and | -0.020 |
" | -0.019 |
: | -0.018 |
because | -0.017 |
Token | his |
Token ID | 465 |
Feature activation | -7.17e+00 |
Pos logit contributions | |
not | +0.002 |
and | +0.002 |
because | +0.002 |
but | +0.001 |
" | +0.001 |
Neg logit contributions | |
andel | -0.006 |
ymes | -0.006 |
asis | -0.006 |
ocol | -0.006 |
robat | -0.006 |
Token | new |
Token ID | 649 |
Feature activation | -5.81e+00 |
Pos logit contributions | |
not | +0.120 |
and | +0.110 |
because | +0.105 |
they | +0.101 |
but | +0.099 |
Neg logit contributions | |
umm | -0.088 |
asis | -0.088 |
andel | -0.087 |
seas | -0.086 |
ocol | -0.085 |
Token | spicy |
Token ID | 26880 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
not | +0.115 |
and | +0.104 |
because | +0.100 |
they | +0.095 |
but | +0.095 |
Neg logit contributions | |
andel | -0.058 |
umm | -0.057 |
asis | -0.057 |
ymes | -0.054 |
nests | -0.054 |
Token | treat |
Token ID | 2190 |
Feature activation | -7.49e+00 |
Pos logit contributions | |
not | +0.038 |
and | +0.035 |
because | +0.033 |
but | +0.031 |
they | +0.031 |
Neg logit contributions | |
umm | -0.025 |
asis | -0.025 |
andel | -0.024 |
robat | -0.024 |
ymes | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
not | +0.051 |
and | +0.030 |
" | +0.028 |
because | +0.026 |
but | +0.020 |
Neg logit contributions | |
robat | -0.161 |
asis | -0.158 |
keeping | -0.158 |
umm | -0.158 |
seas | -0.153 |
Token | He |
Token ID | 679 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
not | +0.187 |
and | +0.170 |
because | +0.144 |
but | +0.138 |
for | +0.137 |
Neg logit contributions | |
umm | -0.300 |
igsaw | -0.290 |
andel | -0.287 |
Ta | -0.283 |
ival | -0.283 |
Token | quickly |
Token ID | 2952 |
Feature activation | -1.90e+01 |
Pos logit contributions | |
not | +0.147 |
because | +0.129 |
and | +0.122 |
but | +0.121 |
" | +0.113 |
Neg logit contributions | |
asis | -0.254 |
pillar | -0.248 |
Ta | -0.244 |
arrow | -0.242 |
pill | -0.240 |
Token | opened |
Token ID | 4721 |
Feature activation | -8.72e+00 |
Pos logit contributions | |
not | +0.233 |
and | +0.199 |
because | +0.197 |
but | +0.184 |
" | +0.178 |
Neg logit contributions | |
asis | -0.309 |
andel | -0.306 |
pillar | -0.303 |
Ta | -0.302 |
nests | -0.297 |
Token | the |
Token ID | 262 |
Feature activation | -2.54e+00 |
Pos logit contributions | |
not | +0.073 |
and | +0.059 |
because | +0.055 |
but | +0.047 |
" | +0.044 |
Neg logit contributions | |
andel | -0.180 |
seas | -0.177 |
ocol | -0.176 |
asis | -0.175 |
nests | -0.174 |
Token | brick |
Token ID | 17214 |
Feature activation | +7.99e+00 |
Pos logit contributions | |
not | +0.044 |
and | +0.042 |
because | +0.039 |
but | +0.037 |
, | +0.037 |
Neg logit contributions | |
ymes | -0.032 |
asis | -0.032 |
andel | -0.032 |
robat | -0.032 |
Ta | -0.031 |
Token | and |
Token ID | 290 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
asis | +0.186 |
umm | +0.184 |
andel | +0.182 |
robat | +0.182 |
ites | +0.181 |
Neg logit contributions | |
not | -0.052 |
and | -0.033 |
because | -0.028 |
" | -0.023 |
but | -0.021 |
Token | taste |
Token ID | 6938 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
not | +0.130 |
and | +0.115 |
" | +0.106 |
because | +0.096 |
but | +0.095 |
Neg logit contributions | |
asis | -0.277 |
andel | -0.277 |
ocol | -0.271 |
arrow | -0.268 |
pillar | -0.268 |
Token | it |
Token ID | 340 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
asis | +0.036 |
ymes | +0.036 |
andel | +0.036 |
robat | +0.036 |
Ta | +0.036 |
Neg logit contributions | |
not | -0.017 |
and | -0.016 |
because | -0.013 |
but | -0.012 |
, | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
asis | +0.020 |
robat | +0.019 |
ymes | +0.019 |
umm | +0.019 |
orns | +0.018 |
Neg logit contributions | |
not | -0.009 |
" | -0.007 |
and | -0.006 |
they | -0.006 |
Their | -0.006 |
Token | It |
Token ID | 632 |
Feature activation | -4.60e-01 |
Pos logit contributions | |
not | +0.165 |
and | +0.156 |
because | +0.138 |
but | +0.128 |
, | +0.126 |
Neg logit contributions | |
andel | -0.224 |
ymes | -0.222 |
asis | -0.222 |
Ta | -0.221 |
umm | -0.219 |
Token | is |
Token ID | 318 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
not | +0.005 |
and | +0.004 |
because | +0.004 |
but | +0.004 |
" | +0.004 |
Neg logit contributions | |
asis | -0.008 |
ymes | -0.008 |
orns | -0.008 |
robat | -0.008 |
pill | -0.008 |
Token | not |
Token ID | 407 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
and | +0.154 |
not | +0.133 |
because | +0.125 |
but | +0.124 |
, | +0.120 |
Neg logit contributions | |
ocol | -0.296 |
nests | -0.288 |
andel | -0.287 |
ymes | -0.286 |
mango | -0.281 |
Token | real |
Token ID | 1103 |
Feature activation | -8.78e+00 |
Pos logit contributions | |
not | +0.182 |
and | +0.174 |
because | +0.154 |
but | +0.145 |
" | +0.144 |
Neg logit contributions | |
ymes | -0.249 |
andel | -0.248 |
asis | -0.247 |
ocol | -0.241 |
robat | -0.239 |
Token | . |
Token ID | 13 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
not | +0.073 |
and | +0.051 |
because | +0.044 |
but | +0.039 |
" | +0.039 |
Neg logit contributions | |
ocol | -0.183 |
ymes | -0.183 |
andel | -0.181 |
orns | -0.180 |
robat | -0.180 |
Token | It |
Token ID | 632 |
Feature activation | -9.51e-02 |
Pos logit contributions | |
not | +0.166 |
and | +0.157 |
because | +0.138 |
but | +0.129 |
, | +0.128 |
Neg logit contributions | |
andel | -0.216 |
ymes | -0.215 |
Ta | -0.214 |
asis | -0.213 |
umm | -0.212 |
Token | is |
Token ID | 318 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
not | +0.001 |
and | +0.001 |
because | +0.001 |
but | +0.001 |
" | +0.001 |
Neg logit contributions | |
asis | -0.002 |
ymes | -0.002 |
pill | -0.002 |
orns | -0.002 |
robat | -0.002 |
Token | only |
Token ID | 691 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
and | +0.153 |
not | +0.139 |
because | +0.128 |
but | +0.126 |
, | +0.125 |
Neg logit contributions | |
ocol | -0.289 |
andel | -0.278 |
ymes | -0.277 |
nests | -0.277 |
seas | -0.273 |
Token | for |
Token ID | 329 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
not | +0.025 |
and | +0.021 |
because | +0.019 |
" | +0.018 |
but | +0.018 |
Neg logit contributions | |
asis | -0.050 |
ymes | -0.049 |
ites | -0.049 |
robat | -0.048 |
nests | -0.048 |
Token | a |
Token ID | 257 |
Feature activation | -7.85e+00 |
Pos logit contributions | |
not | +0.083 |
and | +0.079 |
because | +0.066 |
but | +0.060 |
" | +0.057 |
Neg logit contributions | |
ymes | -0.216 |
andel | -0.216 |
asis | -0.215 |
robat | -0.213 |
ocol | -0.213 |
Token | little |
Token ID | 1310 |
Feature activation | -6.36e+00 |
Pos logit contributions | |
not | +0.102 |
and | +0.097 |
because | +0.086 |
but | +0.082 |
, | +0.082 |
Neg logit contributions | |
ymes | -0.136 |
orns | -0.134 |
asis | -0.133 |
andel | -0.133 |
robat | -0.132 |
Token | while |
Token ID | 981 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
not | +0.057 |
and | +0.054 |
because | +0.045 |
but | +0.041 |
, | +0.040 |
Neg logit contributions | |
ymes | -0.134 |
asis | -0.133 |
andel | -0.133 |
robat | -0.132 |
Ta | -0.132 |
Token | , |
Token ID | 11 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
not | +0.095 |
because | +0.062 |
and | +0.061 |
" | +0.059 |
still | +0.051 |
Neg logit contributions | |
ites | -0.225 |
andel | -0.223 |
asis | -0.222 |
oceans | -0.221 |
seas | -0.221 |
Token | and |
Token ID | 290 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
not | +0.118 |
: | +0.095 |
and | +0.093 |
because | +0.083 |
. | +0.075 |
Neg logit contributions | |
seas | -0.315 |
oceans | -0.308 |
pige | -0.307 |
andel | -0.306 |
nests | -0.303 |
Token | then |
Token ID | 788 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
not | +0.155 |
and | +0.144 |
because | +0.125 |
: | +0.110 |
but | +0.107 |
Neg logit contributions | |
asis | -0.405 |
nests | -0.404 |
Ta | -0.402 |
ites | -0.400 |
ymes | -0.399 |
Token | we |
Token ID | 356 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
not | +0.237 |
and | +0.218 |
because | +0.194 |
but | +0.172 |
" | +0.164 |
Neg logit contributions | |
asis | -0.473 |
ymes | -0.471 |
ites | -0.466 |
andel | -0.462 |
robat | -0.460 |
Token | can |
Token ID | 460 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
not | +0.098 |
and | +0.098 |
because | +0.077 |
, | +0.073 |
. | +0.072 |
Neg logit contributions | |
ymes | -0.221 |
andel | -0.220 |
umm | -0.218 |
Ta | -0.215 |
robat | -0.215 |
Token | go |
Token ID | 467 |
Feature activation | -4.98e+00 |
Pos logit contributions | |
not | +0.128 |
and | +0.119 |
because | +0.115 |
" | +0.108 |
but | +0.106 |
Neg logit contributions | |
asis | -0.195 |
robat | -0.184 |
arrow | -0.182 |
ites | -0.182 |
nests | -0.181 |
Token | see |
Token ID | 766 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
not | +0.047 |
" | +0.034 |
because | +0.034 |
and | +0.033 |
: | +0.030 |
Neg logit contributions | |
asis | -0.099 |
ites | -0.099 |
seas | -0.095 |
orns | -0.094 |
robat | -0.094 |
Token | finished |
Token ID | 5201 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
not | +0.045 |
and | +0.037 |
because | +0.036 |
but | +0.033 |
" | +0.032 |
Neg logit contributions | |
asis | -0.074 |
ites | -0.070 |
pillar | -0.070 |
robat | -0.070 |
ival | -0.070 |
Token | the |
Token ID | 262 |
Feature activation | -4.04e+00 |
Pos logit contributions | |
not | +0.110 |
and | +0.093 |
because | +0.089 |
but | +0.082 |
" | +0.072 |
Neg logit contributions | |
nests | -0.230 |
asis | -0.228 |
seas | -0.228 |
ocol | -0.226 |
oceans | -0.223 |
Token | path |
Token ID | 3108 |
Feature activation | -6.44e-02 |
Pos logit contributions | |
not | +0.069 |
and | +0.067 |
for | +0.060 |
, | +0.059 |
because | +0.059 |
Neg logit contributions | |
ymes | -0.058 |
andel | -0.057 |
emaker | -0.057 |
ites | -0.056 |
orns | -0.055 |
Token | , |
Token ID | 11 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
not | +0.000 |
and | +0.000 |
because | +0.000 |
" | +0.000 |
but | +0.000 |
Neg logit contributions | |
asis | -0.001 |
folk | -0.001 |
andel | -0.001 |
ival | -0.001 |
seas | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | -3.89e+00 |
Pos logit contributions | |
not | +0.147 |
and | +0.116 |
because | +0.107 |
: | +0.103 |
. | +0.084 |
Neg logit contributions | |
asis | -0.401 |
andel | -0.397 |
keeping | -0.397 |
nests | -0.395 |
folk | -0.395 |
Token | was |
Token ID | 373 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
not | +0.033 |
and | +0.029 |
because | +0.027 |
but | +0.024 |
" | +0.023 |
Neg logit contributions | |
asis | -0.079 |
pillar | -0.075 |
ymes | -0.075 |
robat | -0.074 |
nests | -0.074 |
Token | so |
Token ID | 523 |
Feature activation | -8.99e+00 |
Pos logit contributions | |
not | +0.196 |
and | +0.186 |
but | +0.159 |
because | +0.159 |
they | +0.158 |
Neg logit contributions | |
andel | -0.426 |
asis | -0.417 |
nests | -0.417 |
seas | -0.411 |
ocol | -0.408 |
Token | beautiful |
Token ID | 4950 |
Feature activation | -2.95e+00 |
Pos logit contributions | |
not | +0.116 |
and | +0.112 |
because | +0.100 |
but | +0.094 |
, | +0.090 |
Neg logit contributions | |
asis | -0.149 |
andel | -0.149 |
ymes | -0.147 |
Ta | -0.146 |
umm | -0.144 |
Token | . |
Token ID | 13 |
Feature activation | -1.87e+01 |
Pos logit contributions | |
not | +0.026 |
" | +0.015 |
and | +0.014 |
: | +0.013 |
because | +0.013 |
Neg logit contributions | |
asis | -0.058 |
umm | -0.058 |
seas | -0.057 |
pillar | -0.055 |
worm | -0.055 |
Token | The |
Token ID | 383 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
not | +0.186 |
and | +0.168 |
because | +0.144 |
but | +0.128 |
, | +0.128 |
Neg logit contributions | |
andel | -0.369 |
asis | -0.362 |
Ta | -0.361 |
umm | -0.360 |
ymes | -0.356 |
Token | animals |
Token ID | 4695 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
and | +0.149 |
not | +0.149 |
because | +0.124 |
, | +0.122 |
" | +0.120 |
Neg logit contributions | |
robat | -0.201 |
ites | -0.201 |
ymes | -0.201 |
lor | -0.200 |
orns | -0.198 |