Token | in |
Token ID | 287 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
icho | +0.315 |
llah | +0.311 |
Uri | +0.311 |
erity | +0.277 |
humans | +0.276 |
Neg logit contributions | |
kered | -0.380 |
Cly | -0.348 |
racted | -0.333 |
>>>>>>>> | -0.324 |
**************** | -0.313 |
Token | the |
Token ID | 262 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
kered | +0.382 |
Cly | +0.354 |
racted | +0.339 |
>>>>>>>> | +0.332 |
★★ | +0.322 |
Neg logit contributions | |
icho | -0.263 |
llah | -0.260 |
Uri | -0.259 |
erity | -0.228 |
humans | -0.227 |
Token | race |
Token ID | 3234 |
Feature activation | +5.20e-01 |
Pos logit contributions | |
kered | +0.009 |
Cly | +0.009 |
racted | +0.008 |
>>>>>>>> | +0.008 |
**************** | +0.008 |
Neg logit contributions | |
icho | -0.006 |
Uri | -0.006 |
llah | -0.006 |
humans | -0.005 |
erity | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -3.48e-02 |
Pos logit contributions | |
kered | +0.379 |
Cly | +0.346 |
racted | +0.329 |
>>>>>>>> | +0.320 |
**************** | +0.309 |
Neg logit contributions | |
icho | -0.362 |
Uri | -0.357 |
llah | -0.357 |
erity | -0.321 |
humans | -0.321 |
Token | v |
Token ID | 410 |
Feature activation | +7.41e-01 |
Pos logit contributions | |
icho | +0.024 |
llah | +0.024 |
Uri | +0.024 |
humans | +0.021 |
erity | +0.021 |
Neg logit contributions | |
kered | -0.026 |
Cly | -0.024 |
racted | -0.022 |
>>>>>>>> | -0.022 |
**************** | -0.021 |
Token | owing |
Token ID | 7855 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
kered | +0.437 |
Cly | +0.389 |
racted | +0.367 |
>>>>>>>> | +0.352 |
**************** | +0.337 |
Neg logit contributions | |
icho | -0.618 |
Uri | -0.613 |
llah | -0.612 |
humans | -0.560 |
erity | -0.559 |
Token | to |
Token ID | 284 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
kered | +2.642 |
Cly | +2.438 |
racted | +2.304 |
>>>>>>>> | +2.249 |
**************** | +2.177 |
Neg logit contributions | |
icho | -2.330 |
llah | -2.310 |
Uri | -2.300 |
humans | -2.066 |
ixel | -2.049 |
Token | take |
Token ID | 1011 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
icho | +0.273 |
Uri | +0.269 |
llah | +0.269 |
humans | +0.241 |
erity | +0.240 |
Neg logit contributions | |
kered | -0.312 |
Cly | -0.286 |
racted | -0.273 |
>>>>>>>> | -0.265 |
**************** | -0.256 |
Token | his |
Token ID | 465 |
Feature activation | +1.65e-01 |
Pos logit contributions | |
icho | +0.238 |
Uri | +0.236 |
llah | +0.234 |
erity | +0.209 |
humans | +0.209 |
Neg logit contributions | |
kered | -0.288 |
Cly | -0.264 |
racted | -0.253 |
>>>>>>>> | -0.245 |
★★ | -0.238 |
Token | campaign |
Token ID | 1923 |
Feature activation | -7.55e-02 |
Pos logit contributions | |
kered | +0.115 |
Cly | +0.105 |
racted | +0.100 |
>>>>>>>> | +0.097 |
**************** | +0.093 |
Neg logit contributions | |
icho | -0.120 |
llah | -0.118 |
Uri | -0.118 |
humans | -0.107 |
erity | -0.107 |
Token | all |
Token ID | 477 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
icho | +0.049 |
llah | +0.049 |
Uri | +0.048 |
humans | +0.043 |
erity | +0.043 |
Neg logit contributions | |
kered | -0.058 |
Cly | -0.054 |
racted | -0.051 |
>>>>>>>> | -0.050 |
**************** | -0.048 |
Token | com |
Token ID | 785 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
kered | +0.513 |
Cly | +0.464 |
racted | +0.438 |
>>>>>>>> | +0.423 |
**************** | +0.411 |
Neg logit contributions | |
icho | -0.640 |
Uri | -0.632 |
llah | -0.631 |
challeng | -0.589 |
metic | -0.577 |
Token | / |
Token ID | 14 |
Feature activation | +8.60e-01 |
Pos logit contributions | |
kered | +0.205 |
Cly | +0.185 |
racted | +0.175 |
>>>>>>>> | +0.169 |
**************** | +0.163 |
Neg logit contributions | |
icho | -0.246 |
llah | -0.243 |
Uri | -0.243 |
erity | -0.221 |
humans | -0.220 |
Token | watch |
Token ID | 8340 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
kered | +0.459 |
Cly | +0.403 |
racted | +0.378 |
>>>>>>>> | +0.360 |
★★ | +0.342 |
Neg logit contributions | |
icho | -0.766 |
Uri | -0.759 |
llah | -0.758 |
humans | -0.697 |
erity | -0.697 |
Token | ? |
Token ID | 30 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
icho | +0.182 |
Uri | +0.181 |
llah | +0.180 |
humans | +0.162 |
erity | +0.162 |
Neg logit contributions | |
kered | -0.182 |
Cly | -0.165 |
racted | -0.158 |
>>>>>>>> | -0.152 |
★★ | -0.147 |
Token | v |
Token ID | 85 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
kered | +0.190 |
Cly | +0.173 |
racted | +0.166 |
>>>>>>>> | +0.161 |
★★ | +0.155 |
Neg logit contributions | |
icho | -0.168 |
Uri | -0.166 |
llah | -0.166 |
humans | -0.148 |
erity | -0.148 |
Token | = |
Token ID | 28 |
Feature activation | +3.39e+00 |
Pos logit contributions | |
kered | +0.181 |
Cly | +0.154 |
racted | +0.144 |
>>>>>>>> | +0.136 |
★★ | +0.127 |
Neg logit contributions | |
llah | -0.351 |
icho | -0.350 |
Uri | -0.348 |
humans | -0.323 |
erity | -0.322 |
Token | 2 |
Token ID | 17 |
Feature activation | +9.36e-01 |
Pos logit contributions | |
kered | +2.365 |
Cly | +2.121 |
racted | +2.051 |
>>>>>>>> | +1.979 |
Changes | +1.925 |
Neg logit contributions | |
Uri | -2.422 |
icho | -2.420 |
llah | -2.369 |
erity | -2.168 |
challeng | -2.143 |
Token | g |
Token ID | 70 |
Feature activation | +3.71e-01 |
Pos logit contributions | |
kered | +0.664 |
Cly | +0.600 |
racted | +0.574 |
>>>>>>>> | +0.556 |
**************** | +0.537 |
Neg logit contributions | |
icho | -0.668 |
Uri | -0.663 |
llah | -0.659 |
erity | -0.595 |
humans | -0.593 |
Token | 7 |
Token ID | 22 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
kered | +0.249 |
Cly | +0.224 |
racted | +0.213 |
>>>>>>>> | +0.206 |
**************** | +0.198 |
Neg logit contributions | |
icho | -0.279 |
Uri | -0.277 |
llah | -0.276 |
erity | -0.250 |
humans | -0.250 |
Token | p |
Token ID | 79 |
Feature activation | -4.40e-01 |
Pos logit contributions | |
kered | +0.414 |
Cly | +0.374 |
racted | +0.358 |
>>>>>>>> | +0.346 |
**************** | +0.334 |
Neg logit contributions | |
icho | -0.421 |
Uri | -0.418 |
llah | -0.415 |
erity | -0.375 |
humans | -0.374 |
Token | k |
Token ID | 74 |
Feature activation | -4.68e-01 |
Pos logit contributions | |
icho | +0.332 |
llah | +0.328 |
Uri | +0.328 |
humans | +0.297 |
erity | +0.296 |
Neg logit contributions | |
kered | -0.295 |
Cly | -0.267 |
racted | -0.253 |
>>>>>>>> | -0.244 |
★★ | -0.235 |
Token | West |
Token ID | 2688 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
icho | +0.597 |
Uri | +0.591 |
llah | +0.589 |
humans | +0.524 |
erity | +0.524 |
Neg logit contributions | |
kered | -0.715 |
Cly | -0.653 |
racted | -0.627 |
>>>>>>>> | -0.609 |
★★ | -0.589 |
Token | Wing |
Token ID | 13405 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
kered | +0.176 |
Cly | +0.160 |
racted | +0.153 |
>>>>>>>> | +0.148 |
**************** | +0.143 |
Neg logit contributions | |
icho | -0.167 |
Uri | -0.165 |
llah | -0.165 |
humans | -0.148 |
erity | -0.148 |
Token | , |
Token ID | 11 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
kered | +0.221 |
Cly | +0.201 |
racted | +0.193 |
>>>>>>>> | +0.187 |
**************** | +0.180 |
Neg logit contributions | |
icho | -0.207 |
Uri | -0.204 |
llah | -0.204 |
humans | -0.183 |
erity | -0.183 |
Token | including |
Token ID | 1390 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
icho | +0.085 |
llah | +0.084 |
Uri | +0.084 |
erity | +0.075 |
humans | +0.075 |
Neg logit contributions | |
kered | -0.095 |
Cly | -0.087 |
racted | -0.083 |
>>>>>>>> | -0.081 |
**************** | -0.078 |
Token | Sebastian |
Token ID | 26190 |
Feature activation | +3.54e-01 |
Pos logit contributions | |
icho | +0.142 |
Uri | +0.140 |
llah | +0.140 |
humans | +0.125 |
erity | +0.125 |
Neg logit contributions | |
kered | -0.166 |
Cly | -0.152 |
racted | -0.145 |
>>>>>>>> | -0.141 |
★★ | -0.136 |
Token | Gork |
Token ID | 49882 |
Feature activation | +3.08e+00 |
Pos logit contributions | |
kered | +0.326 |
Cly | +0.305 |
racted | +0.294 |
>>>>>>>> | +0.286 |
**************** | +0.279 |
Neg logit contributions | |
icho | -0.179 |
llah | -0.173 |
Uri | -0.170 |
humans | -0.152 |
erity | -0.149 |
Token | a |
Token ID | 64 |
Feature activation | +2.84e-01 |
Pos logit contributions | |
kered | +2.125 |
Cly | +1.993 |
racted | +1.897 |
>>>>>>>> | +1.797 |
ダ | +1.794 |
Neg logit contributions | |
icho | -2.129 |
Uri | -2.123 |
llah | -2.050 |
challeng | -1.974 |
metic | -1.957 |
Token | , |
Token ID | 11 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
kered | +0.202 |
Cly | +0.183 |
racted | +0.175 |
>>>>>>>> | +0.169 |
★★ | +0.163 |
Neg logit contributions | |
icho | -0.203 |
Uri | -0.202 |
llah | -0.201 |
erity | -0.181 |
humans | -0.180 |
Token | have |
Token ID | 423 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
kered | +0.184 |
Cly | +0.168 |
racted | +0.160 |
>>>>>>>> | +0.155 |
★★ | +0.150 |
Neg logit contributions | |
icho | -0.175 |
Uri | -0.173 |
llah | -0.173 |
humans | -0.155 |
erity | -0.155 |
Token | received |
Token ID | 2722 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
kered | +0.013 |
Cly | +0.011 |
racted | +0.011 |
>>>>>>>> | +0.011 |
★★ | +0.010 |
Neg logit contributions | |
icho | -0.012 |
Uri | -0.012 |
llah | -0.012 |
humans | -0.011 |
erity | -0.011 |
Token | enormous |
Token ID | 9812 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
kered | +0.360 |
Cly | +0.329 |
racted | +0.315 |
>>>>>>>> | +0.306 |
★★ | +0.295 |
Neg logit contributions | |
icho | -0.316 |
Uri | -0.312 |
llah | -0.311 |
humans | -0.278 |
erity | -0.278 |
Token | , |
Token ID | 11 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
kered | +0.186 |
Cly | +0.170 |
racted | +0.162 |
>>>>>>>> | +0.157 |
**************** | +0.152 |
Neg logit contributions | |
icho | -0.174 |
Uri | -0.172 |
llah | -0.172 |
erity | -0.154 |
humans | -0.154 |
Token | therefore |
Token ID | 4361 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
kered | +0.249 |
Cly | +0.229 |
racted | +0.218 |
>>>>>>>> | +0.212 |
**************** | +0.205 |
Neg logit contributions | |
icho | -0.213 |
llah | -0.210 |
Uri | -0.210 |
erity | -0.188 |
humans | -0.187 |
Token | , |
Token ID | 11 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
icho | +0.173 |
Uri | +0.171 |
llah | +0.171 |
humans | +0.154 |
erity | +0.154 |
Neg logit contributions | |
kered | -0.162 |
Cly | -0.147 |
racted | -0.140 |
>>>>>>>> | -0.135 |
**************** | -0.130 |
Token | a |
Token ID | 257 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
kered | +0.126 |
Cly | +0.115 |
racted | +0.109 |
>>>>>>>> | +0.106 |
**************** | +0.102 |
Neg logit contributions | |
icho | -0.121 |
Uri | -0.120 |
llah | -0.120 |
erity | -0.108 |
humans | -0.107 |
Token | d |
Token ID | 288 |
Feature activation | -5.08e-01 |
Pos logit contributions | |
icho | +0.293 |
Uri | +0.289 |
llah | +0.287 |
erity | +0.255 |
humans | +0.255 |
Neg logit contributions | |
kered | -0.392 |
Cly | -0.360 |
racted | -0.346 |
>>>>>>>> | -0.337 |
**************** | -0.327 |
Token | osed |
Token ID | 1335 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
icho | +0.397 |
Uri | +0.393 |
llah | +0.392 |
humans | +0.357 |
erity | +0.356 |
Neg logit contributions | |
kered | -0.327 |
Cly | -0.293 |
racted | -0.279 |
>>>>>>>> | -0.268 |
**************** | -0.258 |
Token | loss |
Token ID | 2994 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
kered | +2.514 |
Cly | +2.312 |
racted | +2.201 |
>>>>>>>> | +2.145 |
**************** | +2.110 |
Neg logit contributions | |
icho | -1.815 |
Uri | -1.778 |
llah | -1.738 |
erity | -1.614 |
ixel | -1.605 |
Token | of |
Token ID | 286 |
Feature activation | -2.76e-01 |
Pos logit contributions | |
kered | +0.119 |
Cly | +0.109 |
racted | +0.105 |
>>>>>>>> | +0.102 |
★★ | +0.098 |
Neg logit contributions | |
icho | -0.095 |
Uri | -0.094 |
llah | -0.093 |
humans | -0.083 |
erity | -0.083 |
Token | blood |
Token ID | 2910 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
icho | +0.160 |
llah | +0.158 |
Uri | +0.157 |
erity | +0.140 |
humans | +0.139 |
Neg logit contributions | |
kered | -0.233 |
Cly | -0.216 |
racted | -0.208 |
>>>>>>>> | -0.201 |
**************** | -0.196 |
Token | could |
Token ID | 714 |
Feature activation | -5.56e-02 |
Pos logit contributions | |
icho | +1.183 |
Uri | +1.170 |
llah | +1.166 |
humans | +1.044 |
alon | +1.042 |
Neg logit contributions | |
kered | -1.296 |
Cly | -1.183 |
racted | -1.125 |
>>>>>>>> | -1.103 |
★★ | -1.065 |
Token | remove |
Token ID | 4781 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
icho | +0.037 |
Uri | +0.037 |
llah | +0.037 |
humans | +0.033 |
erity | +0.033 |
Neg logit contributions | |
kered | -0.042 |
Cly | -0.038 |
racted | -0.037 |
>>>>>>>> | -0.036 |
★★ | -0.034 |
Token | � |
Token ID | 447 |
Feature activation | +5.85e-01 |
Pos logit contributions | |
icho | +0.008 |
Uri | +0.008 |
llah | +0.008 |
humans | +0.007 |
erity | +0.007 |
Neg logit contributions | |
kered | -0.009 |
Cly | -0.008 |
racted | -0.008 |
>>>>>>>> | -0.008 |
**************** | -0.007 |
Token | � |
Token ID | 251 |
Feature activation | +3.82e-02 |
Pos logit contributions | |
kered | +0.386 |
Cly | +0.347 |
racted | +0.332 |
>>>>>>>> | +0.321 |
★★ | +0.309 |
Neg logit contributions | |
icho | -0.447 |
Uri | -0.439 |
llah | -0.437 |
humans | -0.401 |
erity | -0.398 |
Token |
|
Token ID | 198 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
kered | +0.027 |
Cly | +0.025 |
racted | +0.023 |
>>>>>>>> | +0.023 |
★★ | +0.022 |
Neg logit contributions | |
icho | -0.027 |
Uri | -0.027 |
llah | -0.027 |
humans | -0.024 |
erity | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
kered | +0.189 |
Cly | +0.172 |
racted | +0.164 |
>>>>>>>> | +0.159 |
**************** | +0.153 |
Neg logit contributions | |
icho | -0.190 |
Uri | -0.188 |
llah | -0.188 |
erity | -0.169 |
humans | -0.169 |
Token | Richard |
Token ID | 22245 |
Feature activation | -1.74e-01 |
Pos logit contributions | |
kered | +0.188 |
Cly | +0.169 |
racted | +0.161 |
>>>>>>>> | +0.155 |
★★ | +0.149 |
Neg logit contributions | |
icho | -0.210 |
Uri | -0.208 |
llah | -0.208 |
humans | -0.188 |
erity | -0.188 |
Token | Painter |
Token ID | 49102 |
Feature activation | +3.03e+00 |
Pos logit contributions | |
Uri | +0.124 |
icho | +0.123 |
llah | +0.123 |
erity | +0.110 |
humans | +0.109 |
Neg logit contributions | |
kered | -0.124 |
Cly | -0.110 |
racted | -0.107 |
>>>>>>>> | -0.104 |
★★ | -0.100 |
Token | , |
Token ID | 11 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
kered | +2.009 |
Cly | +1.838 |
racted | +1.718 |
>>>>>>>> | +1.662 |
★★ | +1.620 |
Neg logit contributions | |
icho | -2.300 |
Uri | -2.248 |
llah | -2.247 |
humans | -2.053 |
erity | -2.047 |
Token | the |
Token ID | 262 |
Feature activation | +8.23e-03 |
Pos logit contributions | |
kered | +0.176 |
Cly | +0.161 |
racted | +0.153 |
>>>>>>>> | +0.148 |
★★ | +0.143 |
Neg logit contributions | |
icho | -0.165 |
llah | -0.163 |
Uri | -0.163 |
erity | -0.146 |
humans | -0.146 |
Token | chief |
Token ID | 4039 |
Feature activation | +2.19e-01 |
Pos logit contributions | |
kered | +0.006 |
Cly | +0.005 |
racted | +0.005 |
>>>>>>>> | +0.005 |
**************** | +0.005 |
Neg logit contributions | |
icho | -0.006 |
Uri | -0.006 |
llah | -0.006 |
humans | -0.005 |
erity | -0.005 |
Token | White |
Token ID | 2635 |
Feature activation | -4.34e-01 |
Pos logit contributions | |
kered | +0.142 |
Cly | +0.128 |
racted | +0.121 |
>>>>>>>> | +0.117 |
★★ | +0.112 |
Neg logit contributions | |
icho | -0.170 |
llah | -0.168 |
Uri | -0.168 |
humans | -0.152 |
erity | -0.152 |
Token | House |
Token ID | 2097 |
Feature activation | +1.28e-01 |
Pos logit contributions | |
icho | +0.375 |
Uri | +0.373 |
llah | +0.371 |
erity | +0.340 |
humans | +0.339 |
Neg logit contributions | |
kered | -0.242 |
Cly | -0.213 |
racted | -0.202 |
>>>>>>>> | -0.192 |
Changes | -0.182 |
Token | City |
Token ID | 2254 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
icho | +0.320 |
Uri | +0.318 |
llah | +0.315 |
erity | +0.279 |
humans | +0.278 |
Neg logit contributions | |
kered | -0.415 |
Cly | -0.380 |
racted | -0.367 |
>>>>>>>> | -0.356 |
★★ | -0.345 |
Token | Hall |
Token ID | 4789 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
icho | +0.668 |
Uri | +0.658 |
llah | +0.656 |
humans | +0.568 |
erity | +0.563 |
Neg logit contributions | |
kered | -1.120 |
Cly | -1.037 |
racted | -1.009 |
>>>>>>>> | -0.976 |
★★ | -0.951 |
Token | in |
Token ID | 287 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
icho | +0.557 |
Uri | +0.550 |
llah | +0.547 |
erity | +0.488 |
humans | +0.487 |
Neg logit contributions | |
kered | -0.643 |
Cly | -0.586 |
racted | -0.565 |
>>>>>>>> | -0.546 |
★★ | -0.529 |
Token | 2002 |
Token ID | 6244 |
Feature activation | +3.57e-01 |
Pos logit contributions | |
kered | +0.014 |
Cly | +0.012 |
racted | +0.012 |
>>>>>>>> | +0.012 |
**************** | +0.011 |
Neg logit contributions | |
icho | -0.013 |
Uri | -0.013 |
llah | -0.013 |
humans | -0.012 |
erity | -0.012 |
Token | v |
Token ID | 410 |
Feature activation | +9.02e-01 |
Pos logit contributions | |
kered | +0.269 |
Cly | +0.246 |
racted | +0.235 |
>>>>>>>> | +0.228 |
★★ | +0.220 |
Neg logit contributions | |
icho | -0.239 |
Uri | -0.236 |
llah | -0.236 |
erity | -0.211 |
humans | -0.211 |
Token | owing |
Token ID | 7855 |
Feature activation | +2.99e+00 |
Pos logit contributions | |
kered | +0.523 |
Cly | +0.465 |
racted | +0.439 |
>>>>>>>> | +0.419 |
**************** | +0.401 |
Neg logit contributions | |
icho | -0.759 |
Uri | -0.754 |
llah | -0.752 |
erity | -0.693 |
humans | -0.692 |
Token | to |
Token ID | 284 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
kered | +2.243 |
Cly | +2.066 |
racted | +1.968 |
>>>>>>>> | +1.903 |
★★ | +1.846 |
Neg logit contributions | |
icho | -1.981 |
llah | -1.965 |
Uri | -1.959 |
humans | -1.764 |
ixel | -1.757 |
Token | end |
Token ID | 886 |
Feature activation | -3.12e-01 |
Pos logit contributions | |
icho | +0.227 |
Uri | +0.224 |
llah | +0.224 |
humans | +0.201 |
erity | +0.201 |
Neg logit contributions | |
kered | -0.239 |
Cly | -0.217 |
racted | -0.208 |
>>>>>>>> | -0.201 |
**************** | -0.194 |
Token | homelessness |
Token ID | 28822 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
icho | +0.179 |
Uri | +0.177 |
llah | +0.176 |
erity | +0.154 |
humans | +0.154 |
Neg logit contributions | |
kered | -0.266 |
Cly | -0.245 |
racted | -0.236 |
>>>>>>>> | -0.230 |
★★ | -0.223 |
Token | as |
Token ID | 355 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
kered | +0.013 |
Cly | +0.012 |
racted | +0.012 |
>>>>>>>> | +0.011 |
★★ | +0.011 |
Neg logit contributions | |
icho | -0.012 |
Uri | -0.011 |
llah | -0.011 |
humans | -0.010 |
erity | -0.010 |
Token | we |
Token ID | 356 |
Feature activation | -7.04e-01 |
Pos logit contributions | |
icho | +0.125 |
llah | +0.123 |
Uri | +0.123 |
humans | +0.111 |
erity | +0.111 |
Neg logit contributions | |
kered | -0.125 |
Cly | -0.114 |
racted | -0.108 |
>>>>>>>> | -0.105 |
★★ | -0.101 |
Token | and |
Token ID | 290 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
kered | +0.478 |
Cly | +0.431 |
racted | +0.409 |
>>>>>>>> | +0.394 |
★★ | +0.379 |
Neg logit contributions | |
icho | -0.551 |
llah | -0.545 |
Uri | -0.545 |
humans | -0.494 |
erity | -0.493 |
Token | Creative |
Token ID | 17404 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
kered | +0.185 |
Cly | +0.168 |
racted | +0.158 |
>>>>>>>> | +0.151 |
★★ | +0.146 |
Neg logit contributions | |
icho | -0.228 |
llah | -0.226 |
Uri | -0.225 |
erity | -0.205 |
humans | -0.204 |
Token | Technology |
Token ID | 8987 |
Feature activation | -7.45e-02 |
Pos logit contributions | |
icho | +0.021 |
llah | +0.021 |
Uri | +0.021 |
ixel | +0.019 |
okia | +0.019 |
Neg logit contributions | |
kered | -0.015 |
Cly | -0.014 |
racted | -0.013 |
>>>>>>>> | -0.012 |
★★ | -0.012 |
Token | ( |
Token ID | 357 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
icho | +0.055 |
Uri | +0.054 |
llah | +0.054 |
erity | +0.049 |
humans | +0.049 |
Neg logit contributions | |
kered | -0.051 |
Cly | -0.047 |
racted | -0.044 |
>>>>>>>> | -0.043 |
★★ | -0.041 |
Token | F |
Token ID | 37 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
kered | +0.080 |
Cly | +0.070 |
racted | +0.066 |
>>>>>>>> | +0.063 |
★★ | +0.060 |
Neg logit contributions | |
icho | -0.131 |
Uri | -0.130 |
llah | -0.130 |
humans | -0.119 |
erity | -0.119 |
Token | ACT |
Token ID | 10659 |
Feature activation | +2.95e+00 |
Pos logit contributions | |
kered | +0.432 |
Cly | +0.395 |
racted | +0.378 |
>>>>>>>> | +0.366 |
**************** | +0.354 |
Neg logit contributions | |
icho | -0.401 |
Uri | -0.397 |
llah | -0.395 |
humans | -0.355 |
erity | -0.353 |
Token | ) |
Token ID | 8 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
kered | +1.904 |
Cly | +1.733 |
racted | +1.636 |
>>>>>>>> | +1.558 |
**************** | +1.521 |
Neg logit contributions | |
icho | -2.276 |
llah | -2.259 |
Uri | -2.244 |
humans | -2.038 |
erity | -2.027 |
Token | building |
Token ID | 2615 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
icho | +0.136 |
Uri | +0.135 |
llah | +0.135 |
humans | +0.122 |
erity | +0.122 |
Neg logit contributions | |
kered | -0.115 |
Cly | -0.104 |
racted | -0.098 |
>>>>>>>> | -0.094 |
**************** | -0.091 |
Token | in |
Token ID | 287 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
icho | +0.155 |
llah | +0.153 |
Uri | +0.153 |
erity | +0.137 |
humans | +0.137 |
Neg logit contributions | |
kered | -0.177 |
Cly | -0.163 |
racted | -0.155 |
>>>>>>>> | -0.150 |
**************** | -0.146 |
Token | Liverpool |
Token ID | 11761 |
Feature activation | -3.18e-01 |
Pos logit contributions | |
kered | +0.143 |
Cly | +0.131 |
racted | +0.124 |
>>>>>>>> | +0.120 |
**************** | +0.117 |
Neg logit contributions | |
icho | -0.133 |
llah | -0.131 |
Uri | -0.131 |
humans | -0.118 |
erity | -0.118 |
Token | , |
Token ID | 11 |
Feature activation | -7.48e-02 |
Pos logit contributions | |
icho | +0.224 |
Uri | +0.221 |
llah | +0.221 |
erity | +0.199 |
humans | +0.199 |
Neg logit contributions | |
kered | -0.229 |
Cly | -0.208 |
racted | -0.198 |
>>>>>>>> | -0.192 |
**************** | -0.185 |
Token | told |
Token ID | 1297 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
kered | +0.666 |
Cly | +0.615 |
racted | +0.587 |
>>>>>>>> | +0.571 |
**************** | +0.555 |
Neg logit contributions | |
icho | -0.495 |
llah | -0.485 |
Uri | -0.485 |
erity | -0.429 |
humans | -0.429 |
Token | CF |
Token ID | 18551 |
Feature activation | -7.99e-01 |
Pos logit contributions | |
kered | +0.824 |
Cly | +0.763 |
racted | +0.725 |
>>>>>>>> | +0.707 |
**************** | +0.686 |
Neg logit contributions | |
icho | -0.610 |
llah | -0.600 |
Uri | -0.598 |
erity | -0.530 |
humans | -0.530 |
Token | 13 |
Token ID | 1485 |
Feature activation | +5.78e-01 |
Pos logit contributions | |
icho | +0.645 |
Uri | +0.639 |
llah | +0.637 |
humans | +0.581 |
erity | +0.581 |
Neg logit contributions | |
kered | -0.492 |
Cly | -0.440 |
racted | -0.417 |
>>>>>>>> | -0.401 |
**************** | -0.383 |
Token | . |
Token ID | 13 |
Feature activation | +9.94e-01 |
Pos logit contributions | |
kered | +0.425 |
Cly | +0.389 |
racted | +0.370 |
>>>>>>>> | +0.358 |
**************** | +0.346 |
Neg logit contributions | |
icho | -0.398 |
Uri | -0.391 |
llah | -0.391 |
erity | -0.352 |
humans | -0.351 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
kered | +0.724 |
Cly | +0.660 |
racted | +0.630 |
>>>>>>>> | +0.608 |
**************** | +0.590 |
Neg logit contributions | |
icho | -0.691 |
Uri | -0.680 |
llah | -0.677 |
erity | -0.614 |
humans | -0.612 |
Token | Ever |
Token ID | 23921 |
Feature activation | +2.95e+00 |
Pos logit contributions | |
kered | +0.017 |
Cly | +0.015 |
racted | +0.015 |
>>>>>>>> | +0.014 |
★★ | +0.014 |
Neg logit contributions | |
icho | -0.018 |
Uri | -0.018 |
llah | -0.018 |
erity | -0.016 |
humans | -0.016 |
Token | been |
Token ID | 587 |
Feature activation | +7.72e-01 |
Pos logit contributions | |
kered | +2.225 |
Cly | +2.014 |
racted | +1.897 |
>>>>>>>> | +1.842 |
Changes | +1.797 |
Neg logit contributions | |
icho | -1.984 |
llah | -1.959 |
Uri | -1.955 |
erity | -1.757 |
irit | -1.743 |
Token | stuck |
Token ID | 7819 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
kered | +0.572 |
Cly | +0.523 |
racted | +0.499 |
>>>>>>>> | +0.479 |
**************** | +0.465 |
Neg logit contributions | |
icho | -0.528 |
llah | -0.523 |
Uri | -0.517 |
erity | -0.469 |
humans | -0.467 |
Token | in |
Token ID | 287 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
icho | +0.636 |
Uri | +0.630 |
llah | +0.626 |
humans | +0.554 |
erity | +0.552 |
Neg logit contributions | |
kered | -0.815 |
Cly | -0.750 |
racted | -0.720 |
>>>>>>>> | -0.702 |
★★ | -0.680 |
Token | a |
Token ID | 257 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
kered | +0.132 |
Cly | +0.121 |
racted | +0.116 |
>>>>>>>> | +0.112 |
**************** | +0.109 |
Neg logit contributions | |
icho | -0.106 |
llah | -0.104 |
Uri | -0.104 |
erity | -0.093 |
humans | -0.092 |
Token | situation |
Token ID | 3074 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
kered | +0.290 |
Cly | +0.267 |
racted | +0.254 |
>>>>>>>> | +0.247 |
★★ | +0.239 |
Neg logit contributions | |
icho | -0.234 |
llah | -0.233 |
Uri | -0.229 |
erity | -0.208 |
humans | -0.206 |
Token | 's |
Token ID | 338 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
kered | +0.661 |
Cly | +0.604 |
racted | +0.569 |
>>>>>>>> | +0.551 |
★★ | +0.531 |
Neg logit contributions | |
icho | -0.711 |
llah | -0.702 |
Uri | -0.699 |
erity | -0.633 |
humans | -0.633 |
Token | cancellation |
Token ID | 25395 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
icho | +0.108 |
llah | +0.106 |
Uri | +0.106 |
humans | +0.095 |
erity | +0.094 |
Neg logit contributions | |
kered | -0.127 |
Cly | -0.116 |
racted | -0.111 |
>>>>>>>> | -0.108 |
★★ | -0.104 |
Token | and |
Token ID | 290 |
Feature activation | +7.27e-02 |
Pos logit contributions | |
kered | +1.023 |
Cly | +0.933 |
racted | +0.888 |
>>>>>>>> | +0.862 |
**************** | +0.833 |
Neg logit contributions | |
icho | -0.988 |
llah | -0.974 |
Uri | -0.974 |
erity | -0.876 |
humans | -0.874 |
Token | Yog |
Token ID | 31604 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
kered | +0.055 |
Cly | +0.051 |
racted | +0.048 |
>>>>>>>> | +0.047 |
★★ | +0.045 |
Neg logit contributions | |
icho | -0.049 |
llah | -0.048 |
Uri | -0.048 |
humans | -0.043 |
erity | -0.043 |
Token | sc |
Token ID | 1416 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
kered | +1.161 |
Cly | +1.071 |
racted | +1.031 |
>>>>>>>> | +1.006 |
★★ | +0.975 |
Neg logit contributions | |
icho | -0.768 |
Uri | -0.757 |
llah | -0.755 |
humans | -0.662 |
erity | -0.661 |
Token | ast |
Token ID | 459 |
Feature activation | +2.93e+00 |
Pos logit contributions | |
kered | +1.226 |
Cly | +1.121 |
racted | +1.081 |
>>>>>>>> | +1.037 |
Changes | +1.004 |
Neg logit contributions | |
Uri | -0.963 |
icho | -0.958 |
llah | -0.954 |
humans | -0.841 |
challeng | -0.832 |
Token | 's |
Token ID | 338 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
kered | +2.080 |
Cly | +1.925 |
racted | +1.810 |
>>>>>>>> | +1.748 |
★★ | +1.700 |
Neg logit contributions | |
icho | -2.070 |
llah | -2.041 |
Uri | -2.020 |
erity | -1.822 |
humans | -1.820 |
Token | subsequent |
Token ID | 8840 |
Feature activation | +7.67e-01 |
Pos logit contributions | |
icho | +0.136 |
Uri | +0.134 |
llah | +0.134 |
humans | +0.120 |
erity | +0.120 |
Neg logit contributions | |
kered | -0.152 |
Cly | -0.139 |
racted | -0.133 |
>>>>>>>> | -0.129 |
★★ | -0.125 |
Token | offer |
Token ID | 2897 |
Feature activation | +2.61e-01 |
Pos logit contributions | |
kered | +0.555 |
Cly | +0.508 |
racted | +0.480 |
>>>>>>>> | +0.467 |
**************** | +0.451 |
Neg logit contributions | |
icho | -0.537 |
llah | -0.531 |
Uri | -0.528 |
humans | -0.477 |
erity | -0.476 |
Token | of |
Token ID | 286 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
kered | +0.205 |
Cly | +0.189 |
racted | +0.181 |
>>>>>>>> | +0.176 |
**************** | +0.170 |
Neg logit contributions | |
icho | -0.166 |
llah | -0.164 |
Uri | -0.164 |
humans | -0.145 |
erity | -0.145 |
Token | a |
Token ID | 257 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
kered | +0.026 |
Cly | +0.024 |
racted | +0.023 |
>>>>>>>> | +0.022 |
**************** | +0.022 |
Neg logit contributions | |
icho | -0.023 |
Uri | -0.023 |
llah | -0.023 |
humans | -0.020 |
erity | -0.020 |
Token | the |
Token ID | 262 |
Feature activation | -2.25e-02 |
Pos logit contributions | |
icho | +0.127 |
Uri | +0.126 |
llah | +0.125 |
erity | +0.112 |
humans | +0.112 |
Neg logit contributions | |
kered | -0.135 |
Cly | -0.123 |
racted | -0.118 |
>>>>>>>> | -0.114 |
**************** | -0.110 |
Token | smoother |
Token ID | 32686 |
Feature activation | +3.39e-02 |
Pos logit contributions | |
icho | +0.016 |
Uri | +0.016 |
llah | +0.016 |
erity | +0.014 |
humans | +0.014 |
Neg logit contributions | |
kered | -0.016 |
Cly | -0.015 |
racted | -0.014 |
>>>>>>>> | -0.014 |
★★ | -0.013 |
Token | - |
Token ID | 12 |
Feature activation | +7.13e-01 |
Pos logit contributions | |
kered | +0.023 |
Cly | +0.021 |
racted | +0.020 |
>>>>>>>> | +0.019 |
**************** | +0.019 |
Neg logit contributions | |
icho | -0.025 |
Uri | -0.025 |
llah | -0.024 |
humans | -0.022 |
erity | -0.022 |
Token | talking |
Token ID | 48186 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
kered | +0.472 |
Cly | +0.425 |
racted | +0.404 |
>>>>>>>> | +0.390 |
**************** | +0.374 |
Neg logit contributions | |
icho | -0.544 |
Uri | -0.539 |
llah | -0.538 |
erity | -0.487 |
humans | -0.487 |
Token | Todd |
Token ID | 14377 |
Feature activation | -4.87e-02 |
Pos logit contributions | |
icho | +0.127 |
Uri | +0.126 |
llah | +0.124 |
erity | +0.112 |
humans | +0.112 |
Neg logit contributions | |
kered | -0.126 |
Cly | -0.114 |
racted | -0.110 |
>>>>>>>> | -0.106 |
Changes | -0.102 |
Token | Akin |
Token ID | 48857 |
Feature activation | +2.90e+00 |
Pos logit contributions | |
icho | +0.034 |
llah | +0.034 |
Uri | +0.033 |
humans | +0.030 |
erity | +0.030 |
Neg logit contributions | |
kered | -0.035 |
Cly | -0.032 |
racted | -0.031 |
>>>>>>>> | -0.030 |
**************** | -0.029 |
Token | , |
Token ID | 11 |
Feature activation | +5.76e-01 |
Pos logit contributions | |
kered | +1.976 |
Cly | +1.797 |
racted | +1.682 |
>>>>>>>> | +1.639 |
**************** | +1.578 |
Neg logit contributions | |
icho | -2.143 |
Uri | -2.126 |
llah | -2.121 |
humans | -1.930 |
erity | -1.911 |
Token | Pence |
Token ID | 17339 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
kered | +0.433 |
Cly | +0.395 |
racted | +0.378 |
>>>>>>>> | +0.366 |
★★ | +0.354 |
Neg logit contributions | |
icho | -0.387 |
Uri | -0.383 |
llah | -0.382 |
humans | -0.342 |
erity | -0.341 |
Token | had |
Token ID | 550 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
kered | +0.673 |
Cly | +0.602 |
racted | +0.568 |
>>>>>>>> | +0.548 |
★★ | +0.525 |
Neg logit contributions | |
icho | -0.867 |
Uri | -0.859 |
llah | -0.857 |
humans | -0.782 |
erity | -0.780 |
Token | been |
Token ID | 587 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
kered | +0.314 |
Cly | +0.287 |
racted | +0.274 |
>>>>>>>> | +0.267 |
★★ | +0.258 |
Neg logit contributions | |
icho | -0.262 |
llah | -0.259 |
Uri | -0.258 |
humans | -0.230 |
erity | -0.230 |
Token | presented |
Token ID | 5545 |
Feature activation | -4.45e-01 |
Pos logit contributions | |
kered | +0.234 |
Cly | +0.213 |
racted | +0.203 |
>>>>>>>> | +0.197 |
**************** | +0.191 |
Neg logit contributions | |
icho | -0.216 |
llah | -0.214 |
Uri | -0.213 |
erity | -0.192 |
humans | -0.191 |
Token | burning |
Token ID | 9482 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
kered | +0.109 |
Cly | +0.101 |
racted | +0.097 |
>>>>>>>> | +0.094 |
**************** | +0.092 |
Neg logit contributions | |
icho | -0.068 |
llah | -0.068 |
Uri | -0.067 |
erity | -0.059 |
humans | -0.058 |
Token | sugar |
Token ID | 7543 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
kered | +0.154 |
Cly | +0.142 |
racted | +0.135 |
>>>>>>>> | +0.132 |
**************** | +0.128 |
Neg logit contributions | |
icho | -0.121 |
llah | -0.119 |
Uri | -0.119 |
erity | -0.105 |
humans | -0.105 |
Token | ( |
Token ID | 357 |
Feature activation | +6.70e-01 |
Pos logit contributions | |
kered | +1.184 |
Cly | +1.076 |
racted | +1.027 |
>>>>>>>> | +0.995 |
★★ | +0.959 |
Neg logit contributions | |
icho | -1.171 |
Uri | -1.159 |
llah | -1.156 |
erity | -1.040 |
humans | -1.038 |
Token | gl |
Token ID | 4743 |
Feature activation | +8.98e-01 |
Pos logit contributions | |
kered | +0.519 |
Cly | +0.475 |
racted | +0.455 |
>>>>>>>> | +0.442 |
★★ | +0.430 |
Neg logit contributions | |
icho | -0.434 |
Uri | -0.431 |
llah | -0.430 |
erity | -0.381 |
humans | -0.377 |
Token | uc |
Token ID | 1229 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
kered | +0.485 |
Cly | +0.426 |
racted | +0.400 |
>>>>>>>> | +0.381 |
**************** | +0.363 |
Neg logit contributions | |
icho | -0.793 |
Uri | -0.788 |
llah | -0.786 |
humans | -0.723 |
erity | -0.722 |
Token | ose |
Token ID | 577 |
Feature activation | +2.89e+00 |
Pos logit contributions | |
kered | +0.979 |
Cly | +0.891 |
racted | +0.860 |
>>>>>>>> | +0.830 |
**************** | +0.807 |
Neg logit contributions | |
icho | -0.764 |
Uri | -0.761 |
llah | -0.759 |
humans | -0.672 |
erity | -0.672 |
Token | ) |
Token ID | 8 |
Feature activation | +7.67e-01 |
Pos logit contributions | |
kered | +2.002 |
Cly | +1.815 |
racted | +1.713 |
>>>>>>>> | +1.670 |
★★ | +1.617 |
Neg logit contributions | |
icho | -2.104 |
Uri | -2.096 |
llah | -2.086 |
erity | -1.882 |
humans | -1.877 |
Token | from |
Token ID | 422 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
kered | +0.572 |
Cly | +0.522 |
racted | +0.499 |
>>>>>>>> | +0.484 |
★★ | +0.467 |
Neg logit contributions | |
icho | -0.521 |
Uri | -0.514 |
llah | -0.514 |
humans | -0.460 |
erity | -0.459 |
Token | the |
Token ID | 262 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
kered | +0.189 |
Cly | +0.174 |
racted | +0.166 |
>>>>>>>> | +0.161 |
**************** | +0.156 |
Neg logit contributions | |
icho | -0.160 |
Uri | -0.159 |
llah | -0.158 |
erity | -0.141 |
humans | -0.141 |
Token | fed |
Token ID | 11672 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
icho | +0.107 |
Uri | +0.105 |
llah | +0.105 |
humans | +0.094 |
erity | +0.094 |
Neg logit contributions | |
kered | -0.127 |
Cly | -0.116 |
racted | -0.111 |
>>>>>>>> | -0.107 |
**************** | -0.104 |
Token | state |
Token ID | 1181 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
icho | +0.122 |
Uri | +0.121 |
llah | +0.121 |
humans | +0.110 |
erity | +0.110 |
Neg logit contributions | |
kered | -0.092 |
Cly | -0.082 |
racted | -0.078 |
>>>>>>>> | -0.075 |
★★ | -0.072 |
Token | switch |
Token ID | 5078 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
kered | +0.031 |
Cly | +0.027 |
racted | +0.025 |
>>>>>>>> | +0.024 |
**************** | +0.023 |
Neg logit contributions | |
icho | -0.054 |
llah | -0.054 |
Uri | -0.054 |
humans | -0.050 |
erity | -0.050 |
Token | , |
Token ID | 11 |
Feature activation | +4.95e-01 |
Pos logit contributions | |
kered | +0.169 |
Cly | +0.152 |
racted | +0.145 |
>>>>>>>> | +0.140 |
★★ | +0.135 |
Neg logit contributions | |
icho | -0.183 |
Uri | -0.181 |
llah | -0.180 |
erity | -0.163 |
humans | -0.163 |
Token | just |
Token ID | 655 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
kered | +0.365 |
Cly | +0.333 |
racted | +0.317 |
>>>>>>>> | +0.306 |
**************** | +0.297 |
Neg logit contributions | |
icho | -0.341 |
llah | -0.337 |
Uri | -0.335 |
erity | -0.303 |
humans | -0.301 |
Token | leave |
Token ID | 2666 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
icho | +0.103 |
llah | +0.102 |
Uri | +0.102 |
humans | +0.092 |
erity | +0.092 |
Neg logit contributions | |
kered | -0.103 |
Cly | -0.094 |
racted | -0.089 |
>>>>>>>> | -0.086 |
**************** | -0.083 |
Token | everything |
Token ID | 2279 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
kered | +0.966 |
Cly | +0.896 |
racted | +0.867 |
>>>>>>>> | +0.842 |
**************** | +0.825 |
Neg logit contributions | |
icho | -0.562 |
llah | -0.552 |
Uri | -0.547 |
erity | -0.479 |
humans | -0.473 |
Token | alone |
Token ID | 3436 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
kered | +1.047 |
Cly | +0.960 |
racted | +0.918 |
>>>>>>>> | +0.888 |
**************** | +0.866 |
Neg logit contributions | |
icho | -0.881 |
llah | -0.868 |
Uri | -0.865 |
erity | -0.775 |
humans | -0.771 |
Token | ). |
Token ID | 737 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
kered | +1.842 |
Cly | +1.657 |
racted | +1.578 |
>>>>>>>> | +1.514 |
**************** | +1.488 |
Neg logit contributions | |
icho | -2.220 |
Uri | -2.192 |
llah | -2.188 |
erity | -1.993 |
humans | -1.987 |
Token | We |
Token ID | 775 |
Feature activation | +9.61e-02 |
Pos logit contributions | |
icho | +0.148 |
llah | +0.146 |
Uri | +0.145 |
erity | +0.129 |
humans | +0.129 |
Neg logit contributions | |
kered | -0.183 |
Cly | -0.169 |
racted | -0.161 |
>>>>>>>> | -0.157 |
**************** | -0.152 |
Token | also |
Token ID | 635 |
Feature activation | -2.16e-02 |
Pos logit contributions | |
kered | +0.071 |
Cly | +0.065 |
racted | +0.062 |
>>>>>>>> | +0.060 |
**************** | +0.058 |
Neg logit contributions | |
icho | -0.066 |
Uri | -0.065 |
llah | -0.065 |
humans | -0.058 |
erity | -0.058 |
Token | discussed |
Token ID | 6693 |
Feature activation | -7.05e-01 |
Pos logit contributions | |
icho | +0.015 |
Uri | +0.015 |
llah | +0.015 |
humans | +0.013 |
erity | +0.013 |
Neg logit contributions | |
kered | -0.016 |
Cly | -0.015 |
racted | -0.014 |
>>>>>>>> | -0.014 |
**************** | -0.013 |
Token | lowering |
Token ID | 21683 |
Feature activation | -7.23e-01 |
Pos logit contributions | |
icho | +0.449 |
Uri | +0.444 |
llah | +0.443 |
humans | +0.393 |
erity | +0.393 |
Neg logit contributions | |
kered | -0.555 |
Cly | -0.509 |
racted | -0.488 |
>>>>>>>> | -0.474 |
★★ | -0.459 |
Token | this |
Token ID | 428 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
kered | +0.566 |
Cly | +0.514 |
racted | +0.490 |
>>>>>>>> | +0.474 |
**************** | +0.458 |
Neg logit contributions | |
icho | -0.571 |
Uri | -0.566 |
llah | -0.565 |
erity | -0.509 |
humans | -0.509 |
Token | ). |
Token ID | 737 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
kered | +0.279 |
Cly | +0.251 |
racted | +0.239 |
>>>>>>>> | +0.230 |
★★ | +0.222 |
Neg logit contributions | |
icho | -0.319 |
Uri | -0.316 |
llah | -0.316 |
humans | -0.286 |
erity | -0.285 |
Token |
|
Token ID | 198 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
kered | +0.186 |
Cly | +0.173 |
racted | +0.166 |
>>>>>>>> | +0.162 |
★★ | +0.158 |
Neg logit contributions | |
icho | -0.127 |
llah | -0.125 |
Uri | -0.123 |
erity | -0.109 |
humans | -0.108 |
Token |
|
Token ID | 198 |
Feature activation | -1.90e-01 |
Pos logit contributions | |
icho | +0.118 |
Uri | +0.116 |
llah | +0.116 |
erity | +0.105 |
humans | +0.105 |
Neg logit contributions | |
kered | -0.119 |
Cly | -0.108 |
racted | -0.103 |
>>>>>>>> | -0.100 |
**************** | -0.096 |
Token | H |
Token ID | 39 |
Feature activation | +7.85e-02 |
Pos logit contributions | |
icho | +0.145 |
Uri | +0.144 |
llah | +0.143 |
humans | +0.131 |
erity | +0.130 |
Neg logit contributions | |
kered | -0.126 |
Cly | -0.113 |
racted | -0.107 |
>>>>>>>> | -0.103 |
★★ | -0.098 |
Token | azel |
Token ID | 41319 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
kered | +0.052 |
Cly | +0.047 |
racted | +0.044 |
>>>>>>>> | +0.043 |
★★ | +0.041 |
Neg logit contributions | |
icho | -0.060 |
Uri | -0.060 |
llah | -0.059 |
erity | -0.054 |
humans | -0.054 |
Token | nut |
Token ID | 14930 |
Feature activation | +8.14e-01 |
Pos logit contributions | |
kered | +2.065 |
Cly | +1.930 |
racted | +1.787 |
>>>>>>>> | +1.722 |
★★ | +1.704 |
Neg logit contributions | |
icho | -1.908 |
llah | -1.903 |
Uri | -1.873 |
ixel | -1.697 |
humans | -1.693 |
Token | Fl |
Token ID | 1610 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
kered | +0.583 |
Cly | +0.534 |
racted | +0.506 |
>>>>>>>> | +0.489 |
★★ | +0.474 |
Neg logit contributions | |
icho | -0.577 |
llah | -0.570 |
Uri | -0.567 |
humans | -0.513 |
erity | -0.510 |
Token | our |
Token ID | 454 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
icho | +0.275 |
Uri | +0.271 |
llah | +0.271 |
erity | +0.241 |
humans | +0.240 |
Neg logit contributions | |
kered | -0.338 |
Cly | -0.310 |
racted | -0.297 |
>>>>>>>> | -0.289 |
★★ | -0.280 |
Token | — |
Token ID | 960 |
Feature activation | -1.55e-03 |
Pos logit contributions | |
kered | +0.341 |
Cly | +0.314 |
racted | +0.303 |
>>>>>>>> | +0.295 |
**************** | +0.286 |
Neg logit contributions | |
icho | -0.226 |
Uri | -0.223 |
llah | -0.222 |
erity | -0.195 |
humans | -0.194 |
Token | This |
Token ID | 1212 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
icho | +0.001 |
llah | +0.001 |
Uri | +0.001 |
erity | +0.001 |
humans | +0.001 |
Neg logit contributions | |
kered | -0.001 |
Cly | -0.001 |
racted | -0.001 |
>>>>>>>> | -0.001 |
★★ | -0.001 |
Token | who |
Token ID | 508 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
kered | +0.524 |
Cly | +0.475 |
racted | +0.447 |
>>>>>>>> | +0.433 |
**************** | +0.417 |
Neg logit contributions | |
icho | -0.567 |
llah | -0.563 |
Uri | -0.560 |
humans | -0.508 |
erity | -0.508 |
Token | once |
Token ID | 1752 |
Feature activation | -2.36e-01 |
Pos logit contributions | |
icho | +0.305 |
Uri | +0.302 |
llah | +0.301 |
humans | +0.270 |
erity | +0.270 |
Neg logit contributions | |
kered | -0.326 |
Cly | -0.297 |
racted | -0.284 |
>>>>>>>> | -0.275 |
★★ | -0.266 |
Token | chased |
Token ID | 26172 |
Feature activation | -3.60e-01 |
Pos logit contributions | |
icho | +0.158 |
Uri | +0.157 |
llah | +0.156 |
humans | +0.140 |
erity | +0.139 |
Neg logit contributions | |
kered | -0.177 |
Cly | -0.162 |
racted | -0.155 |
>>>>>>>> | -0.150 |
★★ | -0.145 |
Token | our |
Token ID | 674 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
icho | +0.237 |
llah | +0.234 |
Uri | +0.234 |
erity | +0.208 |
humans | +0.208 |
Neg logit contributions | |
kered | -0.276 |
Cly | -0.253 |
racted | -0.242 |
>>>>>>>> | -0.235 |
**************** | -0.227 |
Token | current |
Token ID | 1459 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
icho | +0.119 |
llah | +0.117 |
Uri | +0.117 |
erity | +0.104 |
humans | +0.104 |
Neg logit contributions | |
kered | -0.144 |
Cly | -0.132 |
racted | -0.127 |
>>>>>>>> | -0.123 |
**************** | -0.119 |
Token | guest |
Token ID | 8319 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
kered | +0.374 |
Cly | +0.343 |
racted | +0.327 |
>>>>>>>> | +0.318 |
**************** | +0.307 |
Neg logit contributions | |
icho | -0.329 |
llah | -0.325 |
Uri | -0.324 |
erity | -0.289 |
humans | -0.289 |
Token | blogger |
Token ID | 23530 |
Feature activation | +7.19e-01 |
Pos logit contributions | |
kered | +1.944 |
Cly | +1.776 |
racted | +1.658 |
>>>>>>>> | +1.615 |
★★ | +1.568 |
Neg logit contributions | |
icho | -2.004 |
llah | -1.990 |
Uri | -1.951 |
erity | -1.798 |
humans | -1.789 |
Token | Richard |
Token ID | 6219 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
kered | +0.521 |
Cly | +0.478 |
racted | +0.452 |
>>>>>>>> | +0.439 |
**************** | +0.424 |
Neg logit contributions | |
icho | -0.503 |
llah | -0.497 |
Uri | -0.493 |
erity | -0.446 |
humans | -0.445 |
Token | Dawkins |
Token ID | 38922 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
icho | +0.311 |
Uri | +0.308 |
llah | +0.307 |
erity | +0.275 |
humans | +0.275 |
Neg logit contributions | |
kered | -0.336 |
Cly | -0.305 |
racted | -0.292 |
>>>>>>>> | -0.283 |
**************** | -0.273 |
Token | off |
Token ID | 572 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
kered | +0.832 |
Cly | +0.763 |
racted | +0.721 |
>>>>>>>> | +0.699 |
**************** | +0.681 |
Neg logit contributions | |
icho | -0.825 |
llah | -0.812 |
Uri | -0.808 |
humans | -0.730 |
erity | -0.729 |
Token | his |
Token ID | 465 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
icho | +0.266 |
Uri | +0.264 |
llah | +0.262 |
humans | +0.232 |
erity | +0.232 |
Neg logit contributions | |
kered | -0.347 |
Cly | -0.318 |
racted | -0.306 |
>>>>>>>> | -0.298 |
★★ | -0.288 |
Token | " |
Token ID | 366 |
Feature activation | +5.49e-01 |
Pos logit contributions | |
kered | +0.257 |
Cly | +0.233 |
racted | +0.223 |
>>>>>>>> | +0.215 |
**************** | +0.208 |
Neg logit contributions | |
icho | -0.253 |
llah | -0.250 |
Uri | -0.250 |
humans | -0.225 |
erity | -0.225 |
Token | al |
Token ID | 282 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
kered | +0.413 |
Cly | +0.376 |
racted | +0.362 |
>>>>>>>> | +0.350 |
**************** | +0.339 |
Neg logit contributions | |
icho | -0.368 |
Uri | -0.365 |
llah | -0.364 |
erity | -0.325 |
humans | -0.323 |
Token | ready |
Token ID | 1493 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
kered | +0.892 |
Cly | +0.805 |
racted | +0.781 |
>>>>>>>> | +0.747 |
**************** | +0.723 |
Neg logit contributions | |
icho | -0.830 |
Uri | -0.826 |
llah | -0.822 |
humans | -0.742 |
alon | -0.734 |
Token | been |
Token ID | 587 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
kered | +0.154 |
Cly | +0.140 |
racted | +0.133 |
>>>>>>>> | +0.129 |
**************** | +0.125 |
Neg logit contributions | |
icho | -0.153 |
Uri | -0.152 |
llah | -0.152 |
humans | -0.136 |
erity | -0.136 |
Token | c |
Token ID | 269 |
Feature activation | +8.12e-02 |
Pos logit contributions | |
kered | +0.254 |
Cly | +0.229 |
racted | +0.219 |
>>>>>>>> | +0.211 |
**************** | +0.204 |
Neg logit contributions | |
icho | -0.274 |
llah | -0.271 |
Uri | -0.271 |
erity | -0.246 |
humans | -0.245 |
Token | ashed |
Token ID | 5263 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
kered | +0.059 |
Cly | +0.054 |
racted | +0.052 |
>>>>>>>> | +0.050 |
★★ | +0.048 |
Neg logit contributions | |
icho | -0.056 |
Uri | -0.055 |
llah | -0.055 |
humans | -0.050 |
erity | -0.050 |
Token | and |
Token ID | 290 |
Feature activation | -5.79e-03 |
Pos logit contributions | |
kered | +2.121 |
Cly | +1.916 |
racted | +1.845 |
>>>>>>>> | +1.785 |
**************** | +1.765 |
Neg logit contributions | |
icho | -1.833 |
Uri | -1.796 |
llah | -1.786 |
humans | -1.626 |
erity | -1.620 |
Token | the |
Token ID | 262 |
Feature activation | +7.06e-02 |
Pos logit contributions | |
icho | +0.004 |
Uri | +0.004 |
llah | +0.004 |
humans | +0.003 |
erity | +0.003 |
Neg logit contributions | |
kered | -0.004 |
Cly | -0.004 |
racted | -0.004 |
>>>>>>>> | -0.004 |
**************** | -0.004 |
Token | name |
Token ID | 1438 |
Feature activation | +6.49e-01 |
Pos logit contributions | |
kered | +0.053 |
Cly | +0.049 |
racted | +0.046 |
>>>>>>>> | +0.045 |
**************** | +0.044 |
Neg logit contributions | |
icho | -0.047 |
Uri | -0.047 |
llah | -0.047 |
erity | -0.042 |
humans | -0.042 |
Token | on |
Token ID | 319 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
kered | +0.497 |
Cly | +0.454 |
racted | +0.433 |
>>>>>>>> | +0.421 |
**************** | +0.409 |
Neg logit contributions | |
icho | -0.429 |
Uri | -0.423 |
llah | -0.422 |
humans | -0.379 |
erity | -0.376 |
Token | the |
Token ID | 262 |
Feature activation | -4.47e-02 |
Pos logit contributions | |
kered | +0.111 |
Cly | +0.103 |
racted | +0.099 |
>>>>>>>> | +0.097 |
**************** | +0.094 |
Neg logit contributions | |
icho | -0.062 |
Uri | -0.061 |
llah | -0.061 |
erity | -0.053 |
humans | -0.053 |
Token | point |
Token ID | 966 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
icho | +0.387 |
Uri | +0.383 |
llah | +0.381 |
erity | +0.342 |
humans | +0.342 |
Neg logit contributions | |
kered | -0.414 |
Cly | -0.377 |
racted | -0.362 |
>>>>>>>> | -0.350 |
**************** | -0.338 |
Token | this |
Token ID | 428 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
kered | +0.122 |
Cly | +0.111 |
racted | +0.106 |
>>>>>>>> | +0.103 |
**************** | +0.099 |
Neg logit contributions | |
icho | -0.110 |
llah | -0.109 |
Uri | -0.109 |
erity | -0.097 |
humans | -0.097 |
Token | time |
Token ID | 640 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
icho | +0.986 |
Uri | +0.981 |
llah | +0.970 |
humans | +0.868 |
erity | +0.866 |
Neg logit contributions | |
kered | -1.125 |
Cly | -1.023 |
racted | -0.985 |
>>>>>>>> | -0.955 |
**************** | -0.921 |
Token | , |
Token ID | 11 |
Feature activation | +2.74e-01 |
Pos logit contributions | |
icho | +0.232 |
Uri | +0.229 |
llah | +0.229 |
humans | +0.206 |
erity | +0.205 |
Neg logit contributions | |
kered | -0.237 |
Cly | -0.216 |
racted | -0.206 |
>>>>>>>> | -0.199 |
**************** | -0.192 |
Token | though |
Token ID | 996 |
Feature activation | +6.70e-01 |
Pos logit contributions | |
kered | +0.208 |
Cly | +0.192 |
racted | +0.182 |
>>>>>>>> | +0.177 |
**************** | +0.171 |
Neg logit contributions | |
icho | -0.181 |
llah | -0.179 |
Uri | -0.178 |
erity | -0.160 |
humans | -0.159 |
Token | , |
Token ID | 11 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
kered | +0.484 |
Cly | +0.442 |
racted | +0.420 |
>>>>>>>> | +0.407 |
★★ | +0.393 |
Neg logit contributions | |
icho | -0.470 |
llah | -0.465 |
Uri | -0.463 |
erity | -0.417 |
humans | -0.416 |
Token | making |
Token ID | 1642 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
kered | +2.072 |
Cly | +1.927 |
racted | +1.802 |
>>>>>>>> | +1.762 |
**************** | +1.707 |
Neg logit contributions | |
icho | -1.860 |
llah | -1.841 |
Uri | -1.799 |
erity | -1.650 |
irit | -1.633 |
Token | it |
Token ID | 340 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
kered | +0.358 |
Cly | +0.331 |
racted | +0.316 |
>>>>>>>> | +0.308 |
★★ | +0.298 |
Neg logit contributions | |
icho | -0.268 |
llah | -0.265 |
Uri | -0.263 |
erity | -0.234 |
humans | -0.233 |
Token | a |
Token ID | 257 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
kered | +0.401 |
Cly | +0.367 |
racted | +0.351 |
>>>>>>>> | +0.341 |
★★ | +0.330 |
Neg logit contributions | |
icho | -0.345 |
llah | -0.341 |
Uri | -0.341 |
humans | -0.304 |
erity | -0.303 |
Token | 15 |
Token ID | 1315 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
kered | +0.498 |
Cly | +0.458 |
racted | +0.436 |
>>>>>>>> | +0.424 |
★★ | +0.411 |
Neg logit contributions | |
icho | -0.409 |
llah | -0.406 |
Uri | -0.402 |
erity | -0.361 |
humans | -0.361 |
Token | - |
Token ID | 12 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
icho | +0.345 |
Uri | +0.342 |
llah | +0.341 |
erity | +0.311 |
humans | +0.310 |
Neg logit contributions | |
kered | -0.270 |
Cly | -0.242 |
racted | -0.229 |
>>>>>>>> | -0.220 |
★★ | -0.212 |
Token | , |
Token ID | 11 |
Feature activation | +6.21e-01 |
Pos logit contributions | |
kered | +0.321 |
Cly | +0.293 |
racted | +0.281 |
>>>>>>>> | +0.273 |
**************** | +0.263 |
Neg logit contributions | |
icho | -0.273 |
Uri | -0.270 |
llah | -0.269 |
humans | -0.239 |
erity | -0.239 |
Token | where |
Token ID | 810 |
Feature activation | +5.45e-02 |
Pos logit contributions | |
kered | +0.458 |
Cly | +0.417 |
racted | +0.399 |
>>>>>>>> | +0.386 |
★★ | +0.373 |
Neg logit contributions | |
icho | -0.427 |
Uri | -0.422 |
llah | -0.422 |
humans | -0.378 |
erity | -0.378 |
Token | an |
Token ID | 281 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
kered | +0.044 |
Cly | +0.040 |
racted | +0.038 |
>>>>>>>> | +0.038 |
★★ | +0.036 |
Neg logit contributions | |
icho | -0.034 |
Uri | -0.033 |
llah | -0.033 |
erity | -0.030 |
humans | -0.030 |
Token | imitation |
Token ID | 40260 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
icho | +0.168 |
Uri | +0.166 |
llah | +0.165 |
erity | +0.148 |
humans | +0.148 |
Neg logit contributions | |
kered | -0.184 |
Cly | -0.168 |
racted | -0.161 |
>>>>>>>> | -0.156 |
★★ | -0.150 |
Token | Ver |
Token ID | 4643 |
Feature activation | -5.78e-01 |
Pos logit contributions | |
kered | +0.259 |
Cly | +0.238 |
racted | +0.224 |
>>>>>>>> | +0.218 |
★★ | +0.211 |
Neg logit contributions | |
icho | -0.229 |
llah | -0.227 |
Uri | -0.225 |
erity | -0.203 |
humans | -0.202 |
Token | me |
Token ID | 1326 |
Feature activation | +2.74e+00 |
Pos logit contributions | |
icho | +0.398 |
Uri | +0.392 |
llah | +0.392 |
erity | +0.351 |
humans | +0.351 |
Neg logit contributions | |
kered | -0.426 |
Cly | -0.387 |
racted | -0.371 |
>>>>>>>> | -0.361 |
Changes | -0.347 |
Token | er |
Token ID | 263 |
Feature activation | -6.11e-01 |
Pos logit contributions | |
kered | +1.882 |
Cly | +1.687 |
racted | +1.613 |
>>>>>>>> | +1.546 |
★★ | +1.498 |
Neg logit contributions | |
icho | -2.008 |
Uri | -1.992 |
llah | -1.983 |
erity | -1.818 |
humans | -1.794 |
Token | hung |
Token ID | 9174 |
Feature activation | +5.50e-01 |
Pos logit contributions | |
icho | +0.426 |
Uri | +0.421 |
llah | +0.419 |
erity | +0.376 |
humans | +0.376 |
Neg logit contributions | |
kered | -0.444 |
Cly | -0.403 |
racted | -0.388 |
>>>>>>>> | -0.374 |
**************** | -0.361 |
Token | on |
Token ID | 319 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
kered | +0.416 |
Cly | +0.380 |
racted | +0.364 |
>>>>>>>> | +0.352 |
**************** | +0.341 |
Neg logit contributions | |
icho | -0.367 |
Uri | -0.363 |
llah | -0.362 |
erity | -0.324 |
humans | -0.324 |
Token | the |
Token ID | 262 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
icho | +0.147 |
Uri | +0.146 |
llah | +0.145 |
humans | +0.128 |
erity | +0.128 |
Neg logit contributions | |
kered | -0.198 |
Cly | -0.182 |
racted | -0.175 |
>>>>>>>> | -0.170 |
**************** | -0.165 |
Token | wall |
Token ID | 3355 |
Feature activation | -9.70e-01 |
Pos logit contributions | |
kered | +0.188 |
Cly | +0.173 |
racted | +0.166 |
>>>>>>>> | +0.161 |
**************** | +0.156 |
Neg logit contributions | |
icho | -0.137 |
llah | -0.135 |
Uri | -0.135 |
humans | -0.119 |
erity | -0.119 |
Token | not |
Token ID | 407 |
Feature activation | +3.91e-01 |
Pos logit contributions | |
kered | +0.114 |
Cly | +0.105 |
racted | +0.100 |
>>>>>>>> | +0.097 |
**************** | +0.094 |
Neg logit contributions | |
icho | -0.092 |
llah | -0.090 |
Uri | -0.090 |
erity | -0.081 |
ixel | -0.080 |
Token | just |
Token ID | 655 |
Feature activation | +6.40e-01 |
Pos logit contributions | |
kered | +0.298 |
Cly | +0.276 |
racted | +0.262 |
>>>>>>>> | +0.253 |
★★ | +0.247 |
Neg logit contributions | |
icho | -0.257 |
llah | -0.255 |
Uri | -0.252 |
erity | -0.229 |
ixel | -0.226 |
Token | waiting |
Token ID | 4953 |
Feature activation | +2.14e-01 |
Pos logit contributions | |
kered | +0.505 |
Cly | +0.468 |
racted | +0.446 |
>>>>>>>> | +0.432 |
★★ | +0.420 |
Neg logit contributions | |
icho | -0.405 |
llah | -0.401 |
Uri | -0.396 |
erity | -0.356 |
humans | -0.352 |
Token | for |
Token ID | 329 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
kered | +0.171 |
Cly | +0.158 |
racted | +0.151 |
>>>>>>>> | +0.146 |
**************** | +0.142 |
Neg logit contributions | |
icho | -0.134 |
Uri | -0.132 |
llah | -0.132 |
erity | -0.117 |
humans | -0.117 |
Token | a |
Token ID | 257 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
kered | +1.241 |
Cly | +1.155 |
racted | +1.098 |
>>>>>>>> | +1.064 |
**************** | +1.030 |
Neg logit contributions | |
icho | -1.042 |
llah | -1.035 |
Uri | -1.011 |
erity | -0.918 |
ixel | -0.911 |
Token | surprise |
Token ID | 5975 |
Feature activation | +2.72e+00 |
Pos logit contributions | |
kered | +0.889 |
Cly | +0.828 |
racted | +0.777 |
>>>>>>>> | +0.762 |
★★ | +0.735 |
Neg logit contributions | |
icho | -0.745 |
llah | -0.744 |
Uri | -0.729 |
erity | -0.665 |
ixel | -0.657 |
Token | — |
Token ID | 851 |
Feature activation | +3.90e-01 |
Pos logit contributions | |
kered | +1.946 |
Cly | +1.799 |
racted | +1.671 |
>>>>>>>> | +1.638 |
★★ | +1.589 |
Neg logit contributions | |
icho | -1.908 |
llah | -1.900 |
Uri | -1.872 |
erity | -1.717 |
ixel | -1.702 |
Token | you |
Token ID | 345 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
kered | +0.289 |
Cly | +0.265 |
racted | +0.253 |
>>>>>>>> | +0.245 |
★★ | +0.237 |
Neg logit contributions | |
icho | -0.265 |
llah | -0.262 |
Uri | -0.261 |
erity | -0.234 |
humans | -0.233 |
Token | � |
Token ID | 447 |
Feature activation | +8.61e-01 |
Pos logit contributions | |
kered | +0.791 |
Cly | +0.724 |
racted | +0.691 |
>>>>>>>> | +0.674 |
**************** | +0.653 |
Neg logit contributions | |
icho | -0.667 |
Uri | -0.658 |
llah | -0.653 |
humans | -0.583 |
erity | -0.578 |
Token | � |
Token ID | 247 |
Feature activation | +3.71e-01 |
Pos logit contributions | |
kered | +0.479 |
Cly | +0.418 |
racted | +0.402 |
>>>>>>>> | +0.388 |
**************** | +0.368 |
Neg logit contributions | |
icho | -0.748 |
Uri | -0.736 |
llah | -0.731 |
humans | -0.675 |
erity | -0.674 |
Token | re |
Token ID | 260 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
kered | +0.295 |
Cly | +0.270 |
racted | +0.259 |
>>>>>>>> | +0.252 |
**************** | +0.244 |
Neg logit contributions | |
icho | -0.234 |
Uri | -0.231 |
llah | -0.230 |
humans | -0.205 |
erity | -0.202 |
Token | ambitions |
Token ID | 22455 |
Feature activation | -3.97e-01 |
Pos logit contributions | |
kered | +0.417 |
Cly | +0.382 |
racted | +0.363 |
>>>>>>>> | +0.353 |
**************** | +0.342 |
Neg logit contributions | |
icho | -0.365 |
llah | -0.360 |
Uri | -0.357 |
humans | -0.323 |
erity | -0.321 |
Token | were |
Token ID | 547 |
Feature activation | +5.54e-01 |
Pos logit contributions | |
icho | +0.271 |
Uri | +0.269 |
llah | +0.268 |
erity | +0.240 |
humans | +0.240 |
Neg logit contributions | |
kered | -0.294 |
Cly | -0.268 |
racted | -0.256 |
>>>>>>>> | -0.248 |
★★ | -0.240 |
Token | not |
Token ID | 407 |
Feature activation | -1.59e-02 |
Pos logit contributions | |
kered | +0.394 |
Cly | +0.360 |
racted | +0.343 |
>>>>>>>> | +0.332 |
**************** | +0.321 |
Neg logit contributions | |
icho | -0.394 |
llah | -0.389 |
Uri | -0.387 |
humans | -0.350 |
erity | -0.349 |
Token | always |
Token ID | 1464 |
Feature activation | -2.19e-01 |
Pos logit contributions | |
icho | +0.011 |
llah | +0.011 |
Uri | +0.011 |
erity | +0.010 |
humans | +0.010 |
Neg logit contributions | |
kered | -0.011 |
Cly | -0.010 |
racted | -0.010 |
>>>>>>>> | -0.010 |
**************** | -0.009 |
Token | self |
Token ID | 2116 |
Feature activation | -5.49e-01 |
Pos logit contributions | |
icho | +0.146 |
llah | +0.144 |
Uri | +0.143 |
erity | +0.129 |
humans | +0.129 |
Neg logit contributions | |
kered | -0.165 |
Cly | -0.152 |
racted | -0.145 |
>>>>>>>> | -0.140 |
**************** | -0.136 |
Token | less |
Token ID | 1203 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
icho | +0.448 |
Uri | +0.444 |
llah | +0.441 |
erity | +0.405 |
humans | +0.404 |
Neg logit contributions | |
kered | -0.335 |
Cly | -0.299 |
racted | -0.280 |
>>>>>>>> | -0.273 |
**************** | -0.260 |
Token | ".[ |
Token ID | 42924 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
kered | +2.903 |
Cly | +2.761 |
racted | +2.657 |
>>>>>>>> | +2.621 |
**************** | +2.567 |
Neg logit contributions | |
icho | -0.938 |
llah | -0.894 |
Uri | -0.886 |
humans | -0.709 |
ixel | -0.709 |
Token | 39 |
Token ID | 2670 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
kered | +0.713 |
Cly | +0.641 |
racted | +0.608 |
>>>>>>>> | +0.587 |
★★ | +0.562 |
Neg logit contributions | |
icho | -0.862 |
Uri | -0.857 |
llah | -0.855 |
erity | -0.776 |
humans | -0.775 |
Token | ] |
Token ID | 60 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
icho | +0.198 |
Uri | +0.196 |
llah | +0.195 |
erity | +0.173 |
humans | +0.173 |
Neg logit contributions | |
kered | -0.250 |
Cly | -0.229 |
racted | -0.220 |
>>>>>>>> | -0.214 |
**************** | -0.207 |
Token |
|
Token ID | 198 |
Feature activation | -2.96e-01 |
Pos logit contributions | |
icho | +0.086 |
Uri | +0.085 |
llah | +0.085 |
humans | +0.076 |
erity | +0.076 |
Neg logit contributions | |
kered | -0.092 |
Cly | -0.084 |
racted | -0.080 |
>>>>>>>> | -0.078 |
**************** | -0.075 |
Token |
|
Token ID | 198 |
Feature activation | -5.33e-01 |
Pos logit contributions | |
icho | +0.207 |
Uri | +0.205 |
llah | +0.204 |
humans | +0.184 |
erity | +0.183 |
Neg logit contributions | |
kered | -0.215 |
Cly | -0.195 |
racted | -0.187 |
>>>>>>>> | -0.180 |
★★ | -0.174 |
Token | performance |
Token ID | 2854 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
kered | +0.642 |
Cly | +0.591 |
racted | +0.567 |
>>>>>>>> | +0.551 |
**************** | +0.535 |
Neg logit contributions | |
icho | -0.484 |
llah | -0.477 |
Uri | -0.477 |
erity | -0.423 |
humans | -0.423 |
Token | and |
Token ID | 290 |
Feature activation | +7.81e-01 |
Pos logit contributions | |
kered | +1.226 |
Cly | +1.116 |
racted | +1.065 |
>>>>>>>> | +1.033 |
**************** | +0.997 |
Neg logit contributions | |
icho | -1.188 |
Uri | -1.173 |
llah | -1.172 |
erity | -1.053 |
humans | -1.050 |
Token | capability |
Token ID | 12971 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
kered | +0.620 |
Cly | +0.568 |
racted | +0.544 |
>>>>>>>> | +0.529 |
**************** | +0.512 |
Neg logit contributions | |
icho | -0.494 |
Uri | -0.487 |
llah | -0.487 |
humans | -0.433 |
erity | -0.432 |
Token |
|
Token ID | 198 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
kered | +0.436 |
Cly | +0.398 |
racted | +0.381 |
>>>>>>>> | +0.369 |
★★ | +0.357 |
Neg logit contributions | |
icho | -0.388 |
Uri | -0.384 |
llah | -0.383 |
humans | -0.342 |
erity | -0.341 |
Token |
|
Token ID | 198 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
kered | +0.924 |
Cly | +0.845 |
racted | +0.796 |
>>>>>>>> | +0.776 |
**************** | +0.759 |
Neg logit contributions | |
icho | -1.016 |
llah | -1.005 |
Uri | -0.996 |
challeng | -0.941 |
metic | -0.919 |
Token | Smart |
Token ID | 25610 |
Feature activation | +2.69e+00 |
Pos logit contributions | |
kered | +0.828 |
Cly | +0.747 |
racted | +0.714 |
>>>>>>>> | +0.693 |
★★ | +0.671 |
Neg logit contributions | |
icho | -0.911 |
llah | -0.904 |
Uri | -0.903 |
erity | -0.814 |
humans | -0.808 |
Token | est |
Token ID | 395 |
Feature activation | +5.92e-02 |
Pos logit contributions | |
kered | +1.928 |
Cly | +1.755 |
racted | +1.665 |
>>>>>>>> | +1.599 |
★★ | +1.570 |
Neg logit contributions | |
icho | -1.903 |
llah | -1.890 |
Uri | -1.874 |
irit | -1.676 |
ixel | -1.675 |
Token | : |
Token ID | 25 |
Feature activation | +9.17e-01 |
Pos logit contributions | |
kered | +0.036 |
Cly | +0.032 |
racted | +0.031 |
>>>>>>>> | +0.029 |
**************** | +0.028 |
Neg logit contributions | |
icho | -0.048 |
Uri | -0.048 |
llah | -0.047 |
humans | -0.043 |
erity | -0.043 |
Token | Powered |
Token ID | 45090 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
kered | +0.668 |
Cly | +0.612 |
racted | +0.581 |
>>>>>>>> | +0.560 |
**************** | +0.545 |
Neg logit contributions | |
icho | -0.639 |
llah | -0.633 |
Uri | -0.627 |
erity | -0.566 |
humans | -0.563 |
Token | by |
Token ID | 416 |
Feature activation | +7.34e-01 |
Pos logit contributions | |
kered | +1.096 |
Cly | +1.017 |
racted | +0.974 |
>>>>>>>> | +0.946 |
**************** | +0.926 |
Neg logit contributions | |
icho | -0.736 |
Uri | -0.722 |
llah | -0.721 |
erity | -0.633 |
humans | -0.627 |
Token | all |
Token ID | 477 |
Feature activation | +5.18e-01 |
Pos logit contributions | |
kered | +0.552 |
Cly | +0.506 |
racted | +0.483 |
>>>>>>>> | +0.467 |
**************** | +0.453 |
Neg logit contributions | |
icho | -0.493 |
Uri | -0.487 |
llah | -0.487 |
erity | -0.435 |
humans | -0.435 |
Token |
|
Token ID | 198 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
kered | +0.189 |
Cly | +0.172 |
racted | +0.164 |
>>>>>>>> | +0.159 |
**************** | +0.154 |
Neg logit contributions | |
icho | -0.193 |
llah | -0.190 |
Uri | -0.190 |
erity | -0.171 |
humans | -0.171 |
Token | OC |
Token ID | 4503 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
kered | +0.182 |
Cly | +0.165 |
racted | +0.157 |
>>>>>>>> | +0.153 |
**************** | +0.147 |
Neg logit contributions | |
icho | -0.196 |
Uri | -0.195 |
llah | -0.194 |
erity | -0.175 |
humans | -0.175 |
Token | : |
Token ID | 25 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
kered | +1.234 |
Cly | +1.124 |
racted | +1.074 |
>>>>>>>> | +1.042 |
**************** | +1.006 |
Neg logit contributions | |
icho | -1.156 |
Uri | -1.142 |
llah | -1.142 |
humans | -1.022 |
erity | -1.021 |
Token | MSI |
Token ID | 30781 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
kered | +0.198 |
Cly | +0.182 |
racted | +0.174 |
>>>>>>>> | +0.169 |
★★ | +0.164 |
Neg logit contributions | |
icho | -0.156 |
llah | -0.155 |
Uri | -0.153 |
humans | -0.137 |
erity | -0.136 |
Token | After |
Token ID | 2293 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
icho | +0.204 |
llah | +0.201 |
Uri | +0.201 |
humans | +0.178 |
erity | +0.178 |
Neg logit contributions | |
kered | -0.255 |
Cly | -0.234 |
racted | -0.224 |
>>>>>>>> | -0.218 |
**************** | -0.211 |
Token | burn |
Token ID | 10899 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
kered | +0.242 |
Cly | +0.219 |
racted | +0.206 |
>>>>>>>> | +0.198 |
Changes | +0.192 |
Neg logit contributions | |
icho | -0.304 |
Uri | -0.299 |
llah | -0.299 |
erity | -0.271 |
humans | -0.269 |
Token | er |
Token ID | 263 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
Uri | +2.347 |
icho | +2.331 |
llah | +2.311 |
erity | +2.120 |
humans | +2.105 |
Neg logit contributions | |
kered | -2.209 |
Cly | -1.993 |
racted | -1.898 |
>>>>>>>> | -1.856 |
Changes | -1.763 |
Token | , |
Token ID | 11 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
icho | +0.511 |
Uri | +0.506 |
llah | +0.504 |
erity | +0.453 |
humans | +0.453 |
Neg logit contributions | |
kered | -0.526 |
Cly | -0.478 |
racted | -0.457 |
>>>>>>>> | -0.442 |
**************** | -0.426 |
Token | Un |
Token ID | 791 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
icho | +0.219 |
llah | +0.217 |
Uri | +0.215 |
humans | +0.192 |
erity | +0.192 |
Neg logit contributions | |
kered | -0.249 |
Cly | -0.228 |
racted | -0.217 |
>>>>>>>> | -0.211 |
★★ | -0.205 |
Token | locked |
Token ID | 24162 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
kered | +0.302 |
Cly | +0.276 |
racted | +0.264 |
>>>>>>>> | +0.256 |
**************** | +0.247 |
Neg logit contributions | |
icho | -0.281 |
Uri | -0.276 |
llah | -0.276 |
humans | -0.248 |
erity | -0.248 |
Token | Digital |
Token ID | 27640 |
Feature activation | +7.55e-01 |
Pos logit contributions | |
icho | +1.302 |
Uri | +1.288 |
llah | +1.283 |
erity | +1.155 |
humans | +1.153 |
Neg logit contributions | |
kered | -1.378 |
Cly | -1.253 |
racted | -1.201 |
>>>>>>>> | -1.162 |
**************** | -1.120 |
Token | XV |
Token ID | 29922 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
icho | +1.110 |
Uri | +1.100 |
llah | +1.092 |
humans | +0.985 |
erity | +0.984 |
Neg logit contributions | |
kered | -1.151 |
Cly | -1.042 |
racted | -0.999 |
>>>>>>>> | -0.968 |
**************** | -0.933 |
Token | " |
Token ID | 1 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
icho | +0.314 |
Uri | +0.310 |
llah | +0.310 |
humans | +0.278 |
erity | +0.278 |
Neg logit contributions | |
kered | -0.332 |
Cly | -0.302 |
racted | -0.289 |
>>>>>>>> | -0.280 |
**************** | -0.270 |
Token | and |
Token ID | 290 |
Feature activation | -4.53e-01 |
Pos logit contributions | |
icho | +0.249 |
llah | +0.246 |
Uri | +0.246 |
erity | +0.221 |
humans | +0.220 |
Neg logit contributions | |
kered | -0.257 |
Cly | -0.234 |
racted | -0.223 |
>>>>>>>> | -0.216 |
**************** | -0.208 |
Token | " |
Token ID | 366 |
Feature activation | -3.74e-02 |
Pos logit contributions | |
icho | +0.299 |
Uri | +0.296 |
llah | +0.295 |
humans | +0.263 |
erity | +0.263 |
Neg logit contributions | |
kered | -0.345 |
Cly | -0.316 |
racted | -0.302 |
>>>>>>>> | -0.293 |
★★ | -0.284 |
Token | King |
Token ID | 15708 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
icho | +0.027 |
Uri | +0.027 |
llah | +0.027 |
erity | +0.024 |
humans | +0.024 |
Neg logit contributions | |
kered | -0.026 |
Cly | -0.024 |
racted | -0.023 |
>>>>>>>> | -0.022 |
**************** | -0.021 |
Token | dom |
Token ID | 3438 |
Feature activation | -3.16e+00 |
Pos logit contributions | |
icho | +0.117 |
llah | +0.116 |
Uri | +0.114 |
humans | +0.101 |
erity | +0.101 |
Neg logit contributions | |
kered | -0.158 |
Cly | -0.147 |
racted | -0.140 |
>>>>>>>> | -0.136 |
★★ | -0.132 |
Token | Hearts |
Token ID | 20592 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
icho | +1.878 |
Uri | +1.868 |
llah | +1.836 |
erity | +1.642 |
humans | +1.628 |
Neg logit contributions | |
kered | -2.617 |
Cly | -2.381 |
racted | -2.293 |
>>>>>>>> | -2.240 |
**************** | -2.178 |
Token | 3 |
Token ID | 513 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
icho | +1.331 |
Uri | +1.317 |
llah | +1.311 |
humans | +1.176 |
erity | +1.176 |
Neg logit contributions | |
kered | -1.429 |
Cly | -1.301 |
racted | -1.246 |
>>>>>>>> | -1.205 |
**************** | -1.163 |
Token | " |
Token ID | 1 |
Feature activation | -5.79e-01 |
Pos logit contributions | |
icho | +0.461 |
Uri | +0.456 |
llah | +0.452 |
humans | +0.408 |
erity | +0.406 |
Neg logit contributions | |
kered | -0.495 |
Cly | -0.449 |
racted | -0.430 |
>>>>>>>> | -0.415 |
**************** | -0.401 |
Token | were |
Token ID | 547 |
Feature activation | -8.13e-01 |
Pos logit contributions | |
icho | +0.423 |
Uri | +0.419 |
llah | +0.416 |
humans | +0.376 |
erity | +0.376 |
Neg logit contributions | |
kered | -0.402 |
Cly | -0.363 |
racted | -0.347 |
>>>>>>>> | -0.335 |
**************** | -0.322 |
Token | both |
Token ID | 1111 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
icho | +0.557 |
Uri | +0.550 |
llah | +0.549 |
humans | +0.492 |
erity | +0.492 |
Neg logit contributions | |
kered | -0.601 |
Cly | -0.548 |
racted | -0.524 |
>>>>>>>> | -0.508 |
★★ | -0.490 |
Token | now |
Token ID | 783 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
kered | +0.562 |
Cly | +0.510 |
racted | +0.488 |
>>>>>>>> | +0.472 |
**************** | +0.454 |
Neg logit contributions | |
icho | -0.561 |
Uri | -0.555 |
llah | -0.554 |
humans | -0.499 |
erity | -0.499 |
Token | ? |
Token ID | 30 |
Feature activation | -8.47e-03 |
Pos logit contributions | |
icho | +0.032 |
Uri | +0.032 |
llah | +0.032 |
humans | +0.029 |
erity | +0.029 |
Neg logit contributions | |
kered | -0.033 |
Cly | -0.030 |
racted | -0.029 |
>>>>>>>> | -0.028 |
**************** | -0.027 |
Token | Because |
Token ID | 4362 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
icho | +0.005 |
llah | +0.005 |
Uri | +0.005 |
erity | +0.005 |
humans | +0.005 |
Neg logit contributions | |
kered | -0.007 |
Cly | -0.006 |
racted | -0.006 |
>>>>>>>> | -0.006 |
★★ | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +7.83e-01 |
Pos logit contributions | |
kered | +0.873 |
Cly | +0.806 |
racted | +0.764 |
>>>>>>>> | +0.743 |
★★ | +0.721 |
Neg logit contributions | |
icho | -0.751 |
llah | -0.745 |
Uri | -0.734 |
erity | -0.661 |
humans | -0.655 |
Token | closed |
Token ID | 4838 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
kered | +0.598 |
Cly | +0.550 |
racted | +0.522 |
>>>>>>>> | +0.508 |
**************** | +0.492 |
Neg logit contributions | |
icho | -0.518 |
llah | -0.510 |
Uri | -0.509 |
erity | -0.456 |
humans | -0.454 |
Token | beta |
Token ID | 12159 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
icho | +0.400 |
Uri | +0.396 |
llah | +0.394 |
humans | +0.354 |
erity | +0.353 |
Neg logit contributions | |
kered | -0.420 |
Cly | -0.382 |
racted | -0.366 |
>>>>>>>> | -0.355 |
★★ | -0.342 |
Token | arrives |
Token ID | 14443 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
Uri | +1.934 |
icho | +1.927 |
llah | +1.892 |
humans | +1.706 |
alon | +1.692 |
Neg logit contributions | |
kered | -2.388 |
Cly | -2.164 |
racted | -2.104 |
>>>>>>>> | -2.039 |
★★ | -1.983 |
Token | tomorrow |
Token ID | 9439 |
Feature activation | +7.42e-02 |
Pos logit contributions | |
kered | +0.173 |
Cly | +0.158 |
racted | +0.151 |
>>>>>>>> | +0.146 |
**************** | +0.141 |
Neg logit contributions | |
icho | -0.163 |
Uri | -0.161 |
llah | -0.161 |
erity | -0.144 |
humans | -0.144 |
Token | and |
Token ID | 290 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
kered | +0.053 |
Cly | +0.048 |
racted | +0.046 |
>>>>>>>> | +0.045 |
**************** | +0.043 |
Neg logit contributions | |
icho | -0.053 |
llah | -0.052 |
Uri | -0.052 |
erity | -0.047 |
humans | -0.047 |
Token | the |
Token ID | 262 |
Feature activation | +5.32e-01 |
Pos logit contributions | |
kered | +0.132 |
Cly | +0.122 |
racted | +0.116 |
>>>>>>>> | +0.113 |
**************** | +0.109 |
Neg logit contributions | |
icho | -0.111 |
llah | -0.109 |
Uri | -0.108 |
erity | -0.097 |
humans | -0.096 |
Token | client |
Token ID | 5456 |
Feature activation | +5.09e-02 |
Pos logit contributions | |
kered | +0.402 |
Cly | +0.370 |
racted | +0.351 |
>>>>>>>> | +0.342 |
**************** | +0.330 |
Neg logit contributions | |
icho | -0.356 |
llah | -0.351 |
Uri | -0.350 |
erity | -0.314 |
humans | -0.312 |
Token | ' |
Token ID | 705 |
Feature activation | -9.17e-01 |
Pos logit contributions | |
icho | +0.238 |
Uri | +0.236 |
llah | +0.235 |
humans | +0.209 |
erity | +0.208 |
Neg logit contributions | |
kered | -0.296 |
Cly | -0.271 |
racted | -0.260 |
>>>>>>>> | -0.253 |
★★ | -0.245 |
Token | a |
Token ID | 64 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
icho | +0.559 |
Uri | +0.551 |
llah | +0.550 |
humans | +0.485 |
erity | +0.485 |
Neg logit contributions | |
kered | -0.747 |
Cly | -0.687 |
racted | -0.660 |
>>>>>>>> | -0.642 |
★★ | -0.622 |
Token | > |
Token ID | 1875 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
Uri | +0.291 |
icho | +0.290 |
llah | +0.287 |
erity | +0.249 |
humans | +0.248 |
Neg logit contributions | |
kered | -0.459 |
Cly | -0.425 |
racted | -0.410 |
>>>>>>>> | -0.398 |
**************** | -0.388 |
Token | ( |
Token ID | 357 |
Feature activation | -9.75e-01 |
Pos logit contributions | |
icho | +0.215 |
Uri | +0.214 |
llah | +0.213 |
erity | +0.189 |
humans | +0.189 |
Neg logit contributions | |
kered | -0.231 |
Cly | -0.211 |
racted | -0.200 |
>>>>>>>> | -0.195 |
★★ | -0.190 |
Token | & |
Token ID | 1222 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
icho | +0.804 |
Uri | +0.798 |
llah | +0.796 |
humans | +0.727 |
erity | +0.726 |
Neg logit contributions | |
kered | -0.583 |
Cly | -0.520 |
racted | -0.491 |
>>>>>>>> | -0.472 |
★★ | -0.451 |
Token | self |
Token ID | 2116 |
Feature activation | -3.02e+00 |
Pos logit contributions | |
Uri | +1.113 |
icho | +1.104 |
llah | +1.090 |
alon | +0.967 |
irit | +0.963 |
Neg logit contributions | |
kered | -1.245 |
Cly | -1.143 |
racted | -1.100 |
>>>>>>>> | -1.061 |
★★ | -1.033 |
Token | , |
Token ID | 837 |
Feature activation | -2.51e+00 |
Pos logit contributions | |
icho | +1.507 |
Uri | +1.501 |
llah | +1.471 |
ixel | +1.249 |
erity | +1.249 |
Neg logit contributions | |
kered | -2.786 |
Cly | -2.590 |
racted | -2.485 |
>>>>>>>> | -2.431 |
**************** | -2.379 |
Token | ord |
Token ID | 2760 |
Feature activation | -6.51e-01 |
Pos logit contributions | |
Uri | +1.700 |
icho | +1.676 |
llah | +1.653 |
ixel | +1.481 |
humans | +1.479 |
Neg logit contributions | |
kered | -1.863 |
Cly | -1.694 |
racted | -1.639 |
>>>>>>>> | -1.578 |
★★ | -1.534 |
Token | : |
Token ID | 1058 |
Feature activation | -6.57e-01 |
Pos logit contributions | |
icho | +0.438 |
Uri | +0.435 |
llah | +0.433 |
erity | +0.388 |
humans | +0.385 |
Neg logit contributions | |
kered | -0.489 |
Cly | -0.446 |
racted | -0.425 |
>>>>>>>> | -0.415 |
**************** | -0.401 |
Token | Order |
Token ID | 8284 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
Uri | +0.496 |
icho | +0.495 |
llah | +0.489 |
erity | +0.443 |
humans | +0.442 |
Neg logit contributions | |
kered | -0.439 |
Cly | -0.396 |
racted | -0.377 |
>>>>>>>> | -0.364 |
★★ | -0.350 |
Token | ing |
Token ID | 278 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
icho | +0.252 |
Uri | +0.250 |
llah | +0.247 |
erity | +0.227 |
humans | +0.226 |
Neg logit contributions | |
kered | -0.179 |
Cly | -0.161 |
racted | -0.150 |
>>>>>>>> | -0.145 |
★★ | -0.139 |
Token | . |
Token ID | 13 |
Feature activation | -3.20e-01 |
Pos logit contributions | |
icho | +0.263 |
Uri | +0.260 |
llah | +0.259 |
humans | +0.233 |
erity | +0.232 |
Neg logit contributions | |
kered | -0.281 |
Cly | -0.255 |
racted | -0.244 |
>>>>>>>> | -0.236 |
**************** | -0.228 |
Token | Meaning |
Token ID | 30563 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
icho | +0.219 |
llah | +0.216 |
Uri | +0.215 |
erity | +0.193 |
humans | +0.193 |
Neg logit contributions | |
kered | -0.236 |
Cly | -0.216 |
racted | -0.206 |
>>>>>>>> | -0.200 |
**************** | -0.193 |
Token | that |
Token ID | 326 |
Feature activation | -8.87e-01 |
Pos logit contributions | |
icho | +1.266 |
Uri | +1.249 |
llah | +1.241 |
humans | +1.120 |
erity | +1.113 |
Neg logit contributions | |
kered | -1.400 |
Cly | -1.273 |
racted | -1.218 |
>>>>>>>> | -1.185 |
**************** | -1.142 |
Token | " |
Token ID | 366 |
Feature activation | -5.81e-01 |
Pos logit contributions | |
icho | +0.556 |
llah | +0.549 |
Uri | +0.548 |
erity | +0.485 |
humans | +0.484 |
Neg logit contributions | |
kered | -0.707 |
Cly | -0.650 |
racted | -0.623 |
>>>>>>>> | -0.606 |
★★ | -0.587 |
Token | King |
Token ID | 15708 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
icho | +0.399 |
Uri | +0.394 |
llah | +0.393 |
erity | +0.352 |
humans | +0.352 |
Neg logit contributions | |
kered | -0.429 |
Cly | -0.391 |
racted | -0.374 |
>>>>>>>> | -0.362 |
★★ | -0.350 |
Token | dom |
Token ID | 3438 |
Feature activation | -2.99e+00 |
Pos logit contributions | |
kered | +0.090 |
Cly | +0.083 |
racted | +0.080 |
>>>>>>>> | +0.077 |
**************** | +0.075 |
Neg logit contributions | |
icho | -0.067 |
llah | -0.066 |
Uri | -0.066 |
challeng | -0.058 |
erity | -0.058 |
Token | Hearts |
Token ID | 20592 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
icho | +1.816 |
Uri | +1.800 |
llah | +1.779 |
humans | +1.584 |
erity | +1.574 |
Neg logit contributions | |
kered | -2.434 |
Cly | -2.225 |
racted | -2.153 |
>>>>>>>> | -2.080 |
★★ | -2.027 |
Token | 3 |
Token ID | 513 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
icho | +1.131 |
Uri | +1.122 |
llah | +1.111 |
humans | +1.001 |
erity | +0.998 |
Neg logit contributions | |
kered | -1.232 |
Cly | -1.121 |
racted | -1.078 |
>>>>>>>> | -1.040 |
**************** | -1.004 |
Token | " |
Token ID | 1 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
icho | +0.132 |
Uri | +0.130 |
llah | +0.130 |
humans | +0.113 |
erity | +0.113 |
Neg logit contributions | |
kered | -0.202 |
Cly | -0.186 |
racted | -0.179 |
>>>>>>>> | -0.175 |
**************** | -0.169 |
Token | is |
Token ID | 318 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
kered | +0.014 |
Cly | +0.013 |
racted | +0.012 |
>>>>>>>> | +0.012 |
★★ | +0.011 |
Neg logit contributions | |
icho | -0.013 |
Uri | -0.012 |
llah | -0.012 |
humans | -0.011 |
erity | -0.011 |
Token | still |
Token ID | 991 |
Feature activation | -1.63e-01 |
Pos logit contributions | |
icho | +0.415 |
Uri | +0.411 |
llah | +0.409 |
humans | +0.371 |
erity | +0.370 |
Neg logit contributions | |
kered | -0.380 |
Cly | -0.343 |
racted | -0.327 |
>>>>>>>> | -0.316 |
★★ | -0.304 |
Token | scrap |
Token ID | 15881 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
kered | +0.757 |
Cly | +0.694 |
racted | +0.663 |
>>>>>>>> | +0.644 |
**************** | +0.622 |
Neg logit contributions | |
icho | -0.644 |
llah | -0.636 |
Uri | -0.632 |
erity | -0.567 |
humans | -0.566 |
Token | . |
Token ID | 13 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
kered | +0.913 |
Cly | +0.833 |
racted | +0.798 |
>>>>>>>> | +0.773 |
★★ | +0.747 |
Neg logit contributions | |
icho | -0.817 |
Uri | -0.807 |
llah | -0.806 |
humans | -0.720 |
erity | -0.720 |
Token |
|
Token ID | 198 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
icho | +0.010 |
llah | +0.009 |
Uri | +0.009 |
humans | +0.008 |
erity | +0.008 |
Neg logit contributions | |
kered | -0.011 |
Cly | -0.010 |
racted | -0.010 |
>>>>>>>> | -0.010 |
**************** | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
icho | +0.085 |
Uri | +0.084 |
llah | +0.084 |
erity | +0.076 |
humans | +0.076 |
Neg logit contributions | |
kered | -0.085 |
Cly | -0.077 |
racted | -0.073 |
>>>>>>>> | -0.071 |
**************** | -0.069 |
Token | Article |
Token ID | 14906 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
icho | +0.099 |
Uri | +0.098 |
llah | +0.097 |
erity | +0.087 |
humans | +0.087 |
Neg logit contributions | |
kered | -0.106 |
Cly | -0.097 |
racted | -0.093 |
>>>>>>>> | -0.090 |
**************** | -0.087 |
Token | Continued |
Token ID | 22168 |
Feature activation | -2.91e+00 |
Pos logit contributions | |
icho | +0.102 |
Uri | +0.101 |
llah | +0.101 |
erity | +0.089 |
humans | +0.089 |
Neg logit contributions | |
kered | -0.143 |
Cly | -0.133 |
racted | -0.128 |
>>>>>>>> | -0.124 |
**************** | -0.120 |
Token | Below |
Token ID | 10383 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
icho | +1.950 |
Uri | +1.940 |
llah | +1.924 |
humans | +1.721 |
erity | +1.709 |
Neg logit contributions | |
kered | -2.207 |
Cly | -1.991 |
racted | -1.920 |
>>>>>>>> | -1.859 |
★★ | -1.796 |
Token |
|
Token ID | 198 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
icho | +1.189 |
Uri | +1.186 |
llah | +1.173 |
humans | +1.056 |
erity | +1.045 |
Neg logit contributions | |
kered | -1.299 |
Cly | -1.171 |
racted | -1.132 |
>>>>>>>> | -1.089 |
★★ | -1.052 |
Token |
|
Token ID | 198 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
icho | +0.401 |
Uri | +0.397 |
llah | +0.396 |
erity | +0.356 |
humans | +0.356 |
Neg logit contributions | |
kered | -0.406 |
Cly | -0.369 |
racted | -0.352 |
>>>>>>>> | -0.341 |
**************** | -0.328 |
Token | The |
Token ID | 464 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
icho | +0.248 |
Uri | +0.245 |
llah | +0.245 |
humans | +0.218 |
erity | +0.218 |
Neg logit contributions | |
kered | -0.284 |
Cly | -0.259 |
racted | -0.248 |
>>>>>>>> | -0.241 |
★★ | -0.233 |
Token | T |
Token ID | 309 |
Feature activation | -4.68e-01 |
Pos logit contributions | |
icho | +0.192 |
Uri | +0.190 |
llah | +0.189 |
humans | +0.167 |
erity | +0.167 |
Neg logit contributions | |
kered | -0.255 |
Cly | -0.235 |
racted | -0.225 |
>>>>>>>> | -0.219 |
**************** | -0.212 |
Token | : |
Token ID | 25 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
kered | +0.616 |
Cly | +0.556 |
racted | +0.524 |
>>>>>>>> | +0.506 |
**************** | +0.489 |
Neg logit contributions | |
icho | -0.787 |
llah | -0.783 |
Uri | -0.777 |
erity | -0.710 |
humans | -0.709 |
Token |
|
Token ID | 198 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
kered | +0.244 |
Cly | +0.225 |
racted | +0.214 |
>>>>>>>> | +0.209 |
★★ | +0.202 |
Neg logit contributions | |
icho | -0.205 |
llah | -0.203 |
Uri | -0.201 |
erity | -0.180 |
humans | -0.179 |
Token |
|
Token ID | 198 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
kered | +0.244 |
Cly | +0.222 |
racted | +0.212 |
>>>>>>>> | +0.205 |
**************** | +0.198 |
Neg logit contributions | |
icho | -0.245 |
Uri | -0.242 |
llah | -0.242 |
erity | -0.218 |
humans | -0.217 |
Token | ' |
Token ID | 6 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
kered | +0.309 |
Cly | +0.280 |
racted | +0.267 |
>>>>>>>> | +0.259 |
★★ | +0.251 |
Neg logit contributions | |
icho | -0.325 |
Uri | -0.321 |
llah | -0.321 |
erity | -0.290 |
humans | -0.288 |
Token | King |
Token ID | 15708 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
kered | +0.242 |
Cly | +0.219 |
racted | +0.209 |
>>>>>>>> | +0.203 |
★★ | +0.196 |
Neg logit contributions | |
icho | -0.254 |
llah | -0.251 |
Uri | -0.251 |
erity | -0.226 |
humans | -0.225 |
Token | dom |
Token ID | 3438 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
kered | +0.204 |
Cly | +0.189 |
racted | +0.181 |
>>>>>>>> | +0.175 |
**************** | +0.171 |
Neg logit contributions | |
icho | -0.151 |
llah | -0.148 |
Uri | -0.148 |
erity | -0.131 |
challeng | -0.130 |
Token | Hearts |
Token ID | 20592 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
icho | +1.737 |
Uri | +1.725 |
llah | +1.702 |
humans | +1.519 |
erity | +1.503 |
Neg logit contributions | |
kered | -2.322 |
Cly | -2.119 |
racted | -2.054 |
>>>>>>>> | -1.988 |
★★ | -1.930 |
Token | 3 |
Token ID | 513 |
Feature activation | -3.66e-01 |
Pos logit contributions | |
icho | +0.828 |
Uri | +0.820 |
llah | +0.814 |
humans | +0.726 |
erity | +0.725 |
Neg logit contributions | |
kered | -1.014 |
Cly | -0.927 |
racted | -0.893 |
>>>>>>>> | -0.865 |
**************** | -0.836 |
Token | ' |
Token ID | 6 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
icho | +0.247 |
Uri | +0.245 |
llah | +0.244 |
humans | +0.219 |
erity | +0.218 |
Neg logit contributions | |
kered | -0.274 |
Cly | -0.250 |
racted | -0.239 |
>>>>>>>> | -0.232 |
**************** | -0.224 |
Token | Xbox |
Token ID | 9445 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
kered | +0.095 |
Cly | +0.087 |
racted | +0.083 |
>>>>>>>> | +0.080 |
★★ | +0.077 |
Neg logit contributions | |
icho | -0.092 |
llah | -0.090 |
Uri | -0.090 |
erity | -0.081 |
humans | -0.081 |
Token | One |
Token ID | 1881 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
icho | +0.351 |
Uri | +0.348 |
llah | +0.345 |
erity | +0.307 |
humans | +0.307 |
Neg logit contributions | |
kered | -0.444 |
Cly | -0.406 |
racted | -0.391 |
>>>>>>>> | -0.380 |
**************** | -0.367 |
Token | may |
Token ID | 743 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
icho | +0.420 |
llah | +0.415 |
Uri | +0.415 |
humans | +0.371 |
erity | +0.371 |
Neg logit contributions | |
kered | -0.453 |
Cly | -0.413 |
racted | -0.394 |
>>>>>>>> | -0.382 |
**************** | -0.369 |
Token | be |
Token ID | 307 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
icho | +0.881 |
Uri | +0.876 |
llah | +0.870 |
humans | +0.780 |
erity | +0.775 |
Neg logit contributions | |
kered | -0.963 |
Cly | -0.880 |
racted | -0.846 |
>>>>>>>> | -0.819 |
★★ | -0.792 |
Token | effective |
Token ID | 4050 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
icho | +0.504 |
Uri | +0.498 |
llah | +0.496 |
humans | +0.443 |
erity | +0.442 |
Neg logit contributions | |
kered | -0.587 |
Cly | -0.537 |
racted | -0.514 |
>>>>>>>> | -0.499 |
★★ | -0.482 |
Token | for |
Token ID | 329 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
icho | +0.739 |
Uri | +0.731 |
llah | +0.729 |
humans | +0.647 |
erity | +0.645 |
Neg logit contributions | |
kered | -0.913 |
Cly | -0.836 |
racted | -0.804 |
>>>>>>>> | -0.779 |
★★ | -0.755 |
Token | the |
Token ID | 262 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
icho | +1.011 |
Uri | +0.999 |
llah | +0.996 |
humans | +0.878 |
erity | +0.877 |
Neg logit contributions | |
kered | -1.365 |
Cly | -1.254 |
racted | -1.208 |
>>>>>>>> | -1.173 |
★★ | -1.138 |
Token | treatment |
Token ID | 3513 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
icho | +0.270 |
Uri | +0.265 |
llah | +0.265 |
erity | +0.238 |
humans | +0.237 |
Neg logit contributions | |
kered | -0.311 |
Cly | -0.285 |
racted | -0.270 |
>>>>>>>> | -0.264 |
**************** | -0.254 |
Token | of |
Token ID | 286 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
icho | +1.549 |
Uri | +1.514 |
llah | +1.512 |
erity | +1.331 |
humans | +1.316 |
Neg logit contributions | |
kered | -2.481 |
Cly | -2.295 |
racted | -2.233 |
>>>>>>>> | -2.149 |
★★ | -2.105 |
Token | stress |
Token ID | 5503 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
kered | +0.115 |
Cly | +0.106 |
racted | +0.101 |
>>>>>>>> | +0.098 |
**************** | +0.094 |
Neg logit contributions | |
icho | -0.103 |
Uri | -0.101 |
llah | -0.101 |
erity | -0.091 |
humans | -0.090 |
Token | - |
Token ID | 12 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
icho | +0.325 |
Uri | +0.322 |
llah | +0.321 |
humans | +0.290 |
erity | +0.290 |
Neg logit contributions | |
kered | -0.296 |
Cly | -0.267 |
racted | -0.254 |
>>>>>>>> | -0.246 |
★★ | -0.236 |
Token | related |
Token ID | 5363 |
Feature activation | -4.88e-01 |
Pos logit contributions | |
kered | +0.094 |
Cly | +0.085 |
racted | +0.081 |
>>>>>>>> | +0.078 |
**************** | +0.075 |
Neg logit contributions | |
icho | -0.096 |
Uri | -0.095 |
llah | -0.095 |
erity | -0.085 |
humans | -0.085 |
Token | disorders |
Token ID | 11916 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
icho | +0.329 |
Uri | +0.325 |
llah | +0.324 |
erity | +0.290 |
humans | +0.290 |
Neg logit contributions | |
kered | -0.367 |
Cly | -0.335 |
racted | -0.320 |
>>>>>>>> | -0.311 |
**************** | -0.300 |
Token | hour |
Token ID | 1711 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
kered | +0.289 |
Cly | +0.265 |
racted | +0.254 |
>>>>>>>> | +0.244 |
**************** | +0.237 |
Neg logit contributions | |
icho | -0.260 |
Uri | -0.256 |
llah | -0.256 |
humans | -0.229 |
erity | -0.229 |
Token | away |
Token ID | 1497 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
icho | +0.194 |
Uri | +0.192 |
llah | +0.192 |
humans | +0.173 |
erity | +0.172 |
Neg logit contributions | |
kered | -0.192 |
Cly | -0.175 |
racted | -0.166 |
>>>>>>>> | -0.161 |
★★ | -0.155 |
Token | ," |
Token ID | 553 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
kered | +0.270 |
Cly | +0.247 |
racted | +0.236 |
>>>>>>>> | +0.228 |
**************** | +0.221 |
Neg logit contributions | |
icho | -0.261 |
llah | -0.257 |
Uri | -0.257 |
erity | -0.232 |
humans | -0.232 |
Token | says |
Token ID | 1139 |
Feature activation | -9.82e-01 |
Pos logit contributions | |
kered | +0.087 |
Cly | +0.080 |
racted | +0.077 |
>>>>>>>> | +0.075 |
★★ | +0.072 |
Neg logit contributions | |
icho | -0.065 |
llah | -0.064 |
Uri | -0.064 |
erity | -0.057 |
humans | -0.057 |
Token | A |
Token ID | 317 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
icho | +0.672 |
Uri | +0.668 |
llah | +0.664 |
humans | +0.593 |
erity | +0.592 |
Neg logit contributions | |
kered | -0.728 |
Cly | -0.659 |
racted | -0.633 |
>>>>>>>> | -0.614 |
**************** | -0.593 |
Token | du |
Token ID | 646 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
icho | +0.858 |
llah | +0.848 |
Uri | +0.848 |
humans | +0.763 |
erity | +0.762 |
Neg logit contributions | |
kered | -0.784 |
Cly | -0.710 |
racted | -0.676 |
>>>>>>>> | -0.654 |
★★ | -0.630 |
Token | . |
Token ID | 13 |
Feature activation | +7.02e-01 |
Pos logit contributions | |
llah | +2.075 |
icho | +2.066 |
Uri | +2.057 |
alon | +1.845 |
irit | +1.825 |
Neg logit contributions | |
kered | -1.955 |
Cly | -1.765 |
racted | -1.681 |
>>>>>>>> | -1.642 |
★★ | -1.587 |
Token | He |
Token ID | 1544 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
kered | +0.504 |
Cly | +0.460 |
racted | +0.438 |
>>>>>>>> | +0.424 |
★★ | +0.410 |
Neg logit contributions | |
icho | -0.495 |
Uri | -0.487 |
llah | -0.487 |
erity | -0.438 |
humans | -0.438 |
Token | is |
Token ID | 318 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
kered | +0.125 |
Cly | +0.114 |
racted | +0.109 |
>>>>>>>> | +0.105 |
**************** | +0.102 |
Neg logit contributions | |
icho | -0.113 |
Uri | -0.112 |
llah | -0.112 |
erity | -0.100 |
humans | -0.100 |
Token | now |
Token ID | 783 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
icho | +0.385 |
llah | +0.380 |
Uri | +0.380 |
humans | +0.340 |
erity | +0.340 |
Neg logit contributions | |
kered | -0.433 |
Cly | -0.397 |
racted | -0.380 |
>>>>>>>> | -0.367 |
★★ | -0.356 |
Token | playing |
Token ID | 2712 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
icho | +0.361 |
llah | +0.356 |
Uri | +0.355 |
humans | +0.317 |
erity | +0.316 |
Neg logit contributions | |
kered | -0.434 |
Cly | -0.399 |
racted | -0.382 |
>>>>>>>> | -0.371 |
**************** | -0.359 |
Token | PNG |
Token ID | 36182 |
Feature activation | -6.72e-01 |
Pos logit contributions | |
icho | +0.075 |
llah | +0.074 |
Uri | +0.074 |
erity | +0.067 |
alon | +0.066 |
Neg logit contributions | |
kered | -0.088 |
Cly | -0.082 |
racted | -0.078 |
>>>>>>>> | -0.076 |
**************** | -0.074 |
Token | larger |
Token ID | 4025 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
icho | +0.346 |
Uri | +0.341 |
llah | +0.339 |
humans | +0.293 |
erity | +0.293 |
Neg logit contributions | |
kered | -0.610 |
Cly | -0.567 |
racted | -0.547 |
>>>>>>>> | -0.534 |
**************** | -0.519 |
Token | image |
Token ID | 2939 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
icho | +0.968 |
Uri | +0.962 |
llah | +0.953 |
humans | +0.822 |
erity | +0.814 |
Neg logit contributions | |
kered | -1.710 |
Cly | -1.585 |
racted | -1.530 |
>>>>>>>> | -1.491 |
★★ | -1.453 |
Token |
|
Token ID | 198 |
Feature activation | +2.65e-01 |
Pos logit contributions | |
icho | +0.872 |
Uri | +0.864 |
llah | +0.860 |
humans | +0.773 |
erity | +0.773 |
Neg logit contributions | |
kered | -0.894 |
Cly | -0.812 |
racted | -0.776 |
>>>>>>>> | -0.750 |
★★ | -0.724 |
Token |
|
Token ID | 198 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
kered | +0.187 |
Cly | +0.170 |
racted | +0.161 |
>>>>>>>> | +0.157 |
**************** | +0.152 |
Neg logit contributions | |
icho | -0.191 |
llah | -0.189 |
Uri | -0.188 |
erity | -0.170 |
humans | -0.170 |
Token | larg |
Token ID | 15521 |
Feature activation | -2.81e+00 |
Pos logit contributions | |
kered | +0.145 |
Cly | +0.132 |
>>>>>>>> | +0.130 |
racted | +0.127 |
Changes | +0.126 |
Neg logit contributions | |
llah | -0.140 |
Uri | -0.137 |
icho | -0.136 |
metic | -0.124 |
paran | -0.124 |
Token | er |
Token ID | 263 |
Feature activation | -9.17e-01 |
Pos logit contributions | |
icho | +2.023 |
Uri | +1.981 |
llah | +1.953 |
alon | +1.798 |
humans | +1.796 |
Neg logit contributions | |
kered | -1.919 |
Cly | -1.772 |
racted | -1.683 |
>>>>>>>> | -1.643 |
★★ | -1.586 |
Token | image |
Token ID | 2939 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
icho | +0.512 |
llah | +0.502 |
Uri | +0.500 |
erity | +0.442 |
humans | +0.437 |
Neg logit contributions | |
kered | -0.798 |
Cly | -0.738 |
racted | -0.712 |
>>>>>>>> | -0.693 |
**************** | -0.675 |
Token | T |
Token ID | 309 |
Feature activation | -6.98e-01 |
Pos logit contributions | |
icho | +0.774 |
llah | +0.765 |
Uri | +0.751 |
humans | +0.656 |
erity | +0.652 |
Neg logit contributions | |
kered | -1.338 |
Cly | -1.248 |
racted | -1.191 |
>>>>>>>> | -1.179 |
**************** | -1.140 |
Token | IFF |
Token ID | 29267 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
icho | +0.677 |
llah | +0.675 |
Uri | +0.670 |
erity | +0.627 |
humans | +0.624 |
Neg logit contributions | |
kered | -0.318 |
Cly | -0.269 |
racted | -0.252 |
>>>>>>>> | -0.237 |
**************** | -0.222 |
Token | original |
Token ID | 2656 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
kered | +1.144 |
Cly | +1.057 |
racted | +1.010 |
>>>>>>>> | +0.985 |
Changes | +0.970 |
Neg logit contributions | |
llah | -0.768 |
icho | -0.757 |
Uri | -0.728 |
erity | -0.656 |
humans | -0.647 |
Token | Nick |
Token ID | 8047 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
icho | +0.310 |
Uri | +0.307 |
llah | +0.306 |
erity | +0.275 |
humans | +0.274 |
Neg logit contributions | |
kered | -0.322 |
Cly | -0.292 |
racted | -0.280 |
>>>>>>>> | -0.271 |
★★ | -0.261 |
Token | Cousins |
Token ID | 32644 |
Feature activation | +6.30e-01 |
Pos logit contributions | |
icho | +0.141 |
Uri | +0.139 |
llah | +0.139 |
humans | +0.124 |
erity | +0.124 |
Neg logit contributions | |
kered | -0.160 |
Cly | -0.147 |
racted | -0.141 |
>>>>>>>> | -0.136 |
**************** | -0.131 |
Token | and |
Token ID | 290 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
kered | +0.423 |
Cly | +0.382 |
racted | +0.363 |
>>>>>>>> | +0.351 |
**************** | +0.338 |
Neg logit contributions | |
icho | -0.474 |
Uri | -0.469 |
llah | -0.468 |
humans | -0.424 |
erity | -0.424 |
Token | Sam |
Token ID | 3409 |
Feature activation | -3.12e-01 |
Pos logit contributions | |
kered | +0.116 |
Cly | +0.107 |
racted | +0.102 |
>>>>>>>> | +0.099 |
**************** | +0.096 |
Neg logit contributions | |
icho | -0.097 |
llah | -0.096 |
Uri | -0.096 |
humans | -0.085 |
erity | -0.085 |
Token | G |
Token ID | 402 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
icho | +0.212 |
llah | +0.209 |
Uri | +0.209 |
humans | +0.188 |
erity | +0.187 |
Neg logit contributions | |
kered | -0.232 |
Cly | -0.214 |
racted | -0.203 |
>>>>>>>> | -0.194 |
**************** | -0.188 |
Token | ag |
Token ID | 363 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
icho | +0.334 |
Uri | +0.331 |
llah | +0.331 |
humans | +0.300 |
erity | +0.300 |
Neg logit contributions | |
kered | -0.289 |
Cly | -0.260 |
racted | -0.248 |
>>>>>>>> | -0.238 |
**************** | -0.229 |
Token | ner |
Token ID | 1008 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
icho | +1.274 |
llah | +1.229 |
Uri | +1.178 |
alon | +1.040 |
irit | +1.011 |
Neg logit contributions | |
kered | -2.670 |
Cly | -2.502 |
racted | -2.446 |
>>>>>>>> | -2.364 |
★★ | -2.348 |
Token | gave |
Token ID | 2921 |
Feature activation | -6.29e-02 |
Pos logit contributions | |
icho | +1.320 |
Uri | +1.301 |
llah | +1.301 |
erity | +1.167 |
alon | +1.163 |
Neg logit contributions | |
kered | -1.315 |
Cly | -1.187 |
racted | -1.139 |
>>>>>>>> | -1.100 |
Changes | -1.073 |
Token | the |
Token ID | 262 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
icho | +0.035 |
Uri | +0.035 |
llah | +0.035 |
humans | +0.030 |
erity | +0.030 |
Neg logit contributions | |
kered | -0.054 |
Cly | -0.050 |
racted | -0.048 |
>>>>>>>> | -0.047 |
★★ | -0.046 |
Token | Flyers |
Token ID | 30652 |
Feature activation | +1.90e-01 |
Pos logit contributions | |
kered | +0.293 |
Cly | +0.268 |
racted | +0.255 |
>>>>>>>> | +0.248 |
**************** | +0.240 |
Neg logit contributions | |
icho | -0.268 |
llah | -0.264 |
Uri | -0.264 |
erity | -0.236 |
humans | -0.236 |
Token | two |
Token ID | 734 |
Feature activation | +4.58e-01 |
Pos logit contributions | |
kered | +0.153 |
Cly | +0.140 |
racted | +0.135 |
>>>>>>>> | +0.131 |
★★ | +0.127 |
Neg logit contributions | |
icho | -0.118 |
llah | -0.116 |
Uri | -0.116 |
humans | -0.103 |
erity | -0.103 |
Token | oning |
Token ID | 12484 |
Feature activation | +6.16e-01 |
Pos logit contributions | |
kered | +0.019 |
Cly | +0.017 |
racted | +0.016 |
>>>>>>>> | +0.016 |
**************** | +0.015 |
Neg logit contributions | |
icho | -0.021 |
llah | -0.021 |
Uri | -0.021 |
erity | -0.019 |
alon | -0.019 |
Token | for |
Token ID | 329 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
kered | +0.429 |
Cly | +0.389 |
racted | +0.370 |
>>>>>>>> | +0.357 |
★★ | +0.346 |
Neg logit contributions | |
icho | -0.448 |
llah | -0.443 |
Uri | -0.443 |
humans | -0.399 |
erity | -0.399 |
Token | Quality |
Token ID | 14156 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
icho | +0.348 |
Uri | +0.344 |
llah | +0.344 |
humans | +0.310 |
erity | +0.309 |
Neg logit contributions | |
kered | -0.336 |
Cly | -0.305 |
racted | -0.291 |
>>>>>>>> | -0.281 |
★★ | -0.271 |
Token | and |
Token ID | 290 |
Feature activation | +9.84e-02 |
Pos logit contributions | |
icho | +0.107 |
Uri | +0.106 |
llah | +0.106 |
humans | +0.096 |
erity | +0.096 |
Neg logit contributions | |
kered | -0.093 |
Cly | -0.084 |
racted | -0.080 |
>>>>>>>> | -0.077 |
★★ | -0.074 |
Token | Aff |
Token ID | 6708 |
Feature activation | -7.18e-01 |
Pos logit contributions | |
kered | +0.068 |
Cly | +0.062 |
racted | +0.059 |
>>>>>>>> | +0.056 |
★★ | +0.055 |
Neg logit contributions | |
icho | -0.072 |
llah | -0.071 |
Uri | -0.071 |
humans | -0.064 |
erity | -0.064 |
Token | ord |
Token ID | 585 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
icho | +0.364 |
Uri | +0.359 |
llah | +0.358 |
erity | +0.307 |
humans | +0.307 |
Neg logit contributions | |
kered | -0.658 |
Cly | -0.611 |
racted | -0.589 |
>>>>>>>> | -0.575 |
★★ | -0.560 |
Token | ability |
Token ID | 1799 |
Feature activation | -6.31e-01 |
Pos logit contributions | |
icho | +2.078 |
llah | +2.067 |
Uri | +2.063 |
erity | +1.869 |
humans | +1.863 |
Neg logit contributions | |
kered | -1.879 |
Cly | -1.686 |
racted | -1.600 |
>>>>>>>> | -1.553 |
**************** | -1.492 |
Token | , |
Token ID | 11 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
icho | +0.447 |
Uri | +0.444 |
llah | +0.441 |
erity | +0.399 |
humans | +0.397 |
Neg logit contributions | |
kered | -0.451 |
Cly | -0.408 |
racted | -0.391 |
>>>>>>>> | -0.377 |
**************** | -0.364 |
Token | would |
Token ID | 561 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
kered | +0.212 |
Cly | +0.189 |
racted | +0.180 |
>>>>>>>> | +0.173 |
**************** | +0.166 |
Neg logit contributions | |
icho | -0.267 |
Uri | -0.265 |
llah | -0.264 |
erity | -0.240 |
humans | -0.240 |
Token | adjust |
Token ID | 4532 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
kered | +0.116 |
Cly | +0.105 |
racted | +0.100 |
>>>>>>>> | +0.097 |
**************** | +0.093 |
Neg logit contributions | |
icho | -0.125 |
Uri | -0.124 |
llah | -0.123 |
erity | -0.111 |
humans | -0.111 |
Token | building |
Token ID | 2615 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
icho | +0.101 |
Uri | +0.100 |
llah | +0.099 |
erity | +0.087 |
humans | +0.087 |
Neg logit contributions | |
kered | -0.152 |
Cly | -0.140 |
racted | -0.135 |
>>>>>>>> | -0.132 |
**************** | -0.128 |
Token |
|
Token ID | 198 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
kered | +0.172 |
Cly | +0.157 |
racted | +0.149 |
>>>>>>>> | +0.145 |
**************** | +0.140 |
Neg logit contributions | |
icho | -0.173 |
Uri | -0.170 |
llah | -0.170 |
erity | -0.153 |
humans | -0.153 |
Token | The |
Token ID | 464 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
kered | +0.146 |
Cly | +0.133 |
racted | +0.127 |
>>>>>>>> | +0.123 |
★★ | +0.119 |
Neg logit contributions | |
icho | -0.134 |
Uri | -0.133 |
llah | -0.132 |
erity | -0.118 |
humans | -0.118 |
Token | City |
Token ID | 2254 |
Feature activation | -6.47e-01 |
Pos logit contributions | |
icho | +0.306 |
Uri | +0.305 |
llah | +0.303 |
erity | +0.272 |
humans | +0.272 |
Neg logit contributions | |
kered | -0.318 |
Cly | -0.287 |
racted | -0.276 |
>>>>>>>> | -0.267 |
**************** | -0.258 |
Token | of |
Token ID | 286 |
Feature activation | -4.47e-01 |
Pos logit contributions | |
icho | +0.412 |
Uri | +0.409 |
llah | +0.407 |
erity | +0.362 |
humans | +0.362 |
Neg logit contributions | |
kered | -0.509 |
Cly | -0.464 |
racted | -0.446 |
>>>>>>>> | -0.434 |
★★ | -0.420 |
Token | Wh |
Token ID | 854 |
Feature activation | -6.80e-01 |
Pos logit contributions | |
icho | +0.316 |
Uri | +0.314 |
llah | +0.312 |
humans | +0.281 |
erity | +0.281 |
Neg logit contributions | |
kered | -0.320 |
Cly | -0.290 |
racted | -0.278 |
>>>>>>>> | -0.269 |
★★ | -0.259 |
Token | itt |
Token ID | 715 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
icho | +0.441 |
llah | +0.434 |
Uri | +0.433 |
erity | +0.386 |
humans | +0.386 |
Neg logit contributions | |
kered | -0.527 |
Cly | -0.484 |
racted | -0.462 |
>>>>>>>> | -0.451 |
★★ | -0.436 |
Token | les |
Token ID | 829 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
icho | +2.328 |
llah | +2.308 |
Uri | +2.290 |
alon | +2.111 |
irit | +2.099 |
Neg logit contributions | |
kered | -1.575 |
Cly | -1.403 |
racted | -1.323 |
>>>>>>>> | -1.291 |
★★ | -1.226 |
Token | ea |
Token ID | 18213 |
Feature activation | +6.14e-01 |
Pos logit contributions | |
icho | +0.229 |
Uri | +0.228 |
llah | +0.227 |
erity | +0.209 |
humans | +0.207 |
Neg logit contributions | |
kered | -0.202 |
Cly | -0.182 |
racted | -0.173 |
>>>>>>>> | -0.165 |
**************** | -0.161 |
Token | covers |
Token ID | 8698 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
kered | +0.451 |
Cly | +0.412 |
racted | +0.393 |
>>>>>>>> | +0.380 |
★★ | +0.367 |
Neg logit contributions | |
icho | -0.424 |
Uri | -0.419 |
llah | -0.418 |
erity | -0.375 |
humans | -0.375 |
Token | almost |
Token ID | 2048 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
kered | +0.103 |
Cly | +0.094 |
racted | +0.089 |
>>>>>>>> | +0.086 |
**************** | +0.083 |
Neg logit contributions | |
icho | -0.109 |
llah | -0.107 |
Uri | -0.107 |
humans | -0.097 |
erity | -0.097 |
Token | 500 |
Token ID | 5323 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
icho | +0.434 |
Uri | +0.430 |
llah | +0.428 |
humans | +0.388 |
erity | +0.387 |
Neg logit contributions | |
kered | -0.396 |
Cly | -0.357 |
racted | -0.341 |
>>>>>>>> | -0.329 |
**************** | -0.316 |
Token | Bloomberg |
Token ID | 15689 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
icho | +0.163 |
Uri | +0.162 |
llah | +0.161 |
humans | +0.143 |
erity | +0.143 |
Neg logit contributions | |
kered | -0.202 |
Cly | -0.185 |
racted | -0.178 |
>>>>>>>> | -0.172 |
★★ | -0.167 |
Token | Politics |
Token ID | 17554 |
Feature activation | -4.26e-01 |
Pos logit contributions | |
icho | +0.291 |
Uri | +0.289 |
llah | +0.287 |
erity | +0.261 |
humans | +0.260 |
Neg logit contributions | |
kered | -0.260 |
Cly | -0.233 |
racted | -0.222 |
>>>>>>>> | -0.214 |
★★ | -0.206 |
Token | and |
Token ID | 290 |
Feature activation | +7.82e-02 |
Pos logit contributions | |
Uri | +0.297 |
icho | +0.296 |
llah | +0.293 |
erity | +0.265 |
humans | +0.264 |
Neg logit contributions | |
kered | -0.310 |
Cly | -0.280 |
racted | -0.269 |
>>>>>>>> | -0.259 |
★★ | -0.250 |
Token | Saint |
Token ID | 9281 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
kered | +0.062 |
Cly | +0.057 |
racted | +0.054 |
>>>>>>>> | +0.053 |
★★ | +0.051 |
Neg logit contributions | |
icho | -0.050 |
llah | -0.049 |
Uri | -0.049 |
erity | -0.044 |
humans | -0.044 |
Token | An |
Token ID | 1052 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
kered | +0.320 |
Cly | +0.291 |
racted | +0.277 |
>>>>>>>> | +0.269 |
★★ | +0.259 |
Neg logit contributions | |
icho | -0.318 |
Uri | -0.314 |
llah | -0.314 |
humans | -0.282 |
erity | -0.282 |
Token | sel |
Token ID | 741 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
icho | +0.851 |
Uri | +0.845 |
llah | +0.840 |
alon | +0.770 |
irit | +0.770 |
Neg logit contributions | |
kered | -0.635 |
Cly | -0.566 |
racted | -0.535 |
>>>>>>>> | -0.523 |
★★ | -0.497 |
Token | m |
Token ID | 76 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
icho | +1.294 |
Uri | +1.287 |
llah | +1.277 |
alon | +1.081 |
humans | +1.069 |
Neg logit contributions | |
kered | -2.643 |
Cly | -2.406 |
racted | -2.354 |
>>>>>>>> | -2.282 |
Changes | -2.245 |
Token | College |
Token ID | 5535 |
Feature activation | -5.71e-01 |
Pos logit contributions | |
kered | +0.194 |
Cly | +0.173 |
racted | +0.166 |
>>>>>>>> | +0.160 |
**************** | +0.154 |
Neg logit contributions | |
icho | -0.204 |
Uri | -0.202 |
llah | -0.201 |
erity | -0.182 |
humans | -0.182 |
Token | and |
Token ID | 290 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
Uri | +0.386 |
icho | +0.385 |
llah | +0.380 |
erity | +0.343 |
humans | +0.341 |
Neg logit contributions | |
kered | -0.426 |
Cly | -0.384 |
racted | -0.371 |
>>>>>>>> | -0.358 |
**************** | -0.347 |
Token | conducted |
Token ID | 5952 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
icho | +0.009 |
llah | +0.009 |
Uri | +0.009 |
humans | +0.008 |
erity | +0.008 |
Neg logit contributions | |
kered | -0.012 |
Cly | -0.011 |
racted | -0.010 |
>>>>>>>> | -0.010 |
★★ | -0.010 |
Token | by |
Token ID | 416 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
icho | +0.797 |
Uri | +0.791 |
llah | +0.786 |
humans | +0.700 |
erity | +0.699 |
Neg logit contributions | |
kered | -0.954 |
Cly | -0.871 |
racted | -0.837 |
>>>>>>>> | -0.813 |
**************** | -0.786 |
Token | Mn |
Token ID | 36030 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
kered | +0.203 |
Cly | +0.191 |
racted | +0.186 |
>>>>>>>> | +0.182 |
**************** | +0.178 |
Neg logit contributions | |
icho | -0.062 |
Uri | -0.060 |
llah | -0.060 |
humans | -0.047 |
erity | -0.047 |
Token | uchin |
Token ID | 43416 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
kered | +0.950 |
Cly | +0.870 |
racted | +0.832 |
>>>>>>>> | +0.804 |
**************** | +0.781 |
Neg logit contributions | |
icho | -0.816 |
Uri | -0.814 |
llah | -0.807 |
humans | -0.724 |
erity | -0.723 |
Token | , |
Token ID | 11 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
kered | +0.231 |
Cly | +0.208 |
racted | +0.201 |
>>>>>>>> | +0.193 |
Changes | +0.185 |
Neg logit contributions | |
icho | -0.245 |
Uri | -0.243 |
llah | -0.242 |
erity | -0.219 |
humans | -0.218 |
Token | that |
Token ID | 326 |
Feature activation | +8.22e-02 |
Pos logit contributions | |
kered | +0.299 |
Cly | +0.271 |
racted | +0.259 |
>>>>>>>> | +0.250 |
★★ | +0.241 |
Neg logit contributions | |
icho | -0.299 |
Uri | -0.296 |
llah | -0.295 |
humans | -0.265 |
erity | -0.265 |
Token | the |
Token ID | 262 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
kered | +0.067 |
Cly | +0.061 |
racted | +0.059 |
>>>>>>>> | +0.057 |
★★ | +0.055 |
Neg logit contributions | |
icho | -0.051 |
Uri | -0.050 |
llah | -0.050 |
erity | -0.044 |
humans | -0.044 |
Token | debt |
Token ID | 5057 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
kered | +0.094 |
Cly | +0.085 |
racted | +0.081 |
>>>>>>>> | +0.078 |
★★ | +0.076 |
Neg logit contributions | |
icho | -0.100 |
Uri | -0.099 |
llah | -0.098 |
humans | -0.089 |
erity | -0.089 |
Token | ceiling |
Token ID | 13387 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
icho | +1.531 |
Uri | +1.514 |
llah | +1.451 |
humans | +1.313 |
erity | +1.299 |
Neg logit contributions | |
kered | -2.328 |
racted | -2.135 |
Cly | -2.115 |
>>>>>>>> | -2.008 |
**************** | -1.979 |
Token | would |
Token ID | 561 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
kered | +0.351 |
Cly | +0.318 |
racted | +0.304 |
>>>>>>>> | +0.293 |
**************** | +0.283 |
Neg logit contributions | |
icho | -0.364 |
Uri | -0.360 |
llah | -0.359 |
humans | -0.324 |
erity | -0.324 |
Token | be |
Token ID | 307 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
kered | +0.289 |
Cly | +0.262 |
racted | +0.250 |
>>>>>>>> | +0.242 |
★★ | +0.232 |
Neg logit contributions | |
icho | -0.309 |
Uri | -0.306 |
llah | -0.305 |
erity | -0.275 |
humans | -0.275 |
Token | raised |
Token ID | 4376 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
icho | +0.297 |
Uri | +0.294 |
llah | +0.294 |
humans | +0.263 |
erity | +0.262 |
Neg logit contributions | |
kered | -0.330 |
Cly | -0.302 |
racted | -0.288 |
>>>>>>>> | -0.280 |
**************** | -0.270 |
Token | . |
Token ID | 13 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
icho | +0.308 |
Uri | +0.305 |
llah | +0.303 |
humans | +0.270 |
erity | +0.270 |
Neg logit contributions | |
kered | -0.360 |
Cly | -0.328 |
racted | -0.316 |
>>>>>>>> | -0.306 |
**************** | -0.295 |
Token | last |
Token ID | 938 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
kered | +0.148 |
Cly | +0.136 |
racted | +0.129 |
>>>>>>>> | +0.125 |
**************** | +0.122 |
Neg logit contributions | |
icho | -0.134 |
Uri | -0.132 |
llah | -0.132 |
humans | -0.119 |
erity | -0.119 |
Token | . |
Token ID | 13 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
kered | +0.396 |
Cly | +0.367 |
racted | +0.349 |
>>>>>>>> | +0.341 |
**************** | +0.334 |
Neg logit contributions | |
icho | -0.283 |
llah | -0.277 |
Uri | -0.275 |
erity | -0.246 |
humans | -0.244 |
Token |
|
Token ID | 198 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
kered | +0.195 |
Cly | +0.180 |
racted | +0.171 |
>>>>>>>> | +0.167 |
**************** | +0.162 |
Neg logit contributions | |
icho | -0.163 |
llah | -0.160 |
Uri | -0.159 |
erity | -0.143 |
humans | -0.143 |
Token |
|
Token ID | 198 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
kered | +0.154 |
Cly | +0.141 |
racted | +0.134 |
>>>>>>>> | +0.130 |
**************** | +0.125 |
Neg logit contributions | |
icho | -0.157 |
llah | -0.155 |
Uri | -0.155 |
erity | -0.139 |
humans | -0.139 |
Token | Article |
Token ID | 14906 |
Feature activation | -9.88e-01 |
Pos logit contributions | |
kered | +0.152 |
Cly | +0.136 |
racted | +0.128 |
>>>>>>>> | +0.123 |
**************** | +0.118 |
Neg logit contributions | |
icho | -0.212 |
Uri | -0.210 |
llah | -0.210 |
erity | -0.192 |
humans | -0.192 |
Token | Continued |
Token ID | 22168 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
icho | +0.605 |
Uri | +0.598 |
llah | +0.596 |
humans | +0.526 |
erity | +0.526 |
Neg logit contributions | |
kered | -0.802 |
Cly | -0.737 |
racted | -0.708 |
>>>>>>>> | -0.688 |
★★ | -0.667 |
Token | Below |
Token ID | 10383 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
icho | +1.803 |
Uri | +1.797 |
llah | +1.782 |
humans | +1.590 |
alon | +1.572 |
Neg logit contributions | |
kered | -2.107 |
Cly | -1.897 |
racted | -1.837 |
>>>>>>>> | -1.777 |
★★ | -1.718 |
Token |
|
Token ID | 198 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
icho | +1.149 |
Uri | +1.149 |
llah | +1.135 |
humans | +1.023 |
erity | +1.009 |
Neg logit contributions | |
kered | -1.271 |
Cly | -1.145 |
racted | -1.108 |
>>>>>>>> | -1.066 |
★★ | -1.029 |
Token |
|
Token ID | 198 |
Feature activation | +3.87e-02 |
Pos logit contributions | |
icho | +0.075 |
llah | +0.074 |
Uri | +0.074 |
erity | +0.067 |
humans | +0.067 |
Neg logit contributions | |
kered | -0.074 |
Cly | -0.067 |
racted | -0.064 |
>>>>>>>> | -0.062 |
**************** | -0.060 |
Token | T |
Token ID | 51 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
kered | +0.028 |
Cly | +0.026 |
racted | +0.025 |
>>>>>>>> | +0.024 |
**************** | +0.023 |
Neg logit contributions | |
icho | -0.027 |
Uri | -0.027 |
llah | -0.027 |
erity | -0.024 |
humans | -0.024 |
Token | od |
Token ID | 375 |
Feature activation | -1.97e-01 |
Pos logit contributions | |
kered | +0.162 |
Cly | +0.149 |
racted | +0.143 |
>>>>>>>> | +0.139 |
★★ | +0.135 |
Neg logit contributions | |
icho | -0.124 |
Uri | -0.122 |
llah | -0.122 |
humans | -0.108 |
erity | -0.108 |
Token | founder |
Token ID | 9119 |
Feature activation | -8.65e-01 |
Pos logit contributions | |
icho | +0.832 |
Uri | +0.824 |
llah | +0.821 |
humans | +0.737 |
erity | +0.735 |
Neg logit contributions | |
kered | -0.872 |
Cly | -0.790 |
racted | -0.758 |
>>>>>>>> | -0.735 |
★★ | -0.708 |
Token | Rev |
Token ID | 5416 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
icho | +0.608 |
Uri | +0.605 |
llah | +0.600 |
humans | +0.539 |
erity | +0.539 |
Neg logit contributions | |
kered | -0.624 |
Cly | -0.564 |
racted | -0.542 |
>>>>>>>> | -0.525 |
★★ | -0.506 |
Token | . |
Token ID | 13 |
Feature activation | -5.36e-02 |
Pos logit contributions | |
icho | +0.310 |
Uri | +0.306 |
llah | +0.306 |
erity | +0.273 |
humans | +0.273 |
Neg logit contributions | |
kered | -0.354 |
Cly | -0.324 |
racted | -0.310 |
>>>>>>>> | -0.299 |
**************** | -0.290 |
Token | Ted |
Token ID | 11396 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
icho | +0.040 |
llah | +0.039 |
Uri | +0.039 |
erity | +0.035 |
humans | +0.035 |
Neg logit contributions | |
kered | -0.037 |
Cly | -0.034 |
racted | -0.032 |
>>>>>>>> | -0.031 |
**************** | -0.030 |
Token | H |
Token ID | 367 |
Feature activation | -8.77e-01 |
Pos logit contributions | |
kered | +0.339 |
Cly | +0.310 |
racted | +0.292 |
>>>>>>>> | +0.282 |
**************** | +0.272 |
Neg logit contributions | |
icho | -0.352 |
llah | -0.348 |
Uri | -0.346 |
humans | -0.314 |
erity | -0.313 |
Token | agg |
Token ID | 9460 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
icho | +0.619 |
llah | +0.609 |
Uri | +0.608 |
humans | +0.545 |
erity | +0.544 |
Neg logit contributions | |
kered | -0.633 |
Cly | -0.575 |
racted | -0.548 |
>>>>>>>> | -0.534 |
★★ | -0.515 |
Token | ard |
Token ID | 446 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
icho | +2.159 |
llah | +2.116 |
Uri | +2.116 |
alon | +1.936 |
humans | +1.932 |
Neg logit contributions | |
kered | -1.742 |
Cly | -1.550 |
racted | -1.476 |
>>>>>>>> | -1.445 |
★★ | -1.380 |
Token | is |
Token ID | 318 |
Feature activation | -6.22e-02 |
Pos logit contributions | |
icho | +1.080 |
Uri | +1.071 |
llah | +1.065 |
humans | +0.949 |
erity | +0.948 |
Neg logit contributions | |
kered | -1.190 |
Cly | -1.078 |
racted | -1.043 |
>>>>>>>> | -1.010 |
★★ | -0.978 |
Token | prof |
Token ID | 1534 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
icho | +0.041 |
llah | +0.040 |
Uri | +0.040 |
erity | +0.036 |
humans | +0.036 |
Neg logit contributions | |
kered | -0.048 |
Cly | -0.044 |
racted | -0.042 |
>>>>>>>> | -0.041 |
**************** | -0.040 |
Token | iled |
Token ID | 3902 |
Feature activation | +9.42e-01 |
Pos logit contributions | |
kered | +0.313 |
Cly | +0.278 |
racted | +0.263 |
>>>>>>>> | +0.251 |
**************** | +0.240 |
Neg logit contributions | |
icho | -0.450 |
Uri | -0.446 |
llah | -0.445 |
humans | -0.408 |
erity | -0.407 |
Token | in |
Token ID | 287 |
Feature activation | +4.77e-02 |
Pos logit contributions | |
kered | +0.731 |
Cly | +0.671 |
racted | +0.638 |
>>>>>>>> | +0.620 |
**************** | +0.603 |
Neg logit contributions | |
icho | -0.612 |
llah | -0.604 |
Uri | -0.602 |
erity | -0.537 |
humans | -0.537 |
Token | . |
Token ID | 13 |
Feature activation | +4.54e-01 |
Pos logit contributions | |
icho | +0.275 |
Uri | +0.271 |
llah | +0.270 |
humans | +0.238 |
erity | +0.237 |
Neg logit contributions | |
kered | -0.392 |
Cly | -0.359 |
racted | -0.343 |
>>>>>>>> | -0.338 |
Changes | -0.326 |
Token |
|
Token ID | 198 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
kered | +0.338 |
Cly | +0.311 |
racted | +0.296 |
>>>>>>>> | +0.288 |
**************** | +0.279 |
Neg logit contributions | |
icho | -0.308 |
llah | -0.304 |
Uri | -0.303 |
erity | -0.272 |
humans | -0.272 |
Token |
|
Token ID | 198 |
Feature activation | +3.74e-02 |
Pos logit contributions | |
kered | +0.153 |
Cly | +0.139 |
racted | +0.133 |
>>>>>>>> | +0.128 |
**************** | +0.124 |
Neg logit contributions | |
icho | -0.151 |
Uri | -0.149 |
llah | -0.149 |
erity | -0.134 |
humans | -0.134 |
Token | 6 |
Token ID | 21 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
kered | +0.027 |
Cly | +0.024 |
racted | +0.023 |
>>>>>>>> | +0.022 |
★★ | +0.021 |
Neg logit contributions | |
icho | -0.027 |
llah | -0.026 |
Uri | -0.026 |
humans | -0.024 |
erity | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
icho | +0.016 |
llah | +0.015 |
Uri | +0.015 |
erity | +0.014 |
humans | +0.014 |
Neg logit contributions | |
kered | -0.016 |
Cly | -0.015 |
racted | -0.014 |
>>>>>>>> | -0.013 |
**************** | -0.013 |
Token | Place |
Token ID | 8474 |
Feature activation | -2.73e+00 |
Pos logit contributions | |
kered | +0.198 |
Cly | +0.183 |
racted | +0.175 |
>>>>>>>> | +0.170 |
**************** | +0.165 |
Neg logit contributions | |
icho | -0.157 |
llah | -0.155 |
Uri | -0.154 |
erity | -0.137 |
humans | -0.137 |
Token | the |
Token ID | 262 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
icho | +1.500 |
Uri | +1.478 |
llah | +1.468 |
humans | +1.279 |
alon | +1.278 |
Neg logit contributions | |
kered | -2.376 |
Cly | -2.185 |
racted | -2.110 |
>>>>>>>> | -2.071 |
Changes | -2.008 |
Token | pot |
Token ID | 1787 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
icho | +0.268 |
Uri | +0.265 |
llah | +0.264 |
humans | +0.236 |
erity | +0.236 |
Neg logit contributions | |
kered | -0.288 |
Cly | -0.262 |
racted | -0.251 |
>>>>>>>> | -0.243 |
★★ | -0.235 |
Token | with |
Token ID | 351 |
Feature activation | -1.97e-01 |
Pos logit contributions | |
kered | +0.255 |
Cly | +0.233 |
racted | +0.223 |
>>>>>>>> | +0.217 |
★★ | +0.209 |
Neg logit contributions | |
icho | -0.221 |
Uri | -0.219 |
llah | -0.218 |
humans | -0.195 |
erity | -0.195 |
Token | all |
Token ID | 477 |
Feature activation | -5.49e-03 |
Pos logit contributions | |
icho | +0.108 |
Uri | +0.107 |
llah | +0.106 |
erity | +0.093 |
humans | +0.092 |
Neg logit contributions | |
kered | -0.173 |
Cly | -0.160 |
racted | -0.154 |
>>>>>>>> | -0.150 |
**************** | -0.146 |
Token | the |
Token ID | 262 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
icho | +0.003 |
llah | +0.003 |
Uri | +0.003 |
erity | +0.003 |
humans | +0.003 |
Neg logit contributions | |
kered | -0.005 |
Cly | -0.004 |
racted | -0.004 |
>>>>>>>> | -0.004 |
**************** | -0.004 |
Token | craft |
Token ID | 5977 |
Feature activation | +7.52e-01 |
Pos logit contributions | |
icho | +0.685 |
Uri | +0.677 |
llah | +0.676 |
humans | +0.604 |
erity | +0.603 |
Neg logit contributions | |
kered | -0.772 |
Cly | -0.705 |
racted | -0.675 |
>>>>>>>> | -0.655 |
★★ | -0.632 |
Token | . |
Token ID | 13 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
kered | +0.552 |
Cly | +0.505 |
racted | +0.482 |
>>>>>>>> | +0.463 |
★★ | +0.450 |
Neg logit contributions | |
icho | -0.522 |
llah | -0.513 |
Uri | -0.512 |
erity | -0.460 |
humans | -0.458 |
Token | They |
Token ID | 1119 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
icho | +0.096 |
llah | +0.095 |
Uri | +0.094 |
erity | +0.083 |
humans | +0.083 |
Neg logit contributions | |
kered | -0.131 |
Cly | -0.122 |
racted | -0.116 |
>>>>>>>> | -0.113 |
★★ | -0.110 |
Token | can |
Token ID | 460 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
icho | +0.009 |
Uri | +0.009 |
llah | +0.009 |
humans | +0.008 |
erity | +0.008 |
Neg logit contributions | |
kered | -0.011 |
Cly | -0.010 |
racted | -0.009 |
>>>>>>>> | -0.009 |
★★ | -0.009 |
Token | go |
Token ID | 467 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
icho | +0.123 |
Uri | +0.122 |
llah | +0.122 |
humans | +0.109 |
erity | +0.109 |
Neg logit contributions | |
kered | -0.133 |
Cly | -0.121 |
racted | -0.116 |
>>>>>>>> | -0.113 |
★★ | -0.109 |
Token | round |
Token ID | 2835 |
Feature activation | -2.73e+00 |
Pos logit contributions | |
icho | +0.317 |
Uri | +0.313 |
llah | +0.312 |
humans | +0.278 |
erity | +0.278 |
Neg logit contributions | |
kered | -0.371 |
Cly | -0.340 |
racted | -0.325 |
>>>>>>>> | -0.316 |
★★ | -0.305 |
Token | and |
Token ID | 290 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
icho | +1.776 |
Uri | +1.761 |
llah | +1.738 |
humans | +1.573 |
erity | +1.552 |
Neg logit contributions | |
kered | -2.076 |
Cly | -1.907 |
racted | -1.818 |
>>>>>>>> | -1.795 |
★★ | -1.723 |
Token | put |
Token ID | 1234 |
Feature activation | -9.97e-01 |
Pos logit contributions | |
icho | +0.844 |
Uri | +0.836 |
llah | +0.832 |
erity | +0.754 |
humans | +0.754 |
Neg logit contributions | |
kered | -0.745 |
Cly | -0.672 |
racted | -0.640 |
>>>>>>>> | -0.619 |
★★ | -0.593 |
Token | in |
Token ID | 287 |
Feature activation | +2.85e-02 |
Pos logit contributions | |
icho | +0.642 |
Uri | +0.635 |
llah | +0.631 |
humans | +0.564 |
erity | +0.561 |
Neg logit contributions | |
kered | -0.776 |
Cly | -0.710 |
racted | -0.682 |
>>>>>>>> | -0.665 |
★★ | -0.642 |
Token | a |
Token ID | 257 |
Feature activation | -6.90e-01 |
Pos logit contributions | |
kered | +0.023 |
Cly | +0.021 |
racted | +0.020 |
>>>>>>>> | +0.020 |
★★ | +0.019 |
Neg logit contributions | |
icho | -0.018 |
llah | -0.017 |
Uri | -0.017 |
erity | -0.015 |
humans | -0.015 |
Token | good |
Token ID | 922 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
icho | +0.379 |
llah | +0.374 |
Uri | +0.373 |
erity | +0.325 |
humans | +0.325 |
Neg logit contributions | |
kered | -0.605 |
Cly | -0.559 |
racted | -0.538 |
>>>>>>>> | -0.525 |
★★ | -0.510 |
Token | considered |
Token ID | 3177 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
kered | +0.717 |
Cly | +0.666 |
racted | +0.634 |
>>>>>>>> | +0.616 |
**************** | +0.597 |
Neg logit contributions | |
icho | -0.538 |
llah | -0.531 |
Uri | -0.526 |
erity | -0.469 |
humans | -0.465 |
Token | one |
Token ID | 530 |
Feature activation | -3.87e-01 |
Pos logit contributions | |
kered | +0.419 |
Cly | +0.385 |
racted | +0.367 |
>>>>>>>> | +0.355 |
★★ | +0.344 |
Neg logit contributions | |
icho | -0.365 |
llah | -0.362 |
Uri | -0.360 |
erity | -0.322 |
humans | -0.321 |
Token | of |
Token ID | 286 |
Feature activation | +6.80e-02 |
Pos logit contributions | |
icho | +0.231 |
Uri | +0.228 |
llah | +0.227 |
humans | +0.200 |
erity | +0.200 |
Neg logit contributions | |
kered | -0.320 |
Cly | -0.294 |
racted | -0.283 |
>>>>>>>> | -0.276 |
**************** | -0.267 |
Token | the |
Token ID | 262 |
Feature activation | -3.66e-01 |
Pos logit contributions | |
kered | +0.059 |
Cly | +0.054 |
racted | +0.052 |
>>>>>>>> | +0.051 |
★★ | +0.049 |
Neg logit contributions | |
icho | -0.038 |
llah | -0.038 |
Uri | -0.038 |
erity | -0.033 |
humans | -0.033 |
Token | main |
Token ID | 1388 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
icho | +0.240 |
llah | +0.237 |
Uri | +0.236 |
erity | +0.211 |
humans | +0.211 |
Neg logit contributions | |
kered | -0.281 |
Cly | -0.258 |
racted | -0.247 |
>>>>>>>> | -0.239 |
★★ | -0.231 |
Token | characters |
Token ID | 3435 |
Feature activation | -2.72e+00 |
Pos logit contributions | |
kered | +0.085 |
Cly | +0.077 |
racted | +0.074 |
>>>>>>>> | +0.071 |
**************** | +0.069 |
Neg logit contributions | |
icho | -0.083 |
Uri | -0.082 |
llah | -0.082 |
erity | -0.074 |
humans | -0.074 |
Token | , |
Token ID | 11 |
Feature activation | -5.62e-01 |
Pos logit contributions | |
icho | +1.693 |
Uri | +1.686 |
llah | +1.650 |
humans | +1.478 |
erity | +1.476 |
Neg logit contributions | |
kered | -2.153 |
Cly | -1.959 |
racted | -1.901 |
>>>>>>>> | -1.847 |
★★ | -1.795 |
Token | he |
Token ID | 339 |
Feature activation | -7.94e-01 |
Pos logit contributions | |
icho | +0.345 |
Uri | +0.341 |
llah | +0.340 |
humans | +0.300 |
erity | +0.300 |
Neg logit contributions | |
kered | -0.456 |
Cly | -0.419 |
racted | -0.402 |
>>>>>>>> | -0.391 |
★★ | -0.379 |
Token | rarely |
Token ID | 8365 |
Feature activation | -6.90e-02 |
Pos logit contributions | |
icho | +0.548 |
Uri | +0.544 |
llah | +0.540 |
humans | +0.486 |
erity | +0.484 |
Neg logit contributions | |
kered | -0.580 |
Cly | -0.527 |
racted | -0.506 |
>>>>>>>> | -0.491 |
★★ | -0.475 |
Token | interacted |
Token ID | 49236 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
icho | +0.046 |
Uri | +0.045 |
llah | +0.045 |
humans | +0.040 |
erity | +0.040 |
Neg logit contributions | |
kered | -0.053 |
Cly | -0.048 |
racted | -0.046 |
>>>>>>>> | -0.045 |
★★ | -0.043 |
Token | with |
Token ID | 351 |
Feature activation | -6.23e-01 |
Pos logit contributions | |
kered | +0.186 |
Cly | +0.172 |
racted | +0.166 |
>>>>>>>> | +0.162 |
**************** | +0.157 |
Neg logit contributions | |
icho | -0.117 |
Uri | -0.115 |
llah | -0.115 |
erity | -0.100 |
humans | -0.100 |
Token | as |
Token ID | 355 |
Feature activation | +6.64e-01 |
Pos logit contributions | |
kered | +0.101 |
Cly | +0.092 |
racted | +0.088 |
>>>>>>>> | +0.085 |
★★ | +0.082 |
Neg logit contributions | |
icho | -0.102 |
Uri | -0.101 |
llah | -0.101 |
humans | -0.091 |
erity | -0.091 |
Token | light |
Token ID | 1657 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
kered | +0.516 |
Cly | +0.473 |
racted | +0.452 |
>>>>>>>> | +0.438 |
**************** | +0.425 |
Neg logit contributions | |
icho | -0.430 |
Uri | -0.425 |
llah | -0.424 |
erity | -0.377 |
humans | -0.377 |
Token | as |
Token ID | 355 |
Feature activation | +7.01e-01 |
Pos logit contributions | |
kered | +0.427 |
Cly | +0.387 |
racted | +0.369 |
>>>>>>>> | +0.358 |
★★ | +0.344 |
Neg logit contributions | |
icho | -0.454 |
Uri | -0.448 |
llah | -0.448 |
humans | -0.404 |
erity | -0.404 |
Token | possible |
Token ID | 1744 |
Feature activation | +5.35e-01 |
Pos logit contributions | |
kered | +0.430 |
Cly | +0.384 |
racted | +0.363 |
>>>>>>>> | +0.349 |
**************** | +0.334 |
Neg logit contributions | |
icho | -0.569 |
Uri | -0.563 |
llah | -0.563 |
erity | -0.513 |
humans | -0.513 |
Token | . |
Token ID | 13 |
Feature activation | +3.84e-01 |
Pos logit contributions | |
kered | +0.391 |
Cly | +0.356 |
racted | +0.340 |
>>>>>>>> | +0.331 |
★★ | +0.319 |
Neg logit contributions | |
icho | -0.369 |
Uri | -0.366 |
llah | -0.366 |
humans | -0.328 |
erity | -0.327 |
Token |
|
Token ID | 198 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
kered | +0.300 |
Cly | +0.277 |
racted | +0.264 |
>>>>>>>> | +0.257 |
**************** | +0.249 |
Neg logit contributions | |
icho | -0.246 |
llah | -0.243 |
Uri | -0.242 |
erity | -0.215 |
humans | -0.215 |
Token |
|
Token ID | 198 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
kered | +1.016 |
Cly | +0.928 |
racted | +0.877 |
>>>>>>>> | +0.855 |
**************** | +0.832 |
Neg logit contributions | |
icho | -1.086 |
llah | -1.074 |
Uri | -1.067 |
challeng | -0.988 |
erity | -0.972 |
Token | At |
Token ID | 2953 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
kered | +0.836 |
Cly | +0.760 |
racted | +0.725 |
>>>>>>>> | +0.704 |
**************** | +0.681 |
Neg logit contributions | |
icho | -0.856 |
Uri | -0.847 |
llah | -0.845 |
erity | -0.761 |
humans | -0.758 |
Token | the |
Token ID | 262 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
kered | +0.089 |
Cly | +0.082 |
racted | +0.079 |
>>>>>>>> | +0.077 |
**************** | +0.074 |
Neg logit contributions | |
icho | -0.064 |
Uri | -0.063 |
llah | -0.063 |
humans | -0.055 |
erity | -0.055 |
Token | same |
Token ID | 976 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
kered | +0.269 |
Cly | +0.249 |
racted | +0.239 |
>>>>>>>> | +0.232 |
**************** | +0.225 |
Neg logit contributions | |
icho | -0.194 |
Uri | -0.190 |
llah | -0.190 |
humans | -0.168 |
erity | -0.167 |
Token | time |
Token ID | 640 |
Feature activation | +2.46e-03 |
Pos logit contributions | |
icho | +0.092 |
Uri | +0.090 |
llah | +0.090 |
humans | +0.076 |
erity | +0.076 |
Neg logit contributions | |
kered | -0.186 |
Cly | -0.173 |
racted | -0.168 |
>>>>>>>> | -0.164 |
**************** | -0.160 |
Token | much |
Token ID | 881 |
Feature activation | +3.09e-01 |
Pos logit contributions | |
kered | +0.305 |
Cly | +0.279 |
racted | +0.266 |
>>>>>>>> | +0.258 |
**************** | +0.250 |
Neg logit contributions | |
icho | -0.274 |
Uri | -0.271 |
llah | -0.270 |
humans | -0.242 |
erity | -0.241 |
Token | happier |
Token ID | 23030 |
Feature activation | +5.08e-01 |
Pos logit contributions | |
kered | +0.239 |
Cly | +0.219 |
racted | +0.210 |
>>>>>>>> | +0.204 |
**************** | +0.198 |
Neg logit contributions | |
icho | -0.201 |
Uri | -0.198 |
llah | -0.198 |
humans | -0.177 |
erity | -0.175 |
Token | for |
Token ID | 329 |
Feature activation | +9.99e-01 |
Pos logit contributions | |
kered | +0.395 |
Cly | +0.361 |
racted | +0.346 |
>>>>>>>> | +0.337 |
**************** | +0.326 |
Neg logit contributions | |
icho | -0.329 |
Uri | -0.325 |
llah | -0.324 |
humans | -0.288 |
erity | -0.288 |
Token | it |
Token ID | 340 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
kered | +0.832 |
Cly | +0.771 |
racted | +0.741 |
>>>>>>>> | +0.722 |
**************** | +0.700 |
Neg logit contributions | |
icho | -0.587 |
llah | -0.580 |
Uri | -0.577 |
humans | -0.508 |
erity | -0.506 |
Token | . |
Token ID | 13 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
kered | +0.313 |
Cly | +0.285 |
racted | +0.273 |
>>>>>>>> | +0.264 |
★★ | +0.255 |
Neg logit contributions | |
icho | -0.293 |
Uri | -0.290 |
llah | -0.289 |
humans | -0.259 |
erity | -0.259 |
Token | � |
Token ID | 126 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
kered | +0.133 |
Cly | +0.122 |
racted | +0.115 |
>>>>>>>> | +0.112 |
**************** | +0.108 |
Neg logit contributions | |
icho | -0.144 |
llah | -0.142 |
Uri | -0.142 |
humans | -0.129 |
erity | -0.128 |
Token | � |
Token ID | 242 |
Feature activation | +4.07e-01 |
Pos logit contributions | |
kered | +1.109 |
Cly | +1.009 |
racted | +0.968 |
>>>>>>>> | +0.941 |
★★ | +0.913 |
Neg logit contributions | |
icho | -1.022 |
llah | -1.007 |
Uri | -1.007 |
humans | -0.908 |
okia | -0.900 |
Token |
|
Token ID | 198 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
kered | +0.296 |
Cly | +0.271 |
racted | +0.258 |
>>>>>>>> | +0.251 |
★★ | +0.242 |
Neg logit contributions | |
icho | -0.282 |
llah | -0.278 |
Uri | -0.278 |
humans | -0.250 |
erity | -0.250 |
Token |
|
Token ID | 198 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
icho | +0.102 |
Uri | +0.101 |
llah | +0.101 |
humans | +0.091 |
erity | +0.091 |
Neg logit contributions | |
kered | -0.104 |
Cly | -0.095 |
racted | -0.091 |
>>>>>>>> | -0.088 |
★★ | -0.084 |
Token | Perhaps |
Token ID | 13710 |
Feature activation | +5.09e-01 |
Pos logit contributions | |
icho | +0.157 |
Uri | +0.155 |
llah | +0.155 |
humans | +0.139 |
erity | +0.139 |
Neg logit contributions | |
kered | -0.161 |
Cly | -0.146 |
racted | -0.139 |
>>>>>>>> | -0.135 |
★★ | -0.130 |
Token | the |
Token ID | 262 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
kered | +0.409 |
Cly | +0.378 |
racted | +0.361 |
>>>>>>>> | +0.352 |
★★ | +0.341 |
Neg logit contributions | |
icho | -0.314 |
llah | -0.311 |
Uri | -0.309 |
humans | -0.275 |
erity | -0.274 |
Token | looks |
Token ID | 3073 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
icho | +0.507 |
Uri | +0.503 |
llah | +0.499 |
humans | +0.449 |
erity | +0.448 |
Neg logit contributions | |
kered | -0.546 |
Cly | -0.497 |
racted | -0.478 |
>>>>>>>> | -0.462 |
★★ | -0.445 |
Token | forward |
Token ID | 2651 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
kered | +0.249 |
Cly | +0.227 |
racted | +0.217 |
>>>>>>>> | +0.210 |
★★ | +0.204 |
Neg logit contributions | |
icho | -0.222 |
llah | -0.219 |
Uri | -0.219 |
humans | -0.196 |
erity | -0.195 |
Token | to |
Token ID | 284 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
kered | +0.129 |
Cly | +0.119 |
racted | +0.114 |
>>>>>>>> | +0.111 |
★★ | +0.108 |
Neg logit contributions | |
icho | -0.095 |
llah | -0.094 |
Uri | -0.094 |
humans | -0.083 |
erity | -0.083 |
Token | 2017 |
Token ID | 2177 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
kered | +0.214 |
Cly | +0.197 |
racted | +0.188 |
>>>>>>>> | +0.183 |
**************** | +0.178 |
Neg logit contributions | |
icho | -0.165 |
llah | -0.163 |
Uri | -0.162 |
erity | -0.144 |
humans | -0.143 |
Token | and |
Token ID | 290 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
kered | +0.208 |
Cly | +0.190 |
racted | +0.183 |
>>>>>>>> | +0.177 |
**************** | +0.171 |
Neg logit contributions | |
icho | -0.173 |
Uri | -0.170 |
llah | -0.170 |
humans | -0.151 |
erity | -0.151 |
Token | beyond |
Token ID | 3675 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
kered | +0.376 |
Cly | +0.343 |
racted | +0.326 |
>>>>>>>> | +0.317 |
**************** | +0.306 |
Neg logit contributions | |
icho | -0.351 |
llah | -0.346 |
Uri | -0.345 |
erity | -0.310 |
humans | -0.309 |
Token | . |
Token ID | 13 |
Feature activation | +2.28e-03 |
Pos logit contributions | |
kered | +1.590 |
Cly | +1.455 |
racted | +1.387 |
>>>>>>>> | +1.342 |
**************** | +1.304 |
Neg logit contributions | |
icho | -1.523 |
Uri | -1.505 |
llah | -1.497 |
erity | -1.350 |
humans | -1.342 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
kered | +0.002 |
Cly | +0.001 |
racted | +0.001 |
>>>>>>>> | +0.001 |
**************** | +0.001 |
Neg logit contributions | |
icho | -0.002 |
Uri | -0.002 |
llah | -0.002 |
humans | -0.001 |
erity | -0.001 |
Token | G |
Token ID | 38 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
kered | +0.155 |
Cly | +0.140 |
racted | +0.134 |
>>>>>>>> | +0.129 |
★★ | +0.124 |
Neg logit contributions | |
icho | -0.168 |
Uri | -0.166 |
llah | -0.166 |
erity | -0.150 |
humans | -0.150 |
Token | RAY |
Token ID | 30631 |
Feature activation | -5.50e-01 |
Pos logit contributions | |
kered | +0.296 |
Cly | +0.271 |
racted | +0.260 |
>>>>>>>> | +0.252 |
**************** | +0.244 |
Neg logit contributions | |
icho | -0.244 |
Uri | -0.242 |
llah | -0.241 |
humans | -0.214 |
erity | -0.214 |
Token | SON |
Token ID | 11782 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
icho | +0.420 |
Uri | +0.416 |
llah | +0.415 |
humans | +0.376 |
erity | +0.376 |
Neg logit contributions | |
kered | -0.364 |
Cly | -0.327 |
racted | -0.312 |
>>>>>>>> | -0.300 |
**************** | -0.288 |
Token | the |
Token ID | 262 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
icho | +0.152 |
Uri | +0.151 |
llah | +0.150 |
humans | +0.133 |
erity | +0.133 |
Neg logit contributions | |
kered | -0.194 |
Cly | -0.177 |
racted | -0.171 |
>>>>>>>> | -0.166 |
**************** | -0.161 |
Token | 31 |
Token ID | 3261 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
icho | +0.219 |
Uri | +0.217 |
llah | +0.216 |
humans | +0.194 |
erity | +0.194 |
Neg logit contributions | |
kered | -0.228 |
Cly | -0.207 |
racted | -0.198 |
>>>>>>>> | -0.192 |
★★ | -0.185 |
Token | - |
Token ID | 12 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
icho | +0.286 |
Uri | +0.284 |
llah | +0.282 |
erity | +0.259 |
humans | +0.258 |
Neg logit contributions | |
kered | -0.219 |
Cly | -0.195 |
racted | -0.184 |
>>>>>>>> | -0.178 |
**************** | -0.171 |
Token | year |
Token ID | 1941 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
kered | +0.092 |
Cly | +0.084 |
racted | +0.081 |
>>>>>>>> | +0.078 |
**************** | +0.076 |
Neg logit contributions | |
icho | -0.082 |
Uri | -0.081 |
llah | -0.081 |
erity | -0.072 |
humans | -0.072 |
Token | - |
Token ID | 12 |
Feature activation | -5.15e-01 |
Pos logit contributions | |
icho | +0.129 |
Uri | +0.129 |
llah | +0.127 |
humans | +0.116 |
erity | +0.116 |
Neg logit contributions | |
kered | -0.099 |
Cly | -0.088 |
racted | -0.084 |
>>>>>>>> | -0.080 |
**************** | -0.078 |
Token | old |
Token ID | 727 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
icho | +0.344 |
Uri | +0.340 |
llah | +0.339 |
humans | +0.305 |
erity | +0.303 |
Neg logit contributions | |
kered | -0.389 |
Cly | -0.355 |
racted | -0.340 |
>>>>>>>> | -0.329 |
★★ | -0.318 |
Token | left |
Token ID | 1364 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
kered | +1.159 |
Cly | +1.063 |
racted | +1.005 |
>>>>>>>> | +0.978 |
★★ | +0.942 |
Neg logit contributions | |
icho | -1.129 |
llah | -1.116 |
Uri | -1.103 |
humans | -1.000 |
erity | -0.999 |
Token | guard |
Token ID | 4860 |
Feature activation | -5.42e-01 |
Pos logit contributions | |
icho | +0.168 |
Uri | +0.167 |
llah | +0.167 |
humans | +0.152 |
erity | +0.152 |
Neg logit contributions | |
kered | -0.120 |
Cly | -0.107 |
racted | -0.101 |
>>>>>>>> | -0.097 |
★★ | -0.092 |
Token | is |
Token ID | 318 |
Feature activation | -9.63e-02 |
Pos logit contributions | |
icho | +0.373 |
Uri | +0.371 |
llah | +0.367 |
erity | +0.331 |
humans | +0.330 |
Neg logit contributions | |
kered | -0.397 |
Cly | -0.361 |
racted | -0.346 |
>>>>>>>> | -0.335 |
**************** | -0.323 |
Token | quietly |
Token ID | 12703 |
Feature activation | -8.41e-01 |
Pos logit contributions | |
icho | +0.067 |
llah | +0.067 |
Uri | +0.066 |
erity | +0.060 |
humans | +0.059 |
Neg logit contributions | |
kered | -0.070 |
Cly | -0.064 |
racted | -0.061 |
>>>>>>>> | -0.059 |
★★ | -0.057 |
Token | one |
Token ID | 530 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
icho | +0.551 |
llah | +0.545 |
Uri | +0.543 |
erity | +0.485 |
humans | +0.484 |
Neg logit contributions | |
kered | -0.649 |
Cly | -0.594 |
racted | -0.567 |
>>>>>>>> | -0.550 |
★★ | -0.534 |
Token | breakers |
Token ID | 49295 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
kered | +0.130 |
Cly | +0.117 |
racted | +0.111 |
>>>>>>>> | +0.107 |
★★ | +0.103 |
Neg logit contributions | |
icho | -0.146 |
Uri | -0.144 |
llah | -0.144 |
humans | -0.131 |
erity | -0.130 |
Token | and |
Token ID | 290 |
Feature activation | +3.39e-01 |
Pos logit contributions | |
kered | +1.096 |
Cly | +1.006 |
racted | +0.958 |
>>>>>>>> | +0.931 |
**************** | +0.900 |
Neg logit contributions | |
icho | -0.980 |
llah | -0.969 |
Uri | -0.967 |
humans | -0.868 |
erity | -0.868 |
Token | a |
Token ID | 257 |
Feature activation | +6.89e-02 |
Pos logit contributions | |
kered | +0.239 |
Cly | +0.218 |
racted | +0.207 |
>>>>>>>> | +0.200 |
**************** | +0.193 |
Neg logit contributions | |
icho | -0.243 |
llah | -0.241 |
Uri | -0.240 |
erity | -0.217 |
humans | -0.217 |
Token | nuclear |
Token ID | 4523 |
Feature activation | -5.11e-01 |
Pos logit contributions | |
kered | +0.050 |
Cly | +0.045 |
racted | +0.043 |
>>>>>>>> | +0.042 |
★★ | +0.041 |
Neg logit contributions | |
icho | -0.048 |
Uri | -0.048 |
llah | -0.047 |
erity | -0.043 |
humans | -0.043 |
Token | fre |
Token ID | 2030 |
Feature activation | -7.70e-01 |
Pos logit contributions | |
icho | +0.369 |
Uri | +0.364 |
llah | +0.363 |
erity | +0.327 |
humans | +0.326 |
Neg logit contributions | |
kered | -0.359 |
Cly | -0.324 |
racted | -0.310 |
>>>>>>>> | -0.300 |
Changes | -0.290 |
Token | ighter |
Token ID | 4799 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
icho | +0.674 |
llah | +0.665 |
Uri | +0.663 |
erity | +0.611 |
irit | +0.608 |
Neg logit contributions | |
kered | -0.424 |
Cly | -0.375 |
racted | -0.350 |
>>>>>>>> | -0.338 |
★★ | -0.322 |
Token | , |
Token ID | 11 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
kered | +1.099 |
Cly | +1.002 |
racted | +0.955 |
>>>>>>>> | +0.926 |
**************** | +0.893 |
Neg logit contributions | |
icho | -1.067 |
Uri | -1.054 |
llah | -1.053 |
humans | -0.948 |
erity | -0.947 |
Token | has |
Token ID | 468 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
kered | +0.103 |
Cly | +0.094 |
racted | +0.090 |
>>>>>>>> | +0.087 |
★★ | +0.084 |
Neg logit contributions | |
icho | -0.092 |
Uri | -0.091 |
llah | -0.090 |
humans | -0.081 |
erity | -0.081 |
Token | increased |
Token ID | 3220 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
icho | +0.172 |
llah | +0.170 |
Uri | +0.170 |
erity | +0.152 |
humans | +0.152 |
Neg logit contributions | |
kered | -0.187 |
Cly | -0.171 |
racted | -0.163 |
>>>>>>>> | -0.158 |
**************** | -0.153 |
Token | Arctic |
Token ID | 15723 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
icho | +0.214 |
Uri | +0.211 |
llah | +0.211 |
erity | +0.188 |
humans | +0.188 |
Neg logit contributions | |
kered | -0.254 |
Cly | -0.232 |
racted | -0.223 |
>>>>>>>> | -0.216 |
★★ | -0.209 |
Token | navigation |
Token ID | 16408 |
Feature activation | +8.06e-01 |
Pos logit contributions | |
kered | +0.027 |
Cly | +0.025 |
racted | +0.024 |
>>>>>>>> | +0.023 |
**************** | +0.022 |
Neg logit contributions | |
icho | -0.023 |
Uri | -0.023 |
llah | -0.023 |
erity | -0.020 |
humans | -0.020 |
Token | � |
Token ID | 247 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
kered | +0.040 |
Cly | +0.036 |
racted | +0.034 |
>>>>>>>> | +0.033 |
★★ | +0.031 |
Neg logit contributions | |
icho | -0.051 |
Uri | -0.051 |
llah | -0.051 |
humans | -0.046 |
erity | -0.046 |
Token | t |
Token ID | 83 |
Feature activation | -5.40e-01 |
Pos logit contributions | |
icho | +0.084 |
Uri | +0.083 |
llah | +0.082 |
humans | +0.071 |
erity | +0.071 |
Neg logit contributions | |
kered | -0.137 |
Cly | -0.127 |
racted | -0.122 |
>>>>>>>> | -0.119 |
**************** | -0.116 |
Token | been |
Token ID | 587 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
icho | +0.377 |
Uri | +0.374 |
llah | +0.372 |
erity | +0.334 |
humans | +0.334 |
Neg logit contributions | |
kered | -0.391 |
Cly | -0.356 |
racted | -0.341 |
>>>>>>>> | -0.330 |
★★ | -0.319 |
Token | succeeding |
Token ID | 34195 |
Feature activation | -7.31e-01 |
Pos logit contributions | |
icho | +0.288 |
llah | +0.285 |
Uri | +0.283 |
erity | +0.254 |
humans | +0.254 |
Neg logit contributions | |
kered | -0.325 |
Cly | -0.297 |
racted | -0.284 |
>>>>>>>> | -0.275 |
**************** | -0.266 |
Token | that |
Token ID | 326 |
Feature activation | -7.46e-01 |
Pos logit contributions | |
icho | +0.489 |
Uri | +0.483 |
llah | +0.482 |
humans | +0.430 |
erity | +0.430 |
Neg logit contributions | |
kered | -0.553 |
Cly | -0.504 |
racted | -0.483 |
>>>>>>>> | -0.468 |
**************** | -0.452 |
Token | well |
Token ID | 880 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
icho | +0.487 |
llah | +0.480 |
Uri | +0.478 |
humans | +0.429 |
erity | +0.429 |
Neg logit contributions | |
kered | -0.578 |
Cly | -0.530 |
racted | -0.504 |
>>>>>>>> | -0.494 |
**************** | -0.476 |
Token | , |
Token ID | 11 |
Feature activation | +4.64e-01 |
Pos logit contributions | |
kered | +0.126 |
Cly | +0.115 |
racted | +0.110 |
>>>>>>>> | +0.106 |
**************** | +0.103 |
Neg logit contributions | |
icho | -0.120 |
llah | -0.119 |
Uri | -0.119 |
humans | -0.106 |
erity | -0.106 |
Token | although |
Token ID | 3584 |
Feature activation | +8.71e-01 |
Pos logit contributions | |
kered | +0.332 |
Cly | +0.303 |
racted | +0.286 |
>>>>>>>> | +0.279 |
**************** | +0.270 |
Neg logit contributions | |
icho | -0.330 |
llah | -0.325 |
Uri | -0.323 |
erity | -0.291 |
humans | -0.291 |
Token | this |
Token ID | 428 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
kered | +0.705 |
Cly | +0.653 |
racted | +0.620 |
>>>>>>>> | +0.607 |
**************** | +0.588 |
Neg logit contributions | |
icho | -0.540 |
llah | -0.533 |
Uri | -0.523 |
erity | -0.468 |
humans | -0.466 |
Token | isn |
Token ID | 2125 |
Feature activation | -3.15e-01 |
Pos logit contributions | |
kered | +0.821 |
Cly | +0.753 |
racted | +0.713 |
>>>>>>>> | +0.698 |
★★ | +0.674 |
Neg logit contributions | |
icho | -0.761 |
llah | -0.749 |
Uri | -0.742 |
humans | -0.670 |
erity | -0.669 |
Token | � |
Token ID | 447 |
Feature activation | +5.55e-01 |
Pos logit contributions | |
icho | +0.266 |
Uri | +0.264 |
llah | +0.263 |
humans | +0.241 |
erity | +0.241 |
Neg logit contributions | |
kered | -0.183 |
Cly | -0.162 |
racted | -0.153 |
>>>>>>>> | -0.146 |
★★ | -0.140 |
Token | , |
Token ID | 11 |
Feature activation | +3.23e-02 |
Pos logit contributions | |
icho | +0.106 |
Uri | +0.105 |
llah | +0.105 |
erity | +0.094 |
humans | +0.094 |
Neg logit contributions | |
kered | -0.113 |
Cly | -0.102 |
racted | -0.098 |
>>>>>>>> | -0.095 |
★★ | -0.092 |
Token | essentially |
Token ID | 6986 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
kered | +0.024 |
Cly | +0.021 |
racted | +0.020 |
>>>>>>>> | +0.020 |
**************** | +0.019 |
Neg logit contributions | |
icho | -0.023 |
llah | -0.022 |
Uri | -0.022 |
humans | -0.020 |
erity | -0.020 |
Token | that |
Token ID | 326 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
icho | +0.144 |
llah | +0.143 |
Uri | +0.142 |
erity | +0.127 |
humans | +0.127 |
Neg logit contributions | |
kered | -0.171 |
Cly | -0.157 |
racted | -0.149 |
>>>>>>>> | -0.145 |
**************** | -0.141 |
Token | his |
Token ID | 465 |
Feature activation | +5.32e-01 |
Pos logit contributions | |
kered | +0.160 |
Cly | +0.147 |
racted | +0.140 |
>>>>>>>> | +0.136 |
**************** | +0.132 |
Neg logit contributions | |
icho | -0.129 |
llah | -0.128 |
Uri | -0.126 |
erity | -0.113 |
humans | -0.113 |
Token | ends |
Token ID | 5645 |
Feature activation | +1.46e-02 |
Pos logit contributions | |
kered | +0.394 |
Cly | +0.360 |
racted | +0.341 |
>>>>>>>> | +0.332 |
**************** | +0.322 |
Neg logit contributions | |
icho | -0.366 |
llah | -0.361 |
Uri | -0.358 |
erity | -0.323 |
humans | -0.323 |
Token | justify |
Token ID | 12051 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
kered | +0.012 |
Cly | +0.011 |
racted | +0.010 |
>>>>>>>> | +0.010 |
**************** | +0.010 |
Neg logit contributions | |
icho | -0.009 |
Uri | -0.009 |
llah | -0.009 |
erity | -0.008 |
humans | -0.008 |
Token | his |
Token ID | 465 |
Feature activation | -5.31e-01 |
Pos logit contributions | |
icho | +0.189 |
Uri | +0.187 |
llah | +0.187 |
humans | +0.165 |
erity | +0.164 |
Neg logit contributions | |
kered | -0.257 |
Cly | -0.236 |
racted | -0.227 |
>>>>>>>> | -0.221 |
★★ | -0.215 |
Token | means |
Token ID | 1724 |
Feature activation | -3.67e-02 |
Pos logit contributions | |
icho | +0.280 |
Uri | +0.274 |
llah | +0.273 |
erity | +0.237 |
humans | +0.235 |
Neg logit contributions | |
kered | -0.478 |
Cly | -0.445 |
racted | -0.427 |
>>>>>>>> | -0.419 |
**************** | -0.408 |
Token | , |
Token ID | 11 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
icho | +0.025 |
Uri | +0.025 |
llah | +0.025 |
erity | +0.022 |
humans | +0.022 |
Neg logit contributions | |
kered | -0.027 |
Cly | -0.025 |
racted | -0.024 |
>>>>>>>> | -0.023 |
★★ | -0.022 |
Token | not |
Token ID | 407 |
Feature activation | -5.14e-01 |
Pos logit contributions | |
kered | +0.200 |
Cly | +0.182 |
racted | +0.173 |
>>>>>>>> | +0.168 |
**************** | +0.162 |
Neg logit contributions | |
icho | -0.197 |
llah | -0.195 |
Uri | -0.194 |
humans | -0.175 |
erity | -0.175 |
Token | a |
Token ID | 257 |
Feature activation | +4.36e-02 |
Pos logit contributions | |
icho | +0.349 |
Uri | +0.345 |
llah | +0.344 |
erity | +0.308 |
humans | +0.308 |
Neg logit contributions | |
kered | -0.384 |
Cly | -0.350 |
racted | -0.335 |
>>>>>>>> | -0.325 |
★★ | -0.314 |
Token | figures |
Token ID | 5538 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
icho | +0.273 |
Uri | +0.269 |
llah | +0.269 |
humans | +0.240 |
erity | +0.239 |
Neg logit contributions | |
kered | -0.318 |
Cly | -0.291 |
racted | -0.278 |
>>>>>>>> | -0.270 |
**************** | -0.261 |
Token | couldn |
Token ID | 3521 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
kered | +0.310 |
Cly | +0.282 |
racted | +0.270 |
>>>>>>>> | +0.262 |
★★ | +0.253 |
Neg logit contributions | |
icho | -0.279 |
Uri | -0.276 |
llah | -0.275 |
humans | -0.246 |
erity | -0.246 |
Token | � |
Token ID | 447 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
icho | +0.137 |
Uri | +0.136 |
llah | +0.136 |
humans | +0.126 |
erity | +0.126 |
Neg logit contributions | |
kered | -0.071 |
Cly | -0.062 |
racted | -0.058 |
>>>>>>>> | -0.054 |
★★ | -0.051 |
Token | � |
Token ID | 247 |
Feature activation | -3.92e-01 |
Pos logit contributions | |
icho | +0.460 |
Uri | +0.455 |
llah | +0.455 |
erity | +0.411 |
humans | +0.411 |
Neg logit contributions | |
kered | -0.418 |
Cly | -0.378 |
racted | -0.359 |
>>>>>>>> | -0.347 |
**************** | -0.333 |
Token | t |
Token ID | 83 |
Feature activation | +6.52e-02 |
Pos logit contributions | |
icho | +0.207 |
Uri | +0.204 |
llah | +0.204 |
erity | +0.176 |
humans | +0.176 |
Neg logit contributions | |
kered | -0.351 |
Cly | -0.325 |
racted | -0.314 |
>>>>>>>> | -0.306 |
★★ | -0.297 |
Token | come |
Token ID | 1282 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
kered | +0.045 |
Cly | +0.041 |
racted | +0.039 |
>>>>>>>> | +0.038 |
★★ | +0.037 |
Neg logit contributions | |
icho | -0.047 |
Uri | -0.047 |
llah | -0.047 |
alon | -0.042 |
humans | -0.042 |
Token | at |
Token ID | 379 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
kered | +0.236 |
Cly | +0.215 |
racted | +0.206 |
>>>>>>>> | +0.200 |
**************** | +0.194 |
Neg logit contributions | |
icho | -0.203 |
llah | -0.201 |
Uri | -0.200 |
humans | -0.179 |
erity | -0.178 |
Token | a |
Token ID | 257 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
icho | +0.008 |
Uri | +0.008 |
llah | +0.008 |
humans | +0.007 |
erity | +0.007 |
Neg logit contributions | |
kered | -0.010 |
Cly | -0.009 |
racted | -0.009 |
>>>>>>>> | -0.008 |
★★ | -0.008 |
Token | worse |
Token ID | 4785 |
Feature activation | +4.06e-01 |
Pos logit contributions | |
kered | +0.332 |
Cly | +0.304 |
racted | +0.291 |
>>>>>>>> | +0.286 |
★★ | +0.276 |
Neg logit contributions | |
icho | -0.252 |
llah | -0.248 |
Uri | -0.247 |
humans | -0.220 |
ixel | -0.218 |
Token | time |
Token ID | 640 |
Feature activation | -5.47e-01 |
Pos logit contributions | |
kered | +0.384 |
Cly | +0.357 |
racted | +0.345 |
>>>>>>>> | +0.337 |
★★ | +0.328 |
Neg logit contributions | |
icho | -0.195 |
llah | -0.192 |
Uri | -0.191 |
humans | -0.163 |
erity | -0.162 |
Token | as |
Token ID | 355 |
Feature activation | +2.72e-01 |
Pos logit contributions | |
icho | +0.345 |
Uri | +0.341 |
llah | +0.339 |
humans | +0.301 |
erity | +0.301 |
Neg logit contributions | |
kered | -0.435 |
Cly | -0.399 |
racted | -0.384 |
>>>>>>>> | -0.371 |
★★ | -0.359 |
Token | 2 |
Token ID | 17 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
kered | +0.199 |
Cly | +0.181 |
racted | +0.173 |
>>>>>>>> | +0.167 |
**************** | +0.162 |
Neg logit contributions | |
icho | -0.193 |
llah | -0.192 |
Uri | -0.192 |
erity | -0.172 |
humans | -0.172 |
Token | smartphone |
Token ID | 11745 |
Feature activation | +7.43e-02 |
Pos logit contributions | |
icho | +1.364 |
Uri | +1.344 |
llah | +1.327 |
humans | +1.212 |
okia | +1.196 |
Neg logit contributions | |
kered | -1.415 |
Cly | -1.289 |
racted | -1.229 |
>>>>>>>> | -1.199 |
★★ | -1.151 |
Token | after |
Token ID | 706 |
Feature activation | -9.67e-01 |
Pos logit contributions | |
kered | +0.054 |
Cly | +0.049 |
racted | +0.047 |
>>>>>>>> | +0.045 |
★★ | +0.043 |
Neg logit contributions | |
icho | -0.052 |
Uri | -0.052 |
llah | -0.051 |
humans | -0.046 |
erity | -0.046 |
Token | 20 |
Token ID | 1160 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
icho | +0.624 |
llah | +0.614 |
Uri | +0.611 |
erity | +0.547 |
humans | +0.544 |
Neg logit contributions | |
kered | -0.756 |
Cly | -0.694 |
racted | -0.663 |
>>>>>>>> | -0.644 |
**************** | -0.624 |
Token | Korean |
Token ID | 6983 |
Feature activation | -9.20e-01 |
Pos logit contributions | |
icho | +0.668 |
Uri | +0.660 |
llah | +0.659 |
humans | +0.585 |
erity | +0.584 |
Neg logit contributions | |
kered | -0.828 |
Cly | -0.758 |
racted | -0.728 |
>>>>>>>> | -0.707 |
**************** | -0.684 |
Token | consumers |
Token ID | 7008 |
Feature activation | -2.29e-02 |
Pos logit contributions | |
icho | +0.633 |
llah | +0.628 |
Uri | +0.626 |
erity | +0.563 |
humans | +0.560 |
Neg logit contributions | |
kered | -0.676 |
Cly | -0.617 |
racted | -0.589 |
>>>>>>>> | -0.571 |
★★ | -0.551 |
Token | were |
Token ID | 547 |
Feature activation | -7.15e-01 |
Pos logit contributions | |
icho | +0.016 |
llah | +0.016 |
Uri | +0.016 |
humans | +0.015 |
erity | +0.015 |
Neg logit contributions | |
kered | -0.016 |
Cly | -0.015 |
racted | -0.014 |
>>>>>>>> | -0.014 |
**************** | -0.013 |
Token | hurt |
Token ID | 5938 |
Feature activation | -3.32e-02 |
Pos logit contributions | |
icho | +0.508 |
Uri | +0.502 |
llah | +0.501 |
erity | +0.451 |
humans | +0.451 |
Neg logit contributions | |
kered | -0.511 |
Cly | -0.464 |
racted | -0.443 |
>>>>>>>> | -0.428 |
**************** | -0.413 |
Token | as |
Token ID | 355 |
Feature activation | -9.96e-01 |
Pos logit contributions | |
icho | +0.020 |
Uri | +0.019 |
llah | +0.019 |
erity | +0.017 |
humans | +0.017 |
Neg logit contributions | |
kered | -0.028 |
Cly | -0.025 |
racted | -0.024 |
>>>>>>>> | -0.024 |
**************** | -0.023 |
Token | they |
Token ID | 484 |
Feature activation | -7.73e-01 |
Pos logit contributions | |
icho | +0.593 |
llah | +0.584 |
Uri | +0.584 |
erity | +0.514 |
humans | +0.513 |
Neg logit contributions | |
kered | -0.827 |
Cly | -0.762 |
racted | -0.732 |
>>>>>>>> | -0.710 |
★★ | -0.689 |
Token | attempted |
Token ID | 7482 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
icho | +0.517 |
Uri | +0.512 |
llah | +0.510 |
erity | +0.456 |
humans | +0.454 |
Neg logit contributions | |
kered | -0.582 |
Cly | -0.532 |
racted | -0.510 |
>>>>>>>> | -0.495 |
★★ | -0.479 |
Token | M |
Token ID | 44 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
kered | +0.360 |
Cly | +0.326 |
racted | +0.310 |
>>>>>>>> | +0.301 |
★★ | +0.291 |
Neg logit contributions | |
icho | -0.399 |
Uri | -0.394 |
llah | -0.394 |
erity | -0.356 |
humans | -0.355 |
Token | arian |
Token ID | 3699 |
Feature activation | +8.43e-02 |
Pos logit contributions | |
icho | +0.105 |
Uri | +0.104 |
llah | +0.104 |
humans | +0.095 |
erity | +0.095 |
Neg logit contributions | |
kered | -0.065 |
Cly | -0.057 |
racted | -0.054 |
>>>>>>>> | -0.052 |
**************** | -0.049 |
Token | H |
Token ID | 367 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
kered | +0.065 |
Cly | +0.060 |
racted | +0.057 |
>>>>>>>> | +0.056 |
★★ | +0.054 |
Neg logit contributions | |
icho | -0.055 |
Uri | -0.054 |
llah | -0.054 |
humans | -0.048 |
erity | -0.048 |
Token | oss |
Token ID | 793 |
Feature activation | -4.16e-01 |
Pos logit contributions | |
icho | +0.192 |
Uri | +0.188 |
llah | +0.188 |
erity | +0.156 |
humans | +0.156 |
Neg logit contributions | |
kered | -0.434 |
Cly | -0.406 |
racted | -0.392 |
>>>>>>>> | -0.384 |
★★ | -0.375 |
Token | a |
Token ID | 64 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
icho | +0.252 |
Uri | +0.249 |
llah | +0.248 |
humans | +0.219 |
erity | +0.219 |
Neg logit contributions | |
kered | -0.341 |
Cly | -0.314 |
racted | -0.302 |
>>>>>>>> | -0.293 |
★★ | -0.284 |
Token | has |
Token ID | 468 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
icho | +0.104 |
Uri | +0.103 |
llah | +0.103 |
erity | +0.092 |
humans | +0.092 |
Neg logit contributions | |
kered | -0.106 |
Cly | -0.096 |
racted | -0.092 |
>>>>>>>> | -0.089 |
★★ | -0.086 |
Token | played |
Token ID | 2826 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
icho | +0.190 |
llah | +0.187 |
Uri | +0.187 |
erity | +0.168 |
humans | +0.168 |
Neg logit contributions | |
kered | -0.201 |
Cly | -0.184 |
racted | -0.175 |
>>>>>>>> | -0.170 |
★★ | -0.164 |
Token | for |
Token ID | 329 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
kered | +0.162 |
Cly | +0.148 |
racted | +0.142 |
>>>>>>>> | +0.137 |
★★ | +0.133 |
Neg logit contributions | |
icho | -0.145 |
Uri | -0.143 |
llah | -0.143 |
humans | -0.128 |
erity | -0.127 |
Token | five |
Token ID | 1936 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
kered | +0.111 |
Cly | +0.102 |
racted | +0.098 |
>>>>>>>> | +0.095 |
★★ | +0.092 |
Neg logit contributions | |
icho | -0.082 |
Uri | -0.081 |
llah | -0.081 |
humans | -0.071 |
erity | -0.071 |
Token | NHL |
Token ID | 9481 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
kered | +0.131 |
Cly | +0.119 |
racted | +0.113 |
>>>>>>>> | +0.110 |
★★ | +0.106 |
Neg logit contributions | |
icho | -0.136 |
llah | -0.134 |
Uri | -0.134 |
humans | -0.121 |
erity | -0.121 |
Token | teams |
Token ID | 3466 |
Feature activation | +6.69e-01 |
Pos logit contributions | |
kered | +0.154 |
Cly | +0.139 |
racted | +0.133 |
>>>>>>>> | +0.128 |
★★ | +0.123 |
Neg logit contributions | |
icho | -0.169 |
Uri | -0.168 |
llah | -0.167 |
humans | -0.151 |
erity | -0.151 |
Token | aligned |
Token ID | 41634 |
Feature activation | +7.18e-01 |
Pos logit contributions | |
kered | +0.198 |
Cly | +0.162 |
racted | +0.144 |
>>>>>>>> | +0.134 |
★★ | +0.121 |
Neg logit contributions | |
icho | -0.607 |
Uri | -0.603 |
llah | -0.603 |
humans | -0.565 |
erity | -0.563 |
Token | countries |
Token ID | 2678 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
kered | +0.580 |
Cly | +0.534 |
racted | +0.511 |
>>>>>>>> | +0.498 |
**************** | +0.484 |
Neg logit contributions | |
icho | -0.444 |
llah | -0.436 |
Uri | -0.436 |
erity | -0.384 |
humans | -0.384 |
Token | must |
Token ID | 1276 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
kered | +0.157 |
Cly | +0.143 |
racted | +0.137 |
>>>>>>>> | +0.133 |
**************** | +0.129 |
Neg logit contributions | |
icho | -0.134 |
llah | -0.133 |
Uri | -0.132 |
humans | -0.118 |
erity | -0.118 |
Token | give |
Token ID | 1577 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
kered | +0.766 |
Cly | +0.698 |
racted | +0.664 |
>>>>>>>> | +0.646 |
**************** | +0.628 |
Neg logit contributions | |
icho | -0.689 |
llah | -0.678 |
Uri | -0.675 |
humans | -0.608 |
erity | -0.607 |
Token | priority |
Token ID | 8475 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
kered | +0.088 |
Cly | +0.081 |
racted | +0.076 |
>>>>>>>> | +0.075 |
★★ | +0.072 |
Neg logit contributions | |
icho | -0.077 |
llah | -0.076 |
Uri | -0.075 |
erity | -0.067 |
humans | -0.067 |
Token | to |
Token ID | 284 |
Feature activation | -6.94e-01 |
Pos logit contributions | |
kered | +0.362 |
Cly | +0.332 |
racted | +0.318 |
>>>>>>>> | +0.310 |
★★ | +0.300 |
Neg logit contributions | |
icho | -0.296 |
Uri | -0.292 |
llah | -0.291 |
humans | -0.259 |
erity | -0.258 |
Token | the |
Token ID | 262 |
Feature activation | -7.39e-01 |
Pos logit contributions | |
icho | +0.410 |
llah | +0.404 |
Uri | +0.403 |
erity | +0.354 |
humans | +0.354 |
Neg logit contributions | |
kered | -0.579 |
Cly | -0.534 |
racted | -0.512 |
>>>>>>>> | -0.499 |
**************** | -0.485 |
Token | abolition |
Token ID | 30480 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
icho | +0.463 |
llah | +0.455 |
Uri | +0.454 |
erity | +0.404 |
humans | +0.403 |
Neg logit contributions | |
kered | -0.591 |
Cly | -0.544 |
racted | -0.520 |
>>>>>>>> | -0.506 |
**************** | -0.492 |
Token | of |
Token ID | 286 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
kered | +0.094 |
Cly | +0.086 |
racted | +0.083 |
>>>>>>>> | +0.081 |
**************** | +0.078 |
Neg logit contributions | |
icho | -0.070 |
Uri | -0.069 |
llah | -0.069 |
humans | -0.061 |
erity | -0.061 |
Token | nuclear |
Token ID | 4523 |
Feature activation | +6.87e-02 |
Pos logit contributions | |
icho | +0.175 |
Uri | +0.173 |
llah | +0.173 |
humans | +0.153 |
erity | +0.153 |
Neg logit contributions | |
kered | -0.227 |
Cly | -0.209 |
racted | -0.200 |
>>>>>>>> | -0.195 |
★★ | -0.189 |
Token | weapons |
Token ID | 3777 |
Feature activation | +8.29e-01 |
Pos logit contributions | |
kered | +0.041 |
Cly | +0.037 |
racted | +0.035 |
>>>>>>>> | +0.033 |
★★ | +0.032 |
Neg logit contributions | |
icho | -0.057 |
Uri | -0.056 |
llah | -0.056 |
humans | -0.051 |
erity | -0.051 |
Token | . |
Token ID | 13 |
Feature activation | +2.92e-02 |
Pos logit contributions | |
icho | +0.249 |
Uri | +0.246 |
llah | +0.246 |
humans | +0.220 |
erity | +0.220 |
Neg logit contributions | |
kered | -0.261 |
Cly | -0.238 |
racted | -0.227 |
>>>>>>>> | -0.220 |
**************** | -0.212 |
Token | Nin |
Token ID | 10516 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
kered | +0.020 |
Cly | +0.018 |
racted | +0.017 |
>>>>>>>> | +0.017 |
★★ | +0.016 |
Neg logit contributions | |
icho | -0.022 |
llah | -0.021 |
Uri | -0.021 |
erity | -0.019 |
humans | -0.019 |
Token | ety |
Token ID | 2963 |
Feature activation | +7.74e-02 |
Pos logit contributions | |
kered | +0.297 |
Cly | +0.275 |
racted | +0.264 |
>>>>>>>> | +0.257 |
**************** | +0.250 |
Neg logit contributions | |
icho | -0.203 |
Uri | -0.199 |
llah | -0.199 |
erity | -0.175 |
humans | -0.175 |
Token | percent |
Token ID | 1411 |
Feature activation | +5.16e-01 |
Pos logit contributions | |
kered | +0.052 |
Cly | +0.047 |
racted | +0.045 |
>>>>>>>> | +0.043 |
**************** | +0.041 |
Neg logit contributions | |
icho | -0.058 |
Uri | -0.058 |
llah | -0.058 |
humans | -0.052 |
erity | -0.052 |
Token | of |
Token ID | 286 |
Feature activation | -5.37e-01 |
Pos logit contributions | |
kered | +0.416 |
Cly | +0.382 |
racted | +0.367 |
>>>>>>>> | +0.357 |
★★ | +0.345 |
Neg logit contributions | |
icho | -0.318 |
Uri | -0.314 |
llah | -0.314 |
humans | -0.277 |
erity | -0.277 |
Token | the |
Token ID | 262 |
Feature activation | -6.66e-01 |
Pos logit contributions | |
icho | +0.328 |
Uri | +0.324 |
llah | +0.323 |
humans | +0.285 |
erity | +0.285 |
Neg logit contributions | |
kered | -0.437 |
Cly | -0.402 |
racted | -0.386 |
>>>>>>>> | -0.375 |
★★ | -0.364 |
Token | children |
Token ID | 1751 |
Feature activation | -9.71e-01 |
Pos logit contributions | |
icho | +0.340 |
llah | +0.334 |
Uri | +0.333 |
erity | +0.287 |
humans | +0.286 |
Neg logit contributions | |
kered | -0.609 |
Cly | -0.567 |
racted | -0.546 |
>>>>>>>> | -0.534 |
**************** | -0.519 |
Token | � |
Token ID | 447 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
icho | +0.628 |
Uri | +0.622 |
llah | +0.619 |
erity | +0.552 |
humans | +0.551 |
Neg logit contributions | |
kered | -0.754 |
Cly | -0.689 |
racted | -0.662 |
>>>>>>>> | -0.642 |
★★ | -0.621 |
Token | � |
Token ID | 247 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
kered | +0.274 |
Cly | +0.242 |
racted | +0.231 |
>>>>>>>> | +0.224 |
★★ | +0.213 |
Neg logit contributions | |
icho | -0.414 |
Uri | -0.408 |
llah | -0.404 |
humans | -0.374 |
erity | -0.373 |
Token | s |
Token ID | 82 |
Feature activation | +3.85e-01 |
Pos logit contributions | |
kered | +0.416 |
Cly | +0.377 |
racted | +0.359 |
>>>>>>>> | +0.347 |
**************** | +0.334 |
Neg logit contributions | |
icho | -0.440 |
Uri | -0.435 |
llah | -0.434 |
erity | -0.392 |
humans | -0.392 |
Token | books |
Token ID | 3835 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
kered | +0.285 |
Cly | +0.262 |
racted | +0.249 |
>>>>>>>> | +0.242 |
**************** | +0.233 |
Neg logit contributions | |
icho | -0.264 |
llah | -0.260 |
Uri | -0.259 |
erity | -0.233 |
humans | -0.233 |
Token | , |
Token ID | 11 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
icho | +0.582 |
Uri | +0.580 |
llah | +0.571 |
humans | +0.515 |
erity | +0.510 |
Neg logit contributions | |
kered | -0.615 |
Cly | -0.555 |
racted | -0.532 |
>>>>>>>> | -0.517 |
★★ | -0.499 |
Token | including |
Token ID | 1390 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
icho | +0.132 |
llah | +0.131 |
Uri | +0.130 |
erity | +0.117 |
humans | +0.117 |
Neg logit contributions | |
kered | -0.137 |
Cly | -0.125 |
racted | -0.119 |
>>>>>>>> | -0.116 |
**************** | -0.111 |
Token | a |
Token ID | 257 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
icho | +0.241 |
llah | +0.238 |
Uri | +0.238 |
erity | +0.213 |
humans | +0.213 |
Neg logit contributions | |
kered | -0.270 |
Cly | -0.246 |
racted | -0.236 |
>>>>>>>> | -0.228 |
**************** | -0.221 |
Token | privacy |
Token ID | 6782 |
Feature activation | -4.86e-02 |
Pos logit contributions | |
icho | +0.148 |
Uri | +0.147 |
llah | +0.146 |
erity | +0.132 |
humans | +0.132 |
Neg logit contributions | |
kered | -0.146 |
Cly | -0.133 |
racted | -0.127 |
>>>>>>>> | -0.123 |
★★ | -0.118 |
Token | - |
Token ID | 12 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
icho | +0.037 |
Uri | +0.036 |
llah | +0.036 |
humans | +0.033 |
erity | +0.032 |
Neg logit contributions | |
kered | -0.032 |
Cly | -0.029 |
racted | -0.028 |
>>>>>>>> | -0.027 |
**************** | -0.026 |
Token | centric |
Token ID | 28577 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
icho | +0.314 |
Uri | +0.310 |
llah | +0.309 |
humans | +0.284 |
erity | +0.282 |
Neg logit contributions | |
kered | -0.235 |
Cly | -0.210 |
racted | -0.199 |
>>>>>>>> | -0.192 |
**************** | -0.183 |
Token | variant |
Token ID | 15304 |
Feature activation | -7.27e-01 |
Pos logit contributions | |
icho | +0.761 |
Uri | +0.758 |
llah | +0.747 |
erity | +0.670 |
humans | +0.669 |
Neg logit contributions | |
kered | -0.768 |
Cly | -0.693 |
racted | -0.666 |
>>>>>>>> | -0.648 |
**************** | -0.624 |
Token | called |
Token ID | 1444 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
icho | +0.499 |
Uri | +0.494 |
llah | +0.491 |
humans | +0.440 |
erity | +0.439 |
Neg logit contributions | |
kered | -0.536 |
Cly | -0.487 |
racted | -0.467 |
>>>>>>>> | -0.454 |
★★ | -0.438 |
Token | Focus |
Token ID | 17061 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
icho | +0.311 |
Uri | +0.308 |
llah | +0.307 |
humans | +0.276 |
erity | +0.276 |
Neg logit contributions | |
kered | -0.306 |
Cly | -0.277 |
racted | -0.265 |
>>>>>>>> | -0.256 |
★★ | -0.247 |
Token | and |
Token ID | 290 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
icho | +0.810 |
Uri | +0.806 |
llah | +0.795 |
alon | +0.723 |
humans | +0.720 |
Neg logit contributions | |
kered | -0.844 |
Cly | -0.763 |
racted | -0.726 |
>>>>>>>> | -0.709 |
**************** | -0.687 |
Token | speed |
Token ID | 2866 |
Feature activation | +6.68e-01 |
Pos logit contributions | |
kered | +0.490 |
Cly | +0.449 |
racted | +0.429 |
>>>>>>>> | +0.415 |
★★ | +0.401 |
Neg logit contributions | |
icho | -0.437 |
llah | -0.432 |
Uri | -0.430 |
humans | -0.385 |
erity | -0.385 |
Token | applied |
Token ID | 5625 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
kered | +0.185 |
Cly | +0.166 |
racted | +0.158 |
>>>>>>>> | +0.152 |
**************** | +0.146 |
Neg logit contributions | |
icho | -0.230 |
Uri | -0.228 |
llah | -0.226 |
humans | -0.206 |
erity | -0.206 |
Token | and |
Token ID | 290 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
kered | +0.081 |
Cly | +0.074 |
racted | +0.071 |
>>>>>>>> | +0.069 |
★★ | +0.066 |
Neg logit contributions | |
icho | -0.070 |
Uri | -0.070 |
llah | -0.069 |
erity | -0.062 |
humans | -0.062 |
Token | subsequently |
Token ID | 12412 |
Feature activation | +3.07e-01 |
Pos logit contributions | |
kered | +0.192 |
Cly | +0.176 |
racted | +0.168 |
>>>>>>>> | +0.163 |
★★ | +0.158 |
Neg logit contributions | |
icho | -0.167 |
Uri | -0.165 |
llah | -0.165 |
erity | -0.147 |
humans | -0.147 |
Token | un |
Token ID | 555 |
Feature activation | -8.10e-02 |
Pos logit contributions | |
kered | +0.219 |
Cly | +0.199 |
racted | +0.190 |
>>>>>>>> | +0.183 |
★★ | +0.177 |
Neg logit contributions | |
icho | -0.218 |
Uri | -0.216 |
llah | -0.215 |
humans | -0.194 |
erity | -0.194 |
Token | - |
Token ID | 12 |
Feature activation | -7.08e-01 |
Pos logit contributions | |
icho | +0.060 |
Uri | +0.059 |
llah | +0.059 |
humans | +0.054 |
erity | +0.053 |
Neg logit contributions | |
kered | -0.055 |
Cly | -0.050 |
racted | -0.048 |
>>>>>>>> | -0.046 |
★★ | -0.044 |
Token | app |
Token ID | 1324 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
icho | +0.499 |
Uri | +0.491 |
llah | +0.489 |
humans | +0.443 |
erity | +0.440 |
Neg logit contributions | |
kered | -0.507 |
Cly | -0.463 |
racted | -0.440 |
>>>>>>>> | -0.427 |
★★ | -0.412 |
Token | lied |
Token ID | 18511 |
Feature activation | -5.62e-01 |
Pos logit contributions | |
icho | +0.649 |
Uri | +0.643 |
llah | +0.640 |
alon | +0.575 |
ixel | +0.570 |
Neg logit contributions | |
kered | -0.808 |
Cly | -0.748 |
racted | -0.704 |
>>>>>>>> | -0.698 |
★★ | -0.677 |
Token | . |
Token ID | 13 |
Feature activation | +4.98e-01 |
Pos logit contributions | |
icho | +0.373 |
Uri | +0.371 |
llah | +0.368 |
erity | +0.329 |
humans | +0.329 |
Neg logit contributions | |
kered | -0.423 |
Cly | -0.387 |
racted | -0.371 |
>>>>>>>> | -0.359 |
★★ | -0.347 |
Token | Un |
Token ID | 791 |
Feature activation | +8.35e-01 |
Pos logit contributions | |
kered | +0.375 |
Cly | +0.343 |
racted | +0.328 |
>>>>>>>> | +0.318 |
**************** | +0.307 |
Neg logit contributions | |
icho | -0.334 |
Uri | -0.330 |
llah | -0.330 |
erity | -0.295 |
humans | -0.295 |
Token | - |
Token ID | 12 |
Feature activation | -5.78e-01 |
Pos logit contributions | |
kered | +0.562 |
Cly | +0.508 |
racted | +0.482 |
>>>>>>>> | +0.466 |
★★ | +0.448 |
Neg logit contributions | |
icho | -0.628 |
Uri | -0.620 |
llah | -0.619 |
humans | -0.562 |
erity | -0.561 |
Token | doing |
Token ID | 19631 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
icho | +0.390 |
Uri | +0.381 |
llah | +0.380 |
humans | +0.346 |
erity | +0.342 |
Neg logit contributions | |
kered | -0.432 |
Cly | -0.397 |
racted | -0.377 |
>>>>>>>> | -0.366 |
★★ | -0.352 |
Token | � |
Token ID | 247 |
Feature activation | +6.36e-02 |
Pos logit contributions | |
kered | +0.002 |
Cly | +0.002 |
racted | +0.002 |
>>>>>>>> | +0.002 |
★★ | +0.002 |
Neg logit contributions | |
icho | -0.003 |
Uri | -0.003 |
llah | -0.003 |
humans | -0.003 |
erity | -0.003 |
Token | s |
Token ID | 82 |
Feature activation | +9.82e-02 |
Pos logit contributions | |
kered | +0.044 |
Cly | +0.040 |
racted | +0.038 |
>>>>>>>> | +0.037 |
★★ | +0.036 |
Neg logit contributions | |
icho | -0.046 |
Uri | -0.046 |
llah | -0.045 |
erity | -0.041 |
humans | -0.041 |
Token | capit |
Token ID | 46964 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
kered | +0.075 |
Cly | +0.068 |
racted | +0.065 |
>>>>>>>> | +0.063 |
★★ | +0.061 |
Neg logit contributions | |
icho | -0.065 |
Uri | -0.064 |
llah | -0.064 |
humans | -0.057 |
erity | -0.057 |
Token | ulation |
Token ID | 1741 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
icho | +0.263 |
Uri | +0.259 |
llah | +0.259 |
erity | +0.227 |
humans | +0.227 |
Neg logit contributions | |
kered | -0.384 |
Cly | -0.354 |
racted | -0.340 |
>>>>>>>> | -0.332 |
★★ | -0.323 |
Token | to |
Token ID | 284 |
Feature activation | -4.42e-01 |
Pos logit contributions | |
icho | +0.911 |
Uri | +0.905 |
llah | +0.890 |
erity | +0.801 |
humans | +0.792 |
Neg logit contributions | |
kered | -1.102 |
Cly | -1.005 |
racted | -0.979 |
>>>>>>>> | -0.945 |
★★ | -0.920 |
Token | Donald |
Token ID | 3759 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
icho | +0.266 |
Uri | +0.263 |
llah | +0.262 |
erity | +0.231 |
humans | +0.231 |
Neg logit contributions | |
kered | -0.364 |
Cly | -0.334 |
racted | -0.323 |
>>>>>>>> | -0.314 |
★★ | -0.304 |
Token | Trump |
Token ID | 1301 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
icho | +0.652 |
Uri | +0.647 |
llah | +0.645 |
erity | +0.559 |
humans | +0.557 |
Neg logit contributions | |
kered | -0.995 |
Cly | -0.916 |
racted | -0.895 |
>>>>>>>> | -0.868 |
Changes | -0.842 |
Token | is |
Token ID | 318 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
icho | +0.194 |
Uri | +0.192 |
llah | +0.192 |
erity | +0.174 |
humans | +0.174 |
Neg logit contributions | |
kered | -0.172 |
Cly | -0.155 |
racted | -0.149 |
>>>>>>>> | -0.143 |
Changes | -0.137 |
Token | complete |
Token ID | 1844 |
Feature activation | -6.41e-01 |
Pos logit contributions | |
kered | +0.093 |
Cly | +0.086 |
racted | +0.081 |
>>>>>>>> | +0.079 |
**************** | +0.077 |
Neg logit contributions | |
icho | -0.084 |
llah | -0.083 |
Uri | -0.083 |
humans | -0.074 |
erity | -0.074 |
Token | . |
Token ID | 13 |
Feature activation | -6.23e-01 |
Pos logit contributions | |
icho | +0.436 |
Uri | +0.432 |
llah | +0.430 |
erity | +0.385 |
humans | +0.384 |
Neg logit contributions | |
kered | -0.477 |
Cly | -0.433 |
racted | -0.417 |
>>>>>>>> | -0.403 |
★★ | -0.388 |
Token | As |
Token ID | 1081 |
Feature activation | -5.08e-01 |
Pos logit contributions | |
icho | +0.404 |
Uri | +0.399 |
llah | +0.399 |
humans | +0.355 |
erity | +0.354 |
Neg logit contributions | |
kered | -0.483 |
Cly | -0.442 |
racted | -0.423 |
>>>>>>>> | -0.411 |
**************** | -0.398 |
Token |
|
Token ID | 198 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
kered | +0.172 |
Cly | +0.157 |
racted | +0.149 |
>>>>>>>> | +0.145 |
**************** | +0.140 |
Neg logit contributions | |
icho | -0.173 |
Uri | -0.170 |
llah | -0.170 |
erity | -0.153 |
humans | -0.153 |
Token | The |
Token ID | 464 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
kered | +0.146 |
Cly | +0.133 |
racted | +0.127 |
>>>>>>>> | +0.123 |
★★ | +0.119 |
Neg logit contributions | |
icho | -0.134 |
Uri | -0.133 |
llah | -0.132 |
erity | -0.118 |
humans | -0.118 |
Token | City |
Token ID | 2254 |
Feature activation | -6.47e-01 |
Pos logit contributions | |
icho | +0.306 |
Uri | +0.305 |
llah | +0.303 |
erity | +0.272 |
humans | +0.272 |
Neg logit contributions | |
kered | -0.318 |
Cly | -0.287 |
racted | -0.276 |
>>>>>>>> | -0.267 |
**************** | -0.258 |
Token | of |
Token ID | 286 |
Feature activation | -4.47e-01 |
Pos logit contributions | |
icho | +0.412 |
Uri | +0.409 |
llah | +0.407 |
erity | +0.362 |
humans | +0.362 |
Neg logit contributions | |
kered | -0.509 |
Cly | -0.464 |
racted | -0.446 |
>>>>>>>> | -0.434 |
★★ | -0.420 |
Token | Wh |
Token ID | 854 |
Feature activation | -6.80e-01 |
Pos logit contributions | |
icho | +0.316 |
Uri | +0.314 |
llah | +0.312 |
humans | +0.281 |
erity | +0.281 |
Neg logit contributions | |
kered | -0.320 |
Cly | -0.290 |
racted | -0.278 |
>>>>>>>> | -0.269 |
★★ | -0.259 |
Token | itt |
Token ID | 715 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
icho | +0.441 |
llah | +0.434 |
Uri | +0.433 |
erity | +0.386 |
humans | +0.386 |
Neg logit contributions | |
kered | -0.527 |
Cly | -0.484 |
racted | -0.462 |
>>>>>>>> | -0.451 |
★★ | -0.436 |
Token | les |
Token ID | 829 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
icho | +2.328 |
llah | +2.308 |
Uri | +2.290 |
alon | +2.111 |
irit | +2.099 |
Neg logit contributions | |
kered | -1.575 |
Cly | -1.403 |
racted | -1.323 |
>>>>>>>> | -1.291 |
★★ | -1.226 |
Token | ea |
Token ID | 18213 |
Feature activation | +6.14e-01 |
Pos logit contributions | |
icho | +0.229 |
Uri | +0.228 |
llah | +0.227 |
erity | +0.209 |
humans | +0.207 |
Neg logit contributions | |
kered | -0.202 |
Cly | -0.182 |
racted | -0.173 |
>>>>>>>> | -0.165 |
**************** | -0.161 |
Token | covers |
Token ID | 8698 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
kered | +0.451 |
Cly | +0.412 |
racted | +0.393 |
>>>>>>>> | +0.380 |
★★ | +0.367 |
Neg logit contributions | |
icho | -0.424 |
Uri | -0.419 |
llah | -0.418 |
erity | -0.375 |
humans | -0.375 |
Token | almost |
Token ID | 2048 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
kered | +0.103 |
Cly | +0.094 |
racted | +0.089 |
>>>>>>>> | +0.086 |
**************** | +0.083 |
Neg logit contributions | |
icho | -0.109 |
llah | -0.107 |
Uri | -0.107 |
humans | -0.097 |
erity | -0.097 |
Token | 500 |
Token ID | 5323 |
Feature activation | -4.10e-01 |
Pos logit contributions | |
icho | +0.434 |
Uri | +0.430 |
llah | +0.428 |
humans | +0.388 |
erity | +0.387 |
Neg logit contributions | |
kered | -0.396 |
Cly | -0.357 |
racted | -0.341 |
>>>>>>>> | -0.329 |
**************** | -0.316 |
Token | Mn |
Token ID | 36030 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
kered | +0.203 |
Cly | +0.191 |
racted | +0.186 |
>>>>>>>> | +0.182 |
**************** | +0.178 |
Neg logit contributions | |
icho | -0.062 |
Uri | -0.060 |
llah | -0.060 |
humans | -0.047 |
erity | -0.047 |
Token | uchin |
Token ID | 43416 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
kered | +0.950 |
Cly | +0.870 |
racted | +0.832 |
>>>>>>>> | +0.804 |
**************** | +0.781 |
Neg logit contributions | |
icho | -0.816 |
Uri | -0.814 |
llah | -0.807 |
humans | -0.724 |
erity | -0.723 |
Token | , |
Token ID | 11 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
kered | +0.231 |
Cly | +0.208 |
racted | +0.201 |
>>>>>>>> | +0.193 |
Changes | +0.185 |
Neg logit contributions | |
icho | -0.245 |
Uri | -0.243 |
llah | -0.242 |
erity | -0.219 |
humans | -0.218 |
Token | that |
Token ID | 326 |
Feature activation | +8.22e-02 |
Pos logit contributions | |
kered | +0.299 |
Cly | +0.271 |
racted | +0.259 |
>>>>>>>> | +0.250 |
★★ | +0.241 |
Neg logit contributions | |
icho | -0.299 |
Uri | -0.296 |
llah | -0.295 |
humans | -0.265 |
erity | -0.265 |
Token | the |
Token ID | 262 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
kered | +0.067 |
Cly | +0.061 |
racted | +0.059 |
>>>>>>>> | +0.057 |
★★ | +0.055 |
Neg logit contributions | |
icho | -0.051 |
Uri | -0.050 |
llah | -0.050 |
erity | -0.044 |
humans | -0.044 |
Token | debt |
Token ID | 5057 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
kered | +0.094 |
Cly | +0.085 |
racted | +0.081 |
>>>>>>>> | +0.078 |
★★ | +0.076 |
Neg logit contributions | |
icho | -0.100 |
Uri | -0.099 |
llah | -0.098 |
humans | -0.089 |
erity | -0.089 |
Token | ceiling |
Token ID | 13387 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
icho | +1.531 |
Uri | +1.514 |
llah | +1.451 |
humans | +1.313 |
erity | +1.299 |
Neg logit contributions | |
kered | -2.328 |
racted | -2.135 |
Cly | -2.115 |
>>>>>>>> | -2.008 |
**************** | -1.979 |
Token | would |
Token ID | 561 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
kered | +0.351 |
Cly | +0.318 |
racted | +0.304 |
>>>>>>>> | +0.293 |
**************** | +0.283 |
Neg logit contributions | |
icho | -0.364 |
Uri | -0.360 |
llah | -0.359 |
humans | -0.324 |
erity | -0.324 |
Token | be |
Token ID | 307 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
kered | +0.289 |
Cly | +0.262 |
racted | +0.250 |
>>>>>>>> | +0.242 |
★★ | +0.232 |
Neg logit contributions | |
icho | -0.309 |
Uri | -0.306 |
llah | -0.305 |
erity | -0.275 |
humans | -0.275 |
Token | raised |
Token ID | 4376 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
icho | +0.297 |
Uri | +0.294 |
llah | +0.294 |
humans | +0.263 |
erity | +0.262 |
Neg logit contributions | |
kered | -0.330 |
Cly | -0.302 |
racted | -0.288 |
>>>>>>>> | -0.280 |
**************** | -0.270 |
Token | . |
Token ID | 13 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
icho | +0.308 |
Uri | +0.305 |
llah | +0.303 |
humans | +0.270 |
erity | +0.270 |
Neg logit contributions | |
kered | -0.360 |
Cly | -0.328 |
racted | -0.316 |
>>>>>>>> | -0.306 |
**************** | -0.295 |
Token | hour |
Token ID | 1711 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
kered | +0.289 |
Cly | +0.265 |
racted | +0.254 |
>>>>>>>> | +0.244 |
**************** | +0.237 |
Neg logit contributions | |
icho | -0.260 |
Uri | -0.256 |
llah | -0.256 |
humans | -0.229 |
erity | -0.229 |
Token | away |
Token ID | 1497 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
icho | +0.194 |
Uri | +0.192 |
llah | +0.192 |
humans | +0.173 |
erity | +0.172 |
Neg logit contributions | |
kered | -0.192 |
Cly | -0.175 |
racted | -0.166 |
>>>>>>>> | -0.161 |
★★ | -0.155 |
Token | ," |
Token ID | 553 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
kered | +0.270 |
Cly | +0.247 |
racted | +0.236 |
>>>>>>>> | +0.228 |
**************** | +0.221 |
Neg logit contributions | |
icho | -0.261 |
llah | -0.257 |
Uri | -0.257 |
erity | -0.232 |
humans | -0.232 |
Token | says |
Token ID | 1139 |
Feature activation | -9.82e-01 |
Pos logit contributions | |
kered | +0.087 |
Cly | +0.080 |
racted | +0.077 |
>>>>>>>> | +0.075 |
★★ | +0.072 |
Neg logit contributions | |
icho | -0.065 |
llah | -0.064 |
Uri | -0.064 |
erity | -0.057 |
humans | -0.057 |
Token | A |
Token ID | 317 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
icho | +0.672 |
Uri | +0.668 |
llah | +0.664 |
humans | +0.593 |
erity | +0.592 |
Neg logit contributions | |
kered | -0.728 |
Cly | -0.659 |
racted | -0.633 |
>>>>>>>> | -0.614 |
**************** | -0.593 |
Token | du |
Token ID | 646 |
Feature activation | -2.83e+00 |
Pos logit contributions | |
icho | +0.858 |
llah | +0.848 |
Uri | +0.848 |
humans | +0.763 |
erity | +0.762 |
Neg logit contributions | |
kered | -0.784 |
Cly | -0.710 |
racted | -0.676 |
>>>>>>>> | -0.654 |
★★ | -0.630 |
Token | . |
Token ID | 13 |
Feature activation | +7.02e-01 |
Pos logit contributions | |
llah | +2.075 |
icho | +2.066 |
Uri | +2.057 |
alon | +1.845 |
irit | +1.825 |
Neg logit contributions | |
kered | -1.955 |
Cly | -1.765 |
racted | -1.681 |
>>>>>>>> | -1.642 |
★★ | -1.587 |
Token | He |
Token ID | 1544 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
kered | +0.504 |
Cly | +0.460 |
racted | +0.438 |
>>>>>>>> | +0.424 |
★★ | +0.410 |
Neg logit contributions | |
icho | -0.495 |
Uri | -0.487 |
llah | -0.487 |
erity | -0.438 |
humans | -0.438 |
Token | is |
Token ID | 318 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
kered | +0.125 |
Cly | +0.114 |
racted | +0.109 |
>>>>>>>> | +0.105 |
**************** | +0.102 |
Neg logit contributions | |
icho | -0.113 |
Uri | -0.112 |
llah | -0.112 |
erity | -0.100 |
humans | -0.100 |
Token | now |
Token ID | 783 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
icho | +0.385 |
llah | +0.380 |
Uri | +0.380 |
humans | +0.340 |
erity | +0.340 |
Neg logit contributions | |
kered | -0.433 |
Cly | -0.397 |
racted | -0.380 |
>>>>>>>> | -0.367 |
★★ | -0.356 |
Token | playing |
Token ID | 2712 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
icho | +0.361 |
llah | +0.356 |
Uri | +0.355 |
humans | +0.317 |
erity | +0.316 |
Neg logit contributions | |
kered | -0.434 |
Cly | -0.399 |
racted | -0.382 |
>>>>>>>> | -0.371 |
**************** | -0.359 |
Token |
|
Token ID | 198 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
kered | +0.189 |
Cly | +0.172 |
racted | +0.164 |
>>>>>>>> | +0.159 |
**************** | +0.154 |
Neg logit contributions | |
icho | -0.193 |
llah | -0.190 |
Uri | -0.190 |
erity | -0.171 |
humans | -0.171 |
Token | OC |
Token ID | 4503 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
kered | +0.182 |
Cly | +0.165 |
racted | +0.157 |
>>>>>>>> | +0.153 |
**************** | +0.147 |
Neg logit contributions | |
icho | -0.196 |
Uri | -0.195 |
llah | -0.194 |
erity | -0.175 |
humans | -0.175 |
Token | : |
Token ID | 25 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
kered | +1.234 |
Cly | +1.124 |
racted | +1.074 |
>>>>>>>> | +1.042 |
**************** | +1.006 |
Neg logit contributions | |
icho | -1.156 |
Uri | -1.142 |
llah | -1.142 |
humans | -1.022 |
erity | -1.021 |
Token | MSI |
Token ID | 30781 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
kered | +0.198 |
Cly | +0.182 |
racted | +0.174 |
>>>>>>>> | +0.169 |
★★ | +0.164 |
Neg logit contributions | |
icho | -0.156 |
llah | -0.155 |
Uri | -0.153 |
humans | -0.137 |
erity | -0.136 |
Token | After |
Token ID | 2293 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
icho | +0.204 |
llah | +0.201 |
Uri | +0.201 |
humans | +0.178 |
erity | +0.178 |
Neg logit contributions | |
kered | -0.255 |
Cly | -0.234 |
racted | -0.224 |
>>>>>>>> | -0.218 |
**************** | -0.211 |
Token | burn |
Token ID | 10899 |
Feature activation | -3.23e+00 |
Pos logit contributions | |
kered | +0.242 |
Cly | +0.219 |
racted | +0.206 |
>>>>>>>> | +0.198 |
Changes | +0.192 |
Neg logit contributions | |
icho | -0.304 |
Uri | -0.299 |
llah | -0.299 |
erity | -0.271 |
humans | -0.269 |
Token | er |
Token ID | 263 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
Uri | +2.347 |
icho | +2.331 |
llah | +2.311 |
erity | +2.120 |
humans | +2.105 |
Neg logit contributions | |
kered | -2.209 |
Cly | -1.993 |
racted | -1.898 |
>>>>>>>> | -1.856 |
Changes | -1.763 |
Token | , |
Token ID | 11 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
icho | +0.511 |
Uri | +0.506 |
llah | +0.504 |
erity | +0.453 |
humans | +0.453 |
Neg logit contributions | |
kered | -0.526 |
Cly | -0.478 |
racted | -0.457 |
>>>>>>>> | -0.442 |
**************** | -0.426 |
Token | Un |
Token ID | 791 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
icho | +0.219 |
llah | +0.217 |
Uri | +0.215 |
humans | +0.192 |
erity | +0.192 |
Neg logit contributions | |
kered | -0.249 |
Cly | -0.228 |
racted | -0.217 |
>>>>>>>> | -0.211 |
★★ | -0.205 |
Token | locked |
Token ID | 24162 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
kered | +0.302 |
Cly | +0.276 |
racted | +0.264 |
>>>>>>>> | +0.256 |
**************** | +0.247 |
Neg logit contributions | |
icho | -0.281 |
Uri | -0.276 |
llah | -0.276 |
humans | -0.248 |
erity | -0.248 |
Token | Digital |
Token ID | 27640 |
Feature activation | +7.55e-01 |
Pos logit contributions | |
icho | +1.302 |
Uri | +1.288 |
llah | +1.283 |
erity | +1.155 |
humans | +1.153 |
Neg logit contributions | |
kered | -1.378 |
Cly | -1.253 |
racted | -1.201 |
>>>>>>>> | -1.162 |
**************** | -1.120 |
Token | may |
Token ID | 743 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
icho | +0.420 |
llah | +0.415 |
Uri | +0.415 |
humans | +0.371 |
erity | +0.371 |
Neg logit contributions | |
kered | -0.453 |
Cly | -0.413 |
racted | -0.394 |
>>>>>>>> | -0.382 |
**************** | -0.369 |
Token | be |
Token ID | 307 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
icho | +0.881 |
Uri | +0.876 |
llah | +0.870 |
humans | +0.780 |
erity | +0.775 |
Neg logit contributions | |
kered | -0.963 |
Cly | -0.880 |
racted | -0.846 |
>>>>>>>> | -0.819 |
★★ | -0.792 |
Token | effective |
Token ID | 4050 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
icho | +0.504 |
Uri | +0.498 |
llah | +0.496 |
humans | +0.443 |
erity | +0.442 |
Neg logit contributions | |
kered | -0.587 |
Cly | -0.537 |
racted | -0.514 |
>>>>>>>> | -0.499 |
★★ | -0.482 |
Token | for |
Token ID | 329 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
icho | +0.739 |
Uri | +0.731 |
llah | +0.729 |
humans | +0.647 |
erity | +0.645 |
Neg logit contributions | |
kered | -0.913 |
Cly | -0.836 |
racted | -0.804 |
>>>>>>>> | -0.779 |
★★ | -0.755 |
Token | the |
Token ID | 262 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
icho | +1.011 |
Uri | +0.999 |
llah | +0.996 |
humans | +0.878 |
erity | +0.877 |
Neg logit contributions | |
kered | -1.365 |
Cly | -1.254 |
racted | -1.208 |
>>>>>>>> | -1.173 |
★★ | -1.138 |
Token | treatment |
Token ID | 3513 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
icho | +0.270 |
Uri | +0.265 |
llah | +0.265 |
erity | +0.238 |
humans | +0.237 |
Neg logit contributions | |
kered | -0.311 |
Cly | -0.285 |
racted | -0.270 |
>>>>>>>> | -0.264 |
**************** | -0.254 |
Token | of |
Token ID | 286 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
icho | +1.549 |
Uri | +1.514 |
llah | +1.512 |
erity | +1.331 |
humans | +1.316 |
Neg logit contributions | |
kered | -2.481 |
Cly | -2.295 |
racted | -2.233 |
>>>>>>>> | -2.149 |
★★ | -2.105 |
Token | stress |
Token ID | 5503 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
kered | +0.115 |
Cly | +0.106 |
racted | +0.101 |
>>>>>>>> | +0.098 |
**************** | +0.094 |
Neg logit contributions | |
icho | -0.103 |
Uri | -0.101 |
llah | -0.101 |
erity | -0.091 |
humans | -0.090 |
Token | - |
Token ID | 12 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
icho | +0.325 |
Uri | +0.322 |
llah | +0.321 |
humans | +0.290 |
erity | +0.290 |
Neg logit contributions | |
kered | -0.296 |
Cly | -0.267 |
racted | -0.254 |
>>>>>>>> | -0.246 |
★★ | -0.236 |
Token | related |
Token ID | 5363 |
Feature activation | -4.88e-01 |
Pos logit contributions | |
kered | +0.094 |
Cly | +0.085 |
racted | +0.081 |
>>>>>>>> | +0.078 |
**************** | +0.075 |
Neg logit contributions | |
icho | -0.096 |
Uri | -0.095 |
llah | -0.095 |
erity | -0.085 |
humans | -0.085 |
Token | disorders |
Token ID | 11916 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
icho | +0.329 |
Uri | +0.325 |
llah | +0.324 |
erity | +0.290 |
humans | +0.290 |
Neg logit contributions | |
kered | -0.367 |
Cly | -0.335 |
racted | -0.320 |
>>>>>>>> | -0.311 |
**************** | -0.300 |