Token | Gender |
Token ID | 20247 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
osate | +0.469 |
� | +0.352 |
ongyang | +0.351 |
insula | +0.346 |
withd | +0.344 |
Neg logit contributions | |
Carbuncle | -0.365 |
hemy | -0.345 |
ndra | -0.336 |
ongs | -0.321 |
dh | -0.319 |
Token | flu |
Token ID | 35522 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
osate | +0.320 |
� | +0.235 |
ongyang | +0.232 |
insula | +0.229 |
withd | +0.226 |
Neg logit contributions | |
Carbuncle | -0.295 |
hemy | -0.283 |
ndra | -0.275 |
ongs | -0.265 |
dh | -0.264 |
Token | id |
Token ID | 312 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
osate | +0.892 |
ongyang | +0.645 |
insula | +0.635 |
enes | +0.629 |
� | +0.626 |
Neg logit contributions | |
Carbuncle | -0.892 |
hemy | -0.837 |
ndra | -0.813 |
ongs | -0.783 |
bars | -0.782 |
Token | or |
Token ID | 393 |
Feature activation | +3.92e-01 |
Pos logit contributions | |
osate | +0.162 |
� | +0.121 |
ongyang | +0.121 |
insula | +0.120 |
withd | +0.118 |
Neg logit contributions | |
Carbuncle | -0.123 |
hemy | -0.117 |
ndra | -0.113 |
ongs | -0.110 |
dh | -0.109 |
Token | gender |
Token ID | 5279 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
osate | +0.353 |
� | +0.258 |
ongyang | +0.256 |
insula | +0.253 |
withd | +0.248 |
Neg logit contributions | |
Carbuncle | -0.333 |
hemy | -0.322 |
ndra | -0.310 |
ongs | -0.300 |
dh | -0.299 |
Token | que |
Token ID | 4188 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
osate | +0.335 |
� | +0.232 |
ongyang | +0.230 |
insula | +0.228 |
withd | +0.224 |
Neg logit contributions | |
Carbuncle | -0.386 |
hemy | -0.373 |
ndra | -0.362 |
ongs | -0.352 |
dh | -0.350 |
Token | er |
Token ID | 263 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
osate | +2.591 |
ongyang | +2.044 |
enes | +2.020 |
satisf | +2.018 |
� | +2.017 |
Neg logit contributions | |
Carbuncle | -1.410 |
hemy | -1.280 |
ndra | -1.219 |
bars | -1.163 |
ongs | -1.162 |
Token | people |
Token ID | 661 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
Carbuncle | +0.300 |
hemy | +0.286 |
ndra | +0.276 |
ongs | +0.267 |
bars | +0.266 |
Neg logit contributions | |
osate | -0.467 |
� | -0.356 |
ongyang | -0.356 |
insula | -0.353 |
withd | -0.348 |
Token | internally |
Token ID | 20947 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
osate | +0.289 |
� | +0.215 |
ongyang | +0.215 |
insula | +0.212 |
withd | +0.209 |
Neg logit contributions | |
Carbuncle | -0.234 |
hemy | -0.221 |
ndra | -0.216 |
ongs | -0.207 |
dh | -0.205 |
Token | understand |
Token ID | 1833 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
osate | +0.963 |
� | +0.690 |
ongyang | +0.688 |
insula | +0.677 |
withd | +0.669 |
Neg logit contributions | |
Carbuncle | -0.970 |
hemy | -0.923 |
ndra | -0.902 |
ongs | -0.869 |
dh | -0.864 |
Token | their |
Token ID | 511 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
osate | +0.520 |
� | +0.390 |
ongyang | +0.387 |
insula | +0.382 |
withd | +0.378 |
Neg logit contributions | |
Carbuncle | -0.406 |
hemy | -0.384 |
ndra | -0.373 |
ongs | -0.360 |
bars | -0.358 |
Token | heavy |
Token ID | 4334 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
osate | +0.389 |
ongyang | +0.295 |
� | +0.294 |
insula | +0.290 |
withd | +0.288 |
Neg logit contributions | |
Carbuncle | -0.265 |
hemy | -0.246 |
ndra | -0.243 |
ongs | -0.229 |
dh | -0.228 |
Token | - |
Token ID | 12 |
Feature activation | +5.50e-01 |
Pos logit contributions | |
osate | +0.205 |
ongyang | +0.143 |
� | +0.141 |
insula | +0.141 |
withd | +0.136 |
Neg logit contributions | |
Carbuncle | -0.226 |
ndra | -0.213 |
hemy | -0.212 |
bars | -0.205 |
dh | -0.202 |
Token | lift |
Token ID | 26282 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
osate | +0.383 |
ongyang | +0.241 |
� | +0.239 |
insula | +0.233 |
withd | +0.228 |
Neg logit contributions | |
Carbuncle | -0.589 |
hemy | -0.565 |
ndra | -0.562 |
dh | -0.546 |
ongs | -0.539 |
Token | rocket |
Token ID | 10701 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
osate | +1.282 |
ongyang | +0.933 |
� | +0.931 |
insula | +0.921 |
withd | +0.907 |
Neg logit contributions | |
Carbuncle | -1.116 |
hemy | -1.047 |
ndra | -1.035 |
ongs | -0.988 |
bars | -0.986 |
Token | and |
Token ID | 290 |
Feature activation | +4.32e-01 |
Pos logit contributions | |
osate | +1.138 |
ongyang | +0.862 |
� | +0.861 |
insula | +0.849 |
withd | +0.841 |
Neg logit contributions | |
Carbuncle | -0.787 |
hemy | -0.737 |
ndra | -0.721 |
ongs | -0.686 |
dh | -0.681 |
Token | Orion |
Token ID | 26153 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
osate | +0.434 |
ongyang | +0.323 |
� | +0.321 |
insula | +0.318 |
withd | +0.313 |
Neg logit contributions | |
Carbuncle | -0.330 |
hemy | -0.306 |
ndra | -0.304 |
ongs | -0.289 |
bars | -0.289 |
Token | spacecraft |
Token ID | 16807 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
osate | +2.079 |
ongyang | +1.517 |
� | +1.515 |
insula | +1.494 |
withd | +1.477 |
Neg logit contributions | |
Carbuncle | -1.854 |
hemy | -1.751 |
ndra | -1.715 |
ongs | -1.647 |
bars | -1.634 |
Token | . |
Token ID | 13 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
osate | +1.247 |
ongyang | +0.958 |
� | +0.956 |
insula | +0.945 |
withd | +0.938 |
Neg logit contributions | |
Carbuncle | -0.766 |
hemy | -0.712 |
ndra | -0.696 |
ongs | -0.660 |
dh | -0.654 |
Token | � |
Token ID | 564 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
osate | +0.034 |
ongyang | +0.025 |
� | +0.025 |
insula | +0.025 |
withd | +0.025 |
Neg logit contributions | |
Carbuncle | -0.027 |
hemy | -0.025 |
ndra | -0.025 |
ongs | -0.024 |
dh | -0.023 |
Token | � |
Token ID | 250 |
Feature activation | +2.99e-01 |
Pos logit contributions | |
Carbuncle | +0.260 |
hemy | +0.245 |
ndra | +0.238 |
ongs | +0.227 |
dh | +0.226 |
Neg logit contributions | |
osate | -0.370 |
� | -0.281 |
ongyang | -0.280 |
insula | -0.276 |
withd | -0.275 |
Token | That |
Token ID | 2504 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
osate | +0.291 |
ongyang | +0.216 |
� | +0.215 |
insula | +0.213 |
withd | +0.212 |
Neg logit contributions | |
Carbuncle | -0.233 |
hemy | -0.221 |
ndra | -0.216 |
ongs | -0.206 |
dh | -0.206 |
Token | size |
Token ID | 7857 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
Carbuncle | +0.016 |
hemy | +0.015 |
ndra | +0.014 |
dh | +0.014 |
ongs | +0.014 |
Neg logit contributions | |
osate | -0.022 |
ongyang | -0.016 |
� | -0.016 |
insula | -0.016 |
withd | -0.016 |
Token | : |
Token ID | 25 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
Carbuncle | +0.145 |
hemy | +0.137 |
ndra | +0.133 |
bars | +0.129 |
dh | +0.128 |
Neg logit contributions | |
osate | -0.178 |
ongyang | -0.131 |
� | -0.131 |
insula | -0.129 |
withd | -0.127 |
Token | Pro |
Token ID | 1041 |
Feature activation | +5.21e-02 |
Pos logit contributions | |
Carbuncle | +0.115 |
hemy | +0.108 |
ndra | +0.105 |
dh | +0.100 |
ongs | +0.100 |
Neg logit contributions | |
osate | -0.151 |
ongyang | -0.113 |
� | -0.113 |
insula | -0.111 |
withd | -0.110 |
Token | pe |
Token ID | 431 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
osate | +0.052 |
ongyang | +0.039 |
� | +0.039 |
insula | +0.039 |
withd | +0.038 |
Neg logit contributions | |
Carbuncle | -0.040 |
hemy | -0.037 |
ndra | -0.036 |
dh | -0.035 |
bars | -0.035 |
Token | ller |
Token ID | 6051 |
Feature activation | +6.89e-01 |
Pos logit contributions | |
osate | +0.660 |
� | +0.524 |
withd | +0.522 |
insula | +0.518 |
ongyang | +0.515 |
Neg logit contributions | |
Carbuncle | -0.285 |
hemy | -0.266 |
ndra | -0.254 |
ongs | -0.238 |
dh | -0.237 |
Token | Blade |
Token ID | 47520 |
Feature activation | +2.18e+00 |
Pos logit contributions | |
osate | +0.723 |
ongyang | +0.552 |
� | +0.550 |
insula | +0.541 |
withd | +0.532 |
Neg logit contributions | |
Carbuncle | -0.491 |
hemy | -0.462 |
ndra | -0.446 |
bars | -0.428 |
ongs | -0.425 |
Token | / |
Token ID | 1220 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
osate | +2.143 |
ongyang | +1.597 |
� | +1.596 |
insula | +1.573 |
withd | +1.551 |
Neg logit contributions | |
Carbuncle | -1.695 |
hemy | -1.604 |
ndra | -1.556 |
ongs | -1.491 |
dh | -1.486 |
Token | 8 |
Token ID | 807 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
osate | +0.126 |
ongyang | +0.095 |
� | +0.095 |
insula | +0.094 |
withd | +0.093 |
Neg logit contributions | |
Carbuncle | -0.092 |
hemy | -0.086 |
ndra | -0.084 |
ongs | -0.080 |
dh | -0.080 |
Token | cm |
Token ID | 11215 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
osate | +0.240 |
ongyang | +0.181 |
� | +0.180 |
insula | +0.179 |
withd | +0.176 |
Neg logit contributions | |
Carbuncle | -0.170 |
hemy | -0.159 |
ndra | -0.155 |
ongs | -0.149 |
dh | -0.148 |
Token |
|
Token ID | 198 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
osate | +0.167 |
ongyang | +0.126 |
� | +0.126 |
insula | +0.124 |
withd | +0.123 |
Neg logit contributions | |
Carbuncle | -0.119 |
hemy | -0.112 |
ndra | -0.109 |
dh | -0.104 |
bars | -0.104 |
Token |
|
Token ID | 198 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
osate | +0.114 |
� | +0.083 |
ongyang | +0.082 |
insula | +0.080 |
satisf | +0.080 |
Neg logit contributions | |
Carbuncle | -0.114 |
hemy | -0.108 |
ndra | -0.105 |
ongs | -0.102 |
bars | -0.100 |
Token | worth |
Token ID | 2861 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
osate | +0.355 |
ongyang | +0.265 |
� | +0.264 |
insula | +0.261 |
withd | +0.258 |
Neg logit contributions | |
Carbuncle | -0.273 |
hemy | -0.257 |
ndra | -0.251 |
ongs | -0.241 |
bars | -0.239 |
Token | millions |
Token ID | 5242 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
osate | +0.223 |
ongyang | +0.172 |
� | +0.172 |
insula | +0.170 |
withd | +0.168 |
Neg logit contributions | |
Carbuncle | -0.135 |
hemy | -0.126 |
ndra | -0.122 |
ongs | -0.116 |
bars | -0.115 |
Token | of |
Token ID | 286 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
osate | +0.323 |
ongyang | +0.247 |
� | +0.246 |
insula | +0.244 |
withd | +0.241 |
Neg logit contributions | |
Carbuncle | -0.213 |
hemy | -0.200 |
ndra | -0.195 |
ongs | -0.187 |
bars | -0.185 |
Token | dollars |
Token ID | 5054 |
Feature activation | +7.42e-01 |
Pos logit contributions | |
osate | +0.425 |
� | +0.333 |
ongyang | +0.332 |
insula | +0.328 |
withd | +0.327 |
Neg logit contributions | |
Carbuncle | -0.235 |
hemy | -0.219 |
ndra | -0.212 |
ongs | -0.200 |
dh | -0.198 |
Token | . |
Token ID | 13 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
osate | +0.766 |
ongyang | +0.579 |
� | +0.578 |
insula | +0.572 |
withd | +0.565 |
Neg logit contributions | |
Carbuncle | -0.540 |
hemy | -0.508 |
ndra | -0.494 |
ongs | -0.474 |
bars | -0.470 |
Token | McDonnell |
Token ID | 39441 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
osate | +0.131 |
� | +0.099 |
ongyang | +0.098 |
insula | +0.097 |
withd | +0.096 |
Neg logit contributions | |
Carbuncle | -0.099 |
hemy | -0.093 |
ndra | -0.091 |
ongs | -0.087 |
dh | -0.086 |
Token | should |
Token ID | 815 |
Feature activation | +7.63e-01 |
Pos logit contributions | |
osate | +2.134 |
� | +1.614 |
ongyang | +1.606 |
satisf | +1.582 |
insula | +1.580 |
Neg logit contributions | |
Carbuncle | -1.635 |
hemy | -1.546 |
ndra | -1.496 |
ongs | -1.437 |
dh | -1.423 |
Token | not |
Token ID | 407 |
Feature activation | +6.04e-01 |
Pos logit contributions | |
osate | +0.661 |
� | +0.470 |
ongyang | +0.469 |
insula | +0.462 |
withd | +0.455 |
Neg logit contributions | |
Carbuncle | -0.680 |
hemy | -0.649 |
ndra | -0.635 |
ongs | -0.612 |
dh | -0.608 |
Token | benefit |
Token ID | 4414 |
Feature activation | +8.52e-03 |
Pos logit contributions | |
osate | +0.515 |
� | +0.364 |
ongyang | +0.363 |
insula | +0.357 |
Fug | +0.352 |
Neg logit contributions | |
Carbuncle | -0.549 |
hemy | -0.523 |
ndra | -0.512 |
ongs | -0.494 |
dh | -0.491 |
Token | simply |
Token ID | 2391 |
Feature activation | +6.18e-01 |
Pos logit contributions | |
osate | +0.009 |
ongyang | +0.007 |
� | +0.007 |
insula | +0.007 |
withd | +0.007 |
Neg logit contributions | |
Carbuncle | -0.006 |
hemy | -0.006 |
ndra | -0.005 |
ongs | -0.005 |
bars | -0.005 |
Token | because |
Token ID | 780 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
osate | +0.622 |
� | +0.468 |
ongyang | +0.468 |
insula | +0.461 |
withd | +0.457 |
Neg logit contributions | |
Carbuncle | -0.465 |
hemy | -0.439 |
ndra | -0.426 |
ongs | -0.409 |
bars | -0.405 |
Token | C |
Token ID | 34 |
Feature activation | +8.18e-01 |
Pos logit contributions | |
Carbuncle | +0.040 |
hemy | +0.038 |
ndra | +0.037 |
dh | +0.035 |
ongs | +0.035 |
Neg logit contributions | |
osate | -0.049 |
ongyang | -0.036 |
� | -0.035 |
insula | -0.035 |
withd | -0.035 |
Token | AS |
Token ID | 1921 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
osate | +0.811 |
� | +0.609 |
ongyang | +0.607 |
insula | +0.599 |
withd | +0.595 |
Neg logit contributions | |
Carbuncle | -0.624 |
hemy | -0.591 |
ndra | -0.573 |
ongs | -0.550 |
dh | -0.545 |
Token | INO |
Token ID | 46016 |
Feature activation | -5.26e-02 |
Pos logit contributions | |
Carbuncle | +0.215 |
hemy | +0.201 |
ndra | +0.195 |
ongs | +0.186 |
dh | +0.185 |
Neg logit contributions | |
osate | -0.320 |
ongyang | -0.245 |
� | -0.243 |
insula | -0.240 |
withd | -0.239 |
Token | RO |
Token ID | 15107 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
Carbuncle | +0.039 |
hemy | +0.037 |
ndra | +0.036 |
ongs | +0.034 |
dh | +0.034 |
Neg logit contributions | |
osate | -0.053 |
ongyang | -0.040 |
� | -0.040 |
insula | -0.040 |
withd | -0.039 |
Token | Y |
Token ID | 56 |
Feature activation | +4.68e-01 |
Pos logit contributions | |
osate | +0.349 |
ongyang | +0.271 |
� | +0.269 |
insula | +0.267 |
withd | +0.265 |
Neg logit contributions | |
Carbuncle | -0.206 |
hemy | -0.192 |
ndra | -0.186 |
ongs | -0.176 |
dh | -0.176 |
Token | ALE |
Token ID | 21358 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
osate | +0.470 |
ongyang | +0.355 |
insula | +0.351 |
� | +0.349 |
withd | +0.346 |
Neg logit contributions | |
Carbuncle | -0.356 |
hemy | -0.328 |
ndra | -0.322 |
ongs | -0.309 |
bars | -0.308 |
Token | " |
Token ID | 1 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
osate | +2.142 |
� | +1.624 |
ongyang | +1.611 |
insula | +1.591 |
Fug | +1.582 |
Neg logit contributions | |
Carbuncle | -1.597 |
hemy | -1.511 |
ndra | -1.466 |
ongs | -1.401 |
dh | -1.386 |
Token | - |
Token ID | 532 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
osate | +0.220 |
ongyang | +0.163 |
� | +0.162 |
insula | +0.161 |
satisf | +0.159 |
Neg logit contributions | |
Carbuncle | -0.171 |
hemy | -0.161 |
ndra | -0.156 |
ongs | -0.151 |
dh | -0.151 |
Token | starring |
Token ID | 20495 |
Feature activation | +7.34e-01 |
Pos logit contributions | |
osate | +0.286 |
ongyang | +0.215 |
� | +0.214 |
insula | +0.212 |
withd | +0.209 |
Neg logit contributions | |
Carbuncle | -0.217 |
hemy | -0.204 |
ndra | -0.199 |
ongs | -0.191 |
bars | -0.189 |
Token | Barry |
Token ID | 14488 |
Feature activation | -7.28e-02 |
Pos logit contributions | |
osate | +0.701 |
ongyang | +0.518 |
� | +0.516 |
insula | +0.510 |
withd | +0.502 |
Neg logit contributions | |
Carbuncle | -0.594 |
hemy | -0.557 |
ndra | -0.543 |
ongs | -0.524 |
bars | -0.521 |
Token | Nelson |
Token ID | 12996 |
Feature activation | +8.37e-02 |
Pos logit contributions | |
Carbuncle | +0.053 |
hemy | +0.050 |
ndra | +0.049 |
dh | +0.047 |
ongs | +0.047 |
Neg logit contributions | |
osate | -0.074 |
ongyang | -0.057 |
� | -0.056 |
insula | -0.056 |
withd | -0.055 |
Token | hole |
Token ID | 13207 |
Feature activation | +5.73e-01 |
Pos logit contributions | |
Carbuncle | +0.193 |
hemy | +0.179 |
ndra | +0.173 |
ongs | +0.164 |
bars | +0.163 |
Neg logit contributions | |
osate | -0.290 |
ongyang | -0.223 |
� | -0.222 |
insula | -0.220 |
satisf | -0.218 |
Token | images |
Token ID | 4263 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
osate | +0.598 |
ongyang | +0.450 |
� | +0.450 |
insula | +0.447 |
withd | +0.441 |
Neg logit contributions | |
Carbuncle | -0.410 |
hemy | -0.387 |
ndra | -0.372 |
bars | -0.367 |
ongs | -0.366 |
Token | for |
Token ID | 329 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
osate | +0.850 |
ongyang | +0.581 |
� | +0.579 |
insula | +0.571 |
withd | +0.557 |
Neg logit contributions | |
Carbuncle | -1.014 |
hemy | -0.965 |
ndra | -0.945 |
ongs | -0.921 |
bars | -0.915 |
Token | a |
Token ID | 257 |
Feature activation | +9.26e-02 |
Pos logit contributions | |
osate | +0.282 |
� | +0.214 |
insula | +0.213 |
ongyang | +0.213 |
withd | +0.209 |
Neg logit contributions | |
Carbuncle | -0.187 |
hemy | -0.174 |
ndra | -0.170 |
bars | -0.163 |
ongs | -0.163 |
Token | typical |
Token ID | 7226 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
osate | +0.094 |
� | +0.070 |
ongyang | +0.070 |
insula | +0.070 |
withd | +0.068 |
Neg logit contributions | |
Carbuncle | -0.070 |
hemy | -0.065 |
ndra | -0.064 |
ongs | -0.061 |
dh | -0.061 |
Token | Canon |
Token ID | 19507 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
Carbuncle | +0.102 |
hemy | +0.096 |
ndra | +0.094 |
ongs | +0.090 |
dh | +0.090 |
Neg logit contributions | |
osate | -0.129 |
� | -0.096 |
ongyang | -0.096 |
insula | -0.095 |
withd | -0.093 |
Token | 16 |
Token ID | 1467 |
Feature activation | +3.84e-01 |
Pos logit contributions | |
osate | +2.040 |
� | +1.519 |
ongyang | +1.515 |
insula | +1.501 |
withd | +1.481 |
Neg logit contributions | |
Carbuncle | -1.643 |
hemy | -1.550 |
ndra | -1.510 |
ongs | -1.450 |
dh | -1.439 |
Token | - |
Token ID | 12 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
osate | +0.396 |
ongyang | +0.297 |
insula | +0.296 |
� | +0.296 |
withd | +0.292 |
Neg logit contributions | |
Carbuncle | -0.281 |
hemy | -0.265 |
ndra | -0.257 |
ongs | -0.249 |
bars | -0.248 |
Token | 35 |
Token ID | 2327 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
osate | +0.281 |
ongyang | +0.216 |
� | +0.216 |
insula | +0.215 |
withd | +0.213 |
Neg logit contributions | |
Carbuncle | -0.160 |
hemy | -0.149 |
ndra | -0.146 |
dh | -0.139 |
ongs | -0.138 |
Token | f |
Token ID | 277 |
Feature activation | +6.75e-01 |
Pos logit contributions | |
osate | +0.153 |
insula | +0.115 |
ongyang | +0.114 |
� | +0.114 |
withd | +0.112 |
Neg logit contributions | |
Carbuncle | -0.115 |
hemy | -0.108 |
ndra | -0.105 |
ongs | -0.102 |
bars | -0.102 |
Token | / |
Token ID | 14 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
osate | +0.589 |
� | +0.424 |
ongyang | +0.422 |
insula | +0.413 |
satisf | +0.411 |
Neg logit contributions | |
Carbuncle | -0.595 |
hemy | -0.567 |
ndra | -0.551 |
ongs | -0.531 |
bars | -0.527 |
Token | t |
Token ID | 256 |
Feature activation | -6.09e-01 |
Pos logit contributions | |
Carbuncle | +0.003 |
hemy | +0.003 |
ndra | +0.003 |
ongs | +0.003 |
bars | +0.003 |
Neg logit contributions | |
osate | -0.004 |
ongyang | -0.003 |
� | -0.003 |
insula | -0.003 |
withd | -0.003 |
Token | rolled |
Token ID | 8375 |
Feature activation | +9.56e-01 |
Pos logit contributions | |
Carbuncle | +0.405 |
hemy | +0.379 |
ndra | +0.368 |
ongs | +0.350 |
dh | +0.347 |
Neg logit contributions | |
osate | -0.663 |
� | -0.513 |
ongyang | -0.512 |
insula | -0.505 |
withd | -0.503 |
Token | , |
Token ID | 11 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
osate | +0.940 |
ongyang | +0.701 |
� | +0.700 |
insula | +0.691 |
withd | +0.682 |
Neg logit contributions | |
Carbuncle | -0.741 |
hemy | -0.703 |
ndra | -0.680 |
ongs | -0.656 |
dh | -0.651 |
Token | dog |
Token ID | 3290 |
Feature activation | +3.87e-01 |
Pos logit contributions | |
osate | +0.406 |
ongyang | +0.302 |
� | +0.301 |
insula | +0.297 |
withd | +0.293 |
Neg logit contributions | |
Carbuncle | -0.326 |
hemy | -0.307 |
ndra | -0.299 |
ongs | -0.287 |
bars | -0.286 |
Token | p |
Token ID | 79 |
Feature activation | +8.04e-01 |
Pos logit contributions | |
osate | +0.400 |
� | +0.308 |
ongyang | +0.306 |
insula | +0.301 |
Fug | +0.300 |
Neg logit contributions | |
Carbuncle | -0.276 |
hemy | -0.261 |
ndra | -0.252 |
ongs | -0.239 |
dh | -0.235 |
Token | iled |
Token ID | 3902 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
osate | +0.598 |
ongyang | +0.404 |
insula | +0.397 |
� | +0.393 |
satisf | +0.385 |
Neg logit contributions | |
Carbuncle | -0.816 |
hemy | -0.771 |
ndra | -0.752 |
bars | -0.724 |
ongs | -0.723 |
Token | on |
Token ID | 319 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
osate | +1.998 |
� | +1.495 |
ongyang | +1.490 |
insula | +1.469 |
withd | +1.459 |
Neg logit contributions | |
Carbuncle | -1.586 |
hemy | -1.499 |
ndra | -1.460 |
ongs | -1.396 |
dh | -1.386 |
Token | , |
Token ID | 11 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
osate | +0.387 |
� | +0.301 |
ongyang | +0.301 |
insula | +0.297 |
withd | +0.295 |
Neg logit contributions | |
Carbuncle | -0.220 |
hemy | -0.205 |
ndra | -0.198 |
ongs | -0.188 |
dh | -0.186 |
Token | dumped |
Token ID | 24105 |
Feature activation | -4.62e-04 |
Pos logit contributions | |
osate | +0.547 |
ongyang | +0.407 |
� | +0.407 |
insula | +0.402 |
withd | +0.397 |
Neg logit contributions | |
Carbuncle | -0.434 |
hemy | -0.410 |
ndra | -0.399 |
ongs | -0.382 |
bars | -0.381 |
Token | on |
Token ID | 319 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
Carbuncle | +0.000 |
hemy | +0.000 |
ndra | +0.000 |
ongs | +0.000 |
dh | +0.000 |
Neg logit contributions | |
osate | -0.000 |
� | -0.000 |
ongyang | -0.000 |
insula | -0.000 |
withd | -0.000 |
Token | with |
Token ID | 351 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
Carbuncle | +0.024 |
hemy | +0.023 |
ndra | +0.022 |
ongs | +0.021 |
bars | +0.021 |
Neg logit contributions | |
osate | -0.032 |
� | -0.024 |
ongyang | -0.024 |
insula | -0.024 |
withd | -0.024 |
Token | have |
Token ID | 423 |
Feature activation | +7.09e-01 |
Pos logit contributions | |
osate | +0.303 |
� | +0.222 |
ongyang | +0.222 |
insula | +0.219 |
withd | +0.215 |
Neg logit contributions | |
Carbuncle | -0.269 |
hemy | -0.254 |
ndra | -0.249 |
ongs | -0.238 |
bars | -0.237 |
Token | to |
Token ID | 284 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
osate | +0.735 |
� | +0.559 |
ongyang | +0.558 |
insula | +0.551 |
withd | +0.547 |
Neg logit contributions | |
Carbuncle | -0.511 |
hemy | -0.480 |
ndra | -0.467 |
ongs | -0.445 |
dh | -0.442 |
Token | get |
Token ID | 651 |
Feature activation | +4.69e-01 |
Pos logit contributions | |
osate | +0.445 |
ongyang | +0.323 |
� | +0.322 |
insula | +0.317 |
withd | +0.311 |
Neg logit contributions | |
Carbuncle | -0.416 |
hemy | -0.393 |
ndra | -0.385 |
ongs | -0.371 |
bars | -0.369 |
Token | a |
Token ID | 257 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
osate | +0.476 |
ongyang | +0.356 |
� | +0.355 |
insula | +0.353 |
withd | +0.348 |
Neg logit contributions | |
Carbuncle | -0.351 |
hemy | -0.330 |
ndra | -0.322 |
bars | -0.310 |
ongs | -0.308 |
Token | prost |
Token ID | 11825 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
osate | +0.238 |
ongyang | +0.178 |
� | +0.177 |
insula | +0.176 |
withd | +0.173 |
Neg logit contributions | |
Carbuncle | -0.178 |
hemy | -0.168 |
ndra | -0.162 |
bars | -0.157 |
dh | -0.156 |
Token | hetic |
Token ID | 6587 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
osate | +1.073 |
� | +0.810 |
ongyang | +0.804 |
withd | +0.798 |
insula | +0.791 |
Neg logit contributions | |
Carbuncle | -0.807 |
hemy | -0.773 |
ndra | -0.741 |
ongs | -0.717 |
dh | -0.716 |
Token | penis |
Token ID | 16360 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
osate | +1.965 |
� | +1.460 |
ongyang | +1.457 |
insula | +1.436 |
withd | +1.425 |
Neg logit contributions | |
Carbuncle | -1.614 |
hemy | -1.526 |
ndra | -1.487 |
ongs | -1.425 |
dh | -1.415 |
Token | and |
Token ID | 290 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
osate | +1.090 |
ongyang | +0.820 |
� | +0.814 |
insula | +0.809 |
withd | +0.798 |
Neg logit contributions | |
Carbuncle | -0.813 |
hemy | -0.765 |
ndra | -0.746 |
bars | -0.716 |
ongs | -0.715 |
Token | God |
Token ID | 1793 |
Feature activation | +6.28e-01 |
Pos logit contributions | |
osate | +0.589 |
ongyang | +0.440 |
� | +0.439 |
insula | +0.435 |
withd | +0.428 |
Neg logit contributions | |
Carbuncle | -0.455 |
hemy | -0.427 |
ndra | -0.418 |
ongs | -0.400 |
bars | -0.400 |
Token | help |
Token ID | 1037 |
Feature activation | +7.59e-01 |
Pos logit contributions | |
osate | +0.614 |
ongyang | +0.458 |
� | +0.458 |
insula | +0.453 |
withd | +0.447 |
Neg logit contributions | |
Carbuncle | -0.487 |
hemy | -0.462 |
ndra | -0.451 |
ongs | -0.432 |
dh | -0.429 |
Token | me |
Token ID | 502 |
Feature activation | +6.63e-01 |
Pos logit contributions | |
osate | +0.824 |
ongyang | +0.637 |
� | +0.636 |
insula | +0.628 |
withd | +0.624 |
Neg logit contributions | |
Carbuncle | -0.511 |
hemy | -0.476 |
ndra | -0.461 |
ongs | -0.439 |
bars | -0.437 |
Token | one |
Token ID | 530 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
osate | +0.368 |
ongyang | +0.270 |
� | +0.270 |
insula | +0.267 |
withd | +0.264 |
Neg logit contributions | |
Carbuncle | -0.324 |
hemy | -0.306 |
ndra | -0.298 |
ongs | -0.287 |
bars | -0.286 |
Token | touchdown |
Token ID | 10242 |
Feature activation | +3.69e-01 |
Pos logit contributions | |
osate | +0.419 |
� | +0.316 |
ongyang | +0.316 |
insula | +0.311 |
withd | +0.309 |
Neg logit contributions | |
Carbuncle | -0.308 |
hemy | -0.291 |
ndra | -0.283 |
ongs | -0.270 |
dh | -0.268 |
Token | .) |
Token ID | 2014 |
Feature activation | +7.21e-01 |
Pos logit contributions | |
osate | +0.385 |
� | +0.295 |
ongyang | +0.294 |
insula | +0.290 |
withd | +0.288 |
Neg logit contributions | |
Carbuncle | -0.261 |
hemy | -0.246 |
ndra | -0.238 |
ongs | -0.227 |
dh | -0.225 |
Token |
|
Token ID | 198 |
Feature activation | +7.74e-01 |
Pos logit contributions | |
osate | +0.712 |
ongyang | +0.532 |
� | +0.531 |
insula | +0.525 |
withd | +0.521 |
Neg logit contributions | |
Carbuncle | -0.557 |
hemy | -0.524 |
ndra | -0.511 |
ongs | -0.489 |
dh | -0.486 |
Token |
|
Token ID | 198 |
Feature activation | +7.42e-01 |
Pos logit contributions | |
osate | +0.654 |
� | +0.476 |
ongyang | +0.461 |
Fug | +0.458 |
satisf | +0.456 |
Neg logit contributions | |
Carbuncle | -0.697 |
hemy | -0.666 |
ndra | -0.645 |
ongs | -0.625 |
bars | -0.617 |
Token | Mc |
Token ID | 9742 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
osate | +0.714 |
ongyang | +0.527 |
� | +0.523 |
withd | +0.520 |
insula | +0.520 |
Neg logit contributions | |
Carbuncle | -0.589 |
hemy | -0.562 |
ndra | -0.547 |
dh | -0.526 |
ongs | -0.523 |
Token | F |
Token ID | 37 |
Feature activation | +5.70e-01 |
Pos logit contributions | |
osate | +2.255 |
� | +1.761 |
ongyang | +1.750 |
insula | +1.733 |
satisf | +1.720 |
Neg logit contributions | |
Carbuncle | -1.312 |
hemy | -1.225 |
ndra | -1.181 |
ongs | -1.124 |
bars | -1.107 |
Token | adden |
Token ID | 38014 |
Feature activation | +6.21e-01 |
Pos logit contributions | |
osate | +0.447 |
ongyang | +0.311 |
� | +0.306 |
insula | +0.301 |
satisf | +0.298 |
Neg logit contributions | |
Carbuncle | -0.554 |
hemy | -0.524 |
ndra | -0.514 |
ongs | -0.494 |
bars | -0.493 |
Token | � |
Token ID | 447 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
osate | +0.599 |
� | +0.446 |
ongyang | +0.445 |
insula | +0.439 |
withd | +0.435 |
Neg logit contributions | |
Carbuncle | -0.491 |
hemy | -0.465 |
ndra | -0.453 |
ongs | -0.434 |
dh | -0.431 |
Token | � |
Token ID | 247 |
Feature activation | +3.62e-01 |
Pos logit contributions | |
osate | +0.251 |
� | +0.190 |
ongyang | +0.189 |
insula | +0.187 |
satisf | +0.185 |
Neg logit contributions | |
Carbuncle | -0.181 |
hemy | -0.170 |
ndra | -0.166 |
ongs | -0.158 |
dh | -0.157 |
Token | s |
Token ID | 82 |
Feature activation | +5.09e-01 |
Pos logit contributions | |
osate | +0.355 |
ongyang | +0.265 |
� | +0.265 |
insula | +0.262 |
withd | +0.259 |
Neg logit contributions | |
Carbuncle | -0.281 |
hemy | -0.265 |
ndra | -0.259 |
ongs | -0.247 |
dh | -0.246 |
Token | traffic |
Token ID | 4979 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
osate | +0.180 |
� | +0.137 |
ongyang | +0.137 |
insula | +0.135 |
withd | +0.134 |
Neg logit contributions | |
Carbuncle | -0.126 |
hemy | -0.119 |
ndra | -0.115 |
ongs | -0.110 |
bars | -0.110 |
Token | control |
Token ID | 1630 |
Feature activation | +4.97e-01 |
Pos logit contributions | |
osate | +0.165 |
ongyang | +0.131 |
� | +0.130 |
insula | +0.129 |
withd | +0.128 |
Neg logit contributions | |
Carbuncle | -0.077 |
hemy | -0.071 |
ndra | -0.067 |
bars | -0.064 |
dh | -0.064 |
Token | and |
Token ID | 290 |
Feature activation | +7.88e-01 |
Pos logit contributions | |
osate | +0.508 |
ongyang | +0.384 |
� | +0.383 |
insula | +0.378 |
withd | +0.375 |
Neg logit contributions | |
Carbuncle | -0.366 |
hemy | -0.344 |
ndra | -0.334 |
ongs | -0.320 |
bars | -0.319 |
Token | surveillance |
Token ID | 8452 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
osate | +0.812 |
� | +0.617 |
ongyang | +0.616 |
insula | +0.607 |
withd | +0.603 |
Neg logit contributions | |
Carbuncle | -0.572 |
hemy | -0.538 |
ndra | -0.523 |
ongs | -0.499 |
dh | -0.496 |
Token | . |
Token ID | 13 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
osate | +0.280 |
ongyang | +0.216 |
� | +0.216 |
insula | +0.213 |
withd | +0.212 |
Neg logit contributions | |
Carbuncle | -0.169 |
hemy | -0.158 |
ndra | -0.153 |
ongs | -0.146 |
bars | -0.145 |
Token | McDonnell |
Token ID | 39441 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
osate | +0.468 |
ongyang | +0.349 |
� | +0.346 |
insula | +0.342 |
withd | +0.341 |
Neg logit contributions | |
Carbuncle | -0.383 |
hemy | -0.361 |
ndra | -0.353 |
ongs | -0.337 |
dh | -0.336 |
Token | � |
Token ID | 447 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
osate | +1.893 |
� | +1.398 |
ongyang | +1.391 |
insula | +1.369 |
withd | +1.362 |
Neg logit contributions | |
Carbuncle | -1.667 |
hemy | -1.582 |
ndra | -1.541 |
ongs | -1.480 |
dh | -1.468 |
Token | � |
Token ID | 247 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
osate | +0.212 |
� | +0.160 |
ongyang | +0.160 |
insula | +0.157 |
withd | +0.156 |
Neg logit contributions | |
Carbuncle | -0.154 |
hemy | -0.145 |
ndra | -0.141 |
ongs | -0.135 |
dh | -0.134 |
Token | s |
Token ID | 82 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
osate | +0.496 |
� | +0.377 |
ongyang | +0.377 |
insula | +0.372 |
withd | +0.369 |
Neg logit contributions | |
Carbuncle | -0.338 |
hemy | -0.317 |
ndra | -0.309 |
ongs | -0.294 |
dh | -0.293 |
Token | office |
Token ID | 2607 |
Feature activation | +7.17e-01 |
Pos logit contributions | |
osate | +0.446 |
� | +0.340 |
ongyang | +0.340 |
insula | +0.335 |
withd | +0.333 |
Neg logit contributions | |
Carbuncle | -0.299 |
hemy | -0.280 |
ndra | -0.273 |
ongs | -0.260 |
dh | -0.258 |
Token | later |
Token ID | 1568 |
Feature activation | -5.70e-03 |
Pos logit contributions | |
osate | +0.677 |
ongyang | +0.494 |
� | +0.492 |
insula | +0.487 |
withd | +0.480 |
Neg logit contributions | |
Carbuncle | -0.588 |
hemy | -0.555 |
ndra | -0.544 |
bars | -0.521 |
ongs | -0.520 |
Token | , |
Token ID | 11 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
osate | +0.032 |
ongyang | +0.024 |
� | +0.024 |
insula | +0.024 |
withd | +0.024 |
Neg logit contributions | |
Carbuncle | -0.020 |
hemy | -0.019 |
ndra | -0.018 |
ongs | -0.018 |
dh | -0.017 |
Token | without |
Token ID | 1231 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
osate | +0.203 |
� | +0.151 |
ongyang | +0.151 |
insula | +0.150 |
withd | +0.147 |
Neg logit contributions | |
Carbuncle | -0.159 |
hemy | -0.149 |
ndra | -0.145 |
ongs | -0.140 |
bars | -0.140 |
Token | a |
Token ID | 257 |
Feature activation | +6.94e-02 |
Pos logit contributions | |
osate | +0.403 |
� | +0.304 |
ongyang | +0.304 |
insula | +0.300 |
withd | +0.295 |
Neg logit contributions | |
Carbuncle | -0.293 |
hemy | -0.272 |
ndra | -0.267 |
bars | -0.256 |
ongs | -0.255 |
Token | single |
Token ID | 2060 |
Feature activation | -2.17e-01 |
Pos logit contributions | |
osate | +0.079 |
� | +0.062 |
ongyang | +0.062 |
insula | +0.061 |
withd | +0.061 |
Neg logit contributions | |
Carbuncle | -0.043 |
hemy | -0.040 |
ndra | -0.039 |
ongs | -0.036 |
bars | -0.036 |
Token | rad |
Token ID | 2511 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
Carbuncle | +0.169 |
hemy | +0.155 |
ndra | +0.155 |
bars | +0.147 |
dh | +0.146 |
Neg logit contributions | |
osate | -0.215 |
� | -0.161 |
ongyang | -0.159 |
insula | -0.158 |
withd | -0.155 |
Token | iological |
Token ID | 15071 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
osate | +0.298 |
� | +0.202 |
ongyang | +0.197 |
insula | +0.196 |
withd | +0.195 |
Neg logit contributions | |
Carbuncle | -0.400 |
hemy | -0.383 |
ndra | -0.375 |
ongs | -0.364 |
dh | -0.362 |
Token | incident |
Token ID | 4519 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
osate | +2.040 |
� | +1.542 |
ongyang | +1.538 |
insula | +1.519 |
withd | +1.506 |
Neg logit contributions | |
Carbuncle | -1.503 |
hemy | -1.411 |
ndra | -1.377 |
ongs | -1.312 |
dh | -1.304 |
Token | , |
Token ID | 11 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
osate | +0.543 |
� | +0.418 |
ongyang | +0.417 |
insula | +0.411 |
withd | +0.406 |
Neg logit contributions | |
Carbuncle | -0.338 |
hemy | -0.315 |
ndra | -0.309 |
ongs | -0.293 |
bars | -0.293 |
Token | over |
Token ID | 625 |
Feature activation | +2.99e-01 |
Pos logit contributions | |
osate | +0.423 |
� | +0.318 |
ongyang | +0.316 |
insula | +0.313 |
withd | +0.308 |
Neg logit contributions | |
Carbuncle | -0.329 |
hemy | -0.309 |
ndra | -0.302 |
ongs | -0.290 |
bars | -0.289 |
Token | a |
Token ID | 257 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
osate | +0.299 |
� | +0.226 |
ongyang | +0.225 |
insula | +0.223 |
withd | +0.221 |
Neg logit contributions | |
Carbuncle | -0.225 |
hemy | -0.211 |
ndra | -0.206 |
ongs | -0.198 |
bars | -0.197 |
Token | period |
Token ID | 2278 |
Feature activation | +3.84e-01 |
Pos logit contributions | |
Carbuncle | +0.023 |
hemy | +0.022 |
ndra | +0.021 |
ongs | +0.021 |
bars | +0.020 |
Neg logit contributions | |
osate | -0.031 |
� | -0.023 |
ongyang | -0.023 |
insula | -0.023 |
withd | -0.023 |
Token | Gender |
Token ID | 41394 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
Carbuncle | +0.180 |
hemy | +0.172 |
ndra | +0.169 |
dh | +0.162 |
ongs | +0.161 |
Neg logit contributions | |
osate | -0.218 |
ongyang | -0.161 |
� | -0.159 |
withd | -0.159 |
insula | -0.158 |
Token | flu |
Token ID | 35522 |
Feature activation | +6.95e-01 |
Pos logit contributions | |
osate | +0.424 |
ongyang | +0.329 |
� | +0.328 |
insula | +0.324 |
withd | +0.321 |
Neg logit contributions | |
Carbuncle | -0.254 |
hemy | -0.237 |
ndra | -0.230 |
ongs | -0.220 |
dh | -0.219 |
Token | id |
Token ID | 312 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
osate | +0.657 |
� | +0.489 |
ongyang | +0.485 |
insula | +0.477 |
withd | +0.474 |
Neg logit contributions | |
Carbuncle | -0.562 |
hemy | -0.535 |
ndra | -0.521 |
ongs | -0.499 |
dh | -0.498 |
Token | or |
Token ID | 393 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
osate | +0.028 |
� | +0.021 |
ongyang | +0.021 |
insula | +0.021 |
withd | +0.020 |
Neg logit contributions | |
Carbuncle | -0.022 |
hemy | -0.022 |
ndra | -0.021 |
ongs | -0.020 |
dh | -0.020 |
Token | Gender |
Token ID | 20247 |
Feature activation | +2.65e-01 |
Pos logit contributions | |
osate | +0.187 |
� | +0.139 |
ongyang | +0.138 |
insula | +0.137 |
withd | +0.134 |
Neg logit contributions | |
Carbuncle | -0.156 |
hemy | -0.149 |
ndra | -0.144 |
ongs | -0.139 |
dh | -0.138 |
Token | que |
Token ID | 4188 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
osate | +0.216 |
� | +0.150 |
ongyang | +0.150 |
insula | +0.148 |
withd | +0.145 |
Neg logit contributions | |
Carbuncle | -0.250 |
hemy | -0.239 |
ndra | -0.234 |
ongs | -0.227 |
dh | -0.226 |
Token | er |
Token ID | 263 |
Feature activation | -5.51e-01 |
Pos logit contributions | |
osate | +2.273 |
ongyang | +1.788 |
� | +1.775 |
satisf | +1.765 |
enes | +1.765 |
Neg logit contributions | |
Carbuncle | -1.232 |
hemy | -1.126 |
ndra | -1.067 |
ongs | -1.024 |
bars | -1.018 |
Token | : |
Token ID | 25 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
Carbuncle | +0.421 |
hemy | +0.402 |
ndra | +0.389 |
ongs | +0.381 |
bars | +0.376 |
Neg logit contributions | |
osate | -0.542 |
ongyang | -0.404 |
� | -0.404 |
insula | -0.401 |
withd | -0.397 |
Token | Gender |
Token ID | 20247 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
osate | +0.469 |
� | +0.352 |
ongyang | +0.351 |
insula | +0.346 |
withd | +0.344 |
Neg logit contributions | |
Carbuncle | -0.365 |
hemy | -0.345 |
ndra | -0.336 |
ongs | -0.321 |
dh | -0.319 |
Token | flu |
Token ID | 35522 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
osate | +0.320 |
� | +0.235 |
ongyang | +0.232 |
insula | +0.229 |
withd | +0.226 |
Neg logit contributions | |
Carbuncle | -0.295 |
hemy | -0.283 |
ndra | -0.275 |
ongs | -0.265 |
dh | -0.264 |
Token | id |
Token ID | 312 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
osate | +0.892 |
ongyang | +0.645 |
insula | +0.635 |
enes | +0.629 |
� | +0.626 |
Neg logit contributions | |
Carbuncle | -0.892 |
hemy | -0.837 |
ndra | -0.813 |
ongs | -0.783 |
bars | -0.782 |
Token | church |
Token ID | 4928 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
Carbuncle | +0.039 |
hemy | +0.037 |
ndra | +0.035 |
ongs | +0.034 |
dh | +0.034 |
Neg logit contributions | |
osate | -0.053 |
� | -0.040 |
ongyang | -0.040 |
insula | -0.039 |
withd | -0.039 |
Token | 's |
Token ID | 338 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
osate | +0.430 |
� | +0.325 |
ongyang | +0.324 |
insula | +0.320 |
withd | +0.317 |
Neg logit contributions | |
Carbuncle | -0.316 |
hemy | -0.298 |
ndra | -0.290 |
ongs | -0.277 |
dh | -0.275 |
Token | official |
Token ID | 1743 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
Carbuncle | +0.326 |
hemy | +0.307 |
ndra | +0.298 |
ongs | +0.285 |
dh | +0.283 |
Neg logit contributions | |
osate | -0.449 |
� | -0.340 |
ongyang | -0.339 |
insula | -0.335 |
withd | -0.332 |
Token | policy |
Token ID | 2450 |
Feature activation | +2.50e-02 |
Pos logit contributions | |
Carbuncle | +0.093 |
hemy | +0.087 |
ndra | +0.085 |
ongs | +0.081 |
dh | +0.081 |
Neg logit contributions | |
osate | -0.116 |
� | -0.087 |
ongyang | -0.087 |
insula | -0.085 |
withd | -0.085 |
Token | hand |
Token ID | 1021 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
osate | +0.024 |
� | +0.018 |
ongyang | +0.018 |
insula | +0.018 |
withd | +0.018 |
Neg logit contributions | |
Carbuncle | -0.020 |
hemy | -0.019 |
ndra | -0.018 |
bars | -0.017 |
ongs | -0.017 |
Token | book |
Token ID | 2070 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
osate | +0.346 |
� | +0.242 |
ongyang | +0.241 |
insula | +0.237 |
withd | +0.235 |
Neg logit contributions | |
Carbuncle | -0.388 |
hemy | -0.370 |
ndra | -0.362 |
ongs | -0.350 |
dh | -0.349 |
Token | and |
Token ID | 290 |
Feature activation | +4.62e-02 |
Pos logit contributions | |
osate | +1.904 |
� | +1.414 |
ongyang | +1.410 |
insula | +1.387 |
withd | +1.383 |
Neg logit contributions | |
Carbuncle | -1.603 |
hemy | -1.514 |
ndra | -1.479 |
ongs | -1.415 |
dh | -1.404 |
Token | asked |
Token ID | 1965 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
osate | +0.044 |
ongyang | +0.032 |
� | +0.032 |
insula | +0.031 |
withd | +0.031 |
Neg logit contributions | |
Carbuncle | -0.038 |
hemy | -0.036 |
ndra | -0.035 |
ongs | -0.034 |
bars | -0.034 |
Token | me |
Token ID | 502 |
Feature activation | +7.04e-02 |
Pos logit contributions | |
osate | +0.487 |
ongyang | +0.369 |
� | +0.369 |
insula | +0.364 |
withd | +0.361 |
Neg logit contributions | |
Carbuncle | -0.346 |
hemy | -0.326 |
ndra | -0.316 |
ongs | -0.303 |
bars | -0.301 |
Token | to |
Token ID | 284 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
osate | +0.074 |
ongyang | +0.056 |
� | +0.055 |
insula | +0.055 |
withd | +0.054 |
Neg logit contributions | |
Carbuncle | -0.050 |
hemy | -0.048 |
ndra | -0.046 |
bars | -0.044 |
ongs | -0.044 |
Token | read |
Token ID | 1100 |
Feature activation | +7.28e-01 |
Pos logit contributions | |
osate | +0.230 |
� | +0.168 |
ongyang | +0.168 |
insula | +0.166 |
withd | +0.164 |
Neg logit contributions | |
Carbuncle | -0.206 |
hemy | -0.195 |
ndra | -0.191 |
ongs | -0.183 |
dh | -0.182 |
Token | were |
Token ID | 547 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
osate | +0.811 |
� | +0.607 |
ongyang | +0.606 |
insula | +0.598 |
withd | +0.593 |
Neg logit contributions | |
Carbuncle | -0.633 |
hemy | -0.598 |
ndra | -0.582 |
ongs | -0.557 |
dh | -0.553 |
Token | not |
Token ID | 407 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
osate | +0.108 |
� | +0.080 |
ongyang | +0.080 |
insula | +0.079 |
withd | +0.078 |
Neg logit contributions | |
Carbuncle | -0.085 |
hemy | -0.080 |
ndra | -0.079 |
bars | -0.075 |
ongs | -0.075 |
Token | successful |
Token ID | 4388 |
Feature activation | +3.25e-02 |
Pos logit contributions | |
osate | +0.150 |
� | +0.112 |
ongyang | +0.111 |
insula | +0.110 |
withd | +0.108 |
Neg logit contributions | |
Carbuncle | -0.121 |
hemy | -0.114 |
ndra | -0.112 |
bars | -0.106 |
ongs | -0.106 |
Token | . |
Token ID | 13 |
Feature activation | +4.04e-02 |
Pos logit contributions | |
osate | +0.036 |
ongyang | +0.028 |
� | +0.028 |
insula | +0.027 |
Fug | +0.027 |
Neg logit contributions | |
Carbuncle | -0.021 |
hemy | -0.020 |
ndra | -0.019 |
ongs | -0.018 |
bars | -0.018 |
Token | Had |
Token ID | 11161 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
osate | +0.040 |
� | +0.030 |
ongyang | +0.030 |
insula | +0.030 |
withd | +0.030 |
Neg logit contributions | |
Carbuncle | -0.031 |
hemy | -0.029 |
ndra | -0.028 |
ongs | -0.027 |
dh | -0.027 |
Token | McDonnell |
Token ID | 39441 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
osate | +0.348 |
� | +0.242 |
ongyang | +0.242 |
insula | +0.237 |
withd | +0.234 |
Neg logit contributions | |
Carbuncle | -0.401 |
hemy | -0.383 |
ndra | -0.376 |
ongs | -0.362 |
bars | -0.360 |
Token | gotten |
Token ID | 7891 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
osate | +1.830 |
� | +1.345 |
ongyang | +1.336 |
insula | +1.316 |
withd | +1.310 |
Neg logit contributions | |
Carbuncle | -1.659 |
hemy | -1.576 |
ndra | -1.533 |
ongs | -1.476 |
dh | -1.463 |
Token | his |
Token ID | 465 |
Feature activation | +5.65e-01 |
Pos logit contributions | |
osate | +0.340 |
� | +0.254 |
ongyang | +0.254 |
insula | +0.250 |
withd | +0.248 |
Neg logit contributions | |
Carbuncle | -0.264 |
hemy | -0.249 |
ndra | -0.244 |
ongs | -0.232 |
bars | -0.231 |
Token | way |
Token ID | 835 |
Feature activation | +5.94e-02 |
Pos logit contributions | |
osate | +0.553 |
ongyang | +0.412 |
� | +0.411 |
insula | +0.407 |
withd | +0.402 |
Neg logit contributions | |
Carbuncle | -0.442 |
hemy | -0.415 |
ndra | -0.408 |
bars | -0.389 |
ongs | -0.389 |
Token | , |
Token ID | 11 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
osate | +0.061 |
ongyang | +0.046 |
� | +0.045 |
insula | +0.045 |
withd | +0.044 |
Neg logit contributions | |
Carbuncle | -0.044 |
hemy | -0.041 |
ndra | -0.041 |
bars | -0.039 |
ongs | -0.038 |
Token | they |
Token ID | 484 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
osate | +0.171 |
ongyang | +0.126 |
� | +0.126 |
insula | +0.124 |
withd | +0.122 |
Neg logit contributions | |
Carbuncle | -0.148 |
hemy | -0.140 |
ndra | -0.137 |
ongs | -0.131 |
bars | -0.131 |
Token | a |
Token ID | 257 |
Feature activation | +5.76e-02 |
Pos logit contributions | |
osate | +0.050 |
ongyang | +0.038 |
� | +0.038 |
insula | +0.037 |
withd | +0.037 |
Neg logit contributions | |
Carbuncle | -0.036 |
hemy | -0.033 |
ndra | -0.032 |
bars | -0.031 |
ongs | -0.031 |
Token | risk |
Token ID | 2526 |
Feature activation | +5.61e-01 |
Pos logit contributions | |
osate | +0.059 |
ongyang | +0.044 |
� | +0.044 |
insula | +0.044 |
withd | +0.043 |
Neg logit contributions | |
Carbuncle | -0.043 |
hemy | -0.040 |
ndra | -0.039 |
ongs | -0.037 |
bars | -0.037 |
Token | - |
Token ID | 12 |
Feature activation | +5.78e-01 |
Pos logit contributions | |
osate | +0.571 |
ongyang | +0.434 |
� | +0.433 |
insula | +0.427 |
withd | +0.423 |
Neg logit contributions | |
Carbuncle | -0.414 |
hemy | -0.388 |
ndra | -0.378 |
dh | -0.362 |
bars | -0.361 |
Token | taking |
Token ID | 26103 |
Feature activation | +2.19e-01 |
Pos logit contributions | |
osate | +0.656 |
ongyang | +0.515 |
� | +0.512 |
insula | +0.505 |
withd | +0.503 |
Neg logit contributions | |
Carbuncle | -0.363 |
hemy | -0.333 |
ndra | -0.323 |
dh | -0.311 |
bars | -0.305 |
Token | aut |
Token ID | 1960 |
Feature activation | +2.79e-01 |
Pos logit contributions | |
osate | +0.217 |
� | +0.162 |
ongyang | +0.162 |
insula | +0.159 |
withd | +0.158 |
Neg logit contributions | |
Carbuncle | -0.170 |
hemy | -0.159 |
ndra | -0.155 |
bars | -0.148 |
ongs | -0.148 |
Token | ocrat |
Token ID | 35128 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
osate | +0.285 |
� | +0.217 |
ongyang | +0.215 |
insula | +0.212 |
withd | +0.211 |
Neg logit contributions | |
Carbuncle | -0.203 |
hemy | -0.192 |
ndra | -0.188 |
ongs | -0.179 |
dh | -0.178 |
Token | governed |
Token ID | 21825 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
osate | +2.015 |
� | +1.529 |
ongyang | +1.525 |
insula | +1.505 |
withd | +1.494 |
Neg logit contributions | |
Carbuncle | -1.441 |
hemy | -1.358 |
ndra | -1.319 |
ongs | -1.259 |
dh | -1.249 |
Token | by |
Token ID | 416 |
Feature activation | -5.41e-02 |
Pos logit contributions | |
osate | +0.160 |
� | +0.119 |
ongyang | +0.119 |
insula | +0.117 |
Fug | +0.115 |
Neg logit contributions | |
Carbuncle | -0.120 |
hemy | -0.113 |
ndra | -0.110 |
ongs | -0.106 |
bars | -0.106 |
Token | real |
Token ID | 1103 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
Carbuncle | +0.039 |
hemy | +0.037 |
ndra | +0.036 |
bars | +0.034 |
ongs | +0.034 |
Neg logit contributions | |
osate | -0.056 |
ongyang | -0.043 |
� | -0.043 |
insula | -0.042 |
withd | -0.042 |
Token | polit |
Token ID | 34470 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
osate | +0.120 |
� | +0.090 |
ongyang | +0.090 |
insula | +0.089 |
withd | +0.089 |
Neg logit contributions | |
Carbuncle | -0.086 |
hemy | -0.082 |
ndra | -0.080 |
ongs | -0.076 |
bars | -0.075 |
Token | ik |
Token ID | 1134 |
Feature activation | -3.49e-02 |
Pos logit contributions | |
osate | +1.267 |
� | +0.925 |
ongyang | +0.924 |
insula | +0.907 |
satisf | +0.899 |
Neg logit contributions | |
Carbuncle | -1.176 |
hemy | -1.113 |
ndra | -1.083 |
ongs | -1.039 |
dh | -1.034 |
Token | my |
Token ID | 616 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
Carbuncle | +0.094 |
hemy | +0.088 |
ndra | +0.086 |
ongs | +0.082 |
bars | +0.081 |
Neg logit contributions | |
osate | -0.134 |
ongyang | -0.102 |
� | -0.102 |
insula | -0.100 |
withd | -0.100 |
Token | last |
Token ID | 938 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
osate | +0.317 |
� | +0.241 |
ongyang | +0.241 |
insula | +0.238 |
withd | +0.236 |
Neg logit contributions | |
Carbuncle | -0.224 |
hemy | -0.210 |
ndra | -0.205 |
ongs | -0.196 |
dh | -0.194 |
Token | sights |
Token ID | 21343 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
osate | +0.358 |
� | +0.279 |
ongyang | +0.278 |
insula | +0.275 |
satisf | +0.274 |
Neg logit contributions | |
Carbuncle | -0.204 |
hemy | -0.192 |
ndra | -0.184 |
ongs | -0.174 |
dh | -0.173 |
Token | of |
Token ID | 286 |
Feature activation | +6.37e-02 |
Pos logit contributions | |
Carbuncle | +0.823 |
hemy | +0.767 |
ndra | +0.754 |
ongs | +0.729 |
dh | +0.719 |
Neg logit contributions | |
osate | -1.135 |
ongyang | -0.854 |
� | -0.849 |
insula | -0.841 |
withd | -0.831 |
Token | this |
Token ID | 428 |
Feature activation | +5.50e-02 |
Pos logit contributions | |
osate | +0.066 |
� | +0.050 |
ongyang | +0.050 |
insula | +0.049 |
withd | +0.049 |
Neg logit contributions | |
Carbuncle | -0.046 |
hemy | -0.043 |
ndra | -0.042 |
ongs | -0.040 |
bars | -0.040 |
Token | indef |
Token ID | 16536 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
osate | +0.056 |
� | +0.043 |
ongyang | +0.042 |
insula | +0.042 |
withd | +0.041 |
Neg logit contributions | |
Carbuncle | -0.041 |
hemy | -0.038 |
ndra | -0.037 |
ongs | -0.035 |
bars | -0.035 |
Token | at |
Token ID | 265 |
Feature activation | +8.67e-02 |
Pos logit contributions | |
osate | +1.909 |
� | +1.432 |
ongyang | +1.424 |
insula | +1.404 |
withd | +1.396 |
Neg logit contributions | |
Carbuncle | -1.512 |
hemy | -1.433 |
ndra | -1.396 |
ongs | -1.339 |
dh | -1.327 |
Token | ig |
Token ID | 328 |
Feature activation | +6.72e-01 |
Pos logit contributions | |
osate | +0.082 |
� | +0.060 |
ongyang | +0.060 |
withd | +0.059 |
insula | +0.059 |
Neg logit contributions | |
Carbuncle | -0.071 |
hemy | -0.067 |
ndra | -0.066 |
ongs | -0.063 |
dh | -0.063 |
Token | able |
Token ID | 540 |
Feature activation | +6.16e-01 |
Pos logit contributions | |
osate | +0.631 |
� | +0.466 |
ongyang | +0.465 |
insula | +0.458 |
satisf | +0.453 |
Neg logit contributions | |
Carbuncle | -0.547 |
hemy | -0.519 |
ndra | -0.504 |
ongs | -0.484 |
dh | -0.480 |
Token | optim |
Token ID | 6436 |
Feature activation | +8.42e-01 |
Pos logit contributions | |
osate | +0.629 |
� | +0.477 |
ongyang | +0.475 |
insula | +0.469 |
withd | +0.466 |
Neg logit contributions | |
Carbuncle | -0.452 |
hemy | -0.426 |
ndra | -0.413 |
ongs | -0.395 |
dh | -0.392 |
Token | ist |
Token ID | 396 |
Feature activation | +7.45e-01 |
Pos logit contributions | |
osate | +0.774 |
� | +0.566 |
ongyang | +0.565 |
insula | +0.556 |
withd | +0.552 |
Neg logit contributions | |
Carbuncle | -0.703 |
hemy | -0.667 |
ndra | -0.651 |
ongs | -0.625 |
dh | -0.621 |
Token | strengthening |
Token ID | 24175 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
osate | +0.423 |
� | +0.325 |
ongyang | +0.325 |
insula | +0.320 |
withd | +0.317 |
Neg logit contributions | |
Carbuncle | -0.271 |
hemy | -0.250 |
ndra | -0.245 |
ongs | -0.233 |
bars | -0.233 |
Token | of |
Token ID | 286 |
Feature activation | +6.77e-02 |
Pos logit contributions | |
osate | +0.147 |
� | +0.112 |
ongyang | +0.111 |
insula | +0.110 |
withd | +0.109 |
Neg logit contributions | |
Carbuncle | -0.107 |
hemy | -0.100 |
ndra | -0.097 |
ongs | -0.093 |
bars | -0.093 |
Token | a |
Token ID | 257 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
osate | +0.068 |
� | +0.052 |
ongyang | +0.052 |
insula | +0.051 |
withd | +0.050 |
Neg logit contributions | |
Carbuncle | -0.051 |
hemy | -0.047 |
ndra | -0.046 |
bars | -0.045 |
ongs | -0.044 |
Token | subt |
Token ID | 13284 |
Feature activation | +4.68e-01 |
Pos logit contributions | |
osate | +0.310 |
ongyang | +0.234 |
� | +0.234 |
insula | +0.230 |
withd | +0.228 |
Neg logit contributions | |
Carbuncle | -0.229 |
hemy | -0.214 |
ndra | -0.209 |
ongs | -0.199 |
bars | -0.199 |
Token | rop |
Token ID | 1773 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
osate | +0.465 |
� | +0.351 |
ongyang | +0.349 |
insula | +0.344 |
withd | +0.342 |
Neg logit contributions | |
Carbuncle | -0.356 |
hemy | -0.337 |
ndra | -0.328 |
ongs | -0.314 |
dh | -0.311 |
Token | ical |
Token ID | 605 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
osate | +0.220 |
� | +0.132 |
ongyang | +0.131 |
insula | +0.128 |
withd | +0.126 |
Neg logit contributions | |
Carbuncle | -0.405 |
hemy | -0.390 |
ndra | -0.383 |
ongs | -0.372 |
dh | -0.370 |
Token | ridge |
Token ID | 32525 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
osate | +2.013 |
� | +1.532 |
ongyang | +1.527 |
insula | +1.509 |
withd | +1.499 |
Neg logit contributions | |
Carbuncle | -1.404 |
hemy | -1.322 |
ndra | -1.283 |
ongs | -1.225 |
dh | -1.214 |
Token | . |
Token ID | 13 |
Feature activation | +7.69e-01 |
Pos logit contributions | |
osate | +0.565 |
� | +0.425 |
ongyang | +0.425 |
insula | +0.418 |
withd | +0.414 |
Neg logit contributions | |
Carbuncle | -0.423 |
hemy | -0.399 |
ndra | -0.388 |
ongs | -0.371 |
dh | -0.369 |
Token | A |
Token ID | 317 |
Feature activation | +6.02e-01 |
Pos logit contributions | |
osate | +0.735 |
ongyang | +0.547 |
� | +0.542 |
withd | +0.538 |
insula | +0.537 |
Neg logit contributions | |
Carbuncle | -0.620 |
hemy | -0.579 |
ndra | -0.571 |
ongs | -0.545 |
dh | -0.542 |
Token | strong |
Token ID | 1913 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
osate | +0.606 |
� | +0.456 |
ongyang | +0.456 |
insula | +0.449 |
withd | +0.446 |
Neg logit contributions | |
Carbuncle | -0.452 |
hemy | -0.426 |
ndra | -0.415 |
ongs | -0.396 |
dh | -0.393 |
Token | ridge |
Token ID | 32525 |
Feature activation | +5.49e-01 |
Pos logit contributions | |
osate | +0.340 |
� | +0.250 |
ongyang | +0.249 |
insula | +0.244 |
withd | +0.243 |
Neg logit contributions | |
Carbuncle | -0.296 |
hemy | -0.278 |
ndra | -0.274 |
bars | -0.261 |
ongs | -0.260 |
Token | head |
Token ID | 1182 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
osate | +0.127 |
ongyang | +0.093 |
� | +0.092 |
insula | +0.092 |
withd | +0.091 |
Neg logit contributions | |
Carbuncle | -0.101 |
hemy | -0.093 |
ndra | -0.090 |
bars | -0.088 |
dh | -0.088 |
Token | ) |
Token ID | 8 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
osate | +0.288 |
ongyang | +0.216 |
� | +0.215 |
insula | +0.213 |
withd | +0.211 |
Neg logit contributions | |
Carbuncle | -0.216 |
hemy | -0.203 |
ndra | -0.197 |
ongs | -0.189 |
dh | -0.189 |
Token | and |
Token ID | 290 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
osate | +0.403 |
� | +0.297 |
ongyang | +0.297 |
insula | +0.293 |
withd | +0.288 |
Neg logit contributions | |
Carbuncle | -0.324 |
hemy | -0.303 |
ndra | -0.295 |
bars | -0.286 |
ongs | -0.286 |
Token | fl |
Token ID | 781 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
osate | +0.521 |
ongyang | +0.393 |
� | +0.391 |
insula | +0.387 |
withd | +0.381 |
Neg logit contributions | |
Carbuncle | -0.373 |
hemy | -0.346 |
ndra | -0.337 |
bars | -0.325 |
ongs | -0.323 |
Token | ot |
Token ID | 313 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
osate | +0.257 |
� | +0.185 |
ongyang | +0.185 |
insula | +0.182 |
withd | +0.180 |
Neg logit contributions | |
Carbuncle | -0.253 |
hemy | -0.241 |
ndra | -0.235 |
ongs | -0.226 |
dh | -0.225 |
Token | illa |
Token ID | 5049 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
osate | +0.608 |
� | +0.456 |
ongyang | +0.455 |
insula | +0.448 |
withd | +0.446 |
Neg logit contributions | |
Carbuncle | -0.451 |
hemy | -0.429 |
ndra | -0.419 |
ongs | -0.402 |
bars | -0.398 |
Token | ( |
Token ID | 357 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
osate | +1.957 |
� | +1.479 |
ongyang | +1.474 |
insula | +1.454 |
withd | +1.444 |
Neg logit contributions | |
Carbuncle | -1.451 |
hemy | -1.369 |
ndra | -1.331 |
ongs | -1.271 |
dh | -1.261 |
Token | four |
Token ID | 14337 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
osate | +0.127 |
ongyang | +0.096 |
� | +0.095 |
insula | +0.094 |
withd | +0.094 |
Neg logit contributions | |
Carbuncle | -0.092 |
hemy | -0.087 |
ndra | -0.085 |
dh | -0.081 |
ongs | -0.081 |
Token | people |
Token ID | 661 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
osate | +0.160 |
ongyang | +0.121 |
� | +0.121 |
insula | +0.120 |
withd | +0.118 |
Neg logit contributions | |
Carbuncle | -0.108 |
hemy | -0.101 |
ndra | -0.098 |
ongs | -0.094 |
bars | -0.094 |
Token | on |
Token ID | 319 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
osate | +0.338 |
ongyang | +0.257 |
� | +0.256 |
insula | +0.254 |
withd | +0.251 |
Neg logit contributions | |
Carbuncle | -0.224 |
hemy | -0.210 |
ndra | -0.204 |
ongs | -0.195 |
bars | -0.193 |
Token | board |
Token ID | 3096 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
osate | +0.301 |
ongyang | +0.237 |
� | +0.235 |
insula | +0.234 |
withd | +0.232 |
Neg logit contributions | |
Carbuncle | -0.154 |
hemy | -0.140 |
ndra | -0.135 |
bars | -0.129 |
ongs | -0.128 |
Token | His |
Token ID | 6653 |
Feature activation | +5.61e-01 |
Pos logit contributions | |
osate | +0.279 |
ongyang | +0.214 |
� | +0.212 |
withd | +0.211 |
insula | +0.211 |
Neg logit contributions | |
Carbuncle | -0.173 |
hemy | -0.163 |
ndra | -0.160 |
dh | -0.151 |
ongs | -0.150 |
Token | comments |
Token ID | 3651 |
Feature activation | +4.14e-02 |
Pos logit contributions | |
osate | +0.577 |
� | +0.437 |
ongyang | +0.436 |
insula | +0.431 |
withd | +0.428 |
Neg logit contributions | |
Carbuncle | -0.408 |
hemy | -0.384 |
ndra | -0.374 |
ongs | -0.356 |
dh | -0.354 |
Token | seemed |
Token ID | 3947 |
Feature activation | +2.37e-01 |
Pos logit contributions | |
osate | +0.040 |
ongyang | +0.029 |
� | +0.029 |
insula | +0.029 |
withd | +0.029 |
Neg logit contributions | |
Carbuncle | -0.033 |
hemy | -0.031 |
ndra | -0.031 |
ongs | -0.029 |
bars | -0.029 |
Token | to |
Token ID | 284 |
Feature activation | +4.32e-01 |
Pos logit contributions | |
osate | +0.244 |
� | +0.184 |
ongyang | +0.184 |
insula | +0.181 |
withd | +0.180 |
Neg logit contributions | |
Carbuncle | -0.173 |
hemy | -0.163 |
ndra | -0.158 |
bars | -0.151 |
ongs | -0.151 |
Token | put |
Token ID | 1234 |
Feature activation | +1.71e-01 |
Pos logit contributions | |
osate | +0.400 |
ongyang | +0.290 |
� | +0.290 |
insula | +0.286 |
withd | +0.282 |
Neg logit contributions | |
Carbuncle | -0.362 |
hemy | -0.342 |
ndra | -0.335 |
ongs | -0.324 |
bars | -0.322 |
Token | McDonnell |
Token ID | 39441 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
osate | +0.176 |
ongyang | +0.133 |
� | +0.133 |
insula | +0.131 |
withd | +0.130 |
Neg logit contributions | |
Carbuncle | -0.125 |
hemy | -0.117 |
ndra | -0.114 |
ongs | -0.109 |
bars | -0.108 |
Token | in |
Token ID | 287 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
osate | +1.942 |
� | +1.471 |
ongyang | +1.464 |
insula | +1.444 |
satisf | +1.434 |
Neg logit contributions | |
Carbuncle | -1.445 |
hemy | -1.362 |
ndra | -1.324 |
ongs | -1.264 |
dh | -1.256 |
Token | line |
Token ID | 1627 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
osate | +0.362 |
� | +0.278 |
ongyang | +0.277 |
insula | +0.274 |
withd | +0.271 |
Neg logit contributions | |
Carbuncle | -0.230 |
hemy | -0.215 |
ndra | -0.209 |
bars | -0.200 |
ongs | -0.199 |
Token | with |
Token ID | 351 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
osate | +0.292 |
ongyang | +0.215 |
� | +0.214 |
insula | +0.212 |
Fug | +0.209 |
Neg logit contributions | |
Carbuncle | -0.235 |
hemy | -0.224 |
ndra | -0.217 |
ongs | -0.210 |
bars | -0.210 |
Token | the |
Token ID | 262 |
Feature activation | +5.46e-01 |
Pos logit contributions | |
osate | +0.430 |
� | +0.322 |
ongyang | +0.322 |
insula | +0.317 |
withd | +0.315 |
Neg logit contributions | |
Carbuncle | -0.332 |
hemy | -0.314 |
ndra | -0.305 |
ongs | -0.292 |
dh | -0.290 |
Token | police |
Token ID | 1644 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
osate | +0.545 |
� | +0.410 |
ongyang | +0.409 |
insula | +0.404 |
withd | +0.400 |
Neg logit contributions | |
Carbuncle | -0.413 |
hemy | -0.390 |
ndra | -0.380 |
ongs | -0.363 |
dh | -0.360 |
Token | setup |
Token ID | 9058 |
Feature activation | -5.54e-01 |
Pos logit contributions | |
Carbuncle | +0.899 |
hemy | +0.839 |
ndra | +0.823 |
bars | +0.791 |
ongs | +0.787 |
Neg logit contributions | |
osate | -1.181 |
ongyang | -0.886 |
� | -0.881 |
insula | -0.871 |
withd | -0.858 |
Token | with |
Token ID | 351 |
Feature activation | -4.84e-01 |
Pos logit contributions | |
Carbuncle | +0.411 |
hemy | +0.382 |
ndra | +0.375 |
bars | +0.359 |
ongs | +0.358 |
Neg logit contributions | |
osate | -0.567 |
ongyang | -0.425 |
� | -0.424 |
insula | -0.420 |
withd | -0.413 |
Token | Pro |
Token ID | 1041 |
Feature activation | -5.67e-02 |
Pos logit contributions | |
Carbuncle | +0.363 |
hemy | +0.337 |
ndra | +0.328 |
bars | +0.318 |
dh | +0.315 |
Neg logit contributions | |
osate | -0.491 |
ongyang | -0.371 |
� | -0.369 |
insula | -0.366 |
withd | -0.358 |
Token | pe |
Token ID | 431 |
Feature activation | +6.44e-01 |
Pos logit contributions | |
Carbuncle | +0.053 |
hemy | +0.050 |
ndra | +0.049 |
dh | +0.048 |
ongs | +0.048 |
Neg logit contributions | |
osate | -0.047 |
ongyang | -0.033 |
� | -0.032 |
insula | -0.032 |
withd | -0.032 |
Token | ller |
Token ID | 6051 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
osate | +0.724 |
ongyang | +0.574 |
� | +0.564 |
insula | +0.558 |
satisf | +0.557 |
Neg logit contributions | |
Carbuncle | -0.408 |
hemy | -0.370 |
ndra | -0.355 |
ongs | -0.338 |
bars | -0.337 |
Token | Blade |
Token ID | 47520 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
osate | +0.421 |
ongyang | +0.294 |
� | +0.292 |
insula | +0.289 |
withd | +0.286 |
Neg logit contributions | |
Carbuncle | -0.469 |
hemy | -0.446 |
ndra | -0.436 |
bars | -0.421 |
ongs | -0.421 |
Token | Technology |
Token ID | 8987 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
osate | +1.927 |
� | +1.455 |
ongyang | +1.449 |
insula | +1.429 |
withd | +1.422 |
Neg logit contributions | |
Carbuncle | -1.454 |
hemy | -1.373 |
ndra | -1.336 |
ongs | -1.276 |
dh | -1.266 |
Token | generate |
Token ID | 7716 |
Feature activation | +3.62e-02 |
Pos logit contributions | |
Carbuncle | +0.196 |
hemy | +0.183 |
ndra | +0.178 |
ongs | +0.171 |
bars | +0.171 |
Neg logit contributions | |
osate | -0.268 |
ongyang | -0.201 |
� | -0.200 |
insula | -0.198 |
withd | -0.195 |
Token | massive |
Token ID | 4858 |
Feature activation | -2.52e-01 |
Pos logit contributions | |
osate | +0.037 |
� | +0.028 |
ongyang | +0.028 |
insula | +0.027 |
withd | +0.027 |
Neg logit contributions | |
Carbuncle | -0.027 |
hemy | -0.025 |
ndra | -0.024 |
ongs | -0.024 |
bars | -0.023 |
Token | airflow |
Token ID | 45771 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
Carbuncle | +0.192 |
hemy | +0.181 |
ndra | +0.175 |
ongs | +0.169 |
bars | +0.169 |
Neg logit contributions | |
osate | -0.252 |
� | -0.188 |
ongyang | -0.188 |
insula | -0.186 |
withd | -0.184 |
Token | for |
Token ID | 329 |
Feature activation | -4.91e-02 |
Pos logit contributions | |
osate | +0.429 |
� | +0.320 |
ongyang | +0.320 |
insula | +0.315 |
withd | +0.313 |
Neg logit contributions | |
Carbuncle | -0.334 |
hemy | -0.315 |
ndra | -0.307 |
ongs | -0.294 |
dh | -0.292 |
Token | CPUs |
Token ID | 32340 |
Feature activation | -5.78e-01 |
Pos logit contributions | |
Carbuncle | +0.276 |
hemy | +0.258 |
ndra | +0.251 |
ongs | +0.241 |
bars | +0.240 |
Neg logit contributions | |
osate | -0.372 |
� | -0.280 |
ongyang | -0.280 |
insula | -0.276 |
withd | -0.273 |
Token | and |
Token ID | 290 |
Feature activation | -7.67e-01 |
Pos logit contributions | |
Carbuncle | +0.429 |
hemy | +0.405 |
ndra | +0.394 |
ongs | +0.380 |
bars | +0.377 |
Neg logit contributions | |
osate | -0.588 |
� | -0.442 |
ongyang | -0.441 |
insula | -0.437 |
withd | -0.429 |
Token | memory |
Token ID | 4088 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
Carbuncle | +0.605 |
hemy | +0.570 |
ndra | +0.556 |
bars | +0.536 |
ongs | +0.535 |
Neg logit contributions | |
osate | -0.745 |
� | -0.553 |
ongyang | -0.552 |
insula | -0.546 |
withd | -0.534 |
Token | ( |
Token ID | 357 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
Carbuncle | +1.166 |
hemy | +1.100 |
ndra | +1.051 |
bars | +1.044 |
dh | +1.021 |
Neg logit contributions | |
osate | -1.782 |
ongyang | -1.354 |
insula | -1.339 |
� | -1.333 |
withd | -1.310 |
Token | Intel |
Token ID | 24123 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
Carbuncle | +1.017 |
hemy | +0.965 |
ndra | +0.941 |
dh | +0.904 |
ongs | +0.892 |
Neg logit contributions | |
osate | -1.432 |
ongyang | -1.082 |
� | -1.071 |
withd | -1.058 |
insula | -1.055 |
Token | VT |
Token ID | 32751 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
osate | +0.176 |
ongyang | +0.132 |
� | +0.132 |
insula | +0.130 |
withd | +0.129 |
Neg logit contributions | |
Carbuncle | -0.134 |
hemy | -0.127 |
ndra | -0.123 |
ongs | -0.118 |
dh | -0.117 |
Token | - |
Token ID | 12 |
Feature activation | -9.59e-01 |
Pos logit contributions | |
Carbuncle | +2.008 |
hemy | +1.877 |
ndra | +1.848 |
dh | +1.764 |
bars | +1.762 |
Neg logit contributions | |
osate | -2.824 |
ongyang | -2.146 |
� | -2.138 |
insula | -2.094 |
satisf | -2.082 |
Token | x |
Token ID | 87 |
Feature activation | -5.45e-01 |
Pos logit contributions | |
Carbuncle | +0.702 |
hemy | +0.656 |
ndra | +0.627 |
ongs | +0.608 |
bars | +0.588 |
Neg logit contributions | |
osate | -0.982 |
� | -0.754 |
ongyang | -0.742 |
insula | -0.741 |
satisf | -0.735 |
Token | , |
Token ID | 11 |
Feature activation | -8.06e-01 |
Pos logit contributions | |
Carbuncle | +0.402 |
hemy | +0.382 |
ndra | +0.371 |
ongs | +0.354 |
bars | +0.354 |
Neg logit contributions | |
osate | -0.555 |
� | -0.418 |
ongyang | -0.417 |
insula | -0.413 |
withd | -0.408 |
Token | AMD |
Token ID | 10324 |
Feature activation | +8.07e-01 |
Pos logit contributions | |
Carbuncle | +0.614 |
hemy | +0.579 |
ndra | +0.566 |
ongs | +0.535 |
bars | +0.535 |
Neg logit contributions | |
osate | -0.802 |
ongyang | -0.608 |
� | -0.602 |
insula | -0.593 |
withd | -0.588 |
Token | - |
Token ID | 12 |
Feature activation | -7.95e-01 |
Pos logit contributions | |
osate | +0.807 |
� | +0.611 |
ongyang | +0.605 |
insula | +0.599 |
Fug | +0.597 |
Neg logit contributions | |
Carbuncle | -0.603 |
hemy | -0.571 |
ndra | -0.556 |
ongs | -0.533 |
dh | -0.528 |
Token | , |
Token ID | 11 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
osate | +0.194 |
ongyang | +0.145 |
� | +0.145 |
insula | +0.143 |
withd | +0.141 |
Neg logit contributions | |
Carbuncle | -0.150 |
hemy | -0.142 |
ndra | -0.138 |
ongs | -0.133 |
bars | -0.132 |
Token | who |
Token ID | 508 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
osate | +0.183 |
� | +0.138 |
ongyang | +0.137 |
insula | +0.136 |
withd | +0.135 |
Neg logit contributions | |
Carbuncle | -0.136 |
hemy | -0.129 |
ndra | -0.125 |
ongs | -0.119 |
dh | -0.118 |
Token | lives |
Token ID | 3160 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
Carbuncle | +0.070 |
hemy | +0.065 |
ndra | +0.063 |
ongs | +0.060 |
bars | +0.060 |
Neg logit contributions | |
osate | -0.109 |
� | -0.084 |
ongyang | -0.084 |
insula | -0.083 |
withd | -0.081 |
Token | in |
Token ID | 287 |
Feature activation | -1.78e-03 |
Pos logit contributions | |
Carbuncle | +0.149 |
hemy | +0.139 |
ndra | +0.135 |
bars | +0.130 |
ongs | +0.129 |
Neg logit contributions | |
osate | -0.220 |
ongyang | -0.167 |
� | -0.166 |
insula | -0.164 |
Fug | -0.162 |
Token | Lomb |
Token ID | 28503 |
Feature activation | -4.15e-01 |
Pos logit contributions | |
Carbuncle | +0.001 |
hemy | +0.001 |
ndra | +0.001 |
bars | +0.001 |
ongs | +0.001 |
Neg logit contributions | |
osate | -0.002 |
� | -0.001 |
ongyang | -0.001 |
insula | -0.001 |
withd | -0.001 |
Token | ard |
Token ID | 446 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
Carbuncle | +0.184 |
hemy | +0.168 |
ndra | +0.159 |
ongs | +0.148 |
dh | +0.146 |
Neg logit contributions | |
osate | -0.543 |
� | -0.443 |
ongyang | -0.440 |
insula | -0.436 |
withd | -0.435 |
Token | , |
Token ID | 11 |
Feature activation | +8.04e-02 |
Pos logit contributions | |
Carbuncle | +1.682 |
hemy | +1.580 |
ndra | +1.534 |
ongs | +1.473 |
bars | +1.471 |
Neg logit contributions | |
osate | -2.816 |
� | -2.193 |
ongyang | -2.189 |
withd | -2.141 |
insula | -2.133 |
Token | was |
Token ID | 373 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
osate | +0.077 |
� | +0.057 |
ongyang | +0.057 |
insula | +0.056 |
withd | +0.055 |
Neg logit contributions | |
Carbuncle | -0.064 |
hemy | -0.061 |
ndra | -0.059 |
ongs | -0.057 |
bars | -0.057 |
Token | by |
Token ID | 416 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
osate | +0.015 |
� | +0.011 |
ongyang | +0.011 |
insula | +0.011 |
withd | +0.011 |
Neg logit contributions | |
Carbuncle | -0.012 |
hemy | -0.011 |
ndra | -0.011 |
ongs | -0.010 |
dh | -0.010 |
Token | chance |
Token ID | 2863 |
Feature activation | -9.73e-01 |
Pos logit contributions | |
Carbuncle | +0.106 |
hemy | +0.099 |
ndra | +0.096 |
ongs | +0.092 |
bars | +0.092 |
Neg logit contributions | |
osate | -0.163 |
� | -0.125 |
ongyang | -0.125 |
insula | -0.124 |
withd | -0.123 |
Token | at |
Token ID | 379 |
Feature activation | -4.69e-02 |
Pos logit contributions | |
Carbuncle | +0.720 |
hemy | +0.676 |
ndra | +0.659 |
ongs | +0.630 |
bars | +0.626 |
Neg logit contributions | |
osate | -0.992 |
ongyang | -0.750 |
� | -0.750 |
insula | -0.738 |
withd | -0.727 |
Token | ling |
Token ID | 1359 |
Feature activation | -3.34e-02 |
Pos logit contributions | |
Carbuncle | +0.000 |
hemy | +0.000 |
ndra | +0.000 |
ongs | +0.000 |
dh | +0.000 |
Neg logit contributions | |
osate | -0.000 |
� | -0.000 |
ongyang | -0.000 |
insula | -0.000 |
Fug | -0.000 |
Token | through |
Token ID | 832 |
Feature activation | -3.54e-01 |
Pos logit contributions | |
Carbuncle | +0.026 |
hemy | +0.024 |
ndra | +0.023 |
ongs | +0.022 |
bars | +0.022 |
Neg logit contributions | |
osate | -0.033 |
� | -0.025 |
ongyang | -0.025 |
insula | -0.024 |
withd | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | -2.06e-01 |
Pos logit contributions | |
Carbuncle | +0.270 |
hemy | +0.254 |
ndra | +0.248 |
ongs | +0.237 |
dh | +0.235 |
Neg logit contributions | |
osate | -0.351 |
� | -0.263 |
ongyang | -0.263 |
insula | -0.259 |
withd | -0.257 |
Token | Tampa |
Token ID | 15528 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Carbuncle | +0.145 |
hemy | +0.137 |
ndra | +0.133 |
ongs | +0.126 |
dh | +0.125 |
Neg logit contributions | |
osate | -0.216 |
� | -0.166 |
ongyang | -0.165 |
insula | -0.163 |
withd | -0.162 |
Token | Bay |
Token ID | 4696 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Carbuncle | +0.737 |
hemy | +0.682 |
ndra | +0.662 |
ongs | +0.628 |
bars | +0.623 |
Neg logit contributions | |
osate | -1.309 |
� | -1.021 |
ongyang | -1.015 |
insula | -1.004 |
withd | -1.000 |
Token | Lightning |
Token ID | 12469 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
Carbuncle | +0.808 |
hemy | +0.740 |
ndra | +0.713 |
ongs | +0.667 |
bars | +0.659 |
Neg logit contributions | |
osate | -1.874 |
� | -1.499 |
ongyang | -1.494 |
insula | -1.477 |
withd | -1.469 |
Token | , |
Token ID | 11 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
Carbuncle | +1.738 |
hemy | +1.627 |
ndra | +1.580 |
ongs | +1.522 |
bars | +1.517 |
Neg logit contributions | |
osate | -2.381 |
� | -1.789 |
ongyang | -1.788 |
insula | -1.767 |
withd | -1.745 |
Token | prevailing |
Token ID | 26602 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
Carbuncle | +0.167 |
hemy | +0.156 |
ndra | +0.152 |
ongs | +0.146 |
bars | +0.146 |
Neg logit contributions | |
osate | -0.222 |
ongyang | -0.166 |
� | -0.166 |
insula | -0.165 |
withd | -0.162 |
Token | through |
Token ID | 832 |
Feature activation | -3.73e-01 |
Pos logit contributions | |
Carbuncle | +0.364 |
hemy | +0.335 |
ndra | +0.326 |
bars | +0.318 |
ongs | +0.316 |
Neg logit contributions | |
osate | -0.493 |
ongyang | -0.371 |
� | -0.366 |
insula | -0.366 |
withd | -0.354 |
Token | a |
Token ID | 257 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
Carbuncle | +0.281 |
hemy | +0.264 |
ndra | +0.257 |
ongs | +0.247 |
bars | +0.245 |
Neg logit contributions | |
osate | -0.375 |
� | -0.281 |
ongyang | -0.281 |
insula | -0.278 |
withd | -0.275 |
Token | dramatic |
Token ID | 10092 |
Feature activation | +9.11e-03 |
Pos logit contributions | |
Carbuncle | +0.179 |
hemy | +0.169 |
ndra | +0.164 |
ongs | +0.157 |
dh | +0.156 |
Neg logit contributions | |
osate | -0.234 |
� | -0.175 |
ongyang | -0.175 |
insula | -0.173 |
withd | -0.171 |
Token | , |
Token ID | 11 |
Feature activation | -5.40e-01 |
Pos logit contributions | |
Carbuncle | +0.117 |
hemy | +0.110 |
ndra | +0.107 |
bars | +0.103 |
ongs | +0.103 |
Neg logit contributions | |
osate | -0.161 |
ongyang | -0.121 |
� | -0.121 |
insula | -0.120 |
withd | -0.118 |
Token | On |
Token ID | 1550 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
Carbuncle | +0.366 |
hemy | +0.342 |
ndra | +0.332 |
ongs | +0.319 |
bars | +0.317 |
Neg logit contributions | |
osate | -0.582 |
� | -0.447 |
ongyang | -0.446 |
insula | -0.443 |
withd | -0.436 |
Token | stad |
Token ID | 24107 |
Feature activation | +3.87e-01 |
Pos logit contributions | |
Carbuncle | +0.066 |
hemy | +0.061 |
ndra | +0.056 |
ongs | +0.054 |
bars | +0.054 |
Neg logit contributions | |
osate | -0.129 |
ongyang | -0.102 |
� | -0.101 |
insula | -0.101 |
satisf | -0.101 |
Token | joined |
Token ID | 5399 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
osate | +0.361 |
� | +0.265 |
ongyang | +0.265 |
insula | +0.261 |
withd | +0.257 |
Neg logit contributions | |
Carbuncle | -0.319 |
hemy | -0.301 |
ndra | -0.295 |
ongs | -0.283 |
bars | -0.281 |
Token | Toronto |
Token ID | 6586 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
osate | +0.248 |
� | +0.188 |
ongyang | +0.188 |
insula | +0.186 |
withd | +0.184 |
Neg logit contributions | |
Carbuncle | -0.172 |
hemy | -0.161 |
ndra | -0.157 |
ongs | -0.150 |
dh | -0.148 |
Token | FC |
Token ID | 10029 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
Carbuncle | +0.213 |
hemy | +0.189 |
ndra | +0.178 |
ongs | +0.161 |
dh | +0.159 |
Neg logit contributions | |
osate | -0.765 |
� | -0.628 |
ongyang | -0.626 |
insula | -0.621 |
withd | -0.618 |
Token | as |
Token ID | 355 |
Feature activation | -7.37e-01 |
Pos logit contributions | |
Carbuncle | +1.691 |
hemy | +1.584 |
ndra | +1.547 |
bars | +1.481 |
ongs | +1.479 |
Neg logit contributions | |
osate | -2.388 |
ongyang | -1.803 |
� | -1.803 |
insula | -1.790 |
withd | -1.767 |
Token | chief |
Token ID | 4039 |
Feature activation | -3.84e-01 |
Pos logit contributions | |
Carbuncle | +0.486 |
hemy | +0.452 |
ndra | +0.439 |
ongs | +0.416 |
dh | +0.414 |
Neg logit contributions | |
osate | -0.811 |
ongyang | -0.627 |
� | -0.626 |
insula | -0.620 |
withd | -0.614 |
Token | scout |
Token ID | 24490 |
Feature activation | -1.95e-04 |
Pos logit contributions | |
Carbuncle | +0.345 |
hemy | +0.325 |
ndra | +0.318 |
bars | +0.310 |
ongs | +0.309 |
Neg logit contributions | |
osate | -0.333 |
ongyang | -0.236 |
� | -0.236 |
insula | -0.233 |
withd | -0.227 |
Token | and |
Token ID | 290 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
Carbuncle | +0.000 |
hemy | +0.000 |
ndra | +0.000 |
ongs | +0.000 |
dh | +0.000 |
Neg logit contributions | |
osate | -0.000 |
ongyang | -0.000 |
� | -0.000 |
insula | -0.000 |
withd | -0.000 |
Token | manager |
Token ID | 4706 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
Carbuncle | +0.088 |
hemy | +0.083 |
ndra | +0.081 |
ongs | +0.077 |
dh | +0.077 |
Neg logit contributions | |
osate | -0.109 |
� | -0.081 |
ongyang | -0.081 |
insula | -0.080 |
withd | -0.079 |
Token |
|
Token ID | 198 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
osate | +0.408 |
� | +0.294 |
ongyang | +0.286 |
Fug | +0.286 |
insula | +0.282 |
Neg logit contributions | |
Carbuncle | -0.440 |
hemy | -0.420 |
ndra | -0.405 |
ongs | -0.393 |
bars | -0.388 |
Token | Subscribe |
Token ID | 27125 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
osate | +0.317 |
� | +0.204 |
ongyang | +0.198 |
insula | +0.194 |
Fug | +0.192 |
Neg logit contributions | |
Carbuncle | -0.524 |
hemy | -0.503 |
ndra | -0.492 |
ongs | -0.477 |
bars | -0.473 |
Token | to |
Token ID | 284 |
Feature activation | -3.59e-02 |
Pos logit contributions | |
osate | +0.694 |
� | +0.523 |
ongyang | +0.517 |
insula | +0.514 |
Fug | +0.513 |
Neg logit contributions | |
Carbuncle | -0.553 |
hemy | -0.525 |
ndra | -0.509 |
ongs | -0.490 |
dh | -0.481 |
Token | our |
Token ID | 674 |
Feature activation | +6.98e-02 |
Pos logit contributions | |
Carbuncle | +0.033 |
hemy | +0.031 |
ndra | +0.030 |
ongs | +0.030 |
dh | +0.029 |
Neg logit contributions | |
osate | -0.030 |
ongyang | -0.021 |
� | -0.021 |
Fug | -0.021 |
insula | -0.021 |
Token | free |
Token ID | 1479 |
Feature activation | -7.26e-01 |
Pos logit contributions | |
osate | +0.065 |
� | +0.048 |
ongyang | +0.048 |
Fug | +0.047 |
insula | +0.047 |
Neg logit contributions | |
Carbuncle | -0.057 |
hemy | -0.054 |
ndra | -0.053 |
ongs | -0.051 |
dh | -0.050 |
Token | newsletters |
Token ID | 16983 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
Carbuncle | +0.452 |
hemy | +0.421 |
ndra | +0.407 |
ongs | +0.390 |
bars | +0.388 |
Neg logit contributions | |
osate | -0.820 |
� | -0.638 |
ongyang | -0.636 |
withd | -0.633 |
insula | -0.632 |
Token | . |
Token ID | 13 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
Carbuncle | +1.390 |
hemy | +1.298 |
ndra | +1.257 |
ongs | +1.186 |
dh | +1.181 |
Neg logit contributions | |
osate | -2.543 |
� | -1.986 |
ongyang | -1.980 |
withd | -1.966 |
insula | -1.959 |
Token |
|
Token ID | 198 |
Feature activation | +9.59e-01 |
Pos logit contributions | |
osate | +0.417 |
� | +0.301 |
ongyang | +0.299 |
insula | +0.295 |
Fug | +0.293 |
Neg logit contributions | |
Carbuncle | -0.409 |
hemy | -0.390 |
ndra | -0.380 |
ongs | -0.366 |
dh | -0.363 |
Token |
|
Token ID | 198 |
Feature activation | +9.46e-01 |
Pos logit contributions | |
osate | +0.813 |
� | +0.586 |
ongyang | +0.574 |
Fug | +0.571 |
satisf | +0.566 |
Neg logit contributions | |
Carbuncle | -0.862 |
hemy | -0.823 |
ndra | -0.796 |
ongs | -0.770 |
bars | -0.762 |
Token | If |
Token ID | 1532 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
osate | +0.917 |
ongyang | +0.680 |
� | +0.678 |
insula | +0.670 |
withd | +0.670 |
Neg logit contributions | |
Carbuncle | -0.743 |
hemy | -0.706 |
ndra | -0.690 |
ongs | -0.659 |
dh | -0.659 |
Token | you |
Token ID | 345 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
osate | +0.399 |
� | +0.306 |
ongyang | +0.304 |
insula | +0.302 |
withd | +0.299 |
Neg logit contributions | |
Carbuncle | -0.271 |
hemy | -0.255 |
ndra | -0.249 |
bars | -0.236 |
ongs | -0.236 |
Token | story |
Token ID | 1621 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
Carbuncle | +0.431 |
hemy | +0.406 |
ndra | +0.396 |
ongs | +0.380 |
bars | +0.377 |
Neg logit contributions | |
osate | -0.523 |
ongyang | -0.387 |
� | -0.386 |
insula | -0.381 |
withd | -0.377 |
Token | . |
Token ID | 13 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
Carbuncle | +0.113 |
hemy | +0.106 |
ndra | +0.103 |
ongs | +0.099 |
bars | +0.098 |
Neg logit contributions | |
osate | -0.177 |
ongyang | -0.136 |
� | -0.135 |
insula | -0.134 |
withd | -0.132 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
Carbuncle | +0.261 |
hemy | +0.245 |
ndra | +0.240 |
ongs | +0.229 |
dh | +0.228 |
Neg logit contributions | |
osate | -0.330 |
ongyang | -0.247 |
� | -0.246 |
insula | -0.242 |
withd | -0.241 |
Token | Looking |
Token ID | 15784 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
osate | +0.369 |
ongyang | +0.274 |
� | +0.273 |
withd | +0.272 |
insula | +0.271 |
Neg logit contributions | |
Carbuncle | -0.290 |
hemy | -0.276 |
ndra | -0.271 |
dh | -0.259 |
ongs | -0.258 |
Token | for |
Token ID | 329 |
Feature activation | -6.16e-02 |
Pos logit contributions | |
osate | +0.278 |
� | +0.207 |
ongyang | +0.206 |
insula | +0.203 |
withd | +0.202 |
Neg logit contributions | |
Carbuncle | -0.228 |
hemy | -0.216 |
ndra | -0.211 |
ongs | -0.203 |
bars | -0.201 |
Token | news |
Token ID | 1705 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
Carbuncle | +0.041 |
hemy | +0.038 |
ndra | +0.037 |
ongs | +0.035 |
dh | +0.035 |
Neg logit contributions | |
osate | -0.068 |
� | -0.052 |
ongyang | -0.052 |
insula | -0.052 |
withd | -0.051 |
Token | you |
Token ID | 345 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
Carbuncle | +1.563 |
hemy | +1.463 |
ndra | +1.421 |
ongs | +1.351 |
dh | +1.341 |
Neg logit contributions | |
osate | -2.365 |
� | -1.811 |
ongyang | -1.807 |
insula | -1.782 |
withd | -1.770 |
Token | can |
Token ID | 460 |
Feature activation | +2.93e-01 |
Pos logit contributions | |
Carbuncle | +0.138 |
hemy | +0.130 |
ndra | +0.127 |
ongs | +0.122 |
dh | +0.120 |
Neg logit contributions | |
osate | -0.157 |
ongyang | -0.116 |
� | -0.115 |
Fug | -0.115 |
satisf | -0.114 |
Token | trust |
Token ID | 3774 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
osate | +0.226 |
ongyang | +0.158 |
satisf | +0.156 |
Fug | +0.156 |
� | +0.156 |
Neg logit contributions | |
Carbuncle | -0.282 |
hemy | -0.269 |
ndra | -0.259 |
ongs | -0.255 |
dh | -0.247 |
Token | ? |
Token ID | 30 |
Feature activation | -7.51e-02 |
Pos logit contributions | |
Carbuncle | +0.185 |
hemy | +0.175 |
ndra | +0.170 |
ongs | +0.165 |
bars | +0.162 |
Neg logit contributions | |
osate | -0.202 |
� | -0.149 |
ongyang | -0.147 |
insula | -0.145 |
Fug | -0.145 |
Token |
|
Token ID | 198 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
Carbuncle | +0.067 |
hemy | +0.064 |
ndra | +0.062 |
ongs | +0.060 |
bars | +0.060 |
Neg logit contributions | |
osate | -0.064 |
� | -0.046 |
ongyang | -0.046 |
Fug | -0.045 |
insula | -0.045 |
Token | first |
Token ID | 717 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
Carbuncle | +0.434 |
hemy | +0.408 |
ndra | +0.395 |
ongs | +0.375 |
dh | +0.372 |
Neg logit contributions | |
osate | -0.599 |
ongyang | -0.454 |
� | -0.454 |
satisf | -0.446 |
Fug | -0.445 |
Token | to |
Token ID | 284 |
Feature activation | -5.35e-01 |
Pos logit contributions | |
Carbuncle | +0.831 |
hemy | +0.783 |
ndra | +0.752 |
ongs | +0.724 |
dh | +0.718 |
Neg logit contributions | |
osate | -1.064 |
ongyang | -0.801 |
� | -0.799 |
insula | -0.793 |
satisf | -0.788 |
Token | hear |
Token ID | 3285 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
Carbuncle | +0.474 |
hemy | +0.450 |
ndra | +0.441 |
ongs | +0.426 |
dh | +0.425 |
Neg logit contributions | |
osate | -0.466 |
� | -0.332 |
ongyang | -0.330 |
insula | -0.327 |
withd | -0.322 |
Token | about |
Token ID | 546 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
Carbuncle | +0.551 |
hemy | +0.521 |
ndra | +0.507 |
ongs | +0.481 |
dh | +0.475 |
Neg logit contributions | |
osate | -0.668 |
� | -0.505 |
ongyang | -0.502 |
satisf | -0.495 |
Fug | -0.495 |
Token | Nation |
Token ID | 8741 |
Feature activation | -5.91e-01 |
Pos logit contributions | |
Carbuncle | +0.998 |
hemy | +0.951 |
ndra | +0.925 |
ongs | +0.889 |
bars | +0.886 |
Neg logit contributions | |
osate | -1.167 |
� | -0.869 |
ongyang | -0.857 |
insula | -0.854 |
withd | -0.849 |
Token | Travels |
Token ID | 48899 |
Feature activation | -2.21e+00 |
Pos logit contributions | |
Carbuncle | +0.361 |
hemy | +0.339 |
ndra | +0.324 |
ongs | +0.300 |
bars | +0.295 |
Neg logit contributions | |
osate | -0.672 |
� | -0.537 |
ongyang | -0.530 |
Fug | -0.525 |
satisf | -0.523 |
Token | destinations |
Token ID | 23982 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
Carbuncle | +1.425 |
hemy | +1.316 |
ndra | +1.273 |
bars | +1.233 |
ongs | +1.229 |
Neg logit contributions | |
osate | -2.468 |
ongyang | -1.903 |
� | -1.902 |
withd | -1.872 |
insula | -1.872 |
Token | , |
Token ID | 11 |
Feature activation | -5.33e-01 |
Pos logit contributions | |
Carbuncle | +0.965 |
hemy | +0.914 |
ndra | +0.890 |
ongs | +0.853 |
dh | +0.846 |
Neg logit contributions | |
osate | -1.137 |
� | -0.844 |
ongyang | -0.840 |
insula | -0.831 |
Fug | -0.824 |
Token | and |
Token ID | 290 |
Feature activation | -3.62e-01 |
Pos logit contributions | |
Carbuncle | +0.459 |
hemy | +0.439 |
ndra | +0.432 |
ongs | +0.410 |
dh | +0.405 |
Neg logit contributions | |
osate | -0.470 |
� | -0.343 |
ongyang | -0.338 |
Fug | -0.336 |
insula | -0.335 |
Token | explore |
Token ID | 7301 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
Carbuncle | +0.270 |
hemy | +0.257 |
ndra | +0.252 |
ongs | +0.237 |
dh | +0.235 |
Neg logit contributions | |
osate | -0.362 |
� | -0.276 |
ongyang | -0.272 |
insula | -0.271 |
Fug | -0.270 |
Token | the |
Token ID | 262 |
Feature activation | -6.19e-01 |
Pos logit contributions | |
Carbuncle | +0.366 |
hemy | +0.350 |
ndra | +0.345 |
ongs | +0.326 |
bars | +0.320 |
Neg logit contributions | |
osate | -0.403 |
� | -0.299 |
ongyang | -0.295 |
insula | -0.292 |
Fug | -0.292 |
Token | oving |
Token ID | 5165 |
Feature activation | +7.16e-02 |
Pos logit contributions | |
Carbuncle | +0.139 |
hemy | +0.131 |
ndra | +0.127 |
ongs | +0.122 |
dh | +0.121 |
Neg logit contributions | |
osate | -0.192 |
� | -0.145 |
ongyang | -0.145 |
insula | -0.143 |
withd | -0.142 |
Token | Mont |
Token ID | 5575 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
osate | +0.073 |
� | +0.055 |
ongyang | +0.055 |
insula | +0.054 |
withd | +0.054 |
Neg logit contributions | |
Carbuncle | -0.053 |
hemy | -0.050 |
ndra | -0.048 |
ongs | -0.046 |
dh | -0.046 |
Token | pel |
Token ID | 30242 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
osate | +0.236 |
ongyang | +0.180 |
� | +0.180 |
insula | +0.177 |
satisf | +0.176 |
Neg logit contributions | |
Carbuncle | -0.158 |
hemy | -0.147 |
ndra | -0.143 |
ongs | -0.136 |
dh | -0.135 |
Token | ier |
Token ID | 959 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
Carbuncle | +0.254 |
hemy | +0.241 |
ndra | +0.233 |
ongs | +0.224 |
dh | +0.223 |
Neg logit contributions | |
osate | -0.260 |
ongyang | -0.189 |
� | -0.187 |
insula | -0.186 |
satisf | -0.183 |
Token | Bever |
Token ID | 22185 |
Feature activation | -4.76e-01 |
Pos logit contributions | |
Carbuncle | +0.168 |
hemy | +0.158 |
ndra | +0.154 |
ongs | +0.146 |
bars | +0.145 |
Neg logit contributions | |
osate | -0.255 |
ongyang | -0.195 |
� | -0.195 |
insula | -0.193 |
withd | -0.191 |
Token | age |
Token ID | 496 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
Carbuncle | +0.202 |
hemy | +0.182 |
ndra | +0.173 |
ongs | +0.158 |
dh | +0.156 |
Neg logit contributions | |
osate | -0.633 |
� | -0.515 |
ongyang | -0.514 |
insula | -0.510 |
withd | -0.507 |
Token | would |
Token ID | 561 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
Carbuncle | +1.477 |
hemy | +1.371 |
ndra | +1.344 |
bars | +1.296 |
ongs | +1.280 |
Neg logit contributions | |
osate | -2.372 |
ongyang | -1.839 |
� | -1.834 |
insula | -1.807 |
withd | -1.796 |
Token | remove |
Token ID | 4781 |
Feature activation | +7.60e-02 |
Pos logit contributions | |
osate | +0.192 |
� | +0.140 |
ongyang | +0.140 |
insula | +0.138 |
withd | +0.137 |
Neg logit contributions | |
Carbuncle | -0.167 |
hemy | -0.158 |
ndra | -0.154 |
ongs | -0.148 |
bars | -0.147 |
Token | those |
Token ID | 883 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
osate | +0.077 |
� | +0.059 |
ongyang | +0.059 |
insula | +0.058 |
withd | +0.057 |
Neg logit contributions | |
Carbuncle | -0.056 |
hemy | -0.053 |
ndra | -0.051 |
ongs | -0.049 |
dh | -0.049 |
Token | yearly |
Token ID | 24169 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
osate | +0.428 |
� | +0.333 |
ongyang | +0.332 |
insula | +0.328 |
withd | +0.326 |
Neg logit contributions | |
Carbuncle | -0.249 |
hemy | -0.233 |
ndra | -0.225 |
ongs | -0.213 |
dh | -0.211 |
Token | taxes |
Token ID | 5704 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
Carbuncle | +0.123 |
hemy | +0.115 |
ndra | +0.112 |
ongs | +0.106 |
bars | +0.105 |
Neg logit contributions | |
osate | -0.194 |
� | -0.149 |
ongyang | -0.149 |
insula | -0.147 |
withd | -0.146 |
Token | Taliban |
Token ID | 15471 |
Feature activation | -2.31e-01 |
Pos logit contributions | |
osate | +0.001 |
� | +0.001 |
ongyang | +0.001 |
insula | +0.001 |
withd | +0.001 |
Neg logit contributions | |
Carbuncle | -0.001 |
hemy | -0.001 |
ndra | -0.001 |
ongs | -0.001 |
bars | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
Carbuncle | +0.161 |
hemy | +0.150 |
ndra | +0.146 |
ongs | +0.140 |
bars | +0.139 |
Neg logit contributions | |
osate | -0.245 |
� | -0.187 |
ongyang | -0.187 |
insula | -0.184 |
withd | -0.182 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +7.46e-01 |
Pos logit contributions | |
Carbuncle | +0.106 |
hemy | +0.101 |
ndra | +0.099 |
ongs | +0.095 |
dh | +0.095 |
Neg logit contributions | |
osate | -0.111 |
� | -0.081 |
ongyang | -0.081 |
withd | -0.080 |
insula | -0.080 |
Token | Looking |
Token ID | 15784 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
osate | +0.731 |
ongyang | +0.542 |
� | +0.541 |
withd | +0.538 |
insula | +0.536 |
Neg logit contributions | |
Carbuncle | -0.577 |
hemy | -0.548 |
ndra | -0.537 |
dh | -0.514 |
ongs | -0.513 |
Token | for |
Token ID | 329 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
osate | +0.240 |
� | +0.178 |
ongyang | +0.178 |
insula | +0.176 |
withd | +0.174 |
Neg logit contributions | |
Carbuncle | -0.198 |
hemy | -0.187 |
ndra | -0.183 |
ongs | -0.176 |
bars | -0.174 |
Token | news |
Token ID | 1705 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
osate | +0.197 |
� | +0.153 |
ongyang | +0.152 |
insula | +0.151 |
withd | +0.149 |
Neg logit contributions | |
Carbuncle | -0.120 |
hemy | -0.112 |
ndra | -0.109 |
ongs | -0.104 |
dh | -0.103 |
Token | you |
Token ID | 345 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
Carbuncle | +1.520 |
hemy | +1.422 |
ndra | +1.381 |
ongs | +1.313 |
dh | +1.304 |
Neg logit contributions | |
osate | -2.290 |
� | -1.752 |
ongyang | -1.748 |
insula | -1.723 |
Fug | -1.712 |
Token | can |
Token ID | 460 |
Feature activation | +4.12e-01 |
Pos logit contributions | |
Carbuncle | +0.087 |
hemy | +0.082 |
ndra | +0.080 |
ongs | +0.077 |
dh | +0.075 |
Neg logit contributions | |
osate | -0.097 |
ongyang | -0.072 |
� | -0.071 |
Fug | -0.071 |
satisf | -0.071 |
Token | trust |
Token ID | 3774 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
osate | +0.314 |
ongyang | +0.219 |
satisf | +0.217 |
Fug | +0.217 |
� | +0.216 |
Neg logit contributions | |
Carbuncle | -0.398 |
hemy | -0.381 |
ndra | -0.366 |
ongs | -0.361 |
dh | -0.349 |
Token | ? |
Token ID | 30 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
Carbuncle | +0.100 |
hemy | +0.094 |
ndra | +0.092 |
ongs | +0.089 |
bars | +0.087 |
Neg logit contributions | |
osate | -0.108 |
� | -0.079 |
ongyang | -0.079 |
Fug | -0.078 |
insula | -0.078 |
Token |
|
Token ID | 198 |
Feature activation | +7.07e-01 |
Pos logit contributions | |
osate | +0.132 |
� | +0.095 |
ongyang | +0.094 |
Fug | +0.093 |
insula | +0.092 |
Neg logit contributions | |
Carbuncle | -0.139 |
hemy | -0.132 |
ndra | -0.128 |
ongs | -0.124 |
bars | -0.123 |
Token |
|
Token ID | 198 |
Feature activation | +7.01e-01 |
Pos logit contributions | |
osate | +0.589 |
� | +0.424 |
Fug | +0.411 |
ongyang | +0.411 |
insula | +0.406 |
Neg logit contributions | |
Carbuncle | -0.646 |
hemy | -0.616 |
ndra | -0.594 |
ongs | -0.578 |
bars | -0.571 |
Token | Subscribe |
Token ID | 27125 |
Feature activation | +7.52e-01 |
Pos logit contributions | |
osate | +0.458 |
� | +0.292 |
ongyang | +0.283 |
insula | +0.277 |
Fug | +0.276 |
Neg logit contributions | |
Carbuncle | -0.775 |
hemy | -0.743 |
ndra | -0.726 |
ongs | -0.705 |
bars | -0.699 |
Token | to |
Token ID | 284 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
osate | +0.728 |
� | +0.548 |
ongyang | +0.542 |
insula | +0.539 |
Fug | +0.538 |
Neg logit contributions | |
Carbuncle | -0.583 |
hemy | -0.554 |
ndra | -0.538 |
ongs | -0.517 |
dh | -0.507 |
Token | our |
Token ID | 674 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
osate | +0.021 |
� | +0.015 |
ongyang | +0.015 |
Fug | +0.015 |
insula | +0.015 |
Neg logit contributions | |
Carbuncle | -0.023 |
hemy | -0.022 |
ndra | -0.021 |
ongs | -0.020 |
dh | -0.020 |
Token | free |
Token ID | 1479 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
osate | +0.128 |
� | +0.095 |
ongyang | +0.095 |
Fug | +0.094 |
satisf | +0.093 |
Neg logit contributions | |
Carbuncle | -0.113 |
hemy | -0.108 |
ndra | -0.105 |
ongs | -0.101 |
dh | -0.099 |
Token | newsletters |
Token ID | 16983 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
Carbuncle | +0.359 |
hemy | +0.335 |
ndra | +0.323 |
ongs | +0.309 |
bars | +0.308 |
Neg logit contributions | |
osate | -0.637 |
� | -0.495 |
ongyang | -0.494 |
insula | -0.490 |
withd | -0.490 |
Token | . |
Token ID | 13 |
Feature activation | +5.91e-01 |
Pos logit contributions | |
Carbuncle | +1.355 |
hemy | +1.266 |
ndra | +1.225 |
ongs | +1.158 |
dh | +1.150 |
Neg logit contributions | |
osate | -2.442 |
� | -1.906 |
ongyang | -1.901 |
withd | -1.880 |
insula | -1.880 |
Token |
|
Token ID | 198 |
Feature activation | +9.95e-01 |
Pos logit contributions | |
osate | +0.519 |
� | +0.373 |
ongyang | +0.372 |
insula | +0.366 |
Fug | +0.365 |
Neg logit contributions | |
Carbuncle | -0.515 |
hemy | -0.493 |
ndra | -0.480 |
ongs | -0.462 |
dh | -0.457 |
Token |
|
Token ID | 198 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
osate | +0.838 |
� | +0.605 |
ongyang | +0.591 |
Fug | +0.590 |
satisf | +0.583 |
Neg logit contributions | |
Carbuncle | -0.896 |
hemy | -0.857 |
ndra | -0.827 |
ongs | -0.801 |
bars | -0.793 |
Token | Update |
Token ID | 10260 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
osate | +0.972 |
ongyang | +0.721 |
� | +0.719 |
insula | +0.711 |
withd | +0.711 |
Neg logit contributions | |
Carbuncle | -0.787 |
hemy | -0.747 |
ndra | -0.731 |
ongs | -0.698 |
dh | -0.697 |
Token | , |
Token ID | 11 |
Feature activation | +3.90e-01 |
Pos logit contributions | |
osate | +0.437 |
� | +0.327 |
ongyang | +0.326 |
insula | +0.323 |
withd | +0.321 |
Neg logit contributions | |
Carbuncle | -0.343 |
hemy | -0.325 |
ndra | -0.316 |
ongs | -0.302 |
bars | -0.302 |
Token | first |
Token ID | 717 |
Feature activation | -3.87e-01 |
Pos logit contributions | |
osate | +0.570 |
Fug | +0.430 |
satisf | +0.426 |
ongyang | +0.425 |
� | +0.425 |
Neg logit contributions | |
Carbuncle | -0.444 |
hemy | -0.427 |
ndra | -0.402 |
ongs | -0.392 |
dh | -0.385 |
Token | to |
Token ID | 284 |
Feature activation | +5.26e-02 |
Pos logit contributions | |
Carbuncle | +0.296 |
hemy | +0.281 |
ndra | +0.270 |
ongs | +0.260 |
dh | +0.256 |
Neg logit contributions | |
osate | -0.381 |
� | -0.287 |
ongyang | -0.285 |
insula | -0.282 |
Fug | -0.282 |
Token | hear |
Token ID | 3285 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
osate | +0.042 |
ongyang | +0.030 |
� | +0.030 |
insula | +0.029 |
satisf | +0.029 |
Neg logit contributions | |
Carbuncle | -0.050 |
hemy | -0.047 |
ndra | -0.046 |
ongs | -0.045 |
dh | -0.044 |
Token | about |
Token ID | 546 |
Feature activation | -8.33e-01 |
Pos logit contributions | |
Carbuncle | +0.314 |
hemy | +0.296 |
ndra | +0.286 |
ongs | +0.274 |
bars | +0.271 |
Neg logit contributions | |
osate | -0.396 |
� | -0.298 |
ongyang | -0.295 |
satisf | -0.293 |
Fug | -0.293 |
Token | Nation |
Token ID | 8741 |
Feature activation | +3.92e-02 |
Pos logit contributions | |
Carbuncle | +0.712 |
hemy | +0.676 |
ndra | +0.659 |
ongs | +0.635 |
dh | +0.630 |
Neg logit contributions | |
osate | -0.750 |
� | -0.544 |
ongyang | -0.542 |
insula | -0.533 |
Fug | -0.530 |
Token | Travels |
Token ID | 48899 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
osate | +0.044 |
� | +0.035 |
ongyang | +0.035 |
Fug | +0.035 |
satisf | +0.035 |
Neg logit contributions | |
Carbuncle | -0.024 |
hemy | -0.023 |
ndra | -0.022 |
ongs | -0.020 |
dh | -0.020 |
Token | destinations |
Token ID | 23982 |
Feature activation | -9.85e-01 |
Pos logit contributions | |
Carbuncle | +1.417 |
hemy | +1.315 |
ndra | +1.273 |
bars | +1.220 |
ongs | +1.218 |
Neg logit contributions | |
osate | -2.379 |
ongyang | -1.833 |
� | -1.826 |
withd | -1.802 |
insula | -1.802 |
Token | , |
Token ID | 11 |
Feature activation | +2.00e-01 |
Pos logit contributions | |
Carbuncle | +0.783 |
hemy | +0.741 |
ndra | +0.721 |
ongs | +0.692 |
dh | +0.685 |
Neg logit contributions | |
osate | -0.945 |
� | -0.703 |
ongyang | -0.699 |
insula | -0.690 |
Fug | -0.684 |
Token | and |
Token ID | 290 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
osate | +0.178 |
� | +0.130 |
ongyang | +0.128 |
satisf | +0.127 |
Fug | +0.127 |
Neg logit contributions | |
Carbuncle | -0.171 |
hemy | -0.163 |
ndra | -0.159 |
ongs | -0.152 |
dh | -0.151 |
Token | explore |
Token ID | 7301 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
osate | +0.028 |
� | +0.021 |
ongyang | +0.021 |
insula | +0.021 |
satisf | +0.021 |
Neg logit contributions | |
Carbuncle | -0.021 |
hemy | -0.020 |
ndra | -0.019 |
ongs | -0.018 |
dh | -0.018 |
Token | the |
Token ID | 262 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
Carbuncle | +0.227 |
hemy | +0.215 |
ndra | +0.209 |
ongs | +0.201 |
dh | +0.199 |
Neg logit contributions | |
osate | -0.279 |
� | -0.208 |
ongyang | -0.207 |
insula | -0.204 |
satisf | -0.202 |
Token | ] |
Token ID | 60 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
osate | +0.074 |
� | +0.051 |
ongyang | +0.051 |
insula | +0.050 |
withd | +0.049 |
Neg logit contributions | |
Carbuncle | -0.087 |
hemy | -0.082 |
ndra | -0.081 |
ongs | -0.078 |
bars | -0.078 |
Token | go |
Token ID | 467 |
Feature activation | +1.87e-02 |
Pos logit contributions | |
osate | +0.151 |
� | +0.106 |
ongyang | +0.106 |
insula | +0.104 |
withd | +0.103 |
Neg logit contributions | |
Carbuncle | -0.166 |
hemy | -0.158 |
ndra | -0.155 |
ongs | -0.149 |
dh | -0.148 |
Token | into |
Token ID | 656 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
osate | +0.019 |
� | +0.014 |
ongyang | +0.014 |
insula | +0.014 |
withd | +0.013 |
Neg logit contributions | |
Carbuncle | -0.014 |
hemy | -0.013 |
ndra | -0.013 |
ongs | -0.013 |
bars | -0.013 |
Token | [ |
Token ID | 685 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
osate | +0.246 |
� | +0.187 |
ongyang | +0.186 |
insula | +0.184 |
withd | +0.182 |
Neg logit contributions | |
Carbuncle | -0.175 |
hemy | -0.165 |
ndra | -0.160 |
ongs | -0.153 |
dh | -0.152 |
Token | Storm |
Token ID | 32173 |
Feature activation | -7.19e-01 |
Pos logit contributions | |
Carbuncle | +0.143 |
hemy | +0.136 |
ndra | +0.133 |
dh | +0.127 |
ongs | +0.127 |
Neg logit contributions | |
osate | -0.195 |
ongyang | -0.145 |
� | -0.145 |
withd | -0.143 |
insula | -0.142 |
Token | tro |
Token ID | 23528 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
Carbuncle | +0.173 |
hemy | +0.144 |
ndra | +0.129 |
ongs | +0.108 |
dh | +0.106 |
Neg logit contributions | |
osate | -1.087 |
� | -0.910 |
ongyang | -0.909 |
insula | -0.902 |
withd | -0.899 |
Token | opers |
Token ID | 20618 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
Carbuncle | +1.510 |
hemy | +1.438 |
ndra | +1.406 |
ongs | +1.355 |
dh | +1.334 |
Neg logit contributions | |
osate | -2.168 |
� | -1.653 |
ongyang | -1.636 |
insula | -1.633 |
withd | -1.633 |
Token | '] |
Token ID | 20520 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
Carbuncle | +1.184 |
hemy | +1.129 |
ndra | +1.108 |
bars | +1.075 |
ongs | +1.075 |
Neg logit contributions | |
osate | -1.145 |
� | -0.811 |
ongyang | -0.805 |
insula | -0.793 |
withd | -0.787 |
Token | past |
Token ID | 1613 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
Carbuncle | +0.073 |
hemy | +0.069 |
ndra | +0.067 |
ongs | +0.063 |
dh | +0.063 |
Neg logit contributions | |
osate | -0.113 |
� | -0.087 |
ongyang | -0.087 |
insula | -0.086 |
withd | -0.085 |
Token | s |
Token ID | 82 |
Feature activation | -9.30e-01 |
Pos logit contributions | |
Carbuncle | +0.137 |
hemy | +0.129 |
ndra | +0.125 |
ongs | +0.120 |
bars | +0.120 |
Neg logit contributions | |
osate | -0.190 |
� | -0.144 |
ongyang | -0.143 |
insula | -0.141 |
withd | -0.140 |
Token | or |
Token ID | 393 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
Carbuncle | +0.700 |
hemy | +0.659 |
ndra | +0.640 |
ongs | +0.621 |
bars | +0.619 |
Neg logit contributions | |
osate | -0.937 |
ongyang | -0.705 |
� | -0.703 |
insula | -0.691 |
withd | -0.678 |
Token | assistant |
Token ID | 8796 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
Carbuncle | +0.184 |
hemy | +0.173 |
ndra | +0.169 |
ongs | +0.162 |
dh | +0.160 |
Neg logit contributions | |
osate | -0.234 |
� | -0.175 |
ongyang | -0.175 |
insula | -0.172 |
withd | -0.171 |
Token | coach |
Token ID | 3985 |
Feature activation | +8.02e-02 |
Pos logit contributions | |
Carbuncle | +0.223 |
hemy | +0.209 |
ndra | +0.205 |
bars | +0.198 |
ongs | +0.198 |
Neg logit contributions | |
osate | -0.250 |
ongyang | -0.183 |
� | -0.183 |
insula | -0.180 |
withd | -0.177 |
Token | with |
Token ID | 351 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
osate | +0.080 |
� | +0.060 |
ongyang | +0.060 |
insula | +0.059 |
withd | +0.058 |
Neg logit contributions | |
Carbuncle | -0.061 |
hemy | -0.057 |
ndra | -0.056 |
ongs | -0.054 |
bars | -0.053 |
Token | the |
Token ID | 262 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
Carbuncle | +0.103 |
hemy | +0.096 |
ndra | +0.094 |
ongs | +0.090 |
bars | +0.089 |
Neg logit contributions | |
osate | -0.142 |
ongyang | -0.107 |
� | -0.107 |
insula | -0.106 |
withd | -0.105 |
Token | Columbus |
Token ID | 14939 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
osate | +0.032 |
� | +0.024 |
ongyang | +0.024 |
insula | +0.023 |
withd | +0.023 |
Neg logit contributions | |
Carbuncle | -0.023 |
hemy | -0.022 |
ndra | -0.022 |
ongs | -0.021 |
dh | -0.020 |
Token | Crew |
Token ID | 17652 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
Carbuncle | +0.762 |
hemy | +0.701 |
ndra | +0.673 |
ongs | +0.634 |
dh | +0.625 |
Neg logit contributions | |
osate | -1.710 |
� | -1.361 |
ongyang | -1.359 |
insula | -1.345 |
withd | -1.338 |
Token | . |
Token ID | 13 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
Carbuncle | +1.348 |
hemy | +1.247 |
ndra | +1.209 |
ongs | +1.157 |
dh | +1.150 |
Neg logit contributions | |
osate | -2.353 |
� | -1.823 |
ongyang | -1.821 |
insula | -1.807 |
withd | -1.787 |
Token | " |
Token ID | 366 |
Feature activation | -5.36e-01 |
Pos logit contributions | |
Carbuncle | +0.208 |
hemy | +0.193 |
ndra | +0.187 |
ongs | +0.178 |
dh | +0.176 |
Neg logit contributions | |
osate | -0.386 |
� | -0.303 |
ongyang | -0.302 |
withd | -0.300 |
insula | -0.299 |
Token | I |
Token ID | 40 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
Carbuncle | +0.389 |
hemy | +0.366 |
ndra | +0.358 |
dh | +0.343 |
ongs | +0.342 |
Neg logit contributions | |
osate | -0.552 |
ongyang | -0.419 |
� | -0.415 |
insula | -0.412 |
withd | -0.412 |
Token | just |
Token ID | 655 |
Feature activation | +3.12e-01 |
Pos logit contributions | |
Carbuncle | +0.227 |
hemy | +0.215 |
ndra | +0.211 |
ongs | +0.203 |
dh | +0.202 |
Neg logit contributions | |
osate | -0.228 |
� | -0.164 |
ongyang | -0.163 |
insula | -0.161 |
withd | -0.159 |
Token | kept |
Token ID | 4030 |
Feature activation | +1.29e-01 |
Pos logit contributions | |
osate | +0.286 |
� | +0.209 |
ongyang | +0.208 |
insula | +0.205 |
withd | +0.203 |
Neg logit contributions | |
Carbuncle | -0.261 |
hemy | -0.248 |
ndra | -0.242 |
ongs | -0.233 |
dh | -0.231 |
Token | and |
Token ID | 290 |
Feature activation | -7.66e-02 |
Pos logit contributions | |
Carbuncle | +0.481 |
hemy | +0.454 |
ndra | +0.437 |
ongs | +0.427 |
bars | +0.426 |
Neg logit contributions | |
osate | -0.618 |
ongyang | -0.461 |
� | -0.458 |
insula | -0.454 |
withd | -0.449 |
Token | original |
Token ID | 2656 |
Feature activation | +1.22e-03 |
Pos logit contributions | |
Carbuncle | +0.053 |
hemy | +0.050 |
ndra | +0.048 |
ongs | +0.046 |
dh | +0.046 |
Neg logit contributions | |
osate | -0.081 |
� | -0.062 |
ongyang | -0.062 |
insula | -0.061 |
withd | -0.061 |
Token | sound |
Token ID | 2128 |
Feature activation | +3.07e-02 |
Pos logit contributions | |
osate | +0.001 |
� | +0.001 |
ongyang | +0.001 |
insula | +0.001 |
withd | +0.001 |
Neg logit contributions | |
Carbuncle | -0.001 |
hemy | -0.001 |
ndra | -0.001 |
ongs | -0.001 |
dh | -0.001 |
Token | rec |
Token ID | 664 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
osate | +0.032 |
� | +0.024 |
ongyang | +0.024 |
insula | +0.024 |
withd | +0.024 |
Neg logit contributions | |
Carbuncle | -0.022 |
hemy | -0.021 |
ndra | -0.020 |
ongs | -0.019 |
bars | -0.019 |
Token | od |
Token ID | 375 |
Feature activation | -6.84e-01 |
Pos logit contributions | |
osate | +0.446 |
� | +0.339 |
ongyang | +0.337 |
insula | +0.333 |
withd | +0.331 |
Neg logit contributions | |
Carbuncle | -0.326 |
hemy | -0.308 |
ndra | -0.299 |
ongs | -0.288 |
dh | -0.285 |
Token | ording |
Token ID | 1284 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
Carbuncle | +0.457 |
hemy | +0.428 |
ndra | +0.407 |
ongs | +0.401 |
dh | +0.396 |
Neg logit contributions | |
osate | -0.750 |
� | -0.578 |
ongyang | -0.569 |
insula | -0.564 |
withd | -0.563 |
Token | instead |
Token ID | 2427 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
Carbuncle | +1.542 |
hemy | +1.436 |
ndra | +1.396 |
bars | +1.365 |
ongs | +1.363 |
Neg logit contributions | |
osate | -2.139 |
ongyang | -1.607 |
� | -1.595 |
insula | -1.590 |
withd | -1.561 |
Token | of |
Token ID | 286 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
Carbuncle | +0.216 |
hemy | +0.202 |
ndra | +0.196 |
ongs | +0.189 |
bars | +0.187 |
Neg logit contributions | |
osate | -0.355 |
ongyang | -0.275 |
� | -0.273 |
insula | -0.272 |
withd | -0.269 |
Token | the |
Token ID | 262 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
Carbuncle | +0.203 |
hemy | +0.190 |
ndra | +0.184 |
ongs | +0.178 |
bars | +0.177 |
Neg logit contributions | |
osate | -0.289 |
ongyang | -0.219 |
� | -0.219 |
insula | -0.217 |
withd | -0.214 |
Token | narration |
Token ID | 45127 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
Carbuncle | +0.023 |
hemy | +0.021 |
ndra | +0.021 |
ongs | +0.020 |
dh | +0.020 |
Neg logit contributions | |
osate | -0.034 |
� | -0.026 |
ongyang | -0.026 |
insula | -0.026 |
withd | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
osate | +0.240 |
� | +0.181 |
ongyang | +0.181 |
insula | +0.178 |
withd | +0.176 |
Neg logit contributions | |
Carbuncle | -0.181 |
hemy | -0.170 |
ndra | -0.165 |
ongs | -0.159 |
bars | -0.158 |
Token | Sanders |
Token ID | 5831 |
Feature activation | -9.43e-01 |
Pos logit contributions | |
Carbuncle | +0.232 |
hemy | +0.219 |
ndra | +0.213 |
ongs | +0.205 |
bars | +0.205 |
Neg logit contributions | |
osate | -0.253 |
ongyang | -0.185 |
� | -0.185 |
insula | -0.181 |
withd | -0.181 |
Token | : |
Token ID | 25 |
Feature activation | +3.12e-01 |
Pos logit contributions | |
Carbuncle | +0.804 |
hemy | +0.763 |
ndra | +0.745 |
ongs | +0.717 |
dh | +0.711 |
Neg logit contributions | |
osate | -0.851 |
� | -0.620 |
ongyang | -0.615 |
insula | -0.607 |
withd | -0.603 |
Token | ' |
Token ID | 705 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
osate | +0.339 |
ongyang | +0.262 |
� | +0.262 |
Fug | +0.259 |
insula | +0.257 |
Neg logit contributions | |
Carbuncle | -0.208 |
hemy | -0.196 |
ndra | -0.187 |
ongs | -0.180 |
dh | -0.176 |
Token | Damn |
Token ID | 43343 |
Feature activation | +9.13e-02 |
Pos logit contributions | |
Carbuncle | +0.735 |
hemy | +0.704 |
ndra | +0.701 |
dh | +0.664 |
bars | +0.656 |
Neg logit contributions | |
osate | -1.135 |
ongyang | -0.867 |
� | -0.860 |
insula | -0.853 |
withd | -0.849 |
Token | right |
Token ID | 826 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
osate | +0.089 |
� | +0.066 |
ongyang | +0.066 |
insula | +0.065 |
Fug | +0.065 |
Neg logit contributions | |
Carbuncle | -0.071 |
hemy | -0.067 |
ndra | -0.065 |
ongs | -0.063 |
dh | -0.063 |
Token | ' |
Token ID | 6 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
Carbuncle | +0.085 |
hemy | +0.080 |
ndra | +0.078 |
ongs | +0.074 |
bars | +0.074 |
Neg logit contributions | |
osate | -0.120 |
� | -0.092 |
ongyang | -0.092 |
insula | -0.090 |
withd | -0.090 |
Token | I |
Token ID | 314 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
Carbuncle | +1.441 |
hemy | +1.349 |
ndra | +1.294 |
bars | +1.292 |
dh | +1.232 |
Neg logit contributions | |
osate | -2.180 |
� | -1.687 |
ongyang | -1.672 |
insula | -1.639 |
satisf | -1.636 |
Token | 'll |
Token ID | 1183 |
Feature activation | +2.82e-01 |
Pos logit contributions | |
Carbuncle | +0.176 |
hemy | +0.168 |
ndra | +0.164 |
ongs | +0.157 |
dh | +0.157 |
Neg logit contributions | |
osate | -0.181 |
� | -0.131 |
ongyang | -0.131 |
insula | -0.129 |
withd | -0.127 |
Token | make |
Token ID | 787 |
Feature activation | -2.95e-01 |
Pos logit contributions | |
osate | +0.230 |
� | +0.164 |
satisf | +0.159 |
withd | +0.159 |
ongyang | +0.158 |
Neg logit contributions | |
Carbuncle | -0.265 |
hemy | -0.249 |
ndra | -0.245 |
ongs | -0.236 |
dh | -0.234 |
Token | the |
Token ID | 262 |
Feature activation | +1.49e-01 |
Pos logit contributions | |
Carbuncle | +0.221 |
hemy | +0.204 |
ndra | +0.199 |
ongs | +0.197 |
dh | +0.193 |
Neg logit contributions | |
osate | -0.295 |
� | -0.225 |
Fug | -0.223 |
insula | -0.221 |
ongyang | -0.219 |
Token | large |
Token ID | 1588 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
osate | +0.153 |
ongyang | +0.116 |
� | +0.116 |
insula | +0.114 |
satisf | +0.113 |
Neg logit contributions | |
Carbuncle | -0.109 |
hemy | -0.102 |
ndra | -0.099 |
ongs | -0.095 |
dh | -0.093 |
Token | about |
Token ID | 546 |
Feature activation | -4.42e-01 |
Pos logit contributions | |
osate | +0.426 |
� | +0.323 |
ongyang | +0.322 |
insula | +0.318 |
withd | +0.315 |
Neg logit contributions | |
Carbuncle | -0.303 |
hemy | -0.285 |
ndra | -0.277 |
ongs | -0.265 |
dh | -0.262 |
Token | the |
Token ID | 262 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
Carbuncle | +0.337 |
hemy | +0.316 |
ndra | +0.308 |
ongs | +0.295 |
dh | +0.294 |
Neg logit contributions | |
osate | -0.441 |
ongyang | -0.331 |
� | -0.331 |
insula | -0.326 |
withd | -0.322 |
Token | proliferation |
Token ID | 25068 |
Feature activation | +2.94e-01 |
Pos logit contributions | |
Carbuncle | +0.171 |
hemy | +0.161 |
ndra | +0.157 |
ongs | +0.149 |
dh | +0.148 |
Neg logit contributions | |
osate | -0.247 |
� | -0.188 |
ongyang | -0.188 |
insula | -0.186 |
withd | -0.184 |
Token | of |
Token ID | 286 |
Feature activation | -4.46e-01 |
Pos logit contributions | |
osate | +0.318 |
ongyang | +0.246 |
� | +0.246 |
insula | +0.242 |
withd | +0.240 |
Neg logit contributions | |
Carbuncle | -0.198 |
hemy | -0.184 |
ndra | -0.179 |
ongs | -0.171 |
dh | -0.170 |
Token | illegal |
Token ID | 5293 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
Carbuncle | +0.327 |
hemy | +0.306 |
ndra | +0.298 |
ongs | +0.285 |
bars | +0.284 |
Neg logit contributions | |
osate | -0.459 |
� | -0.348 |
ongyang | -0.348 |
insula | -0.343 |
withd | -0.339 |
Token | bowling |
Token ID | 33564 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
osate | +0.326 |
� | +0.247 |
ongyang | +0.247 |
insula | +0.244 |
withd | +0.242 |
Neg logit contributions | |
Carbuncle | -0.234 |
hemy | -0.220 |
ndra | -0.214 |
ongs | -0.204 |
dh | -0.203 |
Token | actions |
Token ID | 4028 |
Feature activation | -6.26e-01 |
Pos logit contributions | |
Carbuncle | +1.539 |
hemy | +1.450 |
ndra | +1.413 |
bars | +1.364 |
ongs | +1.358 |
Neg logit contributions | |
osate | -2.120 |
ongyang | -1.601 |
� | -1.591 |
insula | -1.577 |
withd | -1.541 |
Token | , |
Token ID | 11 |
Feature activation | -4.25e-01 |
Pos logit contributions | |
Carbuncle | +0.464 |
hemy | +0.439 |
ndra | +0.426 |
bars | +0.408 |
ongs | +0.408 |
Neg logit contributions | |
osate | -0.637 |
ongyang | -0.481 |
� | -0.479 |
insula | -0.472 |
withd | -0.465 |
Token | D |
Token ID | 360 |
Feature activation | +8.12e-02 |
Pos logit contributions | |
Carbuncle | +0.306 |
hemy | +0.287 |
ndra | +0.279 |
ongs | +0.267 |
dh | +0.265 |
Neg logit contributions | |
osate | -0.440 |
ongyang | -0.336 |
� | -0.335 |
insula | -0.331 |
withd | -0.327 |
Token | rav |
Token ID | 4108 |
Feature activation | +3.29e-02 |
Pos logit contributions | |
osate | +0.064 |
ongyang | +0.045 |
� | +0.044 |
insula | +0.044 |
satisf | +0.043 |
Neg logit contributions | |
Carbuncle | -0.079 |
hemy | -0.074 |
ndra | -0.072 |
bars | -0.070 |
ongs | -0.070 |
Token | id |
Token ID | 312 |
Feature activation | +5.97e-01 |
Pos logit contributions | |
osate | +0.028 |
ongyang | +0.020 |
� | +0.020 |
insula | +0.020 |
satisf | +0.020 |
Neg logit contributions | |
Carbuncle | -0.029 |
hemy | -0.028 |
ndra | -0.026 |
bars | -0.026 |
ongs | -0.026 |
Token | whore |
Token ID | 40107 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
Carbuncle | +0.136 |
hemy | +0.128 |
ndra | +0.125 |
ongs | +0.119 |
bars | +0.118 |
Neg logit contributions | |
osate | -0.182 |
� | -0.137 |
ongyang | -0.137 |
insula | -0.135 |
withd | -0.134 |
Token | house |
Token ID | 4803 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
Carbuncle | +0.015 |
hemy | +0.015 |
ndra | +0.014 |
ongs | +0.014 |
bars | +0.014 |
Neg logit contributions | |
osate | -0.018 |
ongyang | -0.013 |
� | -0.013 |
insula | -0.013 |
withd | -0.013 |
Token | … |
Token ID | 1399 |
Feature activation | +4.06e-01 |
Pos logit contributions | |
osate | +0.339 |
ongyang | +0.256 |
� | +0.256 |
insula | +0.252 |
withd | +0.250 |
Neg logit contributions | |
Carbuncle | -0.250 |
hemy | -0.234 |
ndra | -0.228 |
ongs | -0.219 |
bars | -0.218 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
osate | +0.396 |
� | +0.295 |
ongyang | +0.295 |
insula | +0.290 |
withd | +0.287 |
Neg logit contributions | |
Carbuncle | -0.317 |
hemy | -0.299 |
ndra | -0.291 |
ongs | -0.279 |
dh | -0.278 |
Token | Steven |
Token ID | 28292 |
Feature activation | -8.22e-01 |
Pos logit contributions | |
osate | +0.560 |
ongyang | +0.415 |
� | +0.415 |
withd | +0.412 |
insula | +0.411 |
Neg logit contributions | |
Carbuncle | -0.442 |
hemy | -0.421 |
ndra | -0.412 |
dh | -0.395 |
ongs | -0.394 |
Token | Gerrard |
Token ID | 49314 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
Carbuncle | +0.586 |
hemy | +0.545 |
ndra | +0.531 |
ongs | +0.509 |
dh | +0.505 |
Neg logit contributions | |
osate | -0.859 |
ongyang | -0.658 |
� | -0.657 |
insula | -0.646 |
withd | -0.645 |
Token | scored |
Token ID | 7781 |
Feature activation | -4.91e-01 |
Pos logit contributions | |
Carbuncle | +1.616 |
hemy | +1.508 |
ndra | +1.472 |
bars | +1.423 |
ongs | +1.423 |
Neg logit contributions | |
osate | -2.037 |
insula | -1.519 |
ongyang | -1.518 |
� | -1.515 |
withd | -1.470 |
Token | his |
Token ID | 465 |
Feature activation | -8.31e-02 |
Pos logit contributions | |
Carbuncle | +0.372 |
hemy | +0.349 |
ndra | +0.340 |
ongs | +0.327 |
bars | +0.326 |
Neg logit contributions | |
osate | -0.494 |
� | -0.370 |
ongyang | -0.369 |
insula | -0.366 |
withd | -0.360 |
Token | 100 |
Token ID | 1802 |
Feature activation | -7.37e-01 |
Pos logit contributions | |
Carbuncle | +0.058 |
hemy | +0.054 |
ndra | +0.053 |
ongs | +0.050 |
bars | +0.050 |
Neg logit contributions | |
osate | -0.088 |
ongyang | -0.068 |
� | -0.068 |
insula | -0.067 |
withd | -0.066 |
Token | th |
Token ID | 400 |
Feature activation | -8.08e-01 |
Pos logit contributions | |
Carbuncle | +0.398 |
hemy | +0.367 |
ndra | +0.353 |
ongs | +0.330 |
dh | +0.327 |
Neg logit contributions | |
osate | -0.895 |
� | -0.713 |
ongyang | -0.712 |
insula | -0.704 |
withd | -0.700 |
Token | Premier |
Token ID | 9952 |
Feature activation | -7.11e-01 |
Pos logit contributions | |
Carbuncle | +0.506 |
hemy | +0.471 |
ndra | +0.456 |
ongs | +0.431 |
dh | +0.427 |
Neg logit contributions | |
osate | -0.913 |
� | -0.713 |
ongyang | -0.711 |
insula | -0.703 |
withd | -0.699 |
Token |
|
Token ID | 198 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
osate | +0.108 |
� | +0.080 |
ongyang | +0.080 |
insula | +0.078 |
withd | +0.078 |
Neg logit contributions | |
Carbuncle | -0.089 |
hemy | -0.084 |
ndra | -0.082 |
ongs | -0.078 |
bars | -0.078 |
Token |
|
Token ID | 198 |
Feature activation | -4.09e-01 |
Pos logit contributions | |
Carbuncle | +0.309 |
hemy | +0.294 |
ndra | +0.286 |
ongs | +0.275 |
bars | +0.272 |
Neg logit contributions | |
osate | -0.307 |
� | -0.222 |
ongyang | -0.220 |
insula | -0.216 |
satisf | -0.216 |
Token | search |
Token ID | 12947 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
Carbuncle | +0.296 |
hemy | +0.280 |
ndra | +0.273 |
dh | +0.261 |
ongs | +0.260 |
Neg logit contributions | |
osate | -0.421 |
� | -0.318 |
ongyang | -0.318 |
withd | -0.314 |
insula | -0.312 |
Token | Space |
Token ID | 14106 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
Carbuncle | +0.619 |
hemy | +0.589 |
ndra | +0.577 |
ongs | +0.561 |
bars | +0.560 |
Neg logit contributions | |
osate | -0.530 |
� | -0.365 |
ongyang | -0.364 |
insula | -0.356 |
withd | -0.354 |
Token | = |
Token ID | 796 |
Feature activation | -3.11e-01 |
Pos logit contributions | |
osate | +0.384 |
� | +0.291 |
ongyang | +0.291 |
insula | +0.287 |
withd | +0.284 |
Neg logit contributions | |
Carbuncle | -0.274 |
hemy | -0.257 |
ndra | -0.250 |
ongs | -0.239 |
dh | -0.237 |
Token | Select |
Token ID | 9683 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
Carbuncle | +0.220 |
hemy | +0.206 |
ndra | +0.200 |
ongs | +0.191 |
bars | +0.190 |
Neg logit contributions | |
osate | -0.326 |
� | -0.249 |
ongyang | -0.248 |
insula | -0.245 |
withd | -0.243 |
Token | [ |
Token ID | 58 |
Feature activation | +1.59e-03 |
Pos logit contributions | |
Carbuncle | +1.539 |
hemy | +1.437 |
ndra | +1.398 |
bars | +1.341 |
ongs | +1.336 |
Neg logit contributions | |
osate | -2.101 |
� | -1.589 |
ongyang | -1.585 |
insula | -1.558 |
withd | -1.556 |
Token | # |
Token ID | 2 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
osate | +0.002 |
ongyang | +0.001 |
� | +0.001 |
insula | +0.001 |
withd | +0.001 |
Neg logit contributions | |
Carbuncle | -0.001 |
hemy | -0.001 |
ndra | -0.001 |
dh | -0.001 |
ongs | -0.001 |
Token | == |
Token ID | 6624 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
Carbuncle | +0.393 |
hemy | +0.371 |
ndra | +0.361 |
dh | +0.344 |
ongs | +0.343 |
Neg logit contributions | |
osate | -0.586 |
ongyang | -0.447 |
� | -0.446 |
withd | -0.438 |
insula | -0.436 |
Token | " |
Token ID | 366 |
Feature activation | -8.12e-01 |
Pos logit contributions | |
Carbuncle | +0.214 |
hemy | +0.201 |
ndra | +0.196 |
ongs | +0.187 |
bars | +0.186 |
Neg logit contributions | |
osate | -0.301 |
ongyang | -0.228 |
� | -0.228 |
insula | -0.223 |
withd | -0.222 |
Token | S |
Token ID | 50 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
Carbuncle | +0.597 |
hemy | +0.564 |
ndra | +0.549 |
dh | +0.526 |
ongs | +0.524 |
Neg logit contributions | |
osate | -0.827 |
ongyang | -0.623 |
� | -0.623 |
withd | -0.611 |
insula | -0.609 |
Token | liquid |
Token ID | 8122 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
Carbuncle | +0.279 |
hemy | +0.261 |
ndra | +0.253 |
ongs | +0.241 |
dh | +0.238 |
Neg logit contributions | |
osate | -0.461 |
� | -0.356 |
ongyang | -0.356 |
insula | -0.352 |
withd | -0.349 |
Token | amber |
Token ID | 36505 |
Feature activation | +4.05e-01 |
Pos logit contributions | |
osate | +0.351 |
� | +0.265 |
ongyang | +0.265 |
insula | +0.262 |
withd | +0.260 |
Neg logit contributions | |
Carbuncle | -0.258 |
hemy | -0.243 |
ndra | -0.236 |
ongs | -0.226 |
bars | -0.224 |
Token | and |
Token ID | 290 |
Feature activation | -9.37e-02 |
Pos logit contributions | |
osate | +0.429 |
ongyang | +0.329 |
� | +0.329 |
insula | +0.325 |
withd | +0.323 |
Neg logit contributions | |
Carbuncle | -0.282 |
hemy | -0.264 |
ndra | -0.257 |
ongs | -0.245 |
bars | -0.243 |
Token | f |
Token ID | 277 |
Feature activation | -3.52e-02 |
Pos logit contributions | |
Carbuncle | +0.072 |
hemy | +0.067 |
ndra | +0.066 |
ongs | +0.063 |
bars | +0.063 |
Neg logit contributions | |
osate | -0.093 |
� | -0.070 |
ongyang | -0.070 |
insula | -0.069 |
withd | -0.068 |
Token | icus |
Token ID | 24552 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
Carbuncle | +0.039 |
hemy | +0.037 |
ndra | +0.037 |
ongs | +0.036 |
dh | +0.036 |
Neg logit contributions | |
osate | -0.023 |
� | -0.014 |
ongyang | -0.014 |
withd | -0.014 |
Fug | -0.014 |
Token | trees |
Token ID | 7150 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
osate | +0.144 |
ongyang | +0.113 |
� | +0.112 |
insula | +0.111 |
withd | +0.111 |
Neg logit contributions | |
Carbuncle | -0.078 |
hemy | -0.072 |
ndra | -0.070 |
ongs | -0.066 |
bars | -0.066 |
Token | . |
Token ID | 13 |
Feature activation | -3.71e-01 |
Pos logit contributions | |
Carbuncle | +1.467 |
hemy | +1.380 |
ndra | +1.351 |
ongs | +1.300 |
bars | +1.290 |
Neg logit contributions | |
osate | -2.157 |
ongyang | -1.637 |
� | -1.624 |
insula | -1.609 |
Fug | -1.593 |
Token | They |
Token ID | 1119 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
Carbuncle | +0.268 |
hemy | +0.253 |
ndra | +0.246 |
ongs | +0.234 |
dh | +0.232 |
Neg logit contributions | |
osate | -0.383 |
� | -0.291 |
ongyang | -0.290 |
insula | -0.287 |
withd | -0.285 |
Token | are |
Token ID | 389 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
Carbuncle | +0.246 |
hemy | +0.230 |
ndra | +0.227 |
ongs | +0.216 |
bars | +0.216 |
Neg logit contributions | |
osate | -0.312 |
ongyang | -0.233 |
� | -0.232 |
insula | -0.230 |
withd | -0.227 |
Token | now |
Token ID | 783 |
Feature activation | -1.74e-01 |
Pos logit contributions | |
Carbuncle | +0.253 |
hemy | +0.238 |
ndra | +0.232 |
ongs | +0.222 |
bars | +0.221 |
Neg logit contributions | |
osate | -0.327 |
ongyang | -0.245 |
� | -0.244 |
insula | -0.241 |
withd | -0.239 |
Token | the |
Token ID | 262 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
Carbuncle | +0.131 |
hemy | +0.123 |
ndra | +0.120 |
ongs | +0.114 |
bars | +0.114 |
Neg logit contributions | |
osate | -0.175 |
ongyang | -0.132 |
� | -0.132 |
insula | -0.130 |
withd | -0.129 |
Token | thr |
Token ID | 5636 |
Feature activation | -8.73e-01 |
Pos logit contributions | |
Carbuncle | +0.137 |
hemy | +0.128 |
ndra | +0.125 |
ongs | +0.120 |
bars | +0.119 |
Neg logit contributions | |
osate | -0.191 |
� | -0.144 |
ongyang | -0.144 |
insula | -0.143 |
withd | -0.141 |
Token | ice |
Token ID | 501 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
Carbuncle | +0.655 |
hemy | +0.619 |
ndra | +0.602 |
ongs | +0.578 |
dh | +0.571 |
Neg logit contributions | |
osate | -0.878 |
� | -0.663 |
ongyang | -0.659 |
insula | -0.651 |
withd | -0.647 |
Token | - |
Token ID | 12 |
Feature activation | -7.35e-02 |
Pos logit contributions | |
Carbuncle | +0.377 |
hemy | +0.353 |
ndra | +0.346 |
ongs | +0.330 |
dh | +0.328 |
Neg logit contributions | |
osate | -0.515 |
ongyang | -0.388 |
� | -0.388 |
insula | -0.383 |
withd | -0.380 |
Token | cooked |
Token ID | 46591 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
Carbuncle | +0.042 |
hemy | +0.039 |
ndra | +0.037 |
dh | +0.035 |
ongs | +0.035 |
Neg logit contributions | |
osate | -0.087 |
ongyang | -0.069 |
� | -0.069 |
insula | -0.068 |
withd | -0.068 |
Token | bacon |
Token ID | 21385 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
Carbuncle | +0.081 |
hemy | +0.076 |
ndra | +0.074 |
ongs | +0.071 |
bars | +0.070 |
Neg logit contributions | |
osate | -0.117 |
� | -0.089 |
ongyang | -0.089 |
insula | -0.088 |
withd | -0.087 |
Token | tossed |
Token ID | 22591 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
osate | +0.346 |
� | +0.264 |
ongyang | +0.264 |
insula | +0.261 |
withd | +0.259 |
Neg logit contributions | |
Carbuncle | -0.229 |
hemy | -0.215 |
ndra | -0.208 |
ongs | -0.199 |
bars | -0.197 |
Token | with |
Token ID | 351 |
Feature activation | -6.01e-01 |
Pos logit contributions | |
Carbuncle | +1.561 |
hemy | +1.460 |
ndra | +1.426 |
bars | +1.386 |
ongs | +1.384 |
Neg logit contributions | |
osate | -2.019 |
� | -1.515 |
ongyang | -1.506 |
insula | -1.488 |
Fug | -1.459 |
Token | d |
Token ID | 288 |
Feature activation | -7.48e-01 |
Pos logit contributions | |
Carbuncle | +0.444 |
hemy | +0.415 |
ndra | +0.404 |
ongs | +0.387 |
bars | +0.386 |
Neg logit contributions | |
osate | -0.613 |
� | -0.463 |
ongyang | -0.462 |
insula | -0.458 |
withd | -0.452 |
Token | uk |
Token ID | 2724 |
Feature activation | -9.02e-02 |
Pos logit contributions | |
Carbuncle | +0.629 |
hemy | +0.602 |
ndra | +0.584 |
ongs | +0.567 |
dh | +0.561 |
Neg logit contributions | |
osate | -0.682 |
� | -0.498 |
ongyang | -0.491 |
insula | -0.488 |
Fug | -0.484 |
Token | ( |
Token ID | 357 |
Feature activation | -4.37e-01 |
Pos logit contributions | |
Carbuncle | +0.053 |
hemy | +0.049 |
ndra | +0.047 |
ongs | +0.044 |
dh | +0.044 |
Neg logit contributions | |
osate | -0.105 |
ongyang | -0.083 |
� | -0.083 |
insula | -0.082 |
Fug | -0.082 |
Token | K |
Token ID | 42 |
Feature activation | -2.54e-01 |
Pos logit contributions | |
Carbuncle | +0.311 |
hemy | +0.293 |
ndra | +0.285 |
dh | +0.274 |
ongs | +0.271 |
Neg logit contributions | |
osate | -0.457 |
ongyang | -0.346 |
� | -0.345 |
withd | -0.341 |
insula | -0.341 |
Token | no |
Token ID | 645 |
Feature activation | +1.87e-03 |
Pos logit contributions | |
Carbuncle | +0.524 |
hemy | +0.493 |
ndra | +0.479 |
bars | +0.457 |
ongs | +0.456 |
Neg logit contributions | |
osate | -0.787 |
ongyang | -0.600 |
� | -0.598 |
insula | -0.593 |
withd | -0.585 |
Token | one |
Token ID | 530 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
osate | +0.002 |
� | +0.002 |
ongyang | +0.002 |
insula | +0.002 |
withd | +0.002 |
Neg logit contributions | |
Carbuncle | -0.001 |
hemy | -0.001 |
ndra | -0.001 |
ongs | -0.001 |
dh | -0.001 |
Token | who |
Token ID | 508 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
osate | +0.517 |
� | +0.382 |
ongyang | +0.382 |
insula | +0.378 |
withd | +0.373 |
Neg logit contributions | |
Carbuncle | -0.425 |
hemy | -0.402 |
ndra | -0.393 |
ongs | -0.376 |
bars | -0.374 |
Token | needs |
Token ID | 2476 |
Feature activation | +4.41e-02 |
Pos logit contributions | |
osate | +0.111 |
ongyang | +0.082 |
� | +0.082 |
insula | +0.082 |
withd | +0.080 |
Neg logit contributions | |
Carbuncle | -0.089 |
hemy | -0.084 |
ndra | -0.082 |
ongs | -0.079 |
bars | -0.078 |
Token | a |
Token ID | 257 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
osate | +0.050 |
� | +0.039 |
ongyang | +0.039 |
insula | +0.039 |
withd | +0.038 |
Neg logit contributions | |
Carbuncle | -0.027 |
hemy | -0.025 |
ndra | -0.025 |
ongs | -0.023 |
dh | -0.023 |
Token | bed |
Token ID | 3996 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
osate | +0.142 |
ongyang | +0.111 |
� | +0.110 |
insula | +0.109 |
withd | +0.108 |
Neg logit contributions | |
Carbuncle | -0.075 |
hemy | -0.070 |
ndra | -0.068 |
bars | -0.064 |
ongs | -0.064 |
Token | can |
Token ID | 460 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
osate | +1.161 |
ongyang | +0.863 |
� | +0.860 |
insula | +0.849 |
withd | +0.843 |
Neg logit contributions | |
Carbuncle | -0.938 |
hemy | -0.889 |
ndra | -0.871 |
ongs | -0.834 |
dh | -0.829 |
Token | be |
Token ID | 307 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
osate | +0.546 |
� | +0.392 |
ongyang | +0.391 |
insula | +0.385 |
withd | +0.380 |
Neg logit contributions | |
Carbuncle | -0.542 |
hemy | -0.515 |
ndra | -0.504 |
ongs | -0.485 |
dh | -0.482 |
Token | refused |
Token ID | 6520 |
Feature activation | +5.78e-02 |
Pos logit contributions | |
osate | +0.175 |
� | +0.131 |
ongyang | +0.131 |
insula | +0.130 |
withd | +0.128 |
Neg logit contributions | |
Carbuncle | -0.129 |
hemy | -0.122 |
ndra | -0.119 |
ongs | -0.113 |
dh | -0.112 |
Token | one |
Token ID | 530 |
Feature activation | +5.50e-02 |
Pos logit contributions | |
osate | +0.064 |
ongyang | +0.049 |
� | +0.049 |
insula | +0.049 |
withd | +0.048 |
Neg logit contributions | |
Carbuncle | -0.038 |
hemy | -0.035 |
ndra | -0.034 |
ongs | -0.032 |
bars | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
osate | +0.061 |
ongyang | +0.047 |
� | +0.047 |
insula | +0.046 |
withd | +0.046 |
Neg logit contributions | |
Carbuncle | -0.036 |
hemy | -0.033 |
ndra | -0.032 |
bars | -0.031 |
ongs | -0.031 |
Token | to |
Token ID | 284 |
Feature activation | -4.71e-03 |
Pos logit contributions | |
osate | +0.031 |
� | +0.023 |
ongyang | +0.023 |
insula | +0.023 |
withd | +0.023 |
Neg logit contributions | |
Carbuncle | -0.023 |
hemy | -0.021 |
ndra | -0.021 |
ongs | -0.020 |
bars | -0.020 |
Token | offer |
Token ID | 2897 |
Feature activation | -4.26e-02 |
Pos logit contributions | |
Carbuncle | +0.004 |
hemy | +0.004 |
ndra | +0.004 |
ongs | +0.003 |
dh | +0.003 |
Neg logit contributions | |
osate | -0.004 |
� | -0.003 |
ongyang | -0.003 |
satisf | -0.003 |
withd | -0.003 |
Token | amendments |
Token ID | 17835 |
Feature activation | +2.07e-02 |
Pos logit contributions | |
Carbuncle | +0.032 |
hemy | +0.030 |
ndra | +0.029 |
ongs | +0.028 |
dh | +0.028 |
Neg logit contributions | |
osate | -0.043 |
� | -0.032 |
ongyang | -0.032 |
insula | -0.032 |
withd | -0.032 |
Token | when |
Token ID | 618 |
Feature activation | +6.00e-03 |
Pos logit contributions | |
osate | +0.021 |
� | +0.016 |
ongyang | +0.016 |
insula | +0.016 |
withd | +0.016 |
Neg logit contributions | |
Carbuncle | -0.015 |
hemy | -0.014 |
ndra | -0.014 |
ongs | -0.013 |
bars | -0.013 |
Token | the |
Token ID | 262 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
osate | +0.006 |
ongyang | +0.004 |
� | +0.004 |
insula | +0.004 |
withd | +0.004 |
Neg logit contributions | |
Carbuncle | -0.005 |
hemy | -0.004 |
ndra | -0.004 |
bars | -0.004 |
ongs | -0.004 |
Token | bill |
Token ID | 2855 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
osate | +0.265 |
� | +0.203 |
ongyang | +0.202 |
insula | +0.200 |
withd | +0.199 |
Neg logit contributions | |
Carbuncle | -0.179 |
hemy | -0.168 |
ndra | -0.163 |
ongs | -0.155 |
dh | -0.154 |
Token | reached |
Token ID | 4251 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
osate | +1.090 |
� | +0.810 |
ongyang | +0.808 |
insula | +0.796 |
withd | +0.791 |
Neg logit contributions | |
Carbuncle | -0.902 |
hemy | -0.854 |
ndra | -0.832 |
ongs | -0.797 |
dh | -0.791 |
Token | the |
Token ID | 262 |
Feature activation | +7.18e-02 |
Pos logit contributions | |
osate | +0.333 |
� | +0.249 |
ongyang | +0.248 |
insula | +0.245 |
satisf | +0.244 |
Neg logit contributions | |
Carbuncle | -0.269 |
hemy | -0.256 |
ndra | -0.250 |
ongs | -0.239 |
dh | -0.236 |
Token | Senate |
Token ID | 3845 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
osate | +0.074 |
� | +0.056 |
ongyang | +0.056 |
insula | +0.055 |
withd | +0.055 |
Neg logit contributions | |
Carbuncle | -0.052 |
hemy | -0.049 |
ndra | -0.048 |
ongs | -0.045 |
dh | -0.045 |
Token | floor |
Token ID | 4314 |
Feature activation | -8.34e-02 |
Pos logit contributions | |
osate | +0.574 |
� | +0.437 |
ongyang | +0.435 |
insula | +0.431 |
withd | +0.427 |
Neg logit contributions | |
Carbuncle | -0.403 |
hemy | -0.380 |
ndra | -0.369 |
ongs | -0.352 |
dh | -0.349 |
Token | . |
Token ID | 13 |
Feature activation | +9.83e-02 |
Pos logit contributions | |
Carbuncle | +0.055 |
hemy | +0.052 |
ndra | +0.050 |
ongs | +0.048 |
bars | +0.047 |
Neg logit contributions | |
osate | -0.091 |
� | -0.070 |
ongyang | -0.070 |
insula | -0.069 |
withd | -0.069 |
Token | < |
Token ID | 27 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
osate | +1.110 |
ongyang | +0.841 |
� | +0.840 |
insula | +0.829 |
withd | +0.822 |
Neg logit contributions | |
Carbuncle | -0.765 |
hemy | -0.725 |
ndra | -0.704 |
ongs | -0.675 |
dh | -0.673 |
Token | 570 |
Token ID | 39254 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
osate | +1.467 |
ongyang | +1.125 |
� | +1.120 |
insula | +1.109 |
withd | +1.101 |
Neg logit contributions | |
Carbuncle | -0.912 |
hemy | -0.863 |
ndra | -0.839 |
dh | -0.799 |
ongs | -0.795 |
Token | : |
Token ID | 25 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
osate | +1.096 |
ongyang | +0.809 |
� | +0.805 |
insula | +0.796 |
withd | +0.785 |
Neg logit contributions | |
Carbuncle | -0.920 |
hemy | -0.877 |
ndra | -0.857 |
dh | -0.823 |
ongs | -0.819 |
Token | set |
Token ID | 900 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
osate | +1.171 |
ongyang | +0.887 |
� | +0.885 |
insula | +0.872 |
withd | +0.864 |
Neg logit contributions | |
Carbuncle | -0.814 |
hemy | -0.768 |
ndra | -0.746 |
ongs | -0.711 |
dh | -0.709 |
Token | sw |
Token ID | 1509 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
osate | +0.264 |
ongyang | +0.201 |
� | +0.201 |
insula | +0.198 |
withd | +0.196 |
Neg logit contributions | |
Carbuncle | -0.178 |
hemy | -0.167 |
ndra | -0.162 |
bars | -0.155 |
ongs | -0.155 |
Token | = |
Token ID | 28 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
osate | +1.220 |
� | +0.939 |
ongyang | +0.938 |
insula | +0.926 |
withd | +0.917 |
Neg logit contributions | |
Carbuncle | -0.770 |
hemy | -0.724 |
ndra | -0.702 |
ongs | -0.668 |
dh | -0.663 |
Token | 4 |
Token ID | 19 |
Feature activation | +9.12e-03 |
Pos logit contributions | |
osate | +1.437 |
� | +1.107 |
ongyang | +1.106 |
insula | +1.092 |
withd | +1.086 |
Neg logit contributions | |
Carbuncle | -0.889 |
hemy | -0.833 |
ndra | -0.808 |
ongs | -0.768 |
dh | -0.763 |
Token | : |
Token ID | 25 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
osate | +0.009 |
ongyang | +0.007 |
� | +0.007 |
insula | +0.007 |
withd | +0.006 |
Neg logit contributions | |
Carbuncle | -0.007 |
hemy | -0.007 |
ndra | -0.007 |
bars | -0.006 |
dh | -0.006 |
Token | */ |
Token ID | 9466 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
osate | +1.146 |
� | +0.866 |
ongyang | +0.865 |
insula | +0.851 |
withd | +0.844 |
Neg logit contributions | |
Carbuncle | -0.822 |
hemy | -0.777 |
ndra | -0.756 |
ongs | -0.722 |
bars | -0.718 |
Token | There |
Token ID | 1318 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
osate | +0.601 |
� | +0.467 |
ongyang | +0.467 |
insula | +0.461 |
withd | +0.457 |
Neg logit contributions | |
Carbuncle | -0.342 |
hemy | -0.318 |
ndra | -0.309 |
ongs | -0.292 |
bars | -0.290 |
Token | can |
Token ID | 460 |
Feature activation | +8.50e-01 |
Pos logit contributions | |
osate | +0.489 |
� | +0.371 |
ongyang | +0.371 |
insula | +0.367 |
withd | +0.364 |
Neg logit contributions | |
Carbuncle | -0.346 |
hemy | -0.327 |
ndra | -0.318 |
ongs | -0.304 |
bars | -0.302 |
Token | politically |
Token ID | 11889 |
Feature activation | +3.63e-03 |
Pos logit contributions | |
osate | +0.033 |
ongyang | +0.025 |
� | +0.025 |
insula | +0.024 |
withd | +0.024 |
Neg logit contributions | |
Carbuncle | -0.022 |
hemy | -0.021 |
ndra | -0.020 |
bars | -0.020 |
ongs | -0.019 |
Token | correct |
Token ID | 3376 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
osate | +0.004 |
ongyang | +0.003 |
� | +0.003 |
insula | +0.003 |
withd | +0.003 |
Neg logit contributions | |
Carbuncle | -0.003 |
hemy | -0.003 |
ndra | -0.003 |
bars | -0.003 |
ongs | -0.003 |
Token | number |
Token ID | 1271 |
Feature activation | +7.09e-01 |
Pos logit contributions | |
Carbuncle | +0.117 |
hemy | +0.110 |
ndra | +0.107 |
bars | +0.103 |
ongs | +0.103 |
Neg logit contributions | |
osate | -0.163 |
ongyang | -0.124 |
� | -0.123 |
insula | -0.122 |
withd | -0.121 |
Token | - |
Token ID | 12 |
Feature activation | +4.64e-01 |
Pos logit contributions | |
osate | +0.738 |
ongyang | +0.563 |
� | +0.559 |
insula | +0.557 |
withd | +0.549 |
Neg logit contributions | |
Carbuncle | -0.507 |
hemy | -0.479 |
ndra | -0.461 |
bars | -0.444 |
ongs | -0.443 |
Token | cr |
Token ID | 6098 |
Feature activation | +8.95e-01 |
Pos logit contributions | |
osate | +0.461 |
ongyang | +0.345 |
� | +0.344 |
insula | +0.340 |
withd | +0.338 |
Neg logit contributions | |
Carbuncle | -0.355 |
hemy | -0.338 |
ndra | -0.327 |
dh | -0.314 |
ongs | -0.313 |
Token | unch |
Token ID | 3316 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
osate | +0.817 |
� | +0.596 |
ongyang | +0.594 |
insula | +0.585 |
withd | +0.580 |
Neg logit contributions | |
Carbuncle | -0.754 |
hemy | -0.716 |
ndra | -0.698 |
ongs | -0.672 |
dh | -0.667 |
Token | ing |
Token ID | 278 |
Feature activation | -3.34e-02 |
Pos logit contributions | |
osate | +1.250 |
� | +0.952 |
ongyang | +0.952 |
insula | +0.942 |
withd | +0.936 |
Neg logit contributions | |
Carbuncle | -0.866 |
hemy | -0.824 |
ndra | -0.787 |
ongs | -0.761 |
bars | -0.756 |
Token | . |
Token ID | 13 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
Carbuncle | +0.024 |
hemy | +0.022 |
ndra | +0.021 |
ongs | +0.021 |
bars | +0.021 |
Neg logit contributions | |
osate | -0.035 |
ongyang | -0.027 |
� | -0.027 |
insula | -0.026 |
withd | -0.026 |
Token |
|
Token ID | 198 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
osate | +0.121 |
ongyang | +0.091 |
� | +0.091 |
insula | +0.089 |
withd | +0.089 |
Neg logit contributions | |
Carbuncle | -0.096 |
hemy | -0.090 |
ndra | -0.088 |
ongs | -0.084 |
dh | -0.084 |
Token |
|
Token ID | 198 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
osate | +0.133 |
� | +0.096 |
ongyang | +0.094 |
Fug | +0.093 |
satisf | +0.093 |
Neg logit contributions | |
Carbuncle | -0.139 |
hemy | -0.133 |
ndra | -0.128 |
ongs | -0.124 |
bars | -0.123 |
Token | Out |
Token ID | 7975 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
osate | +0.111 |
ongyang | +0.082 |
� | +0.082 |
withd | +0.081 |
insula | +0.081 |
Neg logit contributions | |
Carbuncle | -0.088 |
hemy | -0.084 |
ndra | -0.082 |
dh | -0.078 |
ongs | -0.078 |
Token | -, |
Token ID | 20995 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
osate | +0.608 |
ongyang | +0.436 |
� | +0.435 |
insula | +0.429 |
withd | +0.424 |
Neg logit contributions | |
Carbuncle | -0.601 |
hemy | -0.571 |
ndra | -0.558 |
ongs | -0.539 |
bars | -0.535 |
Token | five |
Token ID | 1936 |
Feature activation | +6.44e-01 |
Pos logit contributions | |
osate | +1.191 |
� | +0.878 |
ongyang | +0.875 |
insula | +0.863 |
withd | +0.856 |
Neg logit contributions | |
Carbuncle | -1.032 |
hemy | -0.978 |
ndra | -0.953 |
ongs | -0.915 |
dh | -0.908 |
Token | -, |
Token ID | 20995 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
osate | +0.550 |
ongyang | +0.389 |
� | +0.388 |
insula | +0.382 |
withd | +0.378 |
Neg logit contributions | |
Carbuncle | -0.582 |
hemy | -0.555 |
ndra | -0.542 |
ongs | -0.524 |
bars | -0.520 |
Token | and |
Token ID | 290 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
osate | +1.163 |
� | +0.851 |
ongyang | +0.849 |
insula | +0.837 |
withd | +0.830 |
Neg logit contributions | |
Carbuncle | -1.063 |
hemy | -1.010 |
ndra | -0.985 |
ongs | -0.944 |
dh | -0.940 |
Token | ten |
Token ID | 3478 |
Feature activation | +7.07e-01 |
Pos logit contributions | |
osate | +1.119 |
� | +0.821 |
ongyang | +0.819 |
insula | +0.807 |
withd | +0.800 |
Neg logit contributions | |
Carbuncle | -1.002 |
hemy | -0.950 |
ndra | -0.927 |
ongs | -0.890 |
dh | -0.884 |
Token | - |
Token ID | 12 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
osate | +0.724 |
� | +0.550 |
ongyang | +0.549 |
insula | +0.541 |
withd | +0.537 |
Neg logit contributions | |
Carbuncle | -0.516 |
hemy | -0.486 |
ndra | -0.472 |
ongs | -0.451 |
dh | -0.447 |
Token | cent |
Token ID | 1087 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
osate | +1.198 |
� | +0.877 |
ongyang | +0.870 |
insula | +0.858 |
withd | +0.853 |
Neg logit contributions | |
Carbuncle | -1.129 |
hemy | -1.071 |
ndra | -1.044 |
ongs | -1.000 |
dh | -0.996 |
Token | pieces |
Token ID | 5207 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
osate | +1.439 |
� | +1.169 |
ongyang | +1.165 |
insula | +1.153 |
withd | +1.148 |
Neg logit contributions | |
Carbuncle | -0.496 |
hemy | -0.452 |
ndra | -0.430 |
ongs | -0.392 |
dh | -0.390 |
Token | of |
Token ID | 286 |
Feature activation | +8.20e-01 |
Pos logit contributions | |
osate | +0.027 |
ongyang | +0.021 |
� | +0.021 |
insula | +0.020 |
withd | +0.020 |
Neg logit contributions | |
Carbuncle | -0.019 |
hemy | -0.018 |
ndra | -0.017 |
ongs | -0.016 |
bars | -0.016 |
Token | an |
Token ID | 281 |
Feature activation | +7.63e-01 |
Pos logit contributions | |
osate | +0.832 |
� | +0.626 |
ongyang | +0.625 |
insula | +0.619 |
withd | +0.611 |
Neg logit contributions | |
Carbuncle | -0.612 |
hemy | -0.574 |
ndra | -0.559 |
ongs | -0.536 |
bars | -0.535 |
Token | alloy |
Token ID | 36186 |
Feature activation | +7.88e-01 |
Pos logit contributions | |
osate | +0.750 |
� | +0.561 |
ongyang | +0.560 |
insula | +0.552 |
withd | +0.548 |
Neg logit contributions | |
Carbuncle | -0.590 |
hemy | -0.557 |
ndra | -0.542 |
ongs | -0.520 |
dh | -0.515 |
Token | feet |
Token ID | 3625 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
Carbuncle | +0.181 |
hemy | +0.169 |
ndra | +0.165 |
ongs | +0.157 |
bars | +0.155 |
Neg logit contributions | |
osate | -0.299 |
� | -0.230 |
ongyang | -0.230 |
insula | -0.228 |
withd | -0.227 |
Token | : |
Token ID | 25 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
Carbuncle | +0.338 |
hemy | +0.319 |
ndra | +0.308 |
ongs | +0.297 |
bars | +0.297 |
Neg logit contributions | |
osate | -0.508 |
ongyang | -0.387 |
� | -0.383 |
insula | -0.381 |
withd | -0.375 |
Token | according |
Token ID | 1864 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
osate | +0.425 |
� | +0.321 |
ongyang | +0.319 |
insula | +0.316 |
withd | +0.313 |
Neg logit contributions | |
Carbuncle | -0.315 |
hemy | -0.297 |
ndra | -0.289 |
ongs | -0.276 |
bars | -0.274 |
Token | to |
Token ID | 284 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
osate | +0.271 |
� | +0.205 |
ongyang | +0.203 |
Fug | +0.201 |
satisf | +0.200 |
Neg logit contributions | |
Carbuncle | -0.220 |
hemy | -0.208 |
ndra | -0.200 |
ongs | -0.193 |
dh | -0.190 |
Token | figures |
Token ID | 5538 |
Feature activation | +4.55e-01 |
Pos logit contributions | |
Carbuncle | +0.087 |
hemy | +0.082 |
ndra | +0.079 |
ongs | +0.076 |
bars | +0.075 |
Neg logit contributions | |
osate | -0.131 |
� | -0.100 |
ongyang | -0.100 |
insula | -0.099 |
withd | -0.098 |
Token | released |
Token ID | 2716 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
osate | +0.451 |
� | +0.338 |
ongyang | +0.337 |
insula | +0.333 |
withd | +0.330 |
Neg logit contributions | |
Carbuncle | -0.349 |
hemy | -0.329 |
ndra | -0.321 |
ongs | -0.307 |
dh | -0.305 |
Token | in |
Token ID | 287 |
Feature activation | -2.61e-02 |
Pos logit contributions | |
osate | +0.341 |
� | +0.255 |
ongyang | +0.254 |
insula | +0.252 |
withd | +0.250 |
Neg logit contributions | |
Carbuncle | -0.260 |
hemy | -0.245 |
ndra | -0.239 |
ongs | -0.228 |
bars | -0.227 |
Token | 2014 |
Token ID | 1946 |
Feature activation | +1.86e-01 |
Pos logit contributions | |
Carbuncle | +0.017 |
hemy | +0.016 |
ndra | +0.015 |
ongs | +0.014 |
dh | +0.014 |
Neg logit contributions | |
osate | -0.029 |
� | -0.022 |
ongyang | -0.022 |
insula | -0.022 |
Fug | -0.022 |
Token | by |
Token ID | 416 |
Feature activation | -7.26e-02 |
Pos logit contributions | |
osate | +0.185 |
� | +0.139 |
ongyang | +0.138 |
insula | +0.137 |
withd | +0.136 |
Neg logit contributions | |
Carbuncle | -0.141 |
hemy | -0.134 |
ndra | -0.130 |
ongs | -0.125 |
bars | -0.125 |
Token | the |
Token ID | 262 |
Feature activation | -3.19e-02 |
Pos logit contributions | |
Carbuncle | +0.054 |
hemy | +0.051 |
ndra | +0.050 |
ongs | +0.048 |
bars | +0.048 |
Neg logit contributions | |
osate | -0.073 |
� | -0.055 |
ongyang | -0.054 |
insula | -0.054 |
withd | -0.054 |
Token | US |
Token ID | 1294 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
Carbuncle | +0.024 |
hemy | +0.023 |
ndra | +0.022 |
ongs | +0.021 |
bars | +0.021 |
Neg logit contributions | |
osate | -0.032 |
� | -0.024 |
ongyang | -0.024 |
insula | -0.023 |
withd | -0.023 |
Token | is |
Token ID | 318 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
Carbuncle | +0.083 |
hemy | +0.078 |
ndra | +0.076 |
ongs | +0.073 |
bars | +0.072 |
Neg logit contributions | |
osate | -0.113 |
� | -0.085 |
ongyang | -0.085 |
insula | -0.084 |
withd | -0.083 |
Token | a |
Token ID | 257 |
Feature activation | -3.48e-01 |
Pos logit contributions | |
Carbuncle | +0.307 |
hemy | +0.288 |
ndra | +0.281 |
bars | +0.268 |
ongs | +0.268 |
Neg logit contributions | |
osate | -0.402 |
� | -0.300 |
ongyang | -0.300 |
insula | -0.297 |
withd | -0.293 |
Token | firm |
Token ID | 4081 |
Feature activation | +7.70e-01 |
Pos logit contributions | |
Carbuncle | +0.261 |
hemy | +0.245 |
ndra | +0.238 |
ongs | +0.227 |
dh | +0.227 |
Neg logit contributions | |
osate | -0.352 |
� | -0.264 |
ongyang | -0.264 |
insula | -0.261 |
withd | -0.258 |
Token | and |
Token ID | 290 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
osate | +0.754 |
� | +0.560 |
ongyang | +0.558 |
insula | +0.553 |
withd | +0.548 |
Neg logit contributions | |
Carbuncle | -0.601 |
hemy | -0.567 |
ndra | -0.554 |
ongs | -0.529 |
bars | -0.528 |
Token | explicit |
Token ID | 7952 |
Feature activation | -4.16e-02 |
Pos logit contributions | |
osate | +0.249 |
ongyang | +0.186 |
� | +0.185 |
insula | +0.185 |
withd | +0.181 |
Neg logit contributions | |
Carbuncle | -0.185 |
hemy | -0.173 |
ndra | -0.169 |
bars | -0.162 |
dh | -0.161 |
Token | reminder |
Token ID | 15438 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
Carbuncle | +0.032 |
hemy | +0.030 |
ndra | +0.029 |
bars | +0.028 |
ongs | +0.028 |
Neg logit contributions | |
osate | -0.041 |
ongyang | -0.031 |
� | -0.031 |
insula | -0.030 |
withd | -0.030 |
Token | of |
Token ID | 286 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
osate | +0.240 |
� | +0.185 |
insula | +0.183 |
ongyang | +0.183 |
withd | +0.181 |
Neg logit contributions | |
Carbuncle | -0.156 |
hemy | -0.147 |
ndra | -0.144 |
bars | -0.138 |
ongs | -0.137 |
Token | the |
Token ID | 262 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
Carbuncle | +0.154 |
hemy | +0.145 |
ndra | +0.141 |
ongs | +0.135 |
bars | +0.135 |
Neg logit contributions | |
osate | -0.203 |
� | -0.153 |
ongyang | -0.153 |
insula | -0.151 |
withd | -0.149 |
Token | ideal |
Token ID | 7306 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
Carbuncle | +0.153 |
hemy | +0.143 |
ndra | +0.139 |
ongs | +0.133 |
bars | +0.133 |
Neg logit contributions | |
osate | -0.216 |
� | -0.164 |
ongyang | -0.164 |
insula | -0.162 |
withd | -0.160 |
Token | of |
Token ID | 286 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
Carbuncle | +0.430 |
hemy | +0.404 |
ndra | +0.394 |
bars | +0.379 |
ongs | +0.376 |
Neg logit contributions | |
osate | -0.618 |
ongyang | -0.471 |
� | -0.470 |
insula | -0.463 |
withd | -0.460 |
Token | justice |
Token ID | 5316 |
Feature activation | +8.81e-02 |
Pos logit contributions | |
Carbuncle | +0.188 |
hemy | +0.176 |
ndra | +0.171 |
bars | +0.164 |
ongs | +0.163 |
Neg logit contributions | |
osate | -0.278 |
� | -0.212 |
ongyang | -0.212 |
insula | -0.209 |
withd | -0.207 |
Token | at |
Token ID | 379 |
Feature activation | +8.97e-02 |
Pos logit contributions | |
osate | +0.318 |
� | +0.239 |
ongyang | +0.239 |
insula | +0.235 |
Fug | +0.232 |
Neg logit contributions | |
Carbuncle | -0.235 |
hemy | -0.220 |
ndra | -0.213 |
ongs | -0.206 |
bars | -0.205 |
Token | school |
Token ID | 1524 |
Feature activation | +6.43e-01 |
Pos logit contributions | |
osate | +0.088 |
� | +0.066 |
ongyang | +0.066 |
insula | +0.065 |
withd | +0.064 |
Neg logit contributions | |
Carbuncle | -0.070 |
hemy | -0.065 |
ndra | -0.064 |
ongs | -0.061 |
bars | -0.061 |
Token | in |
Token ID | 287 |
Feature activation | -5.37e-02 |
Pos logit contributions | |
osate | +0.689 |
ongyang | +0.528 |
� | +0.527 |
insula | +0.521 |
withd | +0.516 |
Neg logit contributions | |
Carbuncle | -0.442 |
hemy | -0.413 |
ndra | -0.403 |
ongs | -0.384 |
dh | -0.381 |
Token | the |
Token ID | 262 |
Feature activation | +8.17e-02 |
Pos logit contributions | |
Carbuncle | +0.039 |
hemy | +0.036 |
ndra | +0.035 |
ongs | +0.034 |
dh | +0.033 |
Neg logit contributions | |
osate | -0.056 |
� | -0.042 |
ongyang | -0.042 |
insula | -0.042 |
withd | -0.041 |
Token | mainly |
Token ID | 8384 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
osate | +0.084 |
� | +0.064 |
ongyang | +0.064 |
insula | +0.063 |
withd | +0.063 |
Neg logit contributions | |
Carbuncle | -0.059 |
hemy | -0.056 |
ndra | -0.054 |
ongs | -0.052 |
dh | -0.051 |
Token | Catholic |
Token ID | 7835 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
osate | +0.124 |
� | +0.093 |
ongyang | +0.093 |
insula | +0.092 |
withd | +0.091 |
Neg logit contributions | |
Carbuncle | -0.093 |
hemy | -0.087 |
ndra | -0.085 |
ongs | -0.081 |
bars | -0.081 |
Token | but |
Token ID | 475 |
Feature activation | -4.14e-01 |
Pos logit contributions | |
osate | +0.312 |
� | +0.239 |
ongyang | +0.238 |
insula | +0.235 |
withd | +0.233 |
Neg logit contributions | |
Carbuncle | -0.211 |
hemy | -0.198 |
ndra | -0.192 |
ongs | -0.184 |
bars | -0.184 |
Token | largely |
Token ID | 5688 |
Feature activation | +3.49e-01 |
Pos logit contributions | |
Carbuncle | +0.336 |
hemy | +0.319 |
ndra | +0.309 |
ongs | +0.299 |
dh | +0.297 |
Neg logit contributions | |
osate | -0.393 |
� | -0.289 |
ongyang | -0.289 |
insula | -0.284 |
withd | -0.279 |
Token | tolerant |
Token ID | 33435 |
Feature activation | -4.78e-01 |
Pos logit contributions | |
osate | +0.338 |
ongyang | +0.251 |
� | +0.251 |
insula | +0.247 |
withd | +0.243 |
Neg logit contributions | |
Carbuncle | -0.276 |
hemy | -0.261 |
ndra | -0.253 |
ongs | -0.243 |
bars | -0.242 |
Token | Philippines |
Token ID | 13316 |
Feature activation | -8.45e-01 |
Pos logit contributions | |
Carbuncle | +0.344 |
hemy | +0.322 |
ndra | +0.313 |
ongs | +0.299 |
bars | +0.297 |
Neg logit contributions | |
osate | -0.497 |
� | -0.378 |
ongyang | -0.377 |
insula | -0.373 |
withd | -0.370 |
Token | . |
Token ID | 13 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
Carbuncle | +0.534 |
hemy | +0.495 |
ndra | +0.479 |
ongs | +0.460 |
dh | +0.456 |
Neg logit contributions | |
osate | -0.950 |
� | -0.739 |
ongyang | -0.738 |
insula | -0.728 |
Fug | -0.724 |
Token | each |
Token ID | 1123 |
Feature activation | -9.55e-02 |
Pos logit contributions | |
osate | +0.137 |
� | +0.106 |
ongyang | +0.105 |
insula | +0.103 |
withd | +0.103 |
Neg logit contributions | |
Carbuncle | -0.092 |
hemy | -0.087 |
ndra | -0.084 |
bars | -0.080 |
ongs | -0.080 |
Token | category |
Token ID | 6536 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
Carbuncle | +0.071 |
hemy | +0.066 |
ndra | +0.064 |
ongs | +0.062 |
bars | +0.062 |
Neg logit contributions | |
osate | -0.097 |
� | -0.073 |
ongyang | -0.073 |
insula | -0.072 |
withd | -0.072 |
Token | are |
Token ID | 389 |
Feature activation | -3.71e-02 |
Pos logit contributions | |
osate | +1.042 |
� | +0.770 |
ongyang | +0.767 |
insula | +0.756 |
withd | +0.749 |
Neg logit contributions | |
Carbuncle | -0.871 |
hemy | -0.821 |
ndra | -0.804 |
ongs | -0.776 |
bars | -0.769 |
Token | marked |
Token ID | 7498 |
Feature activation | -9.64e-02 |
Pos logit contributions | |
Carbuncle | +0.030 |
hemy | +0.029 |
ndra | +0.028 |
ongs | +0.027 |
bars | +0.027 |
Neg logit contributions | |
osate | -0.035 |
ongyang | -0.026 |
� | -0.026 |
insula | -0.025 |
withd | -0.025 |
Token | with |
Token ID | 351 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
Carbuncle | +0.076 |
hemy | +0.072 |
ndra | +0.070 |
ongs | +0.067 |
bars | +0.067 |
Neg logit contributions | |
osate | -0.094 |
� | -0.070 |
ongyang | -0.069 |
insula | -0.068 |
withd | -0.067 |
Token | a |
Token ID | 257 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
osate | +0.189 |
� | +0.146 |
ongyang | +0.146 |
insula | +0.144 |
withd | +0.143 |
Neg logit contributions | |
Carbuncle | -0.115 |
hemy | -0.107 |
ndra | -0.104 |
ongs | -0.099 |
dh | -0.098 |
Token | star |
Token ID | 3491 |
Feature activation | +8.48e-02 |
Pos logit contributions | |
Carbuncle | +0.019 |
hemy | +0.018 |
ndra | +0.017 |
ongs | +0.017 |
bars | +0.017 |
Neg logit contributions | |
osate | -0.029 |
� | -0.022 |
ongyang | -0.022 |
insula | -0.022 |
withd | -0.021 |
Token | ( |
Token ID | 357 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
osate | +0.087 |
ongyang | +0.066 |
� | +0.066 |
insula | +0.065 |
withd | +0.065 |
Neg logit contributions | |
Carbuncle | -0.062 |
hemy | -0.058 |
ndra | -0.056 |
ongs | -0.054 |
bars | -0.054 |
Token | ). |
Token ID | 6739 |
Feature activation | +6.93e-02 |
Pos logit contributions | |
Carbuncle | +0.098 |
hemy | +0.092 |
ndra | +0.090 |
ongs | +0.085 |
dh | +0.085 |
Neg logit contributions | |
osate | -0.145 |
ongyang | -0.110 |
� | -0.110 |
insula | -0.109 |
withd | -0.108 |
Token |
|
Token ID | 198 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
osate | +0.067 |
� | +0.050 |
ongyang | +0.050 |
insula | +0.049 |
withd | +0.049 |
Neg logit contributions | |
Carbuncle | -0.055 |
hemy | -0.052 |
ndra | -0.051 |
ongs | -0.049 |
dh | -0.048 |
Token |
|
Token ID | 198 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
osate | +0.169 |
� | +0.122 |
ongyang | +0.120 |
Fug | +0.119 |
satisf | +0.118 |
Neg logit contributions | |
Carbuncle | -0.175 |
hemy | -0.167 |
ndra | -0.162 |
ongs | -0.157 |
bars | -0.155 |
Token | than |
Token ID | 621 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
osate | +0.367 |
� | +0.277 |
ongyang | +0.276 |
insula | +0.272 |
withd | +0.270 |
Neg logit contributions | |
Carbuncle | -0.276 |
hemy | -0.261 |
ndra | -0.254 |
ongs | -0.243 |
dh | -0.241 |
Token | the |
Token ID | 262 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
Carbuncle | +0.102 |
hemy | +0.096 |
ndra | +0.093 |
ongs | +0.089 |
dh | +0.088 |
Neg logit contributions | |
osate | -0.141 |
� | -0.107 |
ongyang | -0.106 |
insula | -0.105 |
withd | -0.104 |
Token | last |
Token ID | 938 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
osate | +0.177 |
� | +0.135 |
ongyang | +0.134 |
insula | +0.133 |
withd | +0.132 |
Neg logit contributions | |
Carbuncle | -0.121 |
hemy | -0.114 |
ndra | -0.111 |
ongs | -0.106 |
dh | -0.105 |
Token | home |
Token ID | 1363 |
Feature activation | +5.68e-01 |
Pos logit contributions | |
osate | +0.295 |
� | +0.224 |
ongyang | +0.223 |
insula | +0.220 |
Fug | +0.219 |
Neg logit contributions | |
Carbuncle | -0.212 |
hemy | -0.202 |
ndra | -0.194 |
ongs | -0.186 |
dh | -0.185 |
Token | of |
Token ID | 286 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
osate | +0.583 |
� | +0.443 |
ongyang | +0.441 |
insula | +0.437 |
withd | +0.433 |
Neg logit contributions | |
Carbuncle | -0.414 |
hemy | -0.390 |
ndra | -0.377 |
ongs | -0.361 |
dh | -0.358 |
Token | the |
Token ID | 262 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
osate | +0.150 |
� | +0.114 |
ongyang | +0.114 |
insula | +0.112 |
withd | +0.111 |
Neg logit contributions | |
Carbuncle | -0.108 |
hemy | -0.102 |
ndra | -0.099 |
ongs | -0.094 |
dh | -0.094 |
Token | Jersey |
Token ID | 8221 |
Feature activation | -7.92e-01 |
Pos logit contributions | |
osate | +0.306 |
� | +0.232 |
ongyang | +0.232 |
insula | +0.229 |
withd | +0.227 |
Neg logit contributions | |
Carbuncle | -0.215 |
hemy | -0.202 |
ndra | -0.196 |
ongs | -0.187 |
dh | -0.186 |
Token | City |
Token ID | 2254 |
Feature activation | -9.89e-01 |
Pos logit contributions | |
Carbuncle | +0.467 |
hemy | +0.428 |
ndra | +0.416 |
ongs | +0.391 |
bars | +0.388 |
Neg logit contributions | |
osate | -0.924 |
� | -0.733 |
ongyang | -0.730 |
withd | -0.721 |
insula | -0.720 |
Token | Museum |
Token ID | 9594 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
Carbuncle | +0.678 |
hemy | +0.628 |
ndra | +0.615 |
ongs | +0.585 |
bars | +0.581 |
Neg logit contributions | |
osate | -1.062 |
� | -0.818 |
ongyang | -0.816 |
insula | -0.805 |
withd | -0.800 |
Token | at |
Token ID | 379 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
Carbuncle | +0.135 |
hemy | +0.127 |
ndra | +0.124 |
ongs | +0.118 |
bars | +0.117 |
Neg logit contributions | |
osate | -0.195 |
� | -0.148 |
ongyang | -0.148 |
insula | -0.146 |
withd | -0.145 |
Token | Montgomery |
Token ID | 21532 |
Feature activation | +8.96e-01 |
Pos logit contributions | |
Carbuncle | +0.160 |
hemy | +0.150 |
ndra | +0.147 |
ongs | +0.141 |
bars | +0.140 |
Neg logit contributions | |
osate | -0.198 |
� | -0.148 |
ongyang | -0.147 |
insula | -0.145 |
withd | -0.144 |
Token | to |
Token ID | 284 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
Carbuncle | +0.002 |
hemy | +0.002 |
ndra | +0.002 |
bars | +0.002 |
ongs | +0.002 |
Neg logit contributions | |
osate | -0.003 |
� | -0.003 |
ongyang | -0.003 |
insula | -0.003 |
withd | -0.003 |
Token | media |
Token ID | 2056 |
Feature activation | +6.11e-02 |
Pos logit contributions | |
osate | +0.144 |
� | +0.109 |
ongyang | +0.109 |
insula | +0.108 |
withd | +0.107 |
Neg logit contributions | |
Carbuncle | -0.101 |
hemy | -0.095 |
ndra | -0.092 |
ongs | -0.088 |
dh | -0.087 |
Token | . |
Token ID | 13 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
osate | +0.067 |
ongyang | +0.052 |
� | +0.052 |
insula | +0.051 |
withd | +0.051 |
Neg logit contributions | |
Carbuncle | -0.040 |
hemy | -0.038 |
ndra | -0.036 |
ongs | -0.035 |
bars | -0.035 |
Token | During |
Token ID | 5856 |
Feature activation | -2.68e-01 |
Pos logit contributions | |
Carbuncle | +0.142 |
hemy | +0.134 |
ndra | +0.131 |
ongs | +0.125 |
dh | +0.125 |
Neg logit contributions | |
osate | -0.172 |
ongyang | -0.128 |
� | -0.128 |
insula | -0.126 |
withd | -0.125 |
Token | these |
Token ID | 777 |
Feature activation | -4.48e-02 |
Pos logit contributions | |
Carbuncle | +0.200 |
hemy | +0.189 |
ndra | +0.183 |
ongs | +0.175 |
bars | +0.174 |
Neg logit contributions | |
osate | -0.270 |
� | -0.203 |
ongyang | -0.203 |
insula | -0.200 |
withd | -0.199 |
Token | crimes |
Token ID | 6741 |
Feature activation | -3.45e-01 |
Pos logit contributions | |
Carbuncle | +0.022 |
hemy | +0.020 |
ndra | +0.019 |
ongs | +0.017 |
dh | +0.017 |
Neg logit contributions | |
osate | -0.057 |
� | -0.046 |
ongyang | -0.046 |
insula | -0.045 |
satisf | -0.045 |
Token | , |
Token ID | 11 |
Feature activation | -5.47e-01 |
Pos logit contributions | |
Carbuncle | +0.260 |
hemy | +0.245 |
ndra | +0.240 |
bars | +0.229 |
ongs | +0.229 |
Neg logit contributions | |
osate | -0.346 |
ongyang | -0.260 |
� | -0.259 |
insula | -0.255 |
withd | -0.254 |
Token | suspects |
Token ID | 11826 |
Feature activation | -9.00e-01 |
Pos logit contributions | |
Carbuncle | +0.384 |
hemy | +0.360 |
ndra | +0.350 |
ongs | +0.333 |
dh | +0.330 |
Neg logit contributions | |
osate | -0.577 |
� | -0.441 |
ongyang | -0.440 |
insula | -0.435 |
withd | -0.431 |
Token | will |
Token ID | 481 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
Carbuncle | +0.706 |
hemy | +0.663 |
ndra | +0.648 |
ongs | +0.622 |
bars | +0.619 |
Neg logit contributions | |
osate | -0.881 |
� | -0.654 |
ongyang | -0.654 |
insula | -0.644 |
withd | -0.636 |
Token | " |
Token ID | 366 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
Carbuncle | +0.217 |
hemy | +0.206 |
ndra | +0.200 |
ongs | +0.192 |
dh | +0.191 |
Neg logit contributions | |
osate | -0.259 |
� | -0.192 |
ongyang | -0.191 |
insula | -0.189 |
withd | -0.187 |
Token | literally |
Token ID | 43819 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
Carbuncle | +0.470 |
hemy | +0.445 |
ndra | +0.434 |
dh | +0.418 |
ongs | +0.414 |
Neg logit contributions | |
osate | -0.614 |
ongyang | -0.459 |
� | -0.457 |
withd | -0.449 |
insula | -0.448 |
Token | to |
Token ID | 284 |
Feature activation | +9.93e-02 |
Pos logit contributions | |
osate | +0.237 |
ongyang | +0.179 |
� | +0.178 |
withd | +0.174 |
insula | +0.174 |
Neg logit contributions | |
Carbuncle | -0.166 |
hemy | -0.157 |
ndra | -0.154 |
ongs | -0.148 |
bars | -0.148 |
Token | analyze |
Token ID | 16602 |
Feature activation | +5.24e-02 |
Pos logit contributions | |
osate | +0.096 |
ongyang | +0.071 |
� | +0.071 |
insula | +0.070 |
withd | +0.069 |
Neg logit contributions | |
Carbuncle | -0.079 |
hemy | -0.075 |
ndra | -0.073 |
ongs | -0.070 |
bars | -0.070 |
Token | and |
Token ID | 290 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
osate | +0.053 |
� | +0.040 |
ongyang | +0.039 |
insula | +0.039 |
withd | +0.038 |
Neg logit contributions | |
Carbuncle | -0.040 |
hemy | -0.037 |
ndra | -0.036 |
bars | -0.035 |
ongs | -0.035 |
Token | synthes |
Token ID | 24983 |
Feature activation | +8.63e-01 |
Pos logit contributions | |
Carbuncle | +0.021 |
hemy | +0.020 |
ndra | +0.019 |
ongs | +0.019 |
dh | +0.019 |
Neg logit contributions | |
osate | -0.024 |
� | -0.017 |
ongyang | -0.017 |
insula | -0.017 |
withd | -0.017 |
Token | ize |
Token ID | 1096 |
Feature activation | -4.56e-01 |
Pos logit contributions | |
osate | +0.909 |
� | +0.696 |
ongyang | +0.691 |
insula | +0.688 |
satisf | +0.686 |
Neg logit contributions | |
Carbuncle | -0.603 |
hemy | -0.567 |
ndra | -0.544 |
ongs | -0.519 |
bars | -0.515 |
Token | information |
Token ID | 1321 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
Carbuncle | +0.333 |
hemy | +0.312 |
ndra | +0.304 |
ongs | +0.291 |
bars | +0.290 |
Neg logit contributions | |
osate | -0.469 |
� | -0.356 |
ongyang | -0.356 |
insula | -0.350 |
withd | -0.346 |
Token | and |
Token ID | 290 |
Feature activation | -6.76e-02 |
Pos logit contributions | |
Carbuncle | +0.204 |
hemy | +0.191 |
ndra | +0.187 |
ongs | +0.180 |
bars | +0.178 |
Neg logit contributions | |
osate | -0.276 |
ongyang | -0.208 |
� | -0.207 |
insula | -0.204 |
withd | -0.202 |
Token | to |
Token ID | 284 |
Feature activation | -6.63e-02 |
Pos logit contributions | |
Carbuncle | +0.051 |
hemy | +0.048 |
ndra | +0.047 |
ongs | +0.045 |
bars | +0.045 |
Neg logit contributions | |
osate | -0.068 |
� | -0.051 |
ongyang | -0.051 |
insula | -0.050 |
withd | -0.049 |
Token | generate |
Token ID | 7716 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
Carbuncle | +0.055 |
hemy | +0.052 |
ndra | +0.050 |
ongs | +0.049 |
dh | +0.048 |
Neg logit contributions | |
osate | -0.062 |
� | -0.045 |
ongyang | -0.045 |
insula | -0.045 |
withd | -0.044 |
Token | empathy |
Token ID | 21452 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
Carbuncle | +0.074 |
hemy | +0.070 |
ndra | +0.068 |
ongs | +0.065 |
bars | +0.065 |
Neg logit contributions | |
osate | -0.102 |
ongyang | -0.077 |
� | -0.077 |
insula | -0.076 |
withd | -0.075 |
Token | by |
Token ID | 416 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
Carbuncle | +0.085 |
hemy | +0.080 |
ndra | +0.077 |
ongs | +0.075 |
bars | +0.075 |
Neg logit contributions | |
osate | -0.121 |
ongyang | -0.092 |
� | -0.091 |
insula | -0.090 |
withd | -0.089 |
Token | completely |
Token ID | 3190 |
Feature activation | -3.51e-01 |
Pos logit contributions | |
Carbuncle | +0.279 |
hemy | +0.266 |
ndra | +0.258 |
dh | +0.247 |
ongs | +0.246 |
Neg logit contributions | |
osate | -0.354 |
� | -0.264 |
ongyang | -0.263 |
insula | -0.259 |
withd | -0.257 |
Token | true |
Token ID | 2081 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
Carbuncle | +0.269 |
hemy | +0.255 |
ndra | +0.247 |
ongs | +0.237 |
dh | +0.236 |
Neg logit contributions | |
osate | -0.347 |
� | -0.260 |
ongyang | -0.259 |
insula | -0.255 |
withd | -0.253 |
Token | . |
Token ID | 13 |
Feature activation | -3.79e-01 |
Pos logit contributions | |
Carbuncle | +0.102 |
hemy | +0.096 |
ndra | +0.093 |
ongs | +0.089 |
dh | +0.089 |
Neg logit contributions | |
osate | -0.166 |
ongyang | -0.128 |
� | -0.128 |
insula | -0.126 |
withd | -0.125 |
Token |
|
Token ID | 198 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
Carbuncle | +0.263 |
hemy | +0.247 |
ndra | +0.239 |
ongs | +0.228 |
dh | +0.226 |
Neg logit contributions | |
osate | -0.403 |
ongyang | -0.308 |
� | -0.308 |
insula | -0.304 |
withd | -0.302 |
Token |
|
Token ID | 198 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
Carbuncle | +0.189 |
hemy | +0.180 |
ndra | +0.175 |
ongs | +0.168 |
bars | +0.167 |
Neg logit contributions | |
osate | -0.190 |
� | -0.139 |
ongyang | -0.137 |
insula | -0.135 |
Fug | -0.134 |
Token | As |
Token ID | 1722 |
Feature activation | -3.77e-01 |
Pos logit contributions | |
Carbuncle | +0.188 |
hemy | +0.179 |
ndra | +0.174 |
ongs | +0.167 |
dh | +0.167 |
Neg logit contributions | |
osate | -0.243 |
ongyang | -0.181 |
� | -0.180 |
withd | -0.179 |
insula | -0.179 |
Token | someone |
Token ID | 2130 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
Carbuncle | +0.275 |
hemy | +0.260 |
ndra | +0.252 |
ongs | +0.242 |
dh | +0.239 |
Neg logit contributions | |
osate | -0.386 |
� | -0.293 |
ongyang | -0.292 |
insula | -0.288 |
withd | -0.286 |
Token | who |
Token ID | 508 |
Feature activation | -5.98e-02 |
Pos logit contributions | |
Carbuncle | +0.172 |
hemy | +0.163 |
ndra | +0.157 |
ongs | +0.152 |
dh | +0.151 |
Neg logit contributions | |
osate | -0.246 |
� | -0.186 |
ongyang | -0.185 |
insula | -0.183 |
Fug | -0.180 |
Token | is |
Token ID | 318 |
Feature activation | -4.57e-01 |
Pos logit contributions | |
Carbuncle | +0.045 |
hemy | +0.042 |
ndra | +0.041 |
ongs | +0.039 |
bars | +0.039 |
Neg logit contributions | |
osate | -0.060 |
ongyang | -0.045 |
� | -0.045 |
insula | -0.045 |
Fug | -0.044 |
Token | half |
Token ID | 2063 |
Feature activation | -3.78e-01 |
Pos logit contributions | |
Carbuncle | +0.336 |
hemy | +0.320 |
ndra | +0.308 |
dh | +0.297 |
bars | +0.295 |
Neg logit contributions | |
osate | -0.468 |
ongyang | -0.353 |
� | -0.351 |
insula | -0.347 |
withd | -0.341 |
Token | - |
Token ID | 12 |
Feature activation | -2.53e-01 |
Pos logit contributions | |
Carbuncle | +0.279 |
hemy | +0.262 |
ndra | +0.255 |
dh | +0.246 |
bars | +0.245 |
Neg logit contributions | |
osate | -0.387 |
ongyang | -0.293 |
� | -0.292 |
withd | -0.284 |
insula | -0.284 |
Token | , |
Token ID | 837 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
Carbuncle | +0.207 |
hemy | +0.198 |
ndra | +0.191 |
ongs | +0.185 |
bars | +0.182 |
Neg logit contributions | |
osate | -0.215 |
� | -0.158 |
Fug | -0.154 |
ongyang | -0.154 |
satisf | -0.153 |
Token | 0 |
Token ID | 657 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
Carbuncle | +0.371 |
hemy | +0.355 |
ndra | +0.344 |
ongs | +0.332 |
dh | +0.327 |
Neg logit contributions | |
osate | -0.398 |
� | -0.293 |
ongyang | -0.289 |
Fug | -0.287 |
satisf | -0.286 |
Token | . |
Token ID | 13 |
Feature activation | +4.06e-03 |
Pos logit contributions | |
Carbuncle | +0.146 |
hemy | +0.138 |
ndra | +0.131 |
ongs | +0.125 |
bars | +0.123 |
Neg logit contributions | |
osate | -0.220 |
� | -0.171 |
Fug | -0.169 |
ongyang | -0.168 |
satisf | -0.167 |
Token | 5 |
Token ID | 20 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
osate | +0.004 |
� | +0.003 |
Fug | +0.003 |
satisf | +0.003 |
ongyang | +0.003 |
Neg logit contributions | |
Carbuncle | -0.003 |
hemy | -0.003 |
ndra | -0.003 |
ongs | -0.003 |
bars | -0.003 |
Token | ) |
Token ID | 1267 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
Carbuncle | +0.211 |
hemy | +0.199 |
ndra | +0.193 |
ongs | +0.186 |
bars | +0.182 |
Neg logit contributions | |
osate | -0.267 |
� | -0.199 |
ongyang | -0.199 |
insula | -0.197 |
Fug | -0.196 |
Token | ) |
Token ID | 1267 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
Carbuncle | +0.250 |
hemy | +0.237 |
ndra | +0.229 |
ongs | +0.221 |
bars | +0.217 |
Neg logit contributions | |
osate | -0.324 |
� | -0.244 |
ongyang | -0.242 |
insula | -0.241 |
Fug | -0.240 |
Token | = |
Token ID | 796 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
Carbuncle | +0.223 |
hemy | +0.211 |
ndra | +0.202 |
ongs | +0.192 |
bars | +0.190 |
Neg logit contributions | |
osate | -0.340 |
� | -0.264 |
Fug | -0.260 |
ongyang | -0.260 |
insula | -0.258 |
Token | 0 |
Token ID | 657 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
Carbuncle | +0.248 |
hemy | +0.236 |
ndra | +0.229 |
ongs | +0.220 |
dh | +0.218 |
Neg logit contributions | |
osate | -0.265 |
� | -0.194 |
ongyang | -0.193 |
satisf | -0.191 |
insula | -0.190 |
Token | . |
Token ID | 13 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
Carbuncle | +0.206 |
hemy | +0.195 |
ndra | +0.185 |
ongs | +0.178 |
bars | +0.174 |
Neg logit contributions | |
osate | -0.313 |
� | -0.243 |
Fug | -0.241 |
ongyang | -0.239 |
satisf | -0.238 |
Token | 1 |
Token ID | 16 |
Feature activation | -4.37e-01 |
Pos logit contributions | |
osate | +0.037 |
� | +0.028 |
Fug | +0.028 |
ongyang | +0.028 |
satisf | +0.028 |
Neg logit contributions | |
Carbuncle | -0.024 |
hemy | -0.023 |
ndra | -0.022 |
ongs | -0.020 |
bars | -0.020 |
Token | // |
Token ID | 3373 |
Feature activation | +1.93e-03 |
Pos logit contributions | |
Carbuncle | +0.316 |
hemy | +0.299 |
ndra | +0.288 |
ongs | +0.278 |
dh | +0.272 |
Neg logit contributions | |
osate | -0.448 |
� | -0.342 |
ongyang | -0.339 |
Fug | -0.337 |
insula | -0.335 |
Token | one |
Token ID | 505 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
osate | +0.639 |
� | +0.499 |
ongyang | +0.494 |
insula | +0.490 |
withd | +0.489 |
Neg logit contributions | |
Carbuncle | -0.388 |
hemy | -0.364 |
ndra | -0.351 |
ongs | -0.337 |
dh | -0.330 |
Token | video |
Token ID | 2008 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
osate | +0.154 |
� | +0.117 |
ongyang | +0.116 |
insula | +0.115 |
withd | +0.114 |
Neg logit contributions | |
Carbuncle | -0.114 |
hemy | -0.107 |
ndra | -0.105 |
ongs | -0.100 |
bars | -0.100 |
Token | captures |
Token ID | 23007 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
osate | +0.311 |
� | +0.234 |
ongyang | +0.233 |
insula | +0.231 |
withd | +0.228 |
Neg logit contributions | |
Carbuncle | -0.239 |
hemy | -0.224 |
ndra | -0.219 |
ongs | -0.210 |
bars | -0.210 |
Token | killer |
Token ID | 11868 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
osate | +0.493 |
� | +0.374 |
ongyang | +0.373 |
insula | +0.368 |
withd | +0.365 |
Neg logit contributions | |
Carbuncle | -0.356 |
hemy | -0.335 |
ndra | -0.326 |
ongs | -0.311 |
dh | -0.309 |
Token | whales |
Token ID | 24635 |
Feature activation | +7.56e-01 |
Pos logit contributions | |
osate | +0.680 |
� | +0.508 |
ongyang | +0.506 |
insula | +0.499 |
withd | +0.495 |
Neg logit contributions | |
Carbuncle | -0.542 |
hemy | -0.514 |
ndra | -0.499 |
ongs | -0.478 |
dh | -0.475 |
Token | eating |
Token ID | 6600 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
osate | +0.747 |
� | +0.560 |
ongyang | +0.558 |
insula | +0.551 |
withd | +0.547 |
Neg logit contributions | |
Carbuncle | -0.580 |
hemy | -0.548 |
ndra | -0.533 |
ongs | -0.511 |
dh | -0.506 |
Token | a |
Token ID | 257 |
Feature activation | -4.01e-01 |
Pos logit contributions | |
Carbuncle | +0.186 |
hemy | +0.174 |
ndra | +0.170 |
ongs | +0.162 |
dh | +0.161 |
Neg logit contributions | |
osate | -0.266 |
� | -0.203 |
ongyang | -0.202 |
insula | -0.200 |
withd | -0.198 |
Token | shark |
Token ID | 21027 |
Feature activation | -4.96e-01 |
Pos logit contributions | |
Carbuncle | +0.301 |
hemy | +0.283 |
ndra | +0.276 |
ongs | +0.264 |
dh | +0.262 |
Neg logit contributions | |
osate | -0.403 |
� | -0.305 |
ongyang | -0.303 |
insula | -0.299 |
withd | -0.297 |
Token | alive |
Token ID | 6776 |
Feature activation | +7.18e-01 |
Pos logit contributions | |
Carbuncle | +0.400 |
hemy | +0.378 |
ndra | +0.368 |
ongs | +0.354 |
bars | +0.353 |
Neg logit contributions | |
osate | -0.473 |
� | -0.350 |
ongyang | -0.349 |
insula | -0.343 |
withd | -0.341 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +7.78e-01 |
Pos logit contributions | |
osate | +0.627 |
� | +0.449 |
ongyang | +0.448 |
insula | +0.441 |
withd | +0.436 |
Neg logit contributions | |
Carbuncle | -0.634 |
hemy | -0.601 |
ndra | -0.590 |
ongs | -0.571 |
bars | -0.566 |
Token | KE |
Token ID | 7336 |
Feature activation | +4.35e-01 |
Pos logit contributions | |
osate | +0.762 |
ongyang | +0.565 |
� | +0.564 |
withd | +0.560 |
insula | +0.558 |
Neg logit contributions | |
Carbuncle | -0.602 |
hemy | -0.572 |
ndra | -0.560 |
dh | -0.536 |
ongs | -0.535 |
Token | - |
Token ID | 12 |
Feature activation | +3.84e-01 |
Pos logit contributions | |
osate | +0.306 |
� | +0.229 |
ongyang | +0.229 |
insula | +0.226 |
withd | +0.225 |
Neg logit contributions | |
Carbuncle | -0.237 |
hemy | -0.224 |
ndra | -0.218 |
ongs | -0.208 |
dh | -0.207 |
Token | 150 |
Token ID | 8628 |
Feature activation | -7.66e-01 |
Pos logit contributions | |
osate | +0.401 |
ongyang | +0.308 |
� | +0.303 |
insula | +0.303 |
withd | +0.301 |
Neg logit contributions | |
Carbuncle | -0.270 |
hemy | -0.252 |
ndra | -0.249 |
bars | -0.238 |
ongs | -0.236 |
Token | Eco |
Token ID | 38719 |
Feature activation | -6.33e-01 |
Pos logit contributions | |
Carbuncle | +0.574 |
hemy | +0.532 |
ndra | +0.522 |
bars | +0.501 |
ongs | +0.495 |
Neg logit contributions | |
osate | -0.777 |
ongyang | -0.588 |
� | -0.580 |
insula | -0.579 |
withd | -0.567 |
Token | Boost |
Token ID | 45686 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
Carbuncle | +0.499 |
hemy | +0.467 |
ndra | +0.457 |
bars | +0.440 |
dh | +0.438 |
Neg logit contributions | |
osate | -0.612 |
ongyang | -0.460 |
insula | -0.457 |
� | -0.449 |
withd | -0.444 |
Token | Tort |
Token ID | 28467 |
Feature activation | -8.83e-01 |
Pos logit contributions | |
Carbuncle | +0.161 |
hemy | +0.150 |
ndra | +0.147 |
bars | +0.142 |
ongs | +0.140 |
Neg logit contributions | |
osate | -0.204 |
ongyang | -0.152 |
insula | -0.151 |
� | -0.151 |
withd | -0.147 |
Token | ure |
Token ID | 495 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
Carbuncle | +0.516 |
hemy | +0.480 |
ndra | +0.464 |
ongs | +0.444 |
bars | +0.433 |
Neg logit contributions | |
osate | -1.030 |
� | -0.820 |
ongyang | -0.807 |
withd | -0.800 |
insula | -0.798 |
Token | Test |
Token ID | 6208 |
Feature activation | +6.27e-01 |
Pos logit contributions | |
Carbuncle | +1.349 |
hemy | +1.259 |
ndra | +1.239 |
bars | +1.199 |
ongs | +1.174 |
Neg logit contributions | |
osate | -1.835 |
ongyang | -1.383 |
� | -1.380 |
insula | -1.376 |
withd | -1.348 |
Token | truck |
Token ID | 7779 |
Feature activation | +1.86e-01 |
Pos logit contributions | |
osate | +0.629 |
ongyang | +0.474 |
� | +0.472 |
insula | +0.468 |
withd | +0.461 |
Neg logit contributions | |
Carbuncle | -0.474 |
hemy | -0.445 |
ndra | -0.440 |
bars | -0.418 |
ongs | -0.416 |
Token | in |
Token ID | 287 |
Feature activation | -6.35e-02 |
Pos logit contributions | |
osate | +0.186 |
ongyang | +0.140 |
� | +0.140 |
insula | +0.138 |
withd | +0.136 |
Neg logit contributions | |
Carbuncle | -0.142 |
hemy | -0.133 |
ndra | -0.130 |
bars | -0.124 |
ongs | -0.124 |
Token | the |
Token ID | 262 |
Feature activation | +3.65e-02 |
Pos logit contributions | |
Carbuncle | +0.041 |
hemy | +0.038 |
ndra | +0.037 |
bars | +0.035 |
ongs | +0.035 |
Neg logit contributions | |
osate | -0.070 |
� | -0.055 |
ongyang | -0.055 |
insula | -0.054 |
withd | -0.054 |
Token | 2010 |
Token ID | 3050 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
osate | +0.037 |
� | +0.028 |
ongyang | +0.028 |
insula | +0.028 |
withd | +0.027 |
Neg logit contributions | |
Carbuncle | -0.027 |
hemy | -0.025 |
ndra | -0.025 |
ongs | -0.024 |
bars | -0.024 |
Token | 's |
Token ID | 338 |
Feature activation | -2.51e-01 |
Pos logit contributions | |
Carbuncle | +0.392 |
hemy | +0.365 |
ndra | +0.359 |
bars | +0.345 |
ongs | +0.343 |
Neg logit contributions | |
osate | -0.586 |
ongyang | -0.444 |
� | -0.444 |
insula | -0.442 |
withd | -0.434 |
Token | a |
Token ID | 257 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
Carbuncle | +0.184 |
hemy | +0.173 |
ndra | +0.169 |
bars | +0.162 |
ongs | +0.160 |
Neg logit contributions | |
osate | -0.259 |
ongyang | -0.195 |
� | -0.195 |
insula | -0.193 |
withd | -0.190 |
Token | different |
Token ID | 1180 |
Feature activation | -5.93e-01 |
Pos logit contributions | |
Carbuncle | +0.341 |
hemy | +0.321 |
ndra | +0.312 |
ongs | +0.298 |
bars | +0.297 |
Neg logit contributions | |
osate | -0.481 |
� | -0.364 |
ongyang | -0.363 |
insula | -0.358 |
withd | -0.355 |
Token | path |
Token ID | 3108 |
Feature activation | -7.27e-02 |
Pos logit contributions | |
Carbuncle | +0.443 |
hemy | +0.412 |
ndra | +0.404 |
ongs | +0.386 |
bars | +0.385 |
Neg logit contributions | |
osate | -0.604 |
� | -0.454 |
ongyang | -0.453 |
insula | -0.447 |
withd | -0.444 |
Token | ," |
Token ID | 553 |
Feature activation | -2.18e-01 |
Pos logit contributions | |
Carbuncle | +0.053 |
hemy | +0.050 |
ndra | +0.049 |
ongs | +0.047 |
bars | +0.047 |
Neg logit contributions | |
osate | -0.074 |
� | -0.056 |
ongyang | -0.056 |
insula | -0.055 |
withd | -0.055 |
Token | says |
Token ID | 1139 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Carbuncle | +0.166 |
hemy | +0.155 |
ndra | +0.152 |
ongs | +0.146 |
bars | +0.145 |
Neg logit contributions | |
osate | -0.218 |
ongyang | -0.164 |
� | -0.164 |
insula | -0.161 |
withd | -0.159 |
Token | Boy |
Token ID | 6387 |
Feature activation | -6.27e-01 |
Pos logit contributions | |
Carbuncle | +1.169 |
hemy | +1.080 |
ndra | +1.071 |
ongs | +1.025 |
bars | +1.023 |
Neg logit contributions | |
osate | -1.517 |
ongyang | -1.142 |
� | -1.137 |
insula | -1.121 |
satisf | -1.100 |
Token | ega |
Token ID | 26470 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
Carbuncle | +0.424 |
hemy | +0.397 |
ndra | +0.387 |
ongs | +0.369 |
dh | +0.366 |
Neg logit contributions | |
osate | -0.675 |
� | -0.522 |
ongyang | -0.520 |
insula | -0.514 |
withd | -0.511 |
Token | the |
Token ID | 262 |
Feature activation | -8.39e-01 |
Pos logit contributions | |
Carbuncle | +0.807 |
hemy | +0.753 |
ndra | +0.731 |
ongs | +0.703 |
bars | +0.694 |
Neg logit contributions | |
osate | -1.377 |
� | -1.069 |
ongyang | -1.067 |
insula | -1.055 |
withd | -1.041 |
Token | day |
Token ID | 1110 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
Carbuncle | +0.593 |
hemy | +0.550 |
ndra | +0.542 |
bars | +0.518 |
ongs | +0.518 |
Neg logit contributions | |
osate | -0.884 |
� | -0.673 |
ongyang | -0.669 |
insula | -0.664 |
withd | -0.656 |
Token | after |
Token ID | 706 |
Feature activation | -7.58e-01 |
Pos logit contributions | |
Carbuncle | +0.413 |
hemy | +0.385 |
ndra | +0.377 |
ongs | +0.358 |
bars | +0.355 |
Neg logit contributions | |
osate | -0.635 |
� | -0.489 |
ongyang | -0.488 |
insula | -0.481 |
withd | -0.478 |
Token | region |
Token ID | 3814 |
Feature activation | +6.75e-01 |
Pos logit contributions | |
osate | +0.084 |
� | +0.063 |
ongyang | +0.063 |
insula | +0.062 |
withd | +0.061 |
Neg logit contributions | |
Carbuncle | -0.066 |
hemy | -0.062 |
ndra | -0.060 |
ongs | -0.058 |
bars | -0.058 |
Token | of |
Token ID | 286 |
Feature activation | +9.86e-02 |
Pos logit contributions | |
osate | +0.725 |
ongyang | +0.557 |
� | +0.555 |
insula | +0.548 |
Fug | +0.544 |
Neg logit contributions | |
Carbuncle | -0.460 |
hemy | -0.431 |
ndra | -0.418 |
ongs | -0.400 |
bars | -0.397 |
Token | China |
Token ID | 2807 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
osate | +0.093 |
� | +0.069 |
ongyang | +0.068 |
insula | +0.067 |
withd | +0.067 |
Neg logit contributions | |
Carbuncle | -0.080 |
hemy | -0.075 |
ndra | -0.074 |
ongs | -0.071 |
bars | -0.071 |
Token | in |
Token ID | 287 |
Feature activation | -8.80e-02 |
Pos logit contributions | |
Carbuncle | +0.235 |
hemy | +0.218 |
ndra | +0.214 |
ongs | +0.203 |
bars | +0.203 |
Neg logit contributions | |
osate | -0.362 |
� | -0.277 |
ongyang | -0.276 |
insula | -0.273 |
satisf | -0.271 |
Token | southern |
Token ID | 8372 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
Carbuncle | +0.067 |
hemy | +0.063 |
ndra | +0.062 |
ongs | +0.059 |
bars | +0.059 |
Neg logit contributions | |
osate | -0.088 |
� | -0.066 |
ongyang | -0.065 |
insula | -0.065 |
withd | -0.064 |
Token | Guang |
Token ID | 36980 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
osate | +0.433 |
� | +0.337 |
ongyang | +0.335 |
insula | +0.332 |
withd | +0.330 |
Neg logit contributions | |
Carbuncle | -0.245 |
hemy | -0.228 |
ndra | -0.220 |
ongs | -0.210 |
bars | -0.208 |
Token | d |
Token ID | 67 |
Feature activation | -4.60e-01 |
Pos logit contributions | |
Carbuncle | +1.028 |
hemy | +0.945 |
ndra | +0.909 |
ongs | +0.845 |
dh | +0.844 |
Neg logit contributions | |
osate | -2.497 |
� | -2.003 |
ongyang | -1.990 |
insula | -1.973 |
withd | -1.969 |
Token | ong |
Token ID | 506 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
Carbuncle | +0.277 |
hemy | +0.248 |
ndra | +0.241 |
bars | +0.224 |
dh | +0.224 |
Neg logit contributions | |
osate | -0.534 |
ongyang | -0.431 |
� | -0.421 |
insula | -0.419 |
satisf | -0.413 |
Token | province |
Token ID | 8473 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
Carbuncle | +0.196 |
hemy | +0.183 |
ndra | +0.177 |
ongs | +0.167 |
dh | +0.165 |
Neg logit contributions | |
osate | -0.383 |
� | -0.301 |
ongyang | -0.300 |
insula | -0.296 |
withd | -0.296 |
Token | , |
Token ID | 11 |
Feature activation | +7.81e-02 |
Pos logit contributions | |
Carbuncle | +0.204 |
hemy | +0.192 |
ndra | +0.188 |
ongs | +0.178 |
bars | +0.177 |
Neg logit contributions | |
osate | -0.303 |
� | -0.231 |
ongyang | -0.230 |
insula | -0.227 |
Fug | -0.225 |
Token | nest |
Token ID | 16343 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
osate | +0.081 |
� | +0.062 |
ongyang | +0.062 |
insula | +0.061 |
withd | +0.060 |
Neg logit contributions | |
Carbuncle | -0.056 |
hemy | -0.053 |
ndra | -0.051 |
ongs | -0.049 |
bars | -0.048 |
Token | year |
Token ID | 614 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
osate | +0.018 |
� | +0.014 |
ongyang | +0.014 |
insula | +0.014 |
withd | +0.014 |
Neg logit contributions | |
Carbuncle | -0.012 |
hemy | -0.012 |
ndra | -0.011 |
ongs | -0.011 |
dh | -0.011 |
Token | later |
Token ID | 1568 |
Feature activation | -6.25e-02 |
Pos logit contributions | |
osate | +0.293 |
ongyang | +0.218 |
� | +0.217 |
insula | +0.214 |
withd | +0.211 |
Neg logit contributions | |
Carbuncle | -0.238 |
hemy | -0.223 |
ndra | -0.219 |
ongs | -0.210 |
bars | -0.209 |
Token | , |
Token ID | 11 |
Feature activation | -5.34e-02 |
Pos logit contributions | |
Carbuncle | +0.048 |
hemy | +0.045 |
ndra | +0.044 |
ongs | +0.042 |
bars | +0.042 |
Neg logit contributions | |
osate | -0.062 |
ongyang | -0.047 |
� | -0.047 |
insula | -0.046 |
withd | -0.046 |
Token | he |
Token ID | 339 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
Carbuncle | +0.041 |
hemy | +0.039 |
ndra | +0.038 |
ongs | +0.036 |
dh | +0.036 |
Neg logit contributions | |
osate | -0.053 |
� | -0.039 |
ongyang | -0.039 |
insula | -0.039 |
withd | -0.039 |
Token | joined |
Token ID | 5399 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
Carbuncle | +0.091 |
hemy | +0.085 |
ndra | +0.083 |
bars | +0.080 |
ongs | +0.080 |
Neg logit contributions | |
osate | -0.107 |
ongyang | -0.079 |
insula | -0.078 |
� | -0.078 |
withd | -0.076 |
Token | Columbus |
Token ID | 14939 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
osate | +0.278 |
� | +0.212 |
ongyang | +0.212 |
insula | +0.209 |
withd | +0.208 |
Neg logit contributions | |
Carbuncle | -0.189 |
hemy | -0.178 |
ndra | -0.172 |
ongs | -0.164 |
dh | -0.163 |
Token | as |
Token ID | 355 |
Feature activation | -5.94e-01 |
Pos logit contributions | |
Carbuncle | +0.967 |
hemy | +0.894 |
ndra | +0.863 |
ongs | +0.816 |
bars | +0.806 |
Neg logit contributions | |
osate | -1.978 |
� | -1.558 |
ongyang | -1.556 |
insula | -1.543 |
withd | -1.529 |
Token | an |
Token ID | 281 |
Feature activation | -9.15e-02 |
Pos logit contributions | |
Carbuncle | +0.451 |
hemy | +0.420 |
ndra | +0.412 |
ongs | +0.394 |
bars | +0.393 |
Neg logit contributions | |
osate | -0.597 |
ongyang | -0.448 |
� | -0.447 |
insula | -0.442 |
withd | -0.435 |
Token | assistant |
Token ID | 8796 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
Carbuncle | +0.079 |
hemy | +0.075 |
ndra | +0.074 |
ongs | +0.071 |
dh | +0.071 |
Neg logit contributions | |
osate | -0.081 |
� | -0.059 |
ongyang | -0.059 |
insula | -0.058 |
withd | -0.057 |
Token | coach |
Token ID | 3985 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
Carbuncle | +0.190 |
hemy | +0.179 |
ndra | +0.176 |
ongs | +0.169 |
bars | +0.169 |
Neg logit contributions | |
osate | -0.214 |
ongyang | -0.157 |
� | -0.157 |
insula | -0.154 |
withd | -0.152 |
Token | . |
Token ID | 13 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
osate | +0.186 |
ongyang | +0.141 |
� | +0.141 |
insula | +0.139 |
withd | +0.137 |
Neg logit contributions | |
Carbuncle | -0.130 |
hemy | -0.122 |
ndra | -0.119 |
ongs | -0.114 |
dh | -0.113 |
Token | Gro |
Token ID | 42921 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
Carbuncle | +0.214 |
hemy | +0.202 |
ndra | +0.198 |
ongs | +0.190 |
dh | +0.190 |
Neg logit contributions | |
osate | -0.278 |
ongyang | -0.207 |
withd | -0.205 |
� | -0.205 |
insula | -0.204 |
Token | hl |
Token ID | 18519 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
Carbuncle | +0.159 |
hemy | +0.152 |
ndra | +0.148 |
ongs | +0.143 |
dh | +0.142 |
Neg logit contributions | |
osate | -0.149 |
� | -0.106 |
ongyang | -0.105 |
insula | -0.104 |
withd | -0.103 |
Token | stated |
Token ID | 5081 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
Carbuncle | +0.138 |
hemy | +0.130 |
ndra | +0.126 |
ongs | +0.122 |
bars | +0.121 |
Neg logit contributions | |
osate | -0.172 |
ongyang | -0.128 |
� | -0.127 |
insula | -0.126 |
withd | -0.124 |
Token | that |
Token ID | 326 |
Feature activation | -6.29e-02 |
Pos logit contributions | |
Carbuncle | +0.176 |
hemy | +0.166 |
ndra | +0.161 |
ongs | +0.156 |
bars | +0.155 |
Neg logit contributions | |
osate | -0.235 |
ongyang | -0.176 |
� | -0.175 |
insula | -0.174 |
withd | -0.171 |
Token | Cob |
Token ID | 14828 |
Feature activation | -7.78e-01 |
Pos logit contributions | |
Carbuncle | +0.048 |
hemy | +0.045 |
ndra | +0.044 |
ongs | +0.042 |
bars | +0.042 |
Neg logit contributions | |
osate | -0.063 |
ongyang | -0.047 |
� | -0.047 |
insula | -0.047 |
withd | -0.046 |
Token | ain |
Token ID | 391 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
Carbuncle | +0.585 |
hemy | +0.549 |
ndra | +0.532 |
ongs | +0.507 |
dh | +0.504 |
Neg logit contributions | |
osate | -0.782 |
ongyang | -0.590 |
� | -0.587 |
insula | -0.580 |
satisf | -0.576 |
Token | believed |
Token ID | 4762 |
Feature activation | +3.07e-02 |
Pos logit contributions | |
Carbuncle | +1.155 |
hemy | +1.079 |
ndra | +1.057 |
ongs | +1.019 |
bars | +1.018 |
Neg logit contributions | |
osate | -1.536 |
ongyang | -1.149 |
� | -1.142 |
insula | -1.139 |
withd | -1.113 |
Token | that |
Token ID | 326 |
Feature activation | +2.46e-02 |
Pos logit contributions | |
osate | +0.031 |
� | +0.023 |
ongyang | +0.023 |
insula | +0.023 |
withd | +0.023 |
Neg logit contributions | |
Carbuncle | -0.023 |
hemy | -0.022 |
ndra | -0.021 |
ongs | -0.020 |
bars | -0.020 |
Token | music |
Token ID | 2647 |
Feature activation | -8.10e-01 |
Pos logit contributions | |
osate | +0.025 |
ongyang | +0.019 |
� | +0.019 |
insula | +0.019 |
withd | +0.019 |
Neg logit contributions | |
Carbuncle | -0.018 |
hemy | -0.017 |
ndra | -0.016 |
ongs | -0.016 |
bars | -0.016 |
Token | comes |
Token ID | 2058 |
Feature activation | +3.87e-02 |
Pos logit contributions | |
Carbuncle | +0.611 |
hemy | +0.581 |
ndra | +0.561 |
bars | +0.544 |
ongs | +0.544 |
Neg logit contributions | |
osate | -0.814 |
ongyang | -0.608 |
� | -0.607 |
insula | -0.600 |
withd | -0.591 |
Token | first |
Token ID | 717 |
Feature activation | -6.73e-01 |
Pos logit contributions | |
osate | +0.040 |
� | +0.030 |
ongyang | +0.030 |
insula | +0.030 |
withd | +0.029 |
Neg logit contributions | |
Carbuncle | -0.028 |
hemy | -0.026 |
ndra | -0.026 |
ongs | -0.025 |
dh | -0.024 |