Token | Korean |
Token ID | 6983 |
Feature activation | +9.03e-01 |
Pos logit contributions | |
plin | +0.098 |
Draft | +0.098 |
Blooming | +0.096 |
€ | +0.096 |
Por | +0.092 |
Neg logit contributions | |
nem | -0.110 |
unseen | -0.110 |
uth | -0.101 |
arah | -0.099 |
humiliated | -0.096 |
Token | side |
Token ID | 1735 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
plin | +0.736 |
Draft | +0.735 |
Blooming | +0.726 |
€ | +0.725 |
Por | +0.697 |
Neg logit contributions | |
nem | -0.642 |
unseen | -0.640 |
uth | -0.586 |
arah | -0.564 |
humiliated | -0.552 |
Token | , |
Token ID | 11 |
Feature activation | +3.60e-01 |
Pos logit contributions | |
nem | +0.144 |
unseen | +0.143 |
uth | +0.132 |
arah | +0.127 |
humiliated | +0.124 |
Neg logit contributions | |
plin | -0.161 |
Draft | -0.161 |
Blooming | -0.159 |
€ | -0.158 |
Por | -0.153 |
Token | and |
Token ID | 290 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
plin | +0.276 |
Draft | +0.276 |
Blooming | +0.271 |
€ | +0.270 |
Por | +0.260 |
Neg logit contributions | |
nem | -0.274 |
unseen | -0.274 |
uth | -0.251 |
arah | -0.243 |
humiliated | -0.240 |
Token | only |
Token ID | 691 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
Draft | +0.332 |
plin | +0.332 |
Blooming | +0.325 |
€ | +0.324 |
Por | +0.311 |
Neg logit contributions | |
unseen | -0.387 |
nem | -0.386 |
uth | -0.356 |
arah | -0.344 |
humiliated | -0.343 |
Token | then |
Token ID | 788 |
Feature activation | +5.53e+00 |
Pos logit contributions | |
plin | +0.176 |
Draft | +0.176 |
Blooming | +0.172 |
€ | +0.171 |
Por | +0.164 |
Neg logit contributions | |
unseen | -0.219 |
nem | -0.219 |
uth | -0.202 |
arah | -0.196 |
humiliated | -0.195 |
Token | a |
Token ID | 257 |
Feature activation | +8.28e-01 |
Pos logit contributions | |
€ | +3.870 |
Draft | +3.865 |
Blooming | +3.851 |
plin | +3.844 |
Por | +3.728 |
Neg logit contributions | |
nem | -4.407 |
unseen | -4.347 |
uth | -4.061 |
arah | -4.029 |
emet | -3.895 |
Token | short |
Token ID | 1790 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
plin | +0.617 |
Draft | +0.617 |
Blooming | +0.607 |
€ | +0.604 |
Por | +0.582 |
Neg logit contributions | |
nem | -0.646 |
unseen | -0.645 |
uth | -0.592 |
arah | -0.571 |
humiliated | -0.566 |
Token | announcement |
Token ID | 8009 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
plin | +1.226 |
Draft | +1.224 |
Blooming | +1.211 |
€ | +1.207 |
Por | +1.165 |
Neg logit contributions | |
nem | -1.098 |
unseen | -1.095 |
uth | -1.002 |
arah | -0.969 |
humiliated | -0.946 |
Token | would |
Token ID | 561 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
unseen | +0.594 |
nem | +0.594 |
uth | +0.545 |
arah | +0.526 |
humiliated | +0.521 |
Neg logit contributions | |
plin | -0.551 |
Draft | -0.548 |
Blooming | -0.541 |
€ | -0.534 |
Por | -0.516 |
Token | be |
Token ID | 307 |
Feature activation | -4.57e-01 |
Pos logit contributions | |
plin | +0.699 |
Draft | +0.698 |
Blooming | +0.690 |
€ | +0.684 |
Por | +0.657 |
Neg logit contributions | |
nem | -0.882 |
unseen | -0.879 |
uth | -0.821 |
arah | -0.795 |
humiliated | -0.779 |
Token | tweak |
Token ID | 25393 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
plin | +2.234 |
Draft | +2.229 |
Blooming | +2.206 |
€ | +2.204 |
Por | +2.116 |
Neg logit contributions | |
nem | -2.480 |
unseen | -2.473 |
uth | -2.297 |
arah | -2.234 |
humiliated | -2.179 |
Token | certain |
Token ID | 1728 |
Feature activation | -6.19e-02 |
Pos logit contributions | |
Draft | +0.983 |
plin | +0.982 |
Blooming | +0.970 |
€ | +0.967 |
Por | +0.928 |
Neg logit contributions | |
nem | -1.054 |
unseen | -1.051 |
uth | -0.970 |
arah | -0.941 |
humiliated | -0.919 |
Token | settings |
Token ID | 6460 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
unseen | +0.047 |
nem | +0.047 |
uth | +0.043 |
arah | +0.042 |
humiliated | +0.041 |
Neg logit contributions | |
Draft | -0.047 |
plin | -0.047 |
Blooming | -0.047 |
€ | -0.046 |
Por | -0.044 |
Token | with |
Token ID | 351 |
Feature activation | +4.78e-01 |
Pos logit contributions | |
Draft | +0.242 |
plin | +0.241 |
Blooming | +0.238 |
€ | +0.236 |
Por | +0.228 |
Neg logit contributions | |
unseen | -0.225 |
nem | -0.225 |
uth | -0.206 |
arah | -0.198 |
humiliated | -0.193 |
Token | not |
Token ID | 407 |
Feature activation | +4.57e-01 |
Pos logit contributions | |
Draft | +0.346 |
plin | +0.344 |
Blooming | +0.339 |
€ | +0.337 |
Por | +0.323 |
Neg logit contributions | |
nem | -0.385 |
unseen | -0.385 |
uth | -0.354 |
arah | -0.342 |
humiliated | -0.335 |
Token | epad |
Token ID | 47852 |
Feature activation | +5.09e+00 |
Pos logit contributions | |
plin | +0.394 |
Draft | +0.393 |
Blooming | +0.390 |
€ | +0.389 |
Por | +0.376 |
Neg logit contributions | |
nem | -0.302 |
unseen | -0.301 |
uth | -0.274 |
arah | -0.264 |
humiliated | -0.257 |
Token | to |
Token ID | 284 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
plin | +3.508 |
Draft | +3.501 |
€ | +3.464 |
Blooming | +3.435 |
Por | +3.308 |
Neg logit contributions | |
unseen | -4.175 |
nem | -4.175 |
uth | -3.886 |
arah | -3.790 |
humiliated | -3.704 |
Token | your |
Token ID | 534 |
Feature activation | +7.59e-01 |
Pos logit contributions | |
plin | +1.558 |
Draft | +1.558 |
Blooming | +1.539 |
€ | +1.536 |
Por | +1.477 |
Neg logit contributions | |
nem | -1.578 |
unseen | -1.573 |
uth | -1.449 |
arah | -1.404 |
humiliated | -1.371 |
Token | undead |
Token ID | 26805 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
plin | +0.439 |
Draft | +0.438 |
Blooming | +0.432 |
€ | +0.431 |
Por | +0.409 |
Neg logit contributions | |
nem | -0.715 |
unseen | -0.714 |
uth | -0.669 |
arah | -0.653 |
humiliated | -0.640 |
Token | heart |
Token ID | 2612 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
Draft | +0.087 |
plin | +0.087 |
Blooming | +0.086 |
€ | +0.086 |
Por | +0.082 |
Neg logit contributions | |
nem | -0.075 |
unseen | -0.074 |
uth | -0.067 |
arah | -0.065 |
humiliated | -0.063 |
Token | 's |
Token ID | 338 |
Feature activation | +5.90e-01 |
Pos logit contributions | |
plin | +1.078 |
Draft | +1.078 |
€ | +1.071 |
Blooming | +1.068 |
Por | +1.030 |
Neg logit contributions | |
nem | -1.007 |
unseen | -1.006 |
uth | -0.923 |
arah | -0.899 |
humiliated | -0.873 |
Token | opposition |
Token ID | 5471 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
plin | +2.106 |
Draft | +2.105 |
Blooming | +2.097 |
€ | +2.096 |
Por | +2.043 |
Neg logit contributions | |
nem | -1.735 |
unseen | -1.727 |
uth | -1.587 |
arah | -1.554 |
humiliated | -1.485 |
Token | protesters |
Token ID | 9584 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
nem | +1.407 |
unseen | +1.394 |
uth | +1.271 |
arah | +1.201 |
humiliated | +1.189 |
Neg logit contributions | |
Draft | -1.884 |
plin | -1.882 |
Blooming | -1.853 |
€ | -1.845 |
Por | -1.763 |
Token | and |
Token ID | 290 |
Feature activation | -6.54e-02 |
Pos logit contributions | |
unseen | +1.136 |
nem | +1.133 |
uth | +1.030 |
arah | +0.984 |
humiliated | +0.973 |
Neg logit contributions | |
plin | -1.472 |
Draft | -1.471 |
Blooming | -1.449 |
€ | -1.445 |
Por | -1.391 |
Token | government |
Token ID | 1230 |
Feature activation | -8.39e-01 |
Pos logit contributions | |
nem | +0.044 |
unseen | +0.044 |
uth | +0.040 |
arah | +0.038 |
humiliated | +0.038 |
Neg logit contributions | |
plin | -0.056 |
Draft | -0.056 |
Blooming | -0.055 |
€ | -0.055 |
Por | -0.053 |
Token | forces |
Token ID | 3386 |
Feature activation | -2.48e-01 |
Pos logit contributions | |
nem | +0.510 |
unseen | +0.507 |
uth | +0.456 |
arah | +0.435 |
humiliated | +0.426 |
Neg logit contributions | |
plin | -0.771 |
Draft | -0.771 |
Blooming | -0.762 |
€ | -0.760 |
Por | -0.733 |
Token | left |
Token ID | 1364 |
Feature activation | +5.07e+00 |
Pos logit contributions | |
unseen | +0.163 |
nem | +0.162 |
uth | +0.147 |
arah | +0.140 |
humiliated | +0.139 |
Neg logit contributions | |
Draft | -0.217 |
plin | -0.217 |
Blooming | -0.214 |
€ | -0.213 |
Por | -0.206 |
Token | more |
Token ID | 517 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
€ | +3.768 |
Blooming | +3.719 |
Por | +3.639 |
plin | +3.635 |
Draft | +3.622 |
Neg logit contributions | |
nem | -3.821 |
unseen | -3.776 |
arah | -3.599 |
uth | -3.542 |
emet | -3.399 |
Token | than |
Token ID | 621 |
Feature activation | -6.79e-01 |
Pos logit contributions | |
nem | +0.169 |
unseen | +0.168 |
uth | +0.154 |
arah | +0.148 |
humiliated | +0.145 |
Neg logit contributions | |
plin | -0.199 |
Draft | -0.199 |
Blooming | -0.197 |
€ | -0.196 |
Por | -0.189 |
Token | 40 |
Token ID | 2319 |
Feature activation | +9.84e-01 |
Pos logit contributions | |
unseen | +0.572 |
nem | +0.571 |
uth | +0.527 |
arah | +0.506 |
humiliated | +0.504 |
Neg logit contributions | |
plin | -0.468 |
Draft | -0.466 |
Blooming | -0.455 |
€ | -0.443 |
Por | -0.430 |
Token | people |
Token ID | 661 |
Feature activation | -6.76e-01 |
Pos logit contributions | |
Draft | +0.910 |
plin | +0.910 |
Blooming | +0.903 |
€ | +0.901 |
Por | +0.874 |
Neg logit contributions | |
nem | -0.585 |
unseen | -0.583 |
uth | -0.524 |
arah | -0.506 |
humiliated | -0.487 |
Token | dead |
Token ID | 2636 |
Feature activation | -7.78e-01 |
Pos logit contributions | |
unseen | +0.384 |
nem | +0.382 |
uth | +0.342 |
humiliated | +0.322 |
arah | +0.321 |
Neg logit contributions | |
plin | -0.651 |
Draft | -0.649 |
Blooming | -0.642 |
€ | -0.636 |
Por | -0.616 |
Token | p |
Token ID | 79 |
Feature activation | +3.97e-01 |
Pos logit contributions | |
nem | +0.298 |
unseen | +0.297 |
uth | +0.276 |
arah | +0.267 |
humiliated | +0.259 |
Neg logit contributions | |
Draft | -0.279 |
plin | -0.279 |
€ | -0.275 |
Blooming | -0.275 |
Por | -0.262 |
Token | appa |
Token ID | 20975 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
plin | +0.301 |
Draft | +0.301 |
Blooming | +0.298 |
€ | +0.297 |
Por | +0.286 |
Neg logit contributions | |
nem | -0.303 |
unseen | -0.302 |
uth | -0.279 |
arah | -0.271 |
humiliated | -0.263 |
Token | 's |
Token ID | 338 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
nem | +0.126 |
unseen | +0.126 |
uth | +0.116 |
arah | +0.112 |
humiliated | +0.109 |
Neg logit contributions | |
Draft | -0.138 |
plin | -0.137 |
Blooming | -0.136 |
€ | -0.136 |
Por | -0.130 |
Token | boat |
Token ID | 8848 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
plin | +0.094 |
Draft | +0.094 |
Blooming | +0.092 |
€ | +0.092 |
Por | +0.088 |
Neg logit contributions | |
nem | -0.108 |
unseen | -0.108 |
uth | -0.099 |
arah | -0.097 |
humiliated | -0.094 |
Token | , |
Token ID | 11 |
Feature activation | +5.96e-01 |
Pos logit contributions | |
plin | +1.115 |
Draft | +1.114 |
Blooming | +1.102 |
€ | +1.099 |
Por | +1.057 |
Neg logit contributions | |
nem | -1.135 |
unseen | -1.132 |
uth | -1.044 |
arah | -1.013 |
humiliated | -0.988 |
Token | etc |
Token ID | 3503 |
Feature activation | +4.89e+00 |
Pos logit contributions | |
Draft | +0.450 |
plin | +0.450 |
Blooming | +0.444 |
€ | +0.443 |
Por | +0.425 |
Neg logit contributions | |
nem | -0.458 |
unseen | -0.457 |
uth | -0.420 |
arah | -0.407 |
humiliated | -0.397 |
Token | . |
Token ID | 13 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
plin | +3.254 |
Draft | +3.241 |
€ | +3.236 |
Blooming | +3.219 |
Por | +3.090 |
Neg logit contributions | |
nem | -4.113 |
unseen | -4.100 |
uth | -3.810 |
arah | -3.716 |
humiliated | -3.647 |
Token | Visitors |
Token ID | 44535 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
unseen | +0.213 |
nem | +0.213 |
uth | +0.196 |
arah | +0.189 |
humiliated | +0.187 |
Neg logit contributions | |
plin | -0.183 |
Draft | -0.182 |
Blooming | -0.178 |
€ | -0.177 |
Por | -0.169 |
Token | may |
Token ID | 743 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
Draft | +0.341 |
plin | +0.341 |
Blooming | +0.334 |
€ | +0.330 |
Por | +0.319 |
Neg logit contributions | |
unseen | -0.392 |
nem | -0.392 |
uth | -0.360 |
arah | -0.350 |
humiliated | -0.345 |
Token | also |
Token ID | 635 |
Feature activation | +6.50e-01 |
Pos logit contributions | |
unseen | +0.132 |
nem | +0.132 |
uth | +0.120 |
arah | +0.115 |
humiliated | +0.113 |
Neg logit contributions | |
Draft | -0.139 |
plin | -0.137 |
Blooming | -0.135 |
€ | -0.133 |
Por | -0.130 |
Token | meet |
Token ID | 1826 |
Feature activation | +7.61e-01 |
Pos logit contributions | |
Draft | +0.481 |
plin | +0.476 |
Blooming | +0.469 |
€ | +0.465 |
Por | +0.450 |
Neg logit contributions | |
unseen | -0.516 |
nem | -0.516 |
uth | -0.473 |
arah | -0.457 |
humiliated | -0.449 |
Token | Fasc |
Token ID | 41467 |
Feature activation | -4.42e-01 |
Pos logit contributions | |
nem | +0.520 |
unseen | +0.520 |
uth | +0.476 |
arah | +0.464 |
humiliated | +0.455 |
Neg logit contributions | |
plin | -0.450 |
Draft | -0.448 |
Blooming | -0.440 |
€ | -0.436 |
Por | -0.421 |
Token | is |
Token ID | 318 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
nem | +0.338 |
unseen | +0.337 |
uth | +0.312 |
arah | +0.301 |
humiliated | +0.294 |
Neg logit contributions | |
plin | -0.334 |
Draft | -0.334 |
Blooming | -0.331 |
€ | -0.329 |
Por | -0.316 |
Token | m |
Token ID | 76 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
nem | +0.435 |
unseen | +0.435 |
uth | +0.400 |
arah | +0.387 |
humiliated | +0.381 |
Neg logit contributions | |
plin | -0.410 |
Draft | -0.409 |
Blooming | -0.400 |
€ | -0.396 |
Por | -0.385 |
Token | of |
Token ID | 286 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
Draft | +0.138 |
plin | +0.137 |
Blooming | +0.136 |
€ | +0.135 |
Por | +0.130 |
Neg logit contributions | |
nem | -0.138 |
unseen | -0.137 |
uth | -0.127 |
arah | -0.123 |
humiliated | -0.120 |
Token | th |
Token ID | 294 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
plin | +0.229 |
Draft | +0.228 |
Blooming | +0.225 |
€ | +0.222 |
Por | +0.214 |
Neg logit contributions | |
nem | -0.262 |
unseen | -0.261 |
uth | -0.242 |
arah | -0.234 |
humiliated | -0.229 |
Token | e |
Token ID | 304 |
Feature activation | +4.86e+00 |
Pos logit contributions | |
plin | +1.134 |
Draft | +1.133 |
Blooming | +1.121 |
€ | +1.117 |
Por | +1.078 |
Neg logit contributions | |
nem | -1.013 |
unseen | -1.010 |
uth | -0.928 |
arah | -0.897 |
humiliated | -0.872 |
Token | Potato |
Token ID | 43876 |
Feature activation | -4.81e-01 |
Pos logit contributions | |
plin | +3.784 |
€ | +3.775 |
Draft | +3.770 |
Blooming | +3.762 |
Por | +3.627 |
Neg logit contributions | |
unseen | -3.491 |
nem | -3.491 |
uth | -3.202 |
arah | -3.148 |
humiliated | -3.044 |
Token |
|
Token ID | 198 |
Feature activation | -7.34e-01 |
Pos logit contributions | |
nem | +0.387 |
unseen | +0.384 |
uth | +0.357 |
arah | +0.345 |
humiliated | +0.337 |
Neg logit contributions | |
plin | -0.346 |
Draft | -0.344 |
Blooming | -0.341 |
€ | -0.339 |
Por | -0.323 |
Token |
|
Token ID | 198 |
Feature activation | -5.73e-01 |
Pos logit contributions | |
nem | +0.522 |
unseen | +0.520 |
uth | +0.477 |
arah | +0.461 |
humiliated | +0.448 |
Neg logit contributions | |
plin | -0.593 |
Draft | -0.587 |
Blooming | -0.585 |
€ | -0.582 |
Por | -0.562 |
Token | 1 |
Token ID | 16 |
Feature activation | -8.47e-02 |
Pos logit contributions | |
nem | +0.428 |
unseen | +0.427 |
uth | +0.397 |
arah | +0.384 |
humiliated | +0.371 |
Neg logit contributions | |
plin | -0.442 |
Blooming | -0.437 |
Draft | -0.435 |
€ | -0.433 |
Por | -0.420 |
Token |
|
Token ID | 198 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
nem | +0.067 |
unseen | +0.066 |
uth | +0.061 |
arah | +0.060 |
humiliated | +0.058 |
Neg logit contributions | |
plin | -0.062 |
Draft | -0.062 |
Blooming | -0.061 |
€ | -0.061 |
Por | -0.059 |
Token | address |
Token ID | 2209 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
nem | +0.116 |
unseen | +0.116 |
uth | +0.107 |
arah | +0.103 |
humiliated | +0.100 |
Neg logit contributions | |
plin | -0.124 |
Draft | -0.124 |
Blooming | -0.122 |
€ | -0.122 |
Por | -0.118 |
Token | . |
Token ID | 13 |
Feature activation | +8.07e-01 |
Pos logit contributions | |
nem | +0.388 |
unseen | +0.385 |
uth | +0.359 |
arah | +0.342 |
trusted | +0.333 |
Neg logit contributions | |
plin | -0.409 |
Draft | -0.406 |
Blooming | -0.399 |
€ | -0.397 |
Por | -0.381 |
Token | Please |
Token ID | 4222 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
plin | +0.416 |
Draft | +0.415 |
Blooming | +0.405 |
€ | +0.404 |
Por | +0.380 |
Neg logit contributions | |
nem | -0.812 |
unseen | -0.809 |
uth | -0.764 |
arah | -0.743 |
humiliated | -0.731 |
Token | re |
Token ID | 302 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
plin | +0.961 |
Draft | +0.955 |
Blooming | +0.954 |
€ | +0.951 |
Por | +0.916 |
Neg logit contributions | |
unseen | -1.081 |
nem | -1.079 |
uth | -0.992 |
arah | -0.977 |
humiliated | -0.950 |
Token | - |
Token ID | 12 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
plin | +0.992 |
Draft | +0.991 |
Blooming | +0.982 |
€ | +0.980 |
Por | +0.947 |
Neg logit contributions | |
nem | -0.778 |
unseen | -0.775 |
uth | -0.705 |
arah | -0.682 |
humiliated | -0.663 |
Token | enter |
Token ID | 9255 |
Feature activation | +4.80e+00 |
Pos logit contributions | |
plin | +1.662 |
Draft | +1.660 |
Blooming | +1.644 |
€ | +1.642 |
Por | +1.591 |
Neg logit contributions | |
nem | -1.073 |
unseen | -1.067 |
uth | -0.949 |
arah | -0.923 |
humiliated | -0.901 |
Token | . |
Token ID | 13 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
Draft | +3.183 |
plin | +3.176 |
Blooming | +3.165 |
€ | +3.164 |
Por | +3.014 |
Neg logit contributions | |
nem | -4.099 |
unseen | -4.061 |
uth | -3.743 |
arah | -3.702 |
humiliated | -3.667 |
Token | You |
Token ID | 921 |
Feature activation | -4.76e-01 |
Pos logit contributions | |
Draft | +0.213 |
plin | +0.213 |
Blooming | +0.207 |
€ | +0.207 |
Por | +0.197 |
Neg logit contributions | |
nem | -0.270 |
unseen | -0.270 |
uth | -0.253 |
arah | -0.243 |
humiliated | -0.238 |
Token | must |
Token ID | 1276 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
nem | +0.354 |
unseen | +0.353 |
uth | +0.327 |
arah | +0.314 |
humiliated | +0.307 |
Neg logit contributions | |
Draft | -0.370 |
plin | -0.368 |
Blooming | -0.361 |
€ | -0.361 |
Por | -0.348 |
Token | select |
Token ID | 2922 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
nem | +0.372 |
unseen | +0.371 |
uth | +0.347 |
arah | +0.334 |
trusted | +0.326 |
Neg logit contributions | |
Draft | -0.339 |
plin | -0.337 |
€ | -0.329 |
Blooming | -0.327 |
Por | -0.315 |
Token | a |
Token ID | 257 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
plin | +0.909 |
Draft | +0.905 |
Blooming | +0.891 |
€ | +0.887 |
Por | +0.850 |
Neg logit contributions | |
nem | -1.038 |
unseen | -1.035 |
uth | -0.963 |
arah | -0.934 |
humiliated | -0.904 |
Token | address |
Token ID | 2209 |
Feature activation | -7.34e-01 |
Pos logit contributions | |
plin | +0.095 |
Draft | +0.095 |
Blooming | +0.093 |
€ | +0.093 |
Por | +0.090 |
Neg logit contributions | |
nem | -0.089 |
unseen | -0.088 |
uth | -0.082 |
arah | -0.078 |
humiliated | -0.076 |
Token | . |
Token ID | 13 |
Feature activation | +7.72e-01 |
Pos logit contributions | |
nem | +0.542 |
unseen | +0.537 |
uth | +0.503 |
arah | +0.476 |
trusted | +0.465 |
Neg logit contributions | |
plin | -0.575 |
Draft | -0.572 |
Blooming | -0.560 |
€ | -0.558 |
Por | -0.535 |
Token | Please |
Token ID | 4222 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
plin | +0.403 |
Draft | +0.402 |
Blooming | +0.391 |
€ | +0.391 |
Por | +0.368 |
Neg logit contributions | |
nem | -0.771 |
unseen | -0.767 |
uth | -0.726 |
arah | -0.703 |
humiliated | -0.693 |
Token | re |
Token ID | 302 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
plin | +0.873 |
Draft | +0.868 |
Blooming | +0.865 |
€ | +0.862 |
Por | +0.830 |
Neg logit contributions | |
nem | -0.960 |
unseen | -0.959 |
uth | -0.882 |
arah | -0.866 |
humiliated | -0.842 |
Token | - |
Token ID | 12 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
plin | +0.931 |
Draft | +0.930 |
Blooming | +0.921 |
€ | +0.919 |
Por | +0.888 |
Neg logit contributions | |
nem | -0.723 |
unseen | -0.720 |
uth | -0.656 |
arah | -0.633 |
humiliated | -0.615 |
Token | enter |
Token ID | 9255 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
plin | +1.589 |
Draft | +1.587 |
Blooming | +1.572 |
€ | +1.570 |
Por | +1.521 |
Neg logit contributions | |
nem | -1.003 |
unseen | -0.998 |
uth | -0.889 |
arah | -0.862 |
humiliated | -0.839 |
Token | . |
Token ID | 13 |
Feature activation | +3.46e-01 |
Pos logit contributions | |
Draft | +3.150 |
plin | +3.143 |
Blooming | +3.133 |
€ | +3.126 |
Por | +2.984 |
Neg logit contributions | |
nem | -3.992 |
unseen | -3.954 |
uth | -3.652 |
arah | -3.608 |
humiliated | -3.563 |
Token | You |
Token ID | 921 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
Draft | +0.230 |
plin | +0.230 |
Blooming | +0.224 |
€ | +0.224 |
Por | +0.213 |
Neg logit contributions | |
nem | -0.294 |
unseen | -0.293 |
uth | -0.275 |
arah | -0.264 |
humiliated | -0.258 |
Token | must |
Token ID | 1276 |
Feature activation | -5.13e-01 |
Pos logit contributions | |
nem | +0.539 |
unseen | +0.538 |
uth | +0.498 |
arah | +0.479 |
humiliated | +0.467 |
Neg logit contributions | |
Draft | -0.568 |
plin | -0.563 |
Blooming | -0.553 |
€ | -0.552 |
Por | -0.533 |
Token | select |
Token ID | 2922 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
unseen | +0.406 |
nem | +0.406 |
uth | +0.379 |
arah | +0.365 |
trusted | +0.356 |
Neg logit contributions | |
Draft | -0.375 |
plin | -0.372 |
€ | -0.363 |
Blooming | -0.361 |
Por | -0.348 |
Token | a |
Token ID | 257 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
plin | +0.879 |
Draft | +0.875 |
Blooming | +0.861 |
€ | +0.857 |
Por | +0.821 |
Neg logit contributions | |
nem | -0.998 |
unseen | -0.996 |
uth | -0.926 |
arah | -0.897 |
humiliated | -0.868 |
Token | increase |
Token ID | 2620 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
nem | +0.234 |
unseen | +0.233 |
uth | +0.214 |
arah | +0.208 |
humiliated | +0.202 |
Neg logit contributions | |
Draft | -0.233 |
plin | -0.233 |
Blooming | -0.230 |
€ | -0.230 |
Por | -0.221 |
Token | of |
Token ID | 286 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
Draft | +0.160 |
plin | +0.160 |
Blooming | +0.158 |
€ | +0.158 |
Por | +0.152 |
Neg logit contributions | |
nem | -0.155 |
unseen | -0.155 |
uth | -0.142 |
arah | -0.138 |
humiliated | -0.134 |
Token | algae |
Token ID | 33773 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
nem | +0.151 |
unseen | +0.149 |
uth | +0.136 |
arah | +0.131 |
humiliated | +0.128 |
Neg logit contributions | |
Draft | -0.148 |
plin | -0.147 |
Blooming | -0.146 |
€ | -0.144 |
Por | -0.138 |
Token | within |
Token ID | 1626 |
Feature activation | -3.18e-01 |
Pos logit contributions | |
nem | +1.669 |
unseen | +1.630 |
uth | +1.516 |
arah | +1.455 |
humiliated | +1.428 |
Neg logit contributions | |
Draft | -1.369 |
plin | -1.359 |
€ | -1.332 |
Blooming | -1.330 |
Por | -1.253 |
Token | a |
Token ID | 257 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
nem | +0.227 |
unseen | +0.225 |
uth | +0.205 |
arah | +0.197 |
humiliated | +0.193 |
Neg logit contributions | |
Draft | -0.261 |
plin | -0.260 |
Blooming | -0.257 |
€ | -0.256 |
Por | -0.246 |
Token | body |
Token ID | 1767 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
Draft | +0.740 |
plin | +0.740 |
Blooming | +0.730 |
€ | +0.728 |
Por | +0.698 |
Neg logit contributions | |
nem | -0.807 |
unseen | -0.803 |
uth | -0.742 |
arah | -0.720 |
humiliated | -0.704 |
Token | of |
Token ID | 286 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
plin | +3.397 |
€ | +3.386 |
Blooming | +3.363 |
Draft | +3.338 |
Por | +3.266 |
Neg logit contributions | |
nem | -3.552 |
unseen | -3.544 |
uth | -3.305 |
arah | -3.263 |
humiliated | -3.145 |
Token | water |
Token ID | 1660 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
plin | +0.953 |
Draft | +0.952 |
Blooming | +0.941 |
€ | +0.939 |
Por | +0.902 |
Neg logit contributions | |
nem | -1.014 |
unseen | -1.011 |
uth | -0.933 |
arah | -0.906 |
humiliated | -0.885 |
Token | , |
Token ID | 11 |
Feature activation | +6.59e-01 |
Pos logit contributions | |
nem | +0.013 |
unseen | +0.013 |
uth | +0.012 |
arah | +0.011 |
humiliated | +0.011 |
Neg logit contributions | |
Draft | -0.013 |
plin | -0.013 |
Blooming | -0.012 |
€ | -0.012 |
Por | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
Draft | +0.515 |
plin | +0.514 |
Blooming | +0.508 |
€ | +0.507 |
Por | +0.487 |
Neg logit contributions | |
nem | -0.490 |
unseen | -0.489 |
uth | -0.448 |
arah | -0.433 |
humiliated | -0.422 |
Token | spread |
Token ID | 4104 |
Feature activation | +2.44e-01 |
Pos logit contributions | |
Draft | +0.792 |
plin | +0.790 |
Blooming | +0.782 |
€ | +0.778 |
Por | +0.748 |
Neg logit contributions | |
nem | -0.840 |
unseen | -0.836 |
uth | -0.770 |
arah | -0.745 |
humiliated | -0.728 |
Token | address |
Token ID | 2209 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
plin | +0.105 |
Draft | +0.105 |
Blooming | +0.104 |
€ | +0.103 |
Por | +0.099 |
Neg logit contributions | |
nem | -0.097 |
unseen | -0.097 |
uth | -0.089 |
arah | -0.086 |
humiliated | -0.083 |
Token | . |
Token ID | 13 |
Feature activation | +6.74e-01 |
Pos logit contributions | |
nem | +0.314 |
unseen | +0.312 |
uth | +0.291 |
arah | +0.276 |
trusted | +0.270 |
Neg logit contributions | |
plin | -0.330 |
Draft | -0.329 |
Blooming | -0.323 |
€ | -0.322 |
Por | -0.308 |
Token | Please |
Token ID | 4222 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
plin | +0.354 |
Draft | +0.353 |
Blooming | +0.343 |
€ | +0.343 |
Por | +0.322 |
Neg logit contributions | |
nem | -0.672 |
unseen | -0.669 |
uth | -0.632 |
arah | -0.612 |
humiliated | -0.603 |
Token | re |
Token ID | 302 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
plin | +0.949 |
Draft | +0.944 |
Blooming | +0.941 |
€ | +0.939 |
Por | +0.904 |
Neg logit contributions | |
unseen | -1.051 |
nem | -1.050 |
uth | -0.966 |
arah | -0.951 |
humiliated | -0.923 |
Token | - |
Token ID | 12 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
plin | +0.912 |
Draft | +0.911 |
Blooming | +0.902 |
€ | +0.900 |
Por | +0.870 |
Neg logit contributions | |
nem | -0.707 |
unseen | -0.705 |
uth | -0.642 |
arah | -0.620 |
humiliated | -0.602 |
Token | enter |
Token ID | 9255 |
Feature activation | +4.62e+00 |
Pos logit contributions | |
plin | +1.711 |
Draft | +1.709 |
Blooming | +1.692 |
€ | +1.691 |
Por | +1.638 |
Neg logit contributions | |
nem | -1.094 |
unseen | -1.087 |
uth | -0.968 |
arah | -0.941 |
humiliated | -0.917 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
Draft | +3.096 |
plin | +3.088 |
Blooming | +3.074 |
€ | +3.072 |
Por | +2.928 |
Neg logit contributions | |
nem | -3.911 |
unseen | -3.873 |
uth | -3.578 |
arah | -3.534 |
humiliated | -3.491 |
Token | You |
Token ID | 921 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
plin | +0.124 |
Draft | +0.123 |
€ | +0.120 |
Blooming | +0.120 |
Por | +0.114 |
Neg logit contributions | |
nem | -0.154 |
unseen | -0.154 |
uth | -0.144 |
arah | -0.138 |
humiliated | -0.135 |
Token | must |
Token ID | 1276 |
Feature activation | -2.73e-01 |
Pos logit contributions | |
nem | +0.454 |
unseen | +0.454 |
uth | +0.419 |
arah | +0.403 |
humiliated | +0.393 |
Neg logit contributions | |
Draft | -0.481 |
plin | -0.477 |
Blooming | -0.469 |
€ | -0.468 |
Por | -0.452 |
Token | select |
Token ID | 2922 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
nem | +0.217 |
unseen | +0.217 |
uth | +0.203 |
arah | +0.195 |
trusted | +0.190 |
Neg logit contributions | |
Draft | -0.198 |
plin | -0.197 |
€ | -0.193 |
Blooming | -0.192 |
Por | -0.185 |
Token | a |
Token ID | 257 |
Feature activation | +1.90e+00 |
Pos logit contributions | |
plin | +0.963 |
Draft | +0.959 |
Blooming | +0.943 |
€ | +0.939 |
Por | +0.900 |
Neg logit contributions | |
nem | -1.097 |
unseen | -1.094 |
uth | -1.017 |
arah | -0.986 |
humiliated | -0.955 |
Token | , |
Token ID | 11 |
Feature activation | -2.63e-02 |
Pos logit contributions | |
Draft | +0.277 |
plin | +0.277 |
Blooming | +0.274 |
€ | +0.271 |
Por | +0.262 |
Neg logit contributions | |
nem | -0.248 |
unseen | -0.247 |
uth | -0.225 |
arah | -0.217 |
humiliated | -0.213 |
Token | renegoti |
Token ID | 48312 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
unseen | +0.020 |
nem | +0.020 |
uth | +0.018 |
arah | +0.017 |
humiliated | +0.017 |
Neg logit contributions | |
plin | -0.021 |
Draft | -0.021 |
Blooming | -0.020 |
€ | -0.020 |
Por | -0.019 |
Token | ated |
Token ID | 515 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
plin | +1.043 |
Draft | +1.042 |
€ | +1.031 |
Blooming | +1.031 |
Por | +0.990 |
Neg logit contributions | |
nem | -0.909 |
unseen | -0.905 |
uth | -0.822 |
arah | -0.800 |
humiliated | -0.778 |
Token | or |
Token ID | 393 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
plin | +1.060 |
Draft | +1.059 |
Blooming | +1.048 |
€ | +1.047 |
Por | +1.008 |
Neg logit contributions | |
nem | -0.981 |
unseen | -0.978 |
uth | -0.898 |
arah | -0.871 |
humiliated | -0.848 |
Token | rem |
Token ID | 816 |
Feature activation | +2.11e+00 |
Pos logit contributions | |
plin | +1.023 |
Draft | +1.021 |
Blooming | +1.010 |
€ | +1.005 |
Por | +0.967 |
Neg logit contributions | |
nem | -1.091 |
unseen | -1.089 |
uth | -1.004 |
arah | -0.973 |
humiliated | -0.955 |
Token | ade |
Token ID | 671 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
plin | +1.750 |
Draft | +1.744 |
€ | +1.732 |
Blooming | +1.723 |
Por | +1.660 |
Neg logit contributions | |
nem | -1.468 |
unseen | -1.461 |
uth | -1.320 |
arah | -1.281 |
humiliated | -1.257 |
Token | . |
Token ID | 13 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
€ | +3.383 |
plin | +3.359 |
Draft | +3.337 |
Blooming | +3.310 |
Por | +3.217 |
Neg logit contributions | |
nem | -3.527 |
unseen | -3.486 |
uth | -3.274 |
arah | -3.229 |
emet | -3.111 |
Token | How |
Token ID | 1374 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
plin | +0.243 |
Draft | +0.237 |
Blooming | +0.233 |
€ | +0.231 |
Por | +0.222 |
Neg logit contributions | |
nem | -0.259 |
unseen | -0.256 |
uth | -0.238 |
arah | -0.228 |
humiliated | -0.224 |
Token | this |
Token ID | 428 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
unseen | +0.515 |
nem | +0.515 |
uth | +0.471 |
arah | +0.452 |
humiliated | +0.448 |
Neg logit contributions | |
plin | -0.510 |
Draft | -0.508 |
Blooming | -0.500 |
€ | -0.496 |
Por | -0.477 |
Token | is |
Token ID | 318 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
plin | +1.355 |
Draft | +1.349 |
Blooming | +1.333 |
€ | +1.324 |
Por | +1.275 |
Neg logit contributions | |
nem | -1.439 |
unseen | -1.438 |
uth | -1.320 |
arah | -1.277 |
humiliated | -1.257 |
Token | done |
Token ID | 1760 |
Feature activation | +7.69e-01 |
Pos logit contributions | |
plin | +0.904 |
Draft | +0.901 |
Blooming | +0.892 |
€ | +0.886 |
Por | +0.858 |
Neg logit contributions | |
nem | -0.715 |
unseen | -0.715 |
uth | -0.649 |
arah | -0.624 |
humiliated | -0.611 |
Token | completely |
Token ID | 3190 |
Feature activation | -9.30e-01 |
Pos logit contributions | |
plin | +0.547 |
Draft | +0.546 |
Blooming | +0.540 |
€ | +0.539 |
Por | +0.519 |
Neg logit contributions | |
nem | -0.498 |
unseen | -0.497 |
uth | -0.455 |
arah | -0.440 |
humiliated | -0.430 |
Token | criminal |
Token ID | 4301 |
Feature activation | +8.14e-01 |
Pos logit contributions | |
unseen | +0.693 |
nem | +0.690 |
uth | +0.629 |
arah | +0.606 |
humiliated | +0.599 |
Neg logit contributions | |
plin | -0.730 |
Draft | -0.729 |
Blooming | -0.720 |
€ | -0.716 |
Por | -0.691 |
Token | . |
Token ID | 13 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
plin | +0.610 |
Draft | +0.609 |
Blooming | +0.603 |
€ | +0.601 |
Por | +0.578 |
Neg logit contributions | |
nem | -0.629 |
unseen | -0.627 |
uth | -0.579 |
arah | -0.562 |
humiliated | -0.548 |
Token | And |
Token ID | 843 |
Feature activation | -5.31e-01 |
Pos logit contributions | |
plin | +0.155 |
Draft | +0.152 |
Blooming | +0.150 |
€ | +0.150 |
Por | +0.142 |
Neg logit contributions | |
nem | -0.190 |
unseen | -0.188 |
uth | -0.175 |
arah | -0.169 |
humiliated | -0.166 |
Token | even |
Token ID | 772 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
nem | +0.404 |
unseen | +0.403 |
uth | +0.367 |
arah | +0.352 |
humiliated | +0.351 |
Neg logit contributions | |
Draft | -0.408 |
plin | -0.408 |
Blooming | -0.402 |
€ | -0.399 |
Por | -0.383 |
Token | then |
Token ID | 788 |
Feature activation | +4.57e+00 |
Pos logit contributions | |
Draft | +0.452 |
plin | +0.451 |
Blooming | +0.445 |
€ | +0.444 |
Por | +0.425 |
Neg logit contributions | |
nem | -0.477 |
unseen | -0.476 |
uth | -0.436 |
arah | -0.422 |
humiliated | -0.417 |
Token | , |
Token ID | 11 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
plin | +3.192 |
Draft | +3.183 |
€ | +3.158 |
Blooming | +3.146 |
Por | +3.029 |
Neg logit contributions | |
nem | -3.697 |
unseen | -3.676 |
uth | -3.423 |
arah | -3.370 |
humiliated | -3.247 |
Token | it |
Token ID | 340 |
Feature activation | -4.19e-01 |
Pos logit contributions | |
unseen | +0.368 |
nem | +0.368 |
uth | +0.335 |
arah | +0.320 |
humiliated | +0.320 |
Neg logit contributions | |
Draft | -0.374 |
plin | -0.373 |
Blooming | -0.369 |
€ | -0.366 |
Por | -0.352 |
Token | is |
Token ID | 318 |
Feature activation | -4.10e-02 |
Pos logit contributions | |
nem | +0.313 |
unseen | +0.312 |
uth | +0.286 |
arah | +0.274 |
humiliated | +0.272 |
Neg logit contributions | |
Draft | -0.329 |
plin | -0.327 |
Blooming | -0.323 |
€ | -0.320 |
Por | -0.309 |
Token | hard |
Token ID | 1327 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
unseen | +0.032 |
nem | +0.032 |
uth | +0.029 |
arah | +0.028 |
humiliated | +0.028 |
Neg logit contributions | |
Draft | -0.031 |
plin | -0.030 |
Blooming | -0.030 |
€ | -0.030 |
Por | -0.029 |
Token | to |
Token ID | 284 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
plin | +0.116 |
Draft | +0.116 |
Blooming | +0.115 |
€ | +0.115 |
Por | +0.111 |
Neg logit contributions | |
nem | -0.107 |
unseen | -0.106 |
uth | -0.098 |
arah | -0.095 |
humiliated | -0.092 |
Token | better |
Token ID | 1365 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
unseen | +0.645 |
nem | +0.645 |
uth | +0.591 |
arah | +0.569 |
humiliated | +0.560 |
Neg logit contributions | |
Draft | -0.652 |
plin | -0.646 |
Blooming | -0.641 |
€ | -0.637 |
Por | -0.614 |
Token | . |
Token ID | 13 |
Feature activation | -4.76e-02 |
Pos logit contributions | |
nem | +0.283 |
unseen | +0.283 |
uth | +0.260 |
arah | +0.250 |
humiliated | +0.245 |
Neg logit contributions | |
Draft | -0.282 |
plin | -0.281 |
Blooming | -0.278 |
€ | -0.276 |
Por | -0.266 |
Token |
|
Token ID | 198 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
nem | +0.037 |
unseen | +0.036 |
uth | +0.034 |
arah | +0.032 |
humiliated | +0.032 |
Neg logit contributions | |
plin | -0.036 |
Draft | -0.036 |
Blooming | -0.035 |
€ | -0.035 |
Por | -0.034 |
Token |
|
Token ID | 198 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
nem | +0.273 |
unseen | +0.272 |
uth | +0.250 |
arah | +0.239 |
humiliated | +0.230 |
Neg logit contributions | |
plin | -0.347 |
Draft | -0.342 |
Blooming | -0.340 |
€ | -0.337 |
Por | -0.326 |
Token | Why |
Token ID | 5195 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
nem | +0.141 |
unseen | +0.140 |
uth | +0.131 |
arah | +0.127 |
humiliated | +0.123 |
Neg logit contributions | |
plin | -0.135 |
Blooming | -0.134 |
€ | -0.133 |
Draft | -0.132 |
Por | -0.128 |
Token | then |
Token ID | 788 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
Draft | +0.252 |
plin | +0.252 |
Blooming | +0.247 |
€ | +0.246 |
Por | +0.236 |
Neg logit contributions | |
nem | -0.285 |
unseen | -0.285 |
uth | -0.263 |
arah | -0.255 |
humiliated | -0.250 |
Token | , |
Token ID | 11 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
plin | +3.329 |
Draft | +3.299 |
€ | +3.290 |
Blooming | +3.281 |
Por | +3.162 |
Neg logit contributions | |
nem | -3.511 |
unseen | -3.485 |
uth | -3.244 |
arah | -3.153 |
humiliated | -3.065 |
Token | are |
Token ID | 389 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
Draft | +0.639 |
plin | +0.638 |
Blooming | +0.630 |
€ | +0.628 |
Por | +0.605 |
Neg logit contributions | |
nem | -0.617 |
unseen | -0.615 |
uth | -0.565 |
arah | -0.547 |
humiliated | -0.535 |
Token | some |
Token ID | 617 |
Feature activation | -8.71e-01 |
Pos logit contributions | |
nem | +0.950 |
unseen | +0.944 |
uth | +0.872 |
arah | +0.837 |
humiliated | +0.820 |
Neg logit contributions | |
Draft | -0.920 |
plin | -0.917 |
Blooming | -0.907 |
€ | -0.903 |
Por | -0.868 |
Token | people |
Token ID | 661 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
nem | +0.678 |
unseen | +0.676 |
uth | +0.621 |
arah | +0.594 |
humiliated | +0.587 |
Neg logit contributions | |
Draft | -0.655 |
plin | -0.651 |
Blooming | -0.642 |
€ | -0.636 |
Por | -0.615 |
Token | testing |
Token ID | 4856 |
Feature activation | +6.15e-02 |
Pos logit contributions | |
Draft | +0.166 |
plin | +0.166 |
Blooming | +0.164 |
€ | +0.163 |
Por | +0.157 |
Neg logit contributions | |
nem | -0.159 |
unseen | -0.159 |
uth | -0.145 |
arah | -0.141 |
humiliated | -0.138 |
Token |
|
Token ID | 198 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
nem | +1.034 |
unseen | +1.032 |
uth | +0.946 |
arah | +0.904 |
humiliated | +0.881 |
Neg logit contributions | |
Draft | -1.206 |
plin | -1.203 |
Blooming | -1.191 |
€ | -1.182 |
Por | -1.143 |
Token |
|
Token ID | 198 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
nem | +0.895 |
unseen | +0.894 |
uth | +0.820 |
arah | +0.777 |
trusted | +0.744 |
Neg logit contributions | |
plin | -1.193 |
Draft | -1.175 |
Blooming | -1.167 |
€ | -1.150 |
Por | -1.121 |
Token | pub |
Token ID | 12984 |
Feature activation | -6.50e-01 |
Pos logit contributions | |
nem | +1.082 |
unseen | +1.078 |
uth | +1.005 |
arah | +0.974 |
humiliated | +0.933 |
Neg logit contributions | |
plin | -1.101 |
Blooming | -1.098 |
Draft | -1.092 |
€ | -1.084 |
Por | -1.049 |
Token | struct |
Token ID | 2878 |
Feature activation | -8.10e-01 |
Pos logit contributions | |
nem | +0.590 |
unseen | +0.589 |
uth | +0.550 |
arah | +0.535 |
humiliated | +0.524 |
Neg logit contributions | |
plin | -0.400 |
Draft | -0.399 |
Blooming | -0.394 |
€ | -0.392 |
Por | -0.372 |
Token | Guard |
Token ID | 4932 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
nem | +0.677 |
unseen | +0.673 |
uth | +0.624 |
arah | +0.605 |
humiliated | +0.591 |
Neg logit contributions | |
Draft | -0.562 |
plin | -0.561 |
€ | -0.551 |
Blooming | -0.549 |
Por | -0.522 |
Token | { |
Token ID | 1391 |
Feature activation | +4.50e+00 |
Pos logit contributions | |
plin | +0.128 |
Draft | +0.128 |
Blooming | +0.126 |
€ | +0.126 |
Por | +0.121 |
Neg logit contributions | |
nem | -0.126 |
unseen | -0.126 |
uth | -0.116 |
arah | -0.113 |
humiliated | -0.110 |
Token | ... |
Token ID | 2644 |
Feature activation | +9.91e-01 |
Pos logit contributions | |
€ | +3.175 |
Draft | +3.159 |
plin | +3.153 |
Blooming | +3.148 |
Por | +3.066 |
Neg logit contributions | |
nem | -3.547 |
unseen | -3.529 |
uth | -3.317 |
arah | -3.231 |
humiliated | -3.160 |
Token | } |
Token ID | 1782 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
plin | +0.678 |
Draft | +0.676 |
Blooming | +0.668 |
€ | +0.665 |
Por | +0.637 |
Neg logit contributions | |
nem | -0.833 |
unseen | -0.831 |
uth | -0.771 |
arah | -0.749 |
humiliated | -0.733 |
Token | pub |
Token ID | 2240 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
nem | +0.848 |
unseen | +0.845 |
uth | +0.774 |
arah | +0.746 |
humiliated | +0.727 |
Neg logit contributions | |
plin | -0.888 |
Draft | -0.882 |
Blooming | -0.876 |
€ | -0.868 |
Por | -0.834 |
Token | fn |
Token ID | 24714 |
Feature activation | -5.49e-01 |
Pos logit contributions | |
nem | +0.229 |
unseen | +0.229 |
uth | +0.213 |
arah | +0.208 |
humiliated | +0.204 |
Neg logit contributions | |
plin | -0.161 |
Draft | -0.160 |
Blooming | -0.158 |
€ | -0.158 |
Por | -0.151 |
Token | pin |
Token ID | 6757 |
Feature activation | -5.96e-01 |
Pos logit contributions | |
nem | +0.397 |
unseen | +0.396 |
uth | +0.361 |
arah | +0.348 |
humiliated | +0.341 |
Neg logit contributions | |
Draft | -0.443 |
plin | -0.443 |
Blooming | -0.436 |
€ | -0.435 |
Por | -0.418 |
Token | applies |
Token ID | 8991 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
plin | +0.923 |
Draft | +0.922 |
Blooming | +0.912 |
€ | +0.910 |
Por | +0.876 |
Neg logit contributions | |
nem | -0.904 |
unseen | -0.902 |
uth | -0.830 |
arah | -0.805 |
humiliated | -0.785 |
Token | to |
Token ID | 284 |
Feature activation | +1.90e-01 |
Pos logit contributions | |
plin | +0.258 |
Draft | +0.258 |
Blooming | +0.254 |
€ | +0.252 |
Por | +0.244 |
Neg logit contributions | |
unseen | -0.234 |
nem | -0.234 |
uth | -0.214 |
arah | -0.206 |
humiliated | -0.202 |
Token | not |
Token ID | 407 |
Feature activation | +4.82e-01 |
Pos logit contributions | |
plin | +0.151 |
Draft | +0.151 |
Blooming | +0.149 |
€ | +0.148 |
Por | +0.143 |
Neg logit contributions | |
nem | -0.139 |
unseen | -0.139 |
uth | -0.127 |
arah | -0.123 |
humiliated | -0.120 |
Token | only |
Token ID | 691 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
plin | +0.353 |
Draft | +0.352 |
Blooming | +0.348 |
€ | +0.347 |
Por | +0.333 |
Neg logit contributions | |
nem | -0.381 |
unseen | -0.381 |
uth | -0.352 |
arah | -0.341 |
humiliated | -0.334 |
Token | sex |
Token ID | 1714 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
plin | +0.091 |
Draft | +0.091 |
Blooming | +0.089 |
€ | +0.089 |
Por | +0.086 |
Neg logit contributions | |
nem | -0.085 |
unseen | -0.085 |
uth | -0.078 |
arah | -0.076 |
humiliated | -0.074 |
Token | but |
Token ID | 475 |
Feature activation | +4.49e+00 |
Pos logit contributions | |
nem | +0.010 |
unseen | +0.010 |
uth | +0.009 |
arah | +0.009 |
humiliated | +0.008 |
Neg logit contributions | |
Draft | -0.009 |
plin | -0.009 |
Blooming | -0.009 |
€ | -0.009 |
Por | -0.009 |
Token | also |
Token ID | 635 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
€ | +3.319 |
Blooming | +3.303 |
plin | +3.292 |
Draft | +3.287 |
Por | +3.175 |
Neg logit contributions | |
unseen | -3.425 |
nem | -3.425 |
uth | -3.171 |
arah | -3.091 |
emet | -3.009 |
Token | race |
Token ID | 3234 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
plin | +1.136 |
Draft | +1.135 |
Blooming | +1.124 |
€ | +1.123 |
Por | +1.080 |
Neg logit contributions | |
nem | -1.116 |
unseen | -1.113 |
uth | -1.025 |
arah | -0.996 |
humiliated | -0.969 |
Token | . |
Token ID | 13 |
Feature activation | +8.84e-01 |
Pos logit contributions | |
unseen | +0.913 |
nem | +0.911 |
uth | +0.838 |
arah | +0.807 |
humiliated | +0.789 |
Neg logit contributions | |
plin | -0.965 |
Draft | -0.963 |
Blooming | -0.952 |
€ | -0.947 |
Por | -0.911 |
Token | � |
Token ID | 447 |
Feature activation | +5.87e-01 |
Pos logit contributions | |
plin | +0.681 |
Draft | +0.674 |
€ | +0.665 |
Blooming | +0.665 |
Por | +0.636 |
Neg logit contributions | |
nem | -0.669 |
unseen | -0.665 |
uth | -0.617 |
arah | -0.596 |
humiliated | -0.580 |
Token | � |
Token ID | 251 |
Feature activation | -5.55e-01 |
Pos logit contributions | |
plin | +0.507 |
Draft | +0.506 |
€ | +0.501 |
Blooming | +0.501 |
Por | +0.484 |
Neg logit contributions | |
nem | -0.386 |
unseen | -0.385 |
uth | -0.351 |
arah | -0.339 |
humiliated | -0.328 |
Token | hes |
Token ID | 956 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
Draft | +0.308 |
plin | +0.307 |
Blooming | +0.304 |
€ | +0.303 |
Por | +0.292 |
Neg logit contributions | |
nem | -0.306 |
unseen | -0.305 |
uth | -0.282 |
arah | -0.274 |
humiliated | -0.265 |
Token |
|
Token ID | 198 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
plin | +0.222 |
Draft | +0.222 |
Blooming | +0.220 |
€ | +0.219 |
Por | +0.211 |
Neg logit contributions | |
nem | -0.208 |
unseen | -0.208 |
uth | -0.191 |
arah | -0.185 |
humiliated | -0.180 |
Token |
|
Token ID | 198 |
Feature activation | -3.06e-01 |
Pos logit contributions | |
nem | +0.399 |
unseen | +0.398 |
uth | +0.365 |
arah | +0.349 |
humiliated | +0.335 |
Neg logit contributions | |
plin | -0.509 |
Draft | -0.504 |
Blooming | -0.499 |
€ | -0.495 |
Por | -0.480 |
Token | If |
Token ID | 1532 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
nem | +0.224 |
unseen | +0.223 |
uth | +0.208 |
arah | +0.201 |
humiliated | +0.193 |
Neg logit contributions | |
plin | -0.241 |
Blooming | -0.240 |
€ | -0.238 |
Draft | -0.238 |
Por | -0.230 |
Token | you |
Token ID | 345 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
plin | +0.215 |
Draft | +0.215 |
Blooming | +0.212 |
€ | +0.211 |
Por | +0.203 |
Neg logit contributions | |
nem | -0.228 |
unseen | -0.228 |
uth | -0.210 |
arah | -0.204 |
humiliated | -0.199 |
Token | liked |
Token ID | 8288 |
Feature activation | +4.46e+00 |
Pos logit contributions | |
Draft | +0.382 |
plin | +0.382 |
Blooming | +0.377 |
€ | +0.376 |
Por | +0.362 |
Neg logit contributions | |
nem | -0.367 |
unseen | -0.366 |
uth | -0.336 |
arah | -0.325 |
humiliated | -0.319 |
Token | that |
Token ID | 326 |
Feature activation | +8.17e-01 |
Pos logit contributions | |
plin | +3.322 |
Blooming | +3.317 |
Draft | +3.312 |
€ | +3.296 |
Por | +3.188 |
Neg logit contributions | |
nem | -3.415 |
unseen | -3.398 |
uth | -3.153 |
arah | -3.070 |
humiliated | -2.987 |
Token | you |
Token ID | 345 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
Draft | +0.591 |
plin | +0.589 |
Blooming | +0.581 |
€ | +0.578 |
Por | +0.555 |
Neg logit contributions | |
unseen | -0.655 |
nem | -0.655 |
uth | -0.603 |
arah | -0.587 |
humiliated | -0.574 |
Token | might |
Token ID | 1244 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
Draft | +0.189 |
plin | +0.188 |
Blooming | +0.186 |
€ | +0.184 |
Por | +0.177 |
Neg logit contributions | |
nem | -0.231 |
unseen | -0.230 |
uth | -0.214 |
arah | -0.208 |
humiliated | -0.204 |
Token | like |
Token ID | 588 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
Draft | +0.766 |
plin | +0.764 |
Blooming | +0.756 |
€ | +0.752 |
Por | +0.724 |
Neg logit contributions | |
nem | -0.801 |
unseen | -0.798 |
uth | -0.738 |
arah | -0.714 |
humiliated | -0.697 |
Token | these |
Token ID | 777 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
Draft | +1.910 |
plin | +1.908 |
Blooming | +1.896 |
€ | +1.891 |
Por | +1.822 |
Neg logit contributions | |
nem | -1.900 |
unseen | -1.892 |
uth | -1.747 |
arah | -1.698 |
humiliated | -1.657 |
Token | memories |
Token ID | 9846 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
unseen | +0.325 |
nem | +0.324 |
uth | +0.297 |
arah | +0.289 |
humiliated | +0.282 |
Neg logit contributions | |
plin | -0.318 |
Draft | -0.317 |
Blooming | -0.312 |
€ | -0.312 |
Por | -0.299 |
Token | , |
Token ID | 11 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
plin | +0.806 |
Draft | +0.805 |
Blooming | +0.796 |
€ | +0.794 |
Por | +0.763 |
Neg logit contributions | |
nem | -0.833 |
unseen | -0.832 |
uth | -0.767 |
arah | -0.745 |
humiliated | -0.726 |
Token | old |
Token ID | 1468 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
unseen | +0.119 |
nem | +0.119 |
uth | +0.109 |
arah | +0.106 |
humiliated | +0.104 |
Neg logit contributions | |
plin | -0.117 |
Draft | -0.117 |
Blooming | -0.115 |
€ | -0.115 |
Por | -0.110 |
Token | photos |
Token ID | 5205 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
nem | +0.960 |
unseen | +0.956 |
uth | +0.877 |
arah | +0.851 |
humiliated | +0.833 |
Neg logit contributions | |
Draft | -0.917 |
plin | -0.914 |
€ | -0.899 |
Blooming | -0.897 |
Por | -0.859 |
Token | , |
Token ID | 11 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
Draft | +0.173 |
plin | +0.173 |
Blooming | +0.171 |
€ | +0.170 |
Por | +0.164 |
Neg logit contributions | |
unseen | -0.177 |
nem | -0.177 |
uth | -0.163 |
arah | -0.159 |
humiliated | -0.155 |
Token | etc |
Token ID | 3503 |
Feature activation | +4.43e+00 |
Pos logit contributions | |
plin | +0.013 |
Draft | +0.013 |
Blooming | +0.012 |
€ | +0.012 |
Por | +0.012 |
Neg logit contributions | |
unseen | -0.013 |
nem | -0.013 |
uth | -0.012 |
arah | -0.012 |
humiliated | -0.011 |
Token | .? |
Token ID | 40791 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
plin | +3.049 |
Draft | +3.045 |
€ | +3.009 |
Blooming | +3.004 |
Por | +2.879 |
Neg logit contributions | |
nem | -3.628 |
unseen | -3.597 |
uth | -3.346 |
arah | -3.252 |
humiliated | -3.188 |
Token | Want |
Token ID | 16168 |
Feature activation | +8.06e-01 |
Pos logit contributions | |
nem | +0.235 |
unseen | +0.234 |
uth | +0.220 |
arah | +0.214 |
humiliated | +0.209 |
Neg logit contributions | |
plin | -0.156 |
Draft | -0.156 |
Blooming | -0.154 |
€ | -0.153 |
Por | -0.145 |
Token | to |
Token ID | 284 |
Feature activation | -9.58e-01 |
Pos logit contributions | |
plin | +0.634 |
Draft | +0.634 |
Blooming | +0.626 |
€ | +0.625 |
Por | +0.601 |
Neg logit contributions | |
nem | -0.593 |
unseen | -0.592 |
uth | -0.544 |
arah | -0.527 |
humiliated | -0.512 |
Token | write |
Token ID | 3551 |
Feature activation | +3.45e-01 |
Pos logit contributions | |
nem | +0.730 |
unseen | +0.728 |
uth | +0.668 |
arah | +0.647 |
humiliated | +0.632 |
Neg logit contributions | |
Draft | -0.730 |
plin | -0.727 |
Blooming | -0.718 |
€ | -0.717 |
Por | -0.689 |
Token | a |
Token ID | 257 |
Feature activation | -7.30e-01 |
Pos logit contributions | |
Draft | +0.260 |
plin | +0.260 |
€ | +0.256 |
Blooming | +0.256 |
Por | +0.245 |
Neg logit contributions | |
nem | -0.266 |
unseen | -0.266 |
uth | -0.245 |
arah | -0.237 |
humiliated | -0.231 |
Token | chester |
Token ID | 35983 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
Draft | +0.065 |
plin | +0.065 |
€ | +0.064 |
Blooming | +0.064 |
Por | +0.061 |
Neg logit contributions | |
nem | -0.059 |
unseen | -0.058 |
uth | -0.054 |
arah | -0.052 |
humiliated | -0.050 |
Token | 1 |
Token ID | 352 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
nem | +1.173 |
unseen | +1.161 |
uth | +1.097 |
arah | +1.052 |
humiliated | +1.031 |
Neg logit contributions | |
plin | -0.952 |
Draft | -0.947 |
€ | -0.924 |
Blooming | -0.923 |
Por | -0.879 |
Token | hour |
Token ID | 1711 |
Feature activation | +1.51e-02 |
Pos logit contributions | |
plin | +0.914 |
Draft | +0.911 |
Blooming | +0.903 |
€ | +0.901 |
Por | +0.872 |
Neg logit contributions | |
nem | -0.644 |
unseen | -0.642 |
uth | -0.581 |
arah | -0.559 |
humiliated | -0.541 |
Token | ago |
Token ID | 2084 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
plin | +0.013 |
Draft | +0.013 |
Blooming | +0.013 |
€ | +0.013 |
Por | +0.012 |
Neg logit contributions | |
nem | -0.010 |
unseen | -0.010 |
uth | -0.009 |
arah | -0.009 |
humiliated | -0.009 |
Token | Pretty |
Token ID | 20090 |
Feature activation | -3.12e-01 |
Pos logit contributions | |
plin | +0.912 |
Draft | +0.908 |
Blooming | +0.892 |
€ | +0.890 |
Por | +0.846 |
Neg logit contributions | |
nem | -1.222 |
unseen | -1.218 |
uth | -1.134 |
arah | -1.103 |
humiliated | -1.083 |
Token | simple |
Token ID | 2829 |
Feature activation | +4.39e+00 |
Pos logit contributions | |
nem | +0.241 |
unseen | +0.241 |
uth | +0.222 |
arah | +0.215 |
humiliated | +0.211 |
Neg logit contributions | |
Draft | -0.235 |
plin | -0.234 |
Blooming | -0.232 |
€ | -0.231 |
Por | -0.221 |
Token | Paul |
Token ID | 3362 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
plin | +3.155 |
€ | +3.147 |
Draft | +3.145 |
Blooming | +3.138 |
Por | +3.025 |
Neg logit contributions | |
nem | -3.443 |
unseen | -3.440 |
uth | -3.201 |
arah | -3.124 |
humiliated | -3.023 |
Token | : |
Token ID | 25 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
Draft | +1.072 |
plin | +1.070 |
Blooming | +1.059 |
€ | +1.054 |
Por | +1.005 |
Neg logit contributions | |
nem | -1.161 |
unseen | -1.154 |
uth | -1.071 |
arah | -1.034 |
humiliated | -1.013 |
Token |
|
Token ID | 198 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
plin | +1.245 |
Draft | +1.242 |
Blooming | +1.228 |
€ | +1.224 |
Por | +1.172 |
Neg logit contributions | |
nem | -1.467 |
unseen | -1.464 |
uth | -1.358 |
arah | -1.319 |
humiliated | -1.291 |
Token |
|
Token ID | 198 |
Feature activation | +9.87e-01 |
Pos logit contributions | |
plin | +0.981 |
Draft | +0.979 |
Blooming | +0.969 |
€ | +0.967 |
Por | +0.932 |
Neg logit contributions | |
nem | -0.855 |
unseen | -0.852 |
uth | -0.781 |
arah | -0.755 |
humiliated | -0.735 |
Token | These |
Token ID | 4711 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
plin | +0.769 |
Draft | +0.762 |
Blooming | +0.762 |
€ | +0.758 |
Por | +0.729 |
Neg logit contributions | |
nem | -0.733 |
unseen | -0.731 |
uth | -0.676 |
arah | -0.655 |
humiliated | -0.636 |
Token | representative |
Token ID | 8852 |
Feature activation | -8.27e-02 |
Pos logit contributions | |
nem | +0.222 |
unseen | +0.220 |
uth | +0.202 |
arah | +0.196 |
humiliated | +0.193 |
Neg logit contributions | |
plin | -0.213 |
Draft | -0.212 |
Blooming | -0.209 |
€ | -0.209 |
Por | -0.200 |
Token | of |
Token ID | 286 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
nem | +0.064 |
unseen | +0.064 |
uth | +0.059 |
arah | +0.057 |
humiliated | +0.056 |
Neg logit contributions | |
Draft | -0.062 |
plin | -0.062 |
Blooming | -0.061 |
€ | -0.061 |
Por | -0.058 |
Token | the |
Token ID | 262 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
plin | +0.136 |
Draft | +0.136 |
Blooming | +0.133 |
€ | +0.133 |
Por | +0.128 |
Neg logit contributions | |
unseen | -0.132 |
nem | -0.131 |
uth | -0.121 |
arah | -0.116 |
humiliated | -0.114 |
Token | Democratic |
Token ID | 4390 |
Feature activation | -9.14e-01 |
Pos logit contributions | |
plin | +0.109 |
Draft | +0.108 |
Blooming | +0.106 |
€ | +0.106 |
Por | +0.102 |
Neg logit contributions | |
unseen | -0.106 |
nem | -0.106 |
uth | -0.097 |
arah | -0.094 |
humiliated | -0.092 |
Token | Party |
Token ID | 3615 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
nem | +0.741 |
unseen | +0.740 |
uth | +0.689 |
arah | +0.660 |
humiliated | +0.649 |
Neg logit contributions | |
plin | -0.659 |
Draft | -0.653 |
€ | -0.641 |
Blooming | -0.641 |
Por | -0.611 |
Token | but |
Token ID | 475 |
Feature activation | +4.39e+00 |
Pos logit contributions | |
nem | +0.242 |
unseen | +0.241 |
uth | +0.224 |
arah | +0.216 |
humiliated | +0.212 |
Neg logit contributions | |
plin | -0.235 |
Draft | -0.235 |
Blooming | -0.231 |
€ | -0.231 |
Por | -0.220 |
Token | as |
Token ID | 355 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
Blooming | +3.239 |
€ | +3.233 |
plin | +3.222 |
Draft | +3.206 |
Por | +3.113 |
Neg logit contributions | |
nem | -3.332 |
unseen | -3.328 |
uth | -3.078 |
arah | -3.004 |
humiliated | -2.922 |
Token | an |
Token ID | 281 |
Feature activation | -1.63e-01 |
Pos logit contributions | |
Draft | +0.341 |
plin | +0.341 |
€ | +0.335 |
Blooming | +0.334 |
Por | +0.320 |
Neg logit contributions | |
nem | -0.379 |
unseen | -0.378 |
uth | -0.350 |
arah | -0.338 |
humiliated | -0.331 |
Token | up |
Token ID | 510 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
unseen | +0.115 |
nem | +0.115 |
uth | +0.104 |
arah | +0.100 |
humiliated | +0.098 |
Neg logit contributions | |
plin | -0.136 |
Draft | -0.135 |
€ | -0.133 |
Blooming | -0.133 |
Por | -0.128 |
Token | holder |
Token ID | 13829 |
Feature activation | +6.62e-01 |
Pos logit contributions | |
nem | +0.171 |
unseen | +0.171 |
uth | +0.154 |
arah | +0.148 |
humiliated | +0.143 |
Neg logit contributions | |
plin | -0.264 |
Draft | -0.264 |
Blooming | -0.261 |
€ | -0.261 |
Por | -0.252 |
Token | of |
Token ID | 286 |
Feature activation | +7.26e-01 |
Pos logit contributions | |
plin | +0.490 |
Draft | +0.489 |
Blooming | +0.483 |
€ | +0.481 |
Por | +0.461 |
Neg logit contributions | |
nem | -0.521 |
unseen | -0.519 |
uth | -0.479 |
arah | -0.465 |
humiliated | -0.453 |
Token | l |
Token ID | 75 |
Feature activation | -8.95e-02 |
Pos logit contributions | |
nem | +0.677 |
unseen | +0.670 |
uth | +0.625 |
arah | +0.603 |
humiliated | +0.576 |
Neg logit contributions | |
Draft | -0.812 |
plin | -0.811 |
Blooming | -0.802 |
€ | -0.800 |
Por | -0.773 |
Token | ange |
Token ID | 858 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
nem | +0.044 |
unseen | +0.043 |
uth | +0.039 |
arah | +0.036 |
humiliated | +0.034 |
Neg logit contributions | |
Draft | -0.093 |
plin | -0.092 |
Blooming | -0.092 |
€ | -0.091 |
Por | -0.089 |
Token | , |
Token ID | 11 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
plin | +0.710 |
Draft | +0.710 |
Blooming | +0.697 |
€ | +0.696 |
Por | +0.667 |
Neg logit contributions | |
unseen | -0.727 |
nem | -0.724 |
uth | -0.666 |
arah | -0.642 |
humiliated | -0.628 |
Token | the |
Token ID | 262 |
Feature activation | +4.55e-01 |
Pos logit contributions | |
Draft | +0.188 |
plin | +0.188 |
Blooming | +0.185 |
€ | +0.184 |
Por | +0.177 |
Neg logit contributions | |
unseen | -0.187 |
nem | -0.187 |
uth | -0.171 |
arah | -0.164 |
humiliated | -0.162 |
Token | j |
Token ID | 474 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
Draft | +0.326 |
plin | +0.326 |
Blooming | +0.319 |
€ | +0.319 |
Por | +0.305 |
Neg logit contributions | |
nem | -0.370 |
unseen | -0.370 |
uth | -0.339 |
arah | -0.328 |
humiliated | -0.323 |
Token | umble |
Token ID | 10344 |
Feature activation | +4.38e+00 |
Pos logit contributions | |
nem | +0.085 |
unseen | +0.085 |
uth | +0.077 |
arah | +0.074 |
humiliated | +0.072 |
Neg logit contributions | |
Draft | -0.122 |
plin | -0.122 |
Blooming | -0.121 |
€ | -0.121 |
Por | -0.117 |
Token | of |
Token ID | 286 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
plin | +3.069 |
Draft | +3.058 |
Blooming | +3.036 |
€ | +3.025 |
Por | +2.909 |
Neg logit contributions | |
nem | -3.569 |
unseen | -3.548 |
uth | -3.306 |
arah | -3.227 |
humiliated | -3.143 |
Token | floating |
Token ID | 12462 |
Feature activation | -4.20e-01 |
Pos logit contributions | |
Draft | +0.697 |
plin | +0.697 |
Blooming | +0.685 |
€ | +0.683 |
Por | +0.653 |
Neg logit contributions | |
nem | -0.847 |
unseen | -0.846 |
uth | -0.779 |
arah | -0.757 |
humiliated | -0.744 |
Token | ice |
Token ID | 4771 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
nem | +0.365 |
unseen | +0.364 |
uth | +0.334 |
arah | +0.323 |
humiliated | +0.320 |
Neg logit contributions | |
Draft | -0.280 |
plin | -0.279 |
Blooming | -0.272 |
€ | -0.271 |
Por | -0.258 |
Token | downstream |
Token ID | 33218 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
nem | +0.312 |
unseen | +0.312 |
uth | +0.285 |
arah | +0.275 |
humiliated | +0.271 |
Neg logit contributions | |
Draft | -0.299 |
plin | -0.299 |
Blooming | -0.294 |
€ | -0.293 |
Por | -0.282 |
Token | from |
Token ID | 422 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
plin | +0.200 |
Draft | +0.200 |
Blooming | +0.195 |
€ | +0.195 |
Por | +0.188 |
Neg logit contributions | |
unseen | -0.198 |
nem | -0.196 |
uth | -0.178 |
arah | -0.172 |
humiliated | -0.171 |
Token | a |
Token ID | 257 |
Feature activation | +6.68e-02 |
Pos logit contributions | |
Draft | +0.304 |
plin | +0.304 |
Blooming | +0.299 |
€ | +0.298 |
Por | +0.286 |
Neg logit contributions | |
nem | -0.328 |
unseen | -0.327 |
uth | -0.301 |
arah | -0.291 |
humiliated | -0.286 |
Token | financial |
Token ID | 3176 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
plin | +0.053 |
Draft | +0.053 |
Blooming | +0.052 |
€ | +0.052 |
Por | +0.050 |
Neg logit contributions | |
nem | -0.049 |
unseen | -0.049 |
uth | -0.045 |
arah | -0.043 |
humiliated | -0.042 |
Token | institution |
Token ID | 9901 |
Feature activation | +4.90e-01 |
Pos logit contributions | |
plin | +0.515 |
Draft | +0.514 |
Blooming | +0.508 |
€ | +0.507 |
Por | +0.491 |
Neg logit contributions | |
nem | -0.357 |
unseen | -0.356 |
uth | -0.321 |
arah | -0.308 |
humiliated | -0.300 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
plin | +0.367 |
Draft | +0.366 |
Blooming | +0.360 |
€ | +0.359 |
Por | +0.345 |
Neg logit contributions | |
unseen | -0.382 |
nem | -0.382 |
uth | -0.351 |
arah | -0.339 |
humiliated | -0.334 |
Token | Even |
Token ID | 3412 |
Feature activation | +2.10e-01 |
Pos logit contributions | |
nem | +0.134 |
unseen | +0.132 |
uth | +0.124 |
arah | +0.120 |
humiliated | +0.117 |
Neg logit contributions | |
plin | -0.100 |
Draft | -0.099 |
Blooming | -0.096 |
€ | -0.096 |
Por | -0.091 |
Token | then |
Token ID | 788 |
Feature activation | +4.38e+00 |
Pos logit contributions | |
Draft | +0.151 |
plin | +0.151 |
Blooming | +0.148 |
€ | +0.148 |
Por | +0.142 |
Neg logit contributions | |
nem | -0.169 |
unseen | -0.168 |
uth | -0.155 |
arah | -0.150 |
humiliated | -0.148 |
Token | we |
Token ID | 356 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
plin | +2.927 |
€ | +2.925 |
Blooming | +2.917 |
Draft | +2.911 |
Por | +2.792 |
Neg logit contributions | |
unseen | -3.658 |
nem | -3.657 |
uth | -3.413 |
arah | -3.358 |
humiliated | -3.241 |
Token | were |
Token ID | 547 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
plin | +0.244 |
Draft | +0.244 |
Blooming | +0.241 |
€ | +0.240 |
Por | +0.232 |
Neg logit contributions | |
nem | -0.193 |
unseen | -0.192 |
uth | -0.175 |
arah | -0.168 |
humiliated | -0.165 |
Token | storing |
Token ID | 23069 |
Feature activation | +8.35e-01 |
Pos logit contributions | |
nem | +0.186 |
unseen | +0.185 |
uth | +0.170 |
arah | +0.165 |
humiliated | +0.163 |
Neg logit contributions | |
plin | -0.177 |
Draft | -0.176 |
Blooming | -0.173 |
€ | -0.172 |
Por | -0.166 |
Token | tens |
Token ID | 11192 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
plin | +0.640 |
Draft | +0.639 |
Blooming | +0.630 |
€ | +0.627 |
Por | +0.605 |
Neg logit contributions | |
nem | -0.633 |
unseen | -0.632 |
uth | -0.581 |
arah | -0.562 |
humiliated | -0.550 |
Token | of |
Token ID | 286 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
nem | +0.544 |
unseen | +0.542 |
uth | +0.502 |
arah | +0.488 |
humiliated | +0.478 |
Neg logit contributions | |
plin | -0.474 |
Draft | -0.474 |
Blooming | -0.468 |
€ | -0.468 |
Por | -0.449 |
Token | faithful |
Token ID | 17074 |
Feature activation | -4.22e-01 |
Pos logit contributions | |
plin | +0.687 |
Draft | +0.687 |
Blooming | +0.676 |
€ | +0.675 |
Por | +0.649 |
Neg logit contributions | |
nem | -0.687 |
unseen | -0.685 |
uth | -0.629 |
arah | -0.610 |
humiliated | -0.596 |
Token | to |
Token ID | 284 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
nem | +0.301 |
unseen | +0.299 |
uth | +0.274 |
arah | +0.265 |
humiliated | +0.258 |
Neg logit contributions | |
Draft | -0.343 |
plin | -0.342 |
Blooming | -0.338 |
€ | -0.337 |
Por | -0.325 |
Token | the |
Token ID | 262 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
Draft | +0.793 |
plin | +0.791 |
€ | +0.781 |
Blooming | +0.780 |
Por | +0.744 |
Neg logit contributions | |
nem | -0.836 |
unseen | -0.833 |
uth | -0.767 |
arah | -0.741 |
humiliated | -0.724 |
Token | text |
Token ID | 2420 |
Feature activation | +7.22e-01 |
Pos logit contributions | |
nem | +0.009 |
unseen | +0.009 |
uth | +0.008 |
arah | +0.008 |
humiliated | +0.007 |
Neg logit contributions | |
Draft | -0.008 |
plin | -0.008 |
Blooming | -0.008 |
€ | -0.008 |
Por | -0.007 |
Token | ? |
Token ID | 30 |
Feature activation | +5.96e-02 |
Pos logit contributions | |
Draft | +0.555 |
plin | +0.555 |
Blooming | +0.548 |
€ | +0.547 |
Por | +0.526 |
Neg logit contributions | |
nem | -0.544 |
unseen | -0.543 |
uth | -0.499 |
arah | -0.484 |
humiliated | -0.472 |
Token | Does |
Token ID | 8314 |
Feature activation | -4.93e+00 |
Pos logit contributions | |
plin | +0.047 |
Draft | +0.046 |
Blooming | +0.046 |
€ | +0.046 |
Por | +0.044 |
Neg logit contributions | |
nem | -0.044 |
unseen | -0.044 |
uth | -0.040 |
arah | -0.039 |
humiliated | -0.038 |
Token | it |
Token ID | 340 |
Feature activation | -7.79e-01 |
Pos logit contributions | |
nem | +3.947 |
unseen | +3.893 |
uth | +3.566 |
arah | +3.389 |
trusted | +3.339 |
Neg logit contributions | |
Draft | -3.498 |
plin | -3.447 |
€ | -3.402 |
Blooming | -3.331 |
Por | -3.088 |
Token | diver |
Token ID | 12312 |
Feature activation | +6.11e-01 |
Pos logit contributions | |
nem | +0.570 |
unseen | +0.568 |
uth | +0.519 |
arah | +0.501 |
humiliated | +0.489 |
Neg logit contributions | |
Draft | -0.619 |
plin | -0.617 |
Blooming | -0.611 |
€ | -0.607 |
Por | -0.585 |
Token | ge |
Token ID | 469 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
Draft | +0.405 |
plin | +0.404 |
Blooming | +0.399 |
€ | +0.397 |
Por | +0.380 |
Neg logit contributions | |
nem | -0.525 |
unseen | -0.523 |
uth | -0.488 |
arah | -0.474 |
humiliated | -0.464 |
Token | at |
Token ID | 379 |
Feature activation | +3.69e-01 |
Pos logit contributions | |
nem | +0.169 |
unseen | +0.169 |
uth | +0.153 |
arah | +0.148 |
humiliated | +0.146 |
Neg logit contributions | |
Draft | -0.185 |
plin | -0.185 |
Blooming | -0.183 |
€ | -0.181 |
Por | -0.174 |
Token | all |
Token ID | 477 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
Draft | +0.277 |
plin | +0.276 |
Blooming | +0.273 |
€ | +0.271 |
Por | +0.261 |
Neg logit contributions | |
nem | -0.287 |
unseen | -0.287 |
uth | -0.262 |
arah | -0.255 |
humiliated | -0.249 |
Token | That |
Token ID | 1320 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
nem | +1.009 |
unseen | +0.999 |
uth | +0.931 |
arah | +0.895 |
humiliated | +0.892 |
Neg logit contributions | |
plin | -0.715 |
Draft | -0.709 |
Blooming | -0.688 |
€ | -0.677 |
Por | -0.649 |
Token | 's |
Token ID | 338 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
Draft | +0.778 |
plin | +0.777 |
Blooming | +0.766 |
€ | +0.758 |
Por | +0.735 |
Neg logit contributions | |
nem | -0.701 |
unseen | -0.697 |
uth | -0.636 |
arah | -0.613 |
humiliated | -0.605 |
Token | prohibited |
Token ID | 12244 |
Feature activation | +4.86e-01 |
Pos logit contributions | |
Draft | +0.774 |
plin | +0.772 |
Blooming | +0.758 |
€ | +0.748 |
Por | +0.723 |
Neg logit contributions | |
nem | -0.870 |
unseen | -0.867 |
uth | -0.798 |
arah | -0.773 |
humiliated | -0.763 |
Token | , |
Token ID | 11 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
Draft | +0.374 |
plin | +0.373 |
Blooming | +0.368 |
€ | +0.365 |
Por | +0.353 |
Neg logit contributions | |
nem | -0.368 |
unseen | -0.367 |
uth | -0.337 |
arah | -0.326 |
humiliated | -0.319 |
Token | as |
Token ID | 355 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
Draft | +0.126 |
plin | +0.126 |
Blooming | +0.124 |
€ | +0.123 |
Por | +0.119 |
Neg logit contributions | |
nem | -0.117 |
unseen | -0.117 |
uth | -0.107 |
arah | -0.103 |
humiliated | -0.101 |
Token | are |
Token ID | 389 |
Feature activation | -4.84e+00 |
Pos logit contributions | |
Draft | +0.085 |
plin | +0.084 |
Blooming | +0.083 |
€ | +0.082 |
Por | +0.079 |
Neg logit contributions | |
unseen | -0.088 |
nem | -0.088 |
uth | -0.080 |
arah | -0.076 |
humiliated | -0.076 |
Token | portable |
Token ID | 17726 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
nem | +3.666 |
unseen | +3.616 |
uth | +3.233 |
trusted | +3.189 |
humiliated | +3.135 |
Neg logit contributions | |
Draft | -3.711 |
plin | -3.665 |
Blooming | -3.547 |
€ | -3.474 |
Por | -3.424 |
Token | Wi |
Token ID | 11759 |
Feature activation | -5.65e-01 |
Pos logit contributions | |
nem | +0.194 |
unseen | +0.193 |
uth | +0.175 |
arah | +0.168 |
humiliated | +0.166 |
Neg logit contributions | |
Draft | -0.226 |
plin | -0.226 |
Blooming | -0.221 |
€ | -0.220 |
Por | -0.213 |
Token | - |
Token ID | 12 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
nem | +0.361 |
unseen | +0.357 |
uth | +0.328 |
arah | +0.313 |
humiliated | +0.303 |
Neg logit contributions | |
Draft | -0.497 |
plin | -0.497 |
Blooming | -0.496 |
€ | -0.491 |
Por | -0.477 |
Token | Fi |
Token ID | 10547 |
Feature activation | +9.32e-02 |
Pos logit contributions | |
nem | +1.159 |
unseen | +1.153 |
uth | +1.086 |
arah | +1.035 |
humiliated | +1.020 |
Neg logit contributions | |
plin | -0.981 |
Blooming | -0.973 |
Draft | -0.962 |
€ | -0.951 |
Por | -0.923 |
Token | hots |
Token ID | 33915 |
Feature activation | -7.21e-01 |
Pos logit contributions | |
plin | +0.082 |
Draft | +0.082 |
Blooming | +0.081 |
€ | +0.081 |
Por | +0.078 |
Neg logit contributions | |
nem | -0.060 |
unseen | -0.060 |
uth | -0.054 |
arah | -0.052 |
humiliated | -0.051 |
Token | reach |
Token ID | 3151 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
nem | +0.496 |
unseen | +0.491 |
uth | +0.450 |
arah | +0.433 |
humiliated | +0.425 |
Neg logit contributions | |
Draft | -0.530 |
plin | -0.525 |
€ | -0.516 |
Blooming | -0.516 |
Por | -0.499 |
Token | sexual |
Token ID | 3206 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
nem | +0.784 |
unseen | +0.776 |
uth | +0.710 |
arah | +0.679 |
humiliated | +0.671 |
Neg logit contributions | |
Draft | -0.802 |
plin | -0.802 |
Blooming | -0.785 |
€ | -0.780 |
Por | -0.754 |
Token | maturity |
Token ID | 24841 |
Feature activation | -2.08e-01 |
Pos logit contributions | |
nem | +0.980 |
unseen | +0.963 |
uth | +0.900 |
arah | +0.867 |
humiliated | +0.844 |
Neg logit contributions | |
plin | -0.857 |
Draft | -0.857 |
Blooming | -0.839 |
€ | -0.836 |
Por | -0.800 |
Token | . |
Token ID | 13 |
Feature activation | -7.54e-01 |
Pos logit contributions | |
nem | +0.160 |
unseen | +0.160 |
uth | +0.147 |
arah | +0.142 |
humiliated | +0.139 |
Neg logit contributions | |
plin | -0.157 |
Draft | -0.157 |
Blooming | -0.155 |
€ | -0.154 |
Por | -0.148 |
Token | On |
Token ID | 1550 |
Feature activation | -4.95e-02 |
Pos logit contributions | |
nem | +0.624 |
unseen | +0.611 |
uth | +0.576 |
arah | +0.550 |
humiliated | +0.537 |
Neg logit contributions | |
plin | -0.532 |
Draft | -0.523 |
€ | -0.510 |
Blooming | -0.505 |
Por | -0.479 |
Token | top |
Token ID | 1353 |
Feature activation | -4.82e+00 |
Pos logit contributions | |
nem | +0.040 |
unseen | +0.039 |
uth | +0.036 |
arah | +0.035 |
humiliated | +0.034 |
Neg logit contributions | |
Draft | -0.036 |
plin | -0.036 |
€ | -0.035 |
Blooming | -0.035 |
Por | -0.034 |
Token | of |
Token ID | 286 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
unseen | +3.427 |
nem | +3.412 |
uth | +3.076 |
arah | +2.905 |
trusted | +2.862 |
Neg logit contributions | |
plin | -3.943 |
Draft | -3.838 |
Blooming | -3.792 |
€ | -3.699 |
Por | -3.556 |
Token | all |
Token ID | 477 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
plin | +0.953 |
Draft | +0.951 |
Blooming | +0.939 |
€ | +0.937 |
Por | +0.900 |
Neg logit contributions | |
nem | -0.989 |
unseen | -0.986 |
uth | -0.908 |
arah | -0.880 |
humiliated | -0.861 |
Token | this |
Token ID | 428 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
plin | +0.164 |
Draft | +0.164 |
Blooming | +0.162 |
€ | +0.162 |
Por | +0.156 |
Neg logit contributions | |
nem | -0.173 |
unseen | -0.172 |
uth | -0.159 |
arah | -0.155 |
humiliated | -0.151 |
Token | , |
Token ID | 11 |
Feature activation | +9.34e-02 |
Pos logit contributions | |
plin | +1.071 |
Draft | +1.069 |
Blooming | +1.059 |
€ | +1.058 |
Por | +1.014 |
Neg logit contributions | |
nem | -1.272 |
unseen | -1.268 |
uth | -1.182 |
arah | -1.153 |
humiliated | -1.121 |
Token | a |
Token ID | 257 |
Feature activation | -8.72e-02 |
Pos logit contributions | |
Draft | +0.075 |
plin | +0.074 |
Blooming | +0.073 |
€ | +0.073 |
Por | +0.070 |
Neg logit contributions | |
nem | -0.069 |
unseen | -0.068 |
uth | -0.062 |
arah | -0.060 |
humiliated | -0.059 |
Token | chased |
Token ID | 26172 |
Feature activation | -2.14e-01 |
Pos logit contributions | |
nem | +0.549 |
unseen | +0.548 |
uth | +0.497 |
arah | +0.477 |
humiliated | +0.475 |
Neg logit contributions | |
plin | -0.668 |
Draft | -0.667 |
Blooming | -0.661 |
€ | -0.656 |
Por | -0.634 |
Token | by |
Token ID | 416 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
nem | +0.143 |
unseen | +0.143 |
uth | +0.130 |
arah | +0.125 |
humiliated | +0.122 |
Neg logit contributions | |
plin | -0.184 |
Draft | -0.184 |
Blooming | -0.182 |
€ | -0.181 |
Por | -0.175 |
Token | Satan |
Token ID | 14918 |
Feature activation | +7.39e-02 |
Pos logit contributions | |
plin | +0.291 |
Draft | +0.291 |
Blooming | +0.288 |
€ | +0.287 |
Por | +0.277 |
Neg logit contributions | |
nem | -0.272 |
unseen | -0.271 |
uth | -0.249 |
arah | -0.242 |
humiliated | -0.235 |
Token | . |
Token ID | 13 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
plin | +0.060 |
Draft | +0.060 |
Blooming | +0.060 |
€ | +0.059 |
Por | +0.057 |
Neg logit contributions | |
nem | -0.052 |
unseen | -0.052 |
uth | -0.048 |
arah | -0.046 |
humiliated | -0.045 |
Token | On |
Token ID | 1550 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
nem | +0.014 |
unseen | +0.014 |
uth | +0.013 |
arah | +0.013 |
humiliated | +0.013 |
Neg logit contributions | |
plin | -0.011 |
Draft | -0.011 |
Blooming | -0.011 |
€ | -0.011 |
Por | -0.010 |
Token | top |
Token ID | 1353 |
Feature activation | -4.81e+00 |
Pos logit contributions | |
nem | +0.272 |
unseen | +0.272 |
uth | +0.250 |
arah | +0.243 |
humiliated | +0.237 |
Neg logit contributions | |
plin | -0.272 |
Draft | -0.272 |
Blooming | -0.269 |
€ | -0.268 |
Por | -0.258 |
Token | of |
Token ID | 286 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
unseen | +3.475 |
nem | +3.415 |
uth | +3.094 |
arah | +2.997 |
humiliated | +2.911 |
Neg logit contributions | |
plin | -3.865 |
Draft | -3.792 |
Blooming | -3.734 |
€ | -3.641 |
Por | -3.492 |
Token | that |
Token ID | 326 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
plin | +1.250 |
Draft | +1.250 |
Blooming | +1.232 |
€ | +1.228 |
Por | +1.181 |
Neg logit contributions | |
nem | -1.315 |
unseen | -1.313 |
uth | -1.207 |
arah | -1.173 |
humiliated | -1.150 |
Token | , |
Token ID | 11 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
plin | +1.496 |
Draft | +1.485 |
€ | +1.485 |
Blooming | +1.483 |
Por | +1.418 |
Neg logit contributions | |
nem | -1.847 |
unseen | -1.834 |
uth | -1.720 |
arah | -1.675 |
humiliated | -1.619 |
Token | I |
Token ID | 314 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
plin | +0.237 |
Draft | +0.237 |
Blooming | +0.234 |
€ | +0.234 |
Por | +0.225 |
Neg logit contributions | |
nem | -0.243 |
unseen | -0.242 |
uth | -0.223 |
arah | -0.217 |
humiliated | -0.212 |
Token | got |
Token ID | 1392 |
Feature activation | -1.80e-02 |
Pos logit contributions | |
nem | +0.197 |
unseen | +0.197 |
uth | +0.180 |
arah | +0.173 |
humiliated | +0.170 |
Neg logit contributions | |
Draft | -0.239 |
plin | -0.239 |
Blooming | -0.236 |
€ | -0.235 |
Por | -0.227 |
Token | B |
Token ID | 33 |
Feature activation | -3.84e-01 |
Pos logit contributions | |
Draft | +0.198 |
plin | +0.198 |
Blooming | +0.195 |
€ | +0.195 |
Por | +0.188 |
Neg logit contributions | |
nem | -0.193 |
unseen | -0.192 |
uth | -0.177 |
arah | -0.172 |
humiliated | -0.167 |
Token | +, |
Token ID | 28200 |
Feature activation | +2.26e-01 |
Pos logit contributions | |
nem | +0.289 |
unseen | +0.288 |
uth | +0.265 |
arah | +0.257 |
humiliated | +0.251 |
Neg logit contributions | |
Draft | -0.296 |
plin | -0.296 |
Blooming | -0.293 |
€ | -0.292 |
Por | -0.281 |
Token | � |
Token ID | 447 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
plin | +0.173 |
Draft | +0.173 |
Blooming | +0.171 |
€ | +0.171 |
Por | +0.164 |
Neg logit contributions | |
nem | -0.171 |
unseen | -0.171 |
uth | -0.157 |
arah | -0.152 |
humiliated | -0.149 |
Token | � |
Token ID | 251 |
Feature activation | -7.47e-01 |
Pos logit contributions | |
unseen | +0.242 |
nem | +0.242 |
uth | +0.225 |
arah | +0.219 |
humiliated | +0.213 |
Neg logit contributions | |
plin | -0.214 |
Draft | -0.214 |
Blooming | -0.212 |
€ | -0.212 |
Por | -0.203 |
Token | as |
Token ID | 355 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
nem | +0.557 |
unseen | +0.557 |
uth | +0.512 |
arah | +0.495 |
humiliated | +0.483 |
Neg logit contributions | |
plin | -0.580 |
Draft | -0.578 |
Blooming | -0.574 |
€ | -0.571 |
Por | -0.549 |
Token | did |
Token ID | 750 |
Feature activation | -4.74e+00 |
Pos logit contributions | |
unseen | +0.437 |
nem | +0.436 |
uth | +0.402 |
arah | +0.388 |
humiliated | +0.380 |
Neg logit contributions | |
Draft | -0.417 |
plin | -0.415 |
Blooming | -0.411 |
€ | -0.409 |
Por | -0.391 |
Token | our |
Token ID | 674 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
unseen | +3.922 |
nem | +3.917 |
uth | +3.620 |
arah | +3.491 |
trusted | +3.430 |
Neg logit contributions | |
Draft | -3.219 |
plin | -3.207 |
€ | -3.132 |
Blooming | -3.099 |
Por | -2.943 |
Token | readers |
Token ID | 7183 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
nem | +0.915 |
unseen | +0.912 |
uth | +0.840 |
arah | +0.815 |
humiliated | +0.795 |
Neg logit contributions | |
plin | -0.895 |
Draft | -0.894 |
Blooming | -0.880 |
€ | -0.880 |
Por | -0.844 |
Token | in |
Token ID | 287 |
Feature activation | -9.93e-03 |
Pos logit contributions | |
nem | +1.202 |
unseen | +1.197 |
uth | +1.113 |
arah | +1.085 |
humiliated | +1.055 |
Neg logit contributions | |
plin | -1.025 |
Draft | -1.021 |
Blooming | -1.008 |
€ | -1.006 |
Por | -0.962 |
Token | a |
Token ID | 257 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
nem | +0.008 |
unseen | +0.008 |
uth | +0.007 |
arah | +0.007 |
humiliated | +0.007 |
Neg logit contributions | |
plin | -0.008 |
Draft | -0.008 |
€ | -0.007 |
Blooming | -0.007 |
Por | -0.007 |
Token | premiere |
Token ID | 19245 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
plin | +0.167 |
Draft | +0.167 |
Blooming | +0.165 |
€ | +0.165 |
Por | +0.158 |
Neg logit contributions | |
nem | -0.185 |
unseen | -0.184 |
uth | -0.171 |
arah | -0.166 |
humiliated | -0.162 |
Token | was |
Token ID | 373 |
Feature activation | -9.57e-01 |
Pos logit contributions | |
nem | +0.837 |
unseen | +0.831 |
uth | +0.765 |
arah | +0.737 |
humiliated | +0.727 |
Neg logit contributions | |
Draft | -0.897 |
plin | -0.894 |
Blooming | -0.881 |
€ | -0.880 |
Por | -0.847 |
Token | unexpectedly |
Token ID | 25884 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
nem | +0.694 |
unseen | +0.691 |
uth | +0.627 |
arah | +0.606 |
humiliated | +0.603 |
Neg logit contributions | |
Draft | -0.774 |
plin | -0.773 |
Blooming | -0.757 |
€ | -0.754 |
Por | -0.727 |
Token | successful |
Token ID | 4388 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
plin | +0.173 |
Draft | +0.173 |
Blooming | +0.171 |
€ | +0.171 |
Por | +0.165 |
Neg logit contributions | |
nem | -0.130 |
unseen | -0.130 |
uth | -0.118 |
arah | -0.114 |
humiliated | -0.110 |
Token | ( |
Token ID | 357 |
Feature activation | +6.30e-01 |
Pos logit contributions | |
Draft | +0.151 |
plin | +0.151 |
Blooming | +0.148 |
€ | +0.148 |
Por | +0.142 |
Neg logit contributions | |
nem | -0.141 |
unseen | -0.140 |
uth | -0.128 |
arah | -0.124 |
humiliated | -0.122 |
Token | as |
Token ID | 292 |
Feature activation | -9.87e-01 |
Pos logit contributions | |
plin | +0.511 |
Draft | +0.509 |
Blooming | +0.505 |
€ | +0.504 |
Por | +0.485 |
Neg logit contributions | |
nem | -0.449 |
unseen | -0.448 |
uth | -0.411 |
arah | -0.398 |
humiliated | -0.387 |
Token | compared |
Token ID | 3688 |
Feature activation | -4.74e+00 |
Pos logit contributions | |
nem | +0.738 |
unseen | +0.737 |
uth | +0.673 |
arah | +0.646 |
humiliated | +0.640 |
Neg logit contributions | |
Draft | -0.774 |
plin | -0.768 |
Blooming | -0.756 |
€ | -0.754 |
Por | -0.722 |
Token | to |
Token ID | 284 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
nem | +3.174 |
unseen | +3.172 |
uth | +2.846 |
humiliated | +2.726 |
arah | +2.719 |
Neg logit contributions | |
Draft | -3.985 |
plin | -3.978 |
Blooming | -3.894 |
€ | -3.860 |
Por | -3.729 |
Token | Mitt |
Token ID | 16627 |
Feature activation | -4.51e-01 |
Pos logit contributions | |
nem | +1.123 |
unseen | +1.121 |
uth | +1.014 |
arah | +0.982 |
humiliated | +0.974 |
Neg logit contributions | |
Draft | -1.096 |
plin | -1.090 |
Blooming | -1.064 |
€ | -1.059 |
Por | -1.010 |
Token | Romney |
Token ID | 8431 |
Feature activation | -8.45e-01 |
Pos logit contributions | |
nem | +0.332 |
unseen | +0.331 |
uth | +0.304 |
arah | +0.294 |
humiliated | +0.285 |
Neg logit contributions | |
Draft | -0.359 |
plin | -0.356 |
Blooming | -0.349 |
€ | -0.349 |
Por | -0.332 |
Token | ) |
Token ID | 8 |
Feature activation | -8.67e-02 |
Pos logit contributions | |
nem | +0.608 |
unseen | +0.604 |
uth | +0.554 |
arah | +0.533 |
humiliated | +0.524 |
Neg logit contributions | |
Draft | -0.683 |
plin | -0.680 |
Blooming | -0.671 |
€ | -0.664 |
Por | -0.645 |
Token | in |
Token ID | 287 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
nem | +0.063 |
unseen | +0.062 |
uth | +0.057 |
arah | +0.055 |
humiliated | +0.054 |
Neg logit contributions | |
Draft | -0.070 |
plin | -0.070 |
Blooming | -0.069 |
€ | -0.069 |
Por | -0.066 |
Token | certainly |
Token ID | 3729 |
Feature activation | +4.55e-01 |
Pos logit contributions | |
nem | +0.437 |
unseen | +0.432 |
uth | +0.397 |
arah | +0.381 |
humiliated | +0.377 |
Neg logit contributions | |
Draft | -0.487 |
plin | -0.486 |
Blooming | -0.479 |
€ | -0.476 |
Por | -0.460 |
Token | did |
Token ID | 750 |
Feature activation | -3.92e-02 |
Pos logit contributions | |
plin | +0.379 |
Draft | +0.378 |
Blooming | +0.374 |
€ | +0.373 |
Por | +0.360 |
Neg logit contributions | |
nem | -0.315 |
unseen | -0.313 |
uth | -0.286 |
arah | -0.276 |
humiliated | -0.270 |
Token | not |
Token ID | 407 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
nem | +0.030 |
unseen | +0.030 |
uth | +0.027 |
arah | +0.026 |
humiliated | +0.026 |
Neg logit contributions | |
Draft | -0.030 |
plin | -0.030 |
Blooming | -0.030 |
€ | -0.030 |
Por | -0.028 |
Token | , |
Token ID | 11 |
Feature activation | +1.22e+00 |
Pos logit contributions | |
Draft | +0.207 |
plin | +0.207 |
Blooming | +0.204 |
€ | +0.203 |
Por | +0.197 |
Neg logit contributions | |
nem | -0.178 |
unseen | -0.177 |
uth | -0.162 |
arah | -0.156 |
humiliated | -0.152 |
Token | nor |
Token ID | 4249 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
plin | +0.978 |
Draft | +0.976 |
Blooming | +0.967 |
€ | +0.965 |
Por | +0.930 |
Neg logit contributions | |
nem | -0.880 |
unseen | -0.877 |
uth | -0.804 |
arah | -0.779 |
humiliated | -0.758 |
Token | did |
Token ID | 750 |
Feature activation | -4.65e+00 |
Pos logit contributions | |
nem | +1.045 |
unseen | +1.045 |
uth | +0.950 |
arah | +0.921 |
humiliated | +0.901 |
Neg logit contributions | |
Draft | -1.258 |
plin | -1.249 |
Blooming | -1.232 |
€ | -1.227 |
Por | -1.184 |
Token | I |
Token ID | 314 |
Feature activation | -7.15e-02 |
Pos logit contributions | |
nem | +3.434 |
unseen | +3.417 |
uth | +3.113 |
arah | +3.016 |
humiliated | +2.998 |
Neg logit contributions | |
Draft | -3.654 |
plin | -3.605 |
€ | -3.473 |
Blooming | -3.447 |
Por | -3.289 |
Token | intend |
Token ID | 14765 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
nem | +0.050 |
unseen | +0.049 |
uth | +0.045 |
arah | +0.044 |
humiliated | +0.042 |
Neg logit contributions | |
Draft | -0.059 |
plin | -0.059 |
Blooming | -0.059 |
€ | -0.059 |
Por | -0.057 |
Token | to |
Token ID | 284 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
nem | +1.122 |
unseen | +1.117 |
uth | +1.021 |
arah | +0.991 |
humiliated | +0.962 |
Neg logit contributions | |
Draft | -1.313 |
plin | -1.305 |
Blooming | -1.287 |
€ | -1.281 |
Por | -1.236 |
Token | , |
Token ID | 11 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
nem | +1.361 |
unseen | +1.347 |
uth | +1.244 |
arah | +1.197 |
humiliated | +1.178 |
Neg logit contributions | |
Draft | -1.381 |
plin | -1.380 |
Blooming | -1.361 |
€ | -1.345 |
Por | -1.300 |
Token | call |
Token ID | 869 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
plin | +1.306 |
Draft | +1.303 |
Blooming | +1.294 |
€ | +1.294 |
Por | +1.248 |
Neg logit contributions | |
nem | -1.043 |
unseen | -1.042 |
uth | -0.951 |
arah | -0.921 |
humiliated | -0.891 |
Token | left |
Token ID | 9464 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
plin | +0.142 |
Draft | +0.141 |
Blooming | +0.141 |
€ | +0.140 |
Por | +0.135 |
Neg logit contributions | |
nem | -0.145 |
unseen | -0.145 |
uth | -0.134 |
arah | -0.130 |
humiliated | -0.127 |
Token | - |
Token ID | 12 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
plin | +1.260 |
€ | +1.254 |
Draft | +1.251 |
Blooming | +1.239 |
Por | +1.207 |
Neg logit contributions | |
nem | -0.965 |
unseen | -0.953 |
uth | -0.876 |
arah | -0.852 |
emet | -0.821 |
Token | right |
Token ID | 3506 |
Feature activation | +4.67e-01 |
Pos logit contributions | |
nem | +0.383 |
unseen | +0.382 |
uth | +0.349 |
arah | +0.337 |
humiliated | +0.328 |
Neg logit contributions | |
plin | -0.466 |
Draft | -0.465 |
Blooming | -0.461 |
€ | -0.460 |
Por | -0.444 |
Token | ) |
Token ID | 8 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
plin | +0.399 |
Draft | +0.398 |
€ | +0.396 |
Blooming | +0.394 |
Por | +0.381 |
Neg logit contributions | |
nem | -0.310 |
unseen | -0.309 |
uth | -0.282 |
arah | -0.274 |
humiliated | -0.264 |
Token | Gary |
Token ID | 10936 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
nem | +0.792 |
unseen | +0.789 |
uth | +0.726 |
arah | +0.701 |
humiliated | +0.689 |
Neg logit contributions | |
Draft | -0.778 |
plin | -0.777 |
Blooming | -0.763 |
€ | -0.760 |
Por | -0.731 |
Token | Neville |
Token ID | 35840 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
nem | +0.131 |
unseen | +0.131 |
uth | +0.122 |
arah | +0.117 |
humiliated | +0.115 |
Neg logit contributions | |
Draft | -0.124 |
plin | -0.124 |
Blooming | -0.122 |
€ | -0.122 |
Por | -0.117 |
Token | , |
Token ID | 11 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
nem | +3.408 |
unseen | +3.400 |
uth | +3.132 |
arah | +2.981 |
humiliated | +2.969 |
Neg logit contributions | |
Draft | -3.548 |
plin | -3.513 |
Blooming | -3.473 |
€ | -3.416 |
Por | -3.313 |
Token | Ben |
Token ID | 3932 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
nem | +0.460 |
unseen | +0.458 |
uth | +0.421 |
arah | +0.407 |
humiliated | +0.399 |
Neg logit contributions | |
Draft | -0.478 |
plin | -0.478 |
Blooming | -0.472 |
€ | -0.470 |
Por | -0.452 |
Token | Thorn |
Token ID | 31422 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
nem | +0.914 |
unseen | +0.906 |
uth | +0.860 |
arah | +0.833 |
humiliated | +0.808 |
Neg logit contributions | |
Draft | -0.671 |
plin | -0.665 |
€ | -0.657 |
Blooming | -0.655 |
Por | -0.615 |
Token | ley |
Token ID | 1636 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
plin | +0.010 |
Draft | +0.010 |
Blooming | +0.010 |
€ | +0.010 |
Por | +0.009 |
Neg logit contributions | |
nem | -0.010 |
unseen | -0.010 |
uth | -0.009 |
arah | -0.009 |
humiliated | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
nem | +0.326 |
unseen | +0.326 |
uth | +0.301 |
arah | +0.293 |
humiliated | +0.286 |
Neg logit contributions | |
plin | -0.308 |
Draft | -0.307 |
Blooming | -0.304 |
€ | -0.304 |
Por | -0.292 |
Token | reversed |
Token ID | 17687 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
nem | +0.873 |
unseen | +0.871 |
uth | +0.783 |
humiliated | +0.760 |
arah | +0.751 |
Neg logit contributions | |
Draft | -0.990 |
plin | -0.984 |
€ | -0.962 |
Blooming | -0.961 |
Por | -0.916 |
Token | a |
Token ID | 257 |
Feature activation | +4.16e-01 |
Pos logit contributions | |
unseen | +0.138 |
nem | +0.138 |
uth | +0.126 |
arah | +0.121 |
humiliated | +0.120 |
Neg logit contributions | |
plin | -0.139 |
Draft | -0.139 |
Blooming | -0.136 |
€ | -0.136 |
Por | -0.129 |
Token | measure |
Token ID | 3953 |
Feature activation | -7.79e-01 |
Pos logit contributions | |
plin | +0.307 |
Draft | +0.306 |
Blooming | +0.300 |
€ | +0.299 |
Por | +0.288 |
Neg logit contributions | |
nem | -0.328 |
unseen | -0.327 |
uth | -0.299 |
arah | -0.291 |
humiliated | -0.286 |
Token | put |
Token ID | 1234 |
Feature activation | -8.31e-01 |
Pos logit contributions | |
unseen | +0.572 |
nem | +0.572 |
uth | +0.518 |
arah | +0.503 |
humiliated | +0.495 |
Neg logit contributions | |
plin | -0.618 |
Draft | -0.616 |
Blooming | -0.607 |
€ | -0.605 |
Por | -0.578 |
Token | in |
Token ID | 287 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
nem | +0.536 |
unseen | +0.535 |
uth | +0.484 |
arah | +0.466 |
humiliated | +0.453 |
Neg logit contributions | |
plin | -0.730 |
Draft | -0.730 |
Blooming | -0.722 |
€ | -0.719 |
Por | -0.696 |
Token | place |
Token ID | 1295 |
Feature activation | -4.55e+00 |
Pos logit contributions | |
unseen | +1.392 |
nem | +1.378 |
uth | +1.220 |
arah | +1.167 |
humiliated | +1.149 |
Neg logit contributions | |
Draft | -2.092 |
plin | -2.074 |
Blooming | -2.029 |
€ | -2.026 |
Por | -1.956 |
Token | after |
Token ID | 706 |
Feature activation | -9.96e-01 |
Pos logit contributions | |
unseen | +2.961 |
nem | +2.929 |
uth | +2.576 |
arah | +2.494 |
humiliated | +2.463 |
Neg logit contributions | |
Draft | -4.025 |
plin | -3.975 |
Blooming | -3.873 |
€ | -3.831 |
Por | -3.692 |
Token | the |
Token ID | 262 |
Feature activation | -5.70e-01 |
Pos logit contributions | |
nem | +0.783 |
unseen | +0.781 |
uth | +0.714 |
arah | +0.690 |
humiliated | +0.681 |
Neg logit contributions | |
plin | -0.744 |
Draft | -0.742 |
€ | -0.725 |
Blooming | -0.719 |
Por | -0.688 |
Token | terrorist |
Token ID | 7417 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
nem | +0.487 |
unseen | +0.486 |
uth | +0.448 |
arah | +0.435 |
humiliated | +0.427 |
Neg logit contributions | |
plin | -0.387 |
Draft | -0.384 |
€ | -0.375 |
Blooming | -0.373 |
Por | -0.357 |
Token | attacks |
Token ID | 3434 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
nem | +0.944 |
unseen | +0.937 |
uth | +0.867 |
arah | +0.832 |
humiliated | +0.821 |
Neg logit contributions | |
plin | -0.908 |
Draft | -0.903 |
€ | -0.882 |
Blooming | -0.878 |
Por | -0.845 |
Token | of |
Token ID | 286 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
unseen | +0.776 |
nem | +0.776 |
uth | +0.713 |
arah | +0.688 |
humiliated | +0.675 |
Neg logit contributions | |
plin | -0.789 |
Draft | -0.786 |
€ | -0.771 |
Blooming | -0.769 |
Por | -0.739 |
Token |
|
Token ID | 198 |
Feature activation | +2.77e+00 |
Pos logit contributions | |
nem | +0.291 |
unseen | +0.291 |
uth | +0.266 |
arah | +0.257 |
humiliated | +0.252 |
Neg logit contributions | |
plin | -0.309 |
Draft | -0.309 |
Blooming | -0.304 |
€ | -0.303 |
Por | -0.292 |
Token |
|
Token ID | 198 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
Draft | +2.161 |
€ | +2.146 |
plin | +2.143 |
Blooming | +2.139 |
Por | +2.063 |
Neg logit contributions | |
nem | -2.051 |
unseen | -2.041 |
uth | -1.875 |
arah | -1.835 |
humiliated | -1.794 |
Token | this |
Token ID | 5661 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
Draft | +1.608 |
plin | +1.606 |
Blooming | +1.586 |
€ | +1.582 |
Por | +1.525 |
Neg logit contributions | |
nem | -1.489 |
unseen | -1.482 |
uth | -1.360 |
arah | -1.320 |
humiliated | -1.288 |
Token | brave |
Token ID | 14802 |
Feature activation | +4.65e-01 |
Pos logit contributions | |
Draft | +0.149 |
plin | +0.149 |
Blooming | +0.146 |
€ | +0.146 |
Por | +0.140 |
Neg logit contributions | |
unseen | -0.154 |
nem | -0.154 |
uth | -0.140 |
arah | -0.136 |
humiliated | -0.134 |
Token | o |
Token ID | 267 |
Feature activation | -5.46e-01 |
Pos logit contributions | |
plin | +0.369 |
Draft | +0.369 |
Blooming | +0.363 |
€ | +0.363 |
Por | +0.349 |
Neg logit contributions | |
nem | -0.341 |
unseen | -0.340 |
uth | -0.311 |
arah | -0.301 |
humiliated | -0.294 |
Token | ' |
Token ID | 6 |
Feature activation | -4.54e+00 |
Pos logit contributions | |
unseen | +0.350 |
nem | +0.350 |
uth | +0.320 |
arah | +0.309 |
humiliated | +0.295 |
Neg logit contributions | |
Draft | -0.481 |
plin | -0.478 |
Blooming | -0.474 |
€ | -0.474 |
Por | -0.459 |
Token | er |
Token ID | 263 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
nem | +2.517 |
unseen | +2.506 |
uth | +2.273 |
arah | +2.147 |
emet | +2.030 |
Neg logit contributions | |
Draft | -4.354 |
plin | -4.316 |
€ | -4.279 |
Blooming | -4.264 |
Por | -4.105 |
Token | h |
Token ID | 71 |
Feature activation | -6.99e-01 |
Pos logit contributions | |
unseen | +0.774 |
nem | +0.770 |
uth | +0.709 |
arah | +0.686 |
humiliated | +0.665 |
Neg logit contributions | |
Draft | -0.822 |
plin | -0.819 |
€ | -0.807 |
Blooming | -0.805 |
Por | -0.776 |
Token | anging |
Token ID | 4924 |
Feature activation | -9.89e-01 |
Pos logit contributions | |
unseen | +0.500 |
nem | +0.500 |
uth | +0.465 |
arah | +0.443 |
humiliated | +0.425 |
Neg logit contributions | |
Draft | -0.569 |
plin | -0.563 |
€ | -0.555 |
Blooming | -0.554 |
Por | -0.536 |
Token | firm |
Token ID | 4081 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
unseen | +0.754 |
nem | +0.753 |
uth | +0.685 |
arah | +0.659 |
humiliated | +0.650 |
Neg logit contributions | |
plin | -0.763 |
Draft | -0.761 |
€ | -0.745 |
Blooming | -0.743 |
Por | -0.711 |
Token | ament |
Token ID | 3263 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
plin | +0.283 |
Draft | +0.283 |
Blooming | +0.278 |
€ | +0.278 |
Por | +0.267 |
Neg logit contributions | |
nem | -0.295 |
unseen | -0.295 |
uth | -0.272 |
arah | -0.263 |
humiliated | -0.256 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
Draft | +0.398 |
plin | +0.396 |
Blooming | +0.392 |
€ | +0.391 |
Por | +0.376 |
Neg logit contributions | |
unseen | -0.418 |
nem | -0.418 |
uth | -0.385 |
arah | -0.373 |
humiliated | -0.365 |
Token | They |
Token ID | 1119 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
plin | +0.135 |
Draft | +0.134 |
Blooming | +0.132 |
€ | +0.132 |
Por | +0.127 |
Neg logit contributions | |
nem | -0.137 |
unseen | -0.136 |
uth | -0.126 |
arah | -0.121 |
humiliated | -0.118 |
Token | seek |
Token ID | 5380 |
Feature activation | -8.53e-01 |
Pos logit contributions | |
nem | +0.842 |
unseen | +0.839 |
uth | +0.770 |
arah | +0.744 |
humiliated | +0.737 |
Neg logit contributions | |
Draft | -0.848 |
plin | -0.846 |
Blooming | -0.835 |
€ | -0.828 |
Por | -0.798 |
Token | – |
Token ID | 1906 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
nem | +0.626 |
unseen | +0.625 |
uth | +0.572 |
arah | +0.551 |
humiliated | +0.541 |
Neg logit contributions | |
Draft | -0.677 |
plin | -0.675 |
Blooming | -0.666 |
€ | -0.662 |
Por | -0.639 |
Token | as |
Token ID | 292 |
Feature activation | -6.71e-01 |
Pos logit contributions | |
plin | +0.535 |
Draft | +0.534 |
Blooming | +0.529 |
€ | +0.528 |
Por | +0.510 |
Neg logit contributions | |
nem | -0.456 |
unseen | -0.454 |
uth | -0.416 |
arah | -0.402 |
humiliated | -0.391 |
Token | did |
Token ID | 750 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
unseen | +0.494 |
nem | +0.493 |
uth | +0.450 |
arah | +0.434 |
humiliated | +0.426 |
Neg logit contributions | |
Draft | -0.533 |
plin | -0.530 |
Blooming | -0.523 |
€ | -0.520 |
Por | -0.500 |
Token | those |
Token ID | 883 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
unseen | +3.641 |
nem | +3.639 |
uth | +3.318 |
humiliated | +3.206 |
arah | +3.200 |
Neg logit contributions | |
Draft | -3.291 |
plin | -3.244 |
Blooming | -3.131 |
€ | -3.101 |
Por | -2.946 |
Token | who |
Token ID | 508 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
plin | +0.210 |
Draft | +0.210 |
Blooming | +0.207 |
€ | +0.207 |
Por | +0.199 |
Neg logit contributions | |
nem | -0.221 |
unseen | -0.221 |
uth | -0.204 |
arah | -0.198 |
humiliated | -0.193 |
Token | held |
Token ID | 2714 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
nem | +0.849 |
unseen | +0.845 |
uth | +0.764 |
arah | +0.734 |
humiliated | +0.729 |
Neg logit contributions | |
Draft | -1.126 |
plin | -1.123 |
Blooming | -1.108 |
€ | -1.103 |
Por | -1.063 |
Token | the |
Token ID | 262 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
Draft | +0.157 |
plin | +0.157 |
Blooming | +0.155 |
€ | +0.155 |
Por | +0.149 |
Neg logit contributions | |
nem | -0.150 |
unseen | -0.150 |
uth | -0.137 |
arah | -0.133 |
humiliated | -0.130 |
Token | reins |
Token ID | 35627 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
Draft | +0.017 |
plin | +0.017 |
Blooming | +0.016 |
€ | +0.016 |
Por | +0.015 |
Neg logit contributions | |
nem | -0.018 |
unseen | -0.018 |
uth | -0.017 |
arah | -0.017 |
humiliated | -0.016 |
Token | of |
Token ID | 286 |
Feature activation | -8.66e-01 |
Pos logit contributions | |
unseen | +0.604 |
nem | +0.601 |
uth | +0.557 |
arah | +0.537 |
humiliated | +0.526 |
Neg logit contributions | |
plin | -0.597 |
Draft | -0.595 |
Blooming | -0.587 |
€ | -0.584 |
Por | -0.561 |
Token | the |
Token ID | 262 |
Feature activation | -6.37e-01 |
Pos logit contributions | |
unseen | +0.663 |
nem | +0.658 |
uth | +0.612 |
arah | +0.590 |
humiliated | +0.576 |
Neg logit contributions | |
Draft | -0.655 |
plin | -0.653 |
Blooming | -0.641 |
€ | -0.641 |
Por | -0.610 |
Token | winners |
Token ID | 14591 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
unseen | +0.484 |
nem | +0.482 |
uth | +0.441 |
arah | +0.425 |
humiliated | +0.421 |
Neg logit contributions | |
plin | -0.489 |
Draft | -0.488 |
Blooming | -0.479 |
€ | -0.478 |
Por | -0.460 |
Token | , |
Token ID | 11 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
plin | +0.968 |
Draft | +0.967 |
Blooming | +0.956 |
€ | +0.955 |
Por | +0.918 |
Neg logit contributions | |
nem | -0.994 |
unseen | -0.989 |
uth | -0.914 |
arah | -0.887 |
humiliated | -0.865 |
Token | as |
Token ID | 355 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
unseen | +0.681 |
nem | +0.679 |
uth | +0.619 |
arah | +0.594 |
humiliated | +0.586 |
Neg logit contributions | |
Draft | -0.867 |
plin | -0.867 |
Blooming | -0.853 |
€ | -0.849 |
Por | -0.823 |
Token | per |
Token ID | 583 |
Feature activation | -4.51e+00 |
Pos logit contributions | |
unseen | +0.860 |
nem | +0.853 |
uth | +0.790 |
arah | +0.764 |
humiliated | +0.746 |
Neg logit contributions | |
Draft | -0.823 |
plin | -0.815 |
Blooming | -0.813 |
€ | -0.806 |
Por | -0.773 |
Token | company |
Token ID | 1664 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
unseen | +3.289 |
nem | +3.223 |
uth | +2.982 |
arah | +2.886 |
trusted | +2.815 |
Neg logit contributions | |
Draft | -3.491 |
plin | -3.476 |
Blooming | -3.409 |
€ | -3.398 |
Por | -3.227 |
Token | procedure |
Token ID | 8771 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
unseen | +1.053 |
nem | +1.053 |
uth | +0.958 |
arah | +0.923 |
humiliated | +0.904 |
Neg logit contributions | |
Draft | -1.177 |
plin | -1.169 |
Blooming | -1.154 |
€ | -1.148 |
Por | -1.110 |
Token | , |
Token ID | 11 |
Feature activation | -7.76e-02 |
Pos logit contributions | |
unseen | +1.184 |
nem | +1.180 |
uth | +1.090 |
arah | +1.049 |
humiliated | +1.036 |
Neg logit contributions | |
Draft | -1.132 |
plin | -1.130 |
Blooming | -1.111 |
€ | -1.103 |
Por | -1.063 |
Token | realized |
Token ID | 6939 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
unseen | +0.054 |
nem | +0.054 |
uth | +0.049 |
arah | +0.048 |
humiliated | +0.047 |
Neg logit contributions | |
plin | -0.064 |
Draft | -0.064 |
Blooming | -0.063 |
€ | -0.063 |
Por | -0.061 |
Token | instantly |
Token ID | 11101 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
unseen | +1.100 |
nem | +1.084 |
uth | +0.996 |
arah | +0.964 |
humiliated | +0.952 |
Neg logit contributions | |
Draft | -1.135 |
plin | -1.125 |
Blooming | -1.104 |
€ | -1.103 |
Por | -1.055 |
Token | I |
Token ID | 314 |
Feature activation | -6.06e-01 |
Pos logit contributions | |
Draft | +0.501 |
plin | +0.499 |
Blooming | +0.492 |
€ | +0.491 |
Por | +0.474 |
Neg logit contributions | |
nem | -0.402 |
unseen | -0.401 |
uth | -0.364 |
arah | -0.352 |
humiliated | -0.346 |
Token | was |
Token ID | 373 |
Feature activation | -8.43e-02 |
Pos logit contributions | |
nem | +0.461 |
unseen | +0.460 |
uth | +0.424 |
arah | +0.411 |
humiliated | +0.401 |
Neg logit contributions | |
plin | -0.462 |
Draft | -0.462 |
Blooming | -0.457 |
€ | -0.455 |
Por | -0.438 |
Token | excited |
Token ID | 6568 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
nem | +0.063 |
unseen | +0.063 |
uth | +0.057 |
arah | +0.055 |
humiliated | +0.055 |
Neg logit contributions | |
plin | -0.066 |
Draft | -0.066 |
Blooming | -0.065 |
€ | -0.064 |
Por | -0.062 |
Token | . |
Token ID | 13 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
plin | +1.729 |
Draft | +1.725 |
€ | +1.720 |
Blooming | +1.717 |
Por | +1.651 |
Neg logit contributions | |
nem | -1.719 |
unseen | -1.708 |
uth | -1.586 |
arah | -1.537 |
humiliated | -1.490 |
Token | So |
Token ID | 1406 |
Feature activation | -9.23e-01 |
Pos logit contributions | |
plin | +0.772 |
Draft | +0.767 |
Blooming | +0.756 |
€ | +0.754 |
Por | +0.721 |
Neg logit contributions | |
nem | -0.952 |
unseen | -0.948 |
uth | -0.881 |
arah | -0.857 |
humiliated | -0.839 |
Token | was |
Token ID | 373 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
unseen | +0.711 |
nem | +0.709 |
uth | +0.651 |
arah | +0.635 |
humiliated | +0.624 |
Neg logit contributions | |
Draft | -0.696 |
plin | -0.693 |
Blooming | -0.683 |
€ | -0.681 |
Por | -0.653 |
Token | every |
Token ID | 790 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
nem | +3.257 |
unseen | +3.240 |
uth | +2.944 |
arah | +2.845 |
humiliated | +2.821 |
Neg logit contributions | |
Draft | -3.492 |
plin | -3.451 |
Blooming | -3.321 |
€ | -3.319 |
Por | -3.164 |
Token | other |
Token ID | 584 |
Feature activation | -6.43e-01 |
Pos logit contributions | |
plin | +0.140 |
Draft | +0.140 |
Blooming | +0.139 |
€ | +0.138 |
Por | +0.134 |
Neg logit contributions | |
nem | -0.117 |
unseen | -0.117 |
uth | -0.106 |
arah | -0.103 |
humiliated | -0.100 |
Token | girl |
Token ID | 2576 |
Feature activation | +5.49e-01 |
Pos logit contributions | |
nem | +0.449 |
unseen | +0.448 |
uth | +0.406 |
arah | +0.392 |
humiliated | +0.384 |
Neg logit contributions | |
plin | -0.534 |
Draft | -0.533 |
€ | -0.522 |
Blooming | -0.521 |
Por | -0.503 |
Token | . |
Token ID | 13 |
Feature activation | +5.89e-01 |
Pos logit contributions | |
plin | +0.412 |
Draft | +0.412 |
Blooming | +0.407 |
€ | +0.406 |
Por | +0.390 |
Neg logit contributions | |
nem | -0.424 |
unseen | -0.423 |
uth | -0.389 |
arah | -0.378 |
humiliated | -0.369 |
Token |
|
Token ID | 198 |
Feature activation | +8.72e-02 |
Pos logit contributions | |
plin | +0.405 |
Draft | +0.401 |
Blooming | +0.394 |
€ | +0.394 |
Por | +0.376 |
Neg logit contributions | |
nem | -0.494 |
unseen | -0.492 |
uth | -0.457 |
arah | -0.445 |
humiliated | -0.435 |
Token | her |
Token ID | 607 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
plin | +0.412 |
Draft | +0.411 |
Blooming | +0.407 |
€ | +0.406 |
Por | +0.391 |
Neg logit contributions | |
nem | -0.396 |
unseen | -0.395 |
uth | -0.363 |
arah | -0.352 |
humiliated | -0.343 |
Token | tightly |
Token ID | 17707 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
plin | +1.331 |
Draft | +1.328 |
Blooming | +1.321 |
€ | +1.320 |
Por | +1.272 |
Neg logit contributions | |
nem | -1.164 |
unseen | -1.159 |
uth | -1.068 |
arah | -1.034 |
humiliated | -1.001 |
Token | . |
Token ID | 13 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
unseen | +0.167 |
nem | +0.167 |
uth | +0.153 |
arah | +0.149 |
humiliated | +0.146 |
Neg logit contributions | |
plin | -0.159 |
Draft | -0.158 |
Blooming | -0.156 |
€ | -0.156 |
Por | -0.149 |
Token | She |
Token ID | 1375 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
plin | +0.212 |
Draft | +0.211 |
Blooming | +0.208 |
€ | +0.208 |
Por | +0.199 |
Neg logit contributions | |
nem | -0.230 |
unseen | -0.230 |
uth | -0.212 |
arah | -0.206 |
humiliated | -0.201 |
Token | gr |
Token ID | 1036 |
Feature activation | -3.77e-01 |
Pos logit contributions | |
Draft | +0.235 |
plin | +0.235 |
Blooming | +0.231 |
€ | +0.230 |
Por | +0.221 |
Neg logit contributions | |
unseen | -0.244 |
nem | -0.244 |
uth | -0.224 |
arah | -0.216 |
humiliated | -0.213 |
Token | ins |
Token ID | 1040 |
Feature activation | -4.42e+00 |
Pos logit contributions | |
nem | +0.269 |
unseen | +0.268 |
uth | +0.246 |
arah | +0.238 |
humiliated | +0.232 |
Neg logit contributions | |
plin | -0.305 |
Draft | -0.304 |
Blooming | -0.301 |
€ | -0.301 |
Por | -0.290 |
Token | at |
Token ID | 379 |
Feature activation | -5.52e-01 |
Pos logit contributions | |
unseen | +3.104 |
nem | +3.088 |
uth | +2.744 |
humiliated | +2.697 |
arah | +2.620 |
Neg logit contributions | |
plin | -3.695 |
Draft | -3.681 |
Blooming | -3.626 |
€ | -3.528 |
Por | -3.453 |
Token | me |
Token ID | 502 |
Feature activation | +3.99e-01 |
Pos logit contributions | |
unseen | +0.422 |
nem | +0.420 |
uth | +0.383 |
arah | +0.374 |
humiliated | +0.366 |
Neg logit contributions | |
Draft | -0.424 |
plin | -0.423 |
Blooming | -0.415 |
€ | -0.414 |
Por | -0.398 |
Token | . |
Token ID | 13 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
plin | +0.303 |
Draft | +0.302 |
Blooming | +0.299 |
€ | +0.299 |
Por | +0.287 |
Neg logit contributions | |
nem | -0.304 |
unseen | -0.302 |
uth | -0.280 |
arah | -0.271 |
humiliated | -0.264 |
Token | God |
Token ID | 1793 |
Feature activation | -3.61e-01 |
Pos logit contributions | |
plin | +0.360 |
Draft | +0.360 |
Blooming | +0.355 |
€ | +0.355 |
Por | +0.340 |
Neg logit contributions | |
nem | -0.390 |
unseen | -0.389 |
uth | -0.359 |
arah | -0.349 |
humiliated | -0.341 |
Token | , |
Token ID | 11 |
Feature activation | -7.60e-01 |
Pos logit contributions | |
nem | +0.289 |
unseen | +0.289 |
uth | +0.268 |
arah | +0.260 |
humiliated | +0.254 |
Neg logit contributions | |
Draft | -0.260 |
plin | -0.259 |
Blooming | -0.257 |
€ | -0.255 |
Por | -0.245 |
Token | in |
Token ID | 287 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
nem | +0.538 |
unseen | +0.536 |
uth | +0.483 |
arah | +0.469 |
humiliated | +0.461 |
Neg logit contributions | |
Draft | -0.585 |
plin | -0.581 |
Blooming | -0.574 |
€ | -0.569 |
Por | -0.546 |
Token | his |
Token ID | 465 |
Feature activation | +5.53e-01 |
Pos logit contributions | |
nem | +0.228 |
unseen | +0.228 |
uth | +0.209 |
arah | +0.203 |
humiliated | +0.196 |
Neg logit contributions | |
Draft | -0.231 |
plin | -0.228 |
€ | -0.226 |
Blooming | -0.225 |
Por | -0.214 |
Token | stories |
Token ID | 3923 |
Feature activation | +9.86e-01 |
Pos logit contributions | |
Draft | +0.412 |
plin | +0.411 |
Blooming | +0.405 |
€ | +0.404 |
Por | +0.386 |
Neg logit contributions | |
nem | -0.434 |
unseen | -0.432 |
uth | -0.397 |
arah | -0.386 |
humiliated | -0.377 |
Token | , |
Token ID | 11 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
Draft | +0.728 |
plin | +0.727 |
Blooming | +0.720 |
€ | +0.717 |
Por | +0.686 |
Neg logit contributions | |
nem | -0.776 |
unseen | -0.776 |
uth | -0.714 |
arah | -0.695 |
humiliated | -0.675 |
Token | nor |
Token ID | 4249 |
Feature activation | -6.45e-01 |
Pos logit contributions | |
Draft | +0.882 |
plin | +0.880 |
Blooming | +0.870 |
€ | +0.867 |
Por | +0.833 |
Neg logit contributions | |
nem | -0.884 |
unseen | -0.882 |
uth | -0.809 |
arah | -0.786 |
humiliated | -0.768 |
Token | does |
Token ID | 857 |
Feature activation | -4.42e+00 |
Pos logit contributions | |
nem | +0.454 |
unseen | +0.452 |
uth | +0.413 |
arah | +0.400 |
humiliated | +0.390 |
Neg logit contributions | |
Draft | -0.531 |
plin | -0.529 |
Blooming | -0.524 |
€ | -0.522 |
Por | -0.502 |
Token | he |
Token ID | 339 |
Feature activation | -7.72e-02 |
Pos logit contributions | |
nem | +3.476 |
unseen | +3.463 |
uth | +3.182 |
arah | +3.079 |
humiliated | +3.015 |
Neg logit contributions | |
Draft | -3.268 |
plin | -3.158 |
Blooming | -3.142 |
€ | -3.124 |
Por | -2.865 |
Token | sugar |
Token ID | 7543 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
nem | +0.054 |
unseen | +0.054 |
uth | +0.049 |
arah | +0.047 |
humiliated | +0.046 |
Neg logit contributions | |
Draft | -0.064 |
plin | -0.064 |
Blooming | -0.063 |
€ | -0.063 |
Por | -0.061 |
Token | coat |
Token ID | 31434 |
Feature activation | +4.27e-01 |
Pos logit contributions | |
plin | +0.219 |
Draft | +0.219 |
Blooming | +0.216 |
€ | +0.216 |
Por | +0.207 |
Neg logit contributions | |
nem | -0.261 |
unseen | -0.260 |
uth | -0.241 |
arah | -0.235 |
humiliated | -0.230 |
Token | the |
Token ID | 262 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
Draft | +0.302 |
plin | +0.300 |
Blooming | +0.297 |
€ | +0.296 |
Por | +0.282 |
Neg logit contributions | |
nem | -0.351 |
unseen | -0.351 |
uth | -0.324 |
arah | -0.315 |
humiliated | -0.308 |
Token | realities |
Token ID | 22072 |
Feature activation | +4.50e-01 |
Pos logit contributions | |
nem | +0.116 |
unseen | +0.115 |
uth | +0.105 |
arah | +0.101 |
humiliated | +0.099 |
Neg logit contributions | |
Draft | -0.128 |
plin | -0.128 |
Blooming | -0.126 |
€ | -0.125 |
Por | -0.121 |
Token | covering |
Token ID | 9505 |
Feature activation | +6.99e-01 |
Pos logit contributions | |
plin | +0.940 |
Draft | +0.939 |
Blooming | +0.929 |
€ | +0.927 |
Por | +0.891 |
Neg logit contributions | |
nem | -0.976 |
unseen | -0.973 |
uth | -0.899 |
arah | -0.872 |
humiliated | -0.851 |
Token | the |
Token ID | 262 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
plin | +0.526 |
Draft | +0.525 |
Blooming | +0.519 |
€ | +0.518 |
Por | +0.498 |
Neg logit contributions | |
nem | -0.539 |
unseen | -0.538 |
uth | -0.496 |
arah | -0.481 |
humiliated | -0.470 |
Token | situation |
Token ID | 3074 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
unseen | +0.736 |
nem | +0.734 |
uth | +0.667 |
arah | +0.646 |
humiliated | +0.633 |
Neg logit contributions | |
plin | -0.823 |
Draft | -0.823 |
€ | -0.807 |
Blooming | -0.804 |
Por | -0.774 |
Token | , |
Token ID | 11 |
Feature activation | -9.68e-02 |
Pos logit contributions | |
unseen | +0.225 |
nem | +0.225 |
uth | +0.206 |
arah | +0.199 |
humiliated | +0.195 |
Neg logit contributions | |
plin | -0.230 |
Draft | -0.230 |
Blooming | -0.226 |
€ | -0.226 |
Por | -0.217 |
Token | as |
Token ID | 355 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
unseen | +0.073 |
nem | +0.073 |
uth | +0.067 |
arah | +0.064 |
humiliated | +0.063 |
Neg logit contributions | |
plin | -0.075 |
Draft | -0.075 |
€ | -0.074 |
Blooming | -0.073 |
Por | -0.071 |
Token | will |
Token ID | 481 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
unseen | +0.106 |
nem | +0.105 |
uth | +0.097 |
arah | +0.093 |
humiliated | +0.092 |
Neg logit contributions | |
Draft | -0.099 |
plin | -0.098 |
€ | -0.097 |
Blooming | -0.097 |
Por | -0.092 |
Token | Night |
Token ID | 5265 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
unseen | +3.471 |
nem | +3.431 |
uth | +3.143 |
arah | +3.049 |
trusted | +3.009 |
Neg logit contributions | |
Draft | -3.244 |
plin | -3.234 |
€ | -3.109 |
Blooming | -3.072 |
Por | -2.935 |
Token | line |
Token ID | 1370 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
nem | +0.209 |
unseen | +0.208 |
uth | +0.177 |
arah | +0.167 |
humiliated | +0.158 |
Neg logit contributions | |
plin | -0.588 |
Draft | -0.586 |
Blooming | -0.584 |
€ | -0.582 |
Por | -0.568 |
Token | . |
Token ID | 13 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
nem | +1.117 |
unseen | +1.108 |
uth | +1.009 |
arah | +0.971 |
humiliated | +0.955 |
Neg logit contributions | |
plin | -1.175 |
Draft | -1.166 |
€ | -1.149 |
Blooming | -1.139 |
Por | -1.098 |
Token | Stephan |
Token ID | 20800 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
plin | +0.208 |
Draft | +0.207 |
€ | +0.204 |
Blooming | +0.204 |
Por | +0.195 |
Neg logit contributions | |
nem | -0.205 |
unseen | -0.204 |
uth | -0.189 |
arah | -0.182 |
humiliated | -0.177 |
Token | opol |
Token ID | 39704 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
Draft | +0.490 |
plin | +0.480 |
Blooming | +0.477 |
€ | +0.475 |
Por | +0.446 |
Neg logit contributions | |
nem | -1.077 |
unseen | -1.076 |
uth | -1.025 |
arah | -0.995 |
humiliated | -0.973 |
Token | time |
Token ID | 640 |
Feature activation | -8.54e-01 |
Pos logit contributions | |
unseen | +0.981 |
nem | +0.981 |
uth | +0.899 |
arah | +0.862 |
humiliated | +0.852 |
Neg logit contributions | |
plin | -0.907 |
Draft | -0.907 |
€ | -0.883 |
Blooming | -0.882 |
Por | -0.847 |
Token | still |
Token ID | 991 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
unseen | +0.643 |
nem | +0.642 |
uth | +0.582 |
arah | +0.561 |
humiliated | +0.555 |
Neg logit contributions | |
Draft | -0.664 |
plin | -0.662 |
Blooming | -0.651 |
€ | -0.645 |
Por | -0.624 |
Token | truly |
Token ID | 4988 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
unseen | +0.008 |
nem | +0.008 |
uth | +0.007 |
arah | +0.007 |
humiliated | +0.007 |
Neg logit contributions | |
Draft | -0.008 |
plin | -0.008 |
Blooming | -0.008 |
€ | -0.008 |
Por | -0.008 |
Token | significant |
Token ID | 2383 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
unseen | +0.783 |
nem | +0.781 |
uth | +0.711 |
arah | +0.682 |
humiliated | +0.677 |
Neg logit contributions | |
plin | -0.789 |
Draft | -0.788 |
Blooming | -0.772 |
€ | -0.768 |
Por | -0.740 |
Token | ? |
Token ID | 30 |
Feature activation | -8.98e-01 |
Pos logit contributions | |
nem | +0.192 |
unseen | +0.192 |
uth | +0.175 |
arah | +0.168 |
humiliated | +0.165 |
Neg logit contributions | |
Draft | -0.219 |
plin | -0.219 |
Blooming | -0.216 |
€ | -0.215 |
Por | -0.207 |
Token | Does |
Token ID | 8314 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
nem | +0.763 |
unseen | +0.756 |
uth | +0.709 |
arah | +0.678 |
humiliated | +0.664 |
Neg logit contributions | |
plin | -0.611 |
Draft | -0.602 |
€ | -0.585 |
Blooming | -0.584 |
Por | -0.556 |
Token | this |
Token ID | 428 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
nem | +3.332 |
unseen | +3.326 |
uth | +3.002 |
trusted | +2.859 |
humiliated | +2.850 |
Neg logit contributions | |
Draft | -3.368 |
plin | -3.347 |
€ | -3.206 |
Blooming | -3.195 |
Por | -3.072 |
Token | render |
Token ID | 8543 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
plin | +0.440 |
Draft | +0.440 |
Blooming | +0.434 |
€ | +0.432 |
Por | +0.417 |
Neg logit contributions | |
nem | -0.362 |
unseen | -0.362 |
uth | -0.329 |
arah | -0.317 |
humiliated | -0.309 |
Token | time |
Token ID | 640 |
Feature activation | -5.20e-01 |
Pos logit contributions | |
nem | +1.004 |
unseen | +1.001 |
uth | +0.907 |
arah | +0.866 |
humiliated | +0.855 |
Neg logit contributions | |
Draft | -1.113 |
plin | -1.110 |
Blooming | -1.085 |
€ | -1.084 |
Por | -1.038 |
Token | as |
Token ID | 355 |
Feature activation | -3.35e-03 |
Pos logit contributions | |
unseen | +0.395 |
nem | +0.394 |
uth | +0.359 |
arah | +0.344 |
humiliated | +0.340 |
Neg logit contributions | |
Draft | -0.402 |
plin | -0.402 |
Blooming | -0.395 |
€ | -0.391 |
Por | -0.378 |
Token | something |
Token ID | 1223 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
unseen | +0.003 |
nem | +0.003 |
uth | +0.002 |
arah | +0.002 |
humiliated | +0.002 |
Neg logit contributions | |
Draft | -0.002 |
plin | -0.002 |
Blooming | -0.002 |
€ | -0.002 |
Por | -0.002 |
Token | all |
Token ID | 477 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
unseen | +0.061 |
nem | +0.061 |
uth | +0.057 |
arah | +0.055 |
humiliated | +0.053 |
Neg logit contributions | |
plin | -0.059 |
Draft | -0.059 |
Blooming | -0.058 |
€ | -0.058 |
Por | -0.056 |
Token | - |
Token ID | 12 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
nem | +1.437 |
unseen | +1.434 |
uth | +1.300 |
arah | +1.249 |
humiliated | +1.212 |
Neg logit contributions | |
plin | -1.923 |
Draft | -1.915 |
Blooming | -1.896 |
€ | -1.891 |
Por | -1.823 |
Token | new |
Token ID | 3605 |
Feature activation | +6.36e-01 |
Pos logit contributions | |
Draft | +0.267 |
plin | +0.266 |
Blooming | +0.263 |
€ | +0.263 |
Por | +0.254 |
Neg logit contributions | |
nem | -0.228 |
unseen | -0.227 |
uth | -0.208 |
arah | -0.201 |
humiliated | -0.196 |
Token | four |
Token ID | 1440 |
Feature activation | -6.48e-01 |
Pos logit contributions | |
plin | +0.475 |
Draft | +0.474 |
Blooming | +0.466 |
€ | +0.465 |
Por | +0.447 |
Neg logit contributions | |
nem | -0.497 |
unseen | -0.495 |
uth | -0.456 |
arah | -0.442 |
humiliated | -0.432 |
Token | - |
Token ID | 12 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
nem | +0.419 |
unseen | +0.418 |
uth | +0.378 |
arah | +0.363 |
humiliated | +0.352 |
Neg logit contributions | |
Draft | -0.569 |
plin | -0.569 |
Blooming | -0.563 |
€ | -0.559 |
Por | -0.539 |
Token | wheel |
Token ID | 22001 |
Feature activation | -4.39e+00 |
Pos logit contributions | |
nem | +0.878 |
unseen | +0.874 |
uth | +0.806 |
arah | +0.776 |
humiliated | +0.753 |
Neg logit contributions | |
plin | -0.961 |
Draft | -0.956 |
Blooming | -0.953 |
€ | -0.948 |
Por | -0.909 |
Token | - |
Token ID | 12 |
Feature activation | -6.95e-02 |
Pos logit contributions | |
unseen | +3.421 |
nem | +3.409 |
uth | +3.112 |
arah | +3.030 |
humiliated | +2.943 |
Neg logit contributions | |
plin | -3.266 |
Draft | -3.223 |
Blooming | -3.164 |
€ | -3.146 |
Por | -3.001 |
Token | drive |
Token ID | 19472 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
nem | +0.076 |
unseen | +0.076 |
uth | +0.072 |
arah | +0.070 |
humiliated | +0.069 |
Neg logit contributions | |
Draft | -0.030 |
plin | -0.030 |
€ | -0.029 |
Blooming | -0.029 |
Por | -0.027 |
Token | , |
Token ID | 11 |
Feature activation | -5.42e-01 |
Pos logit contributions | |
nem | +1.972 |
unseen | +1.969 |
uth | +1.798 |
arah | +1.714 |
humiliated | +1.690 |
Neg logit contributions | |
plin | -2.135 |
Draft | -2.112 |
Blooming | -2.067 |
€ | -2.050 |
Por | -1.987 |
Token | torque |
Token ID | 26415 |
Feature activation | -2.82e+00 |
Pos logit contributions | |
nem | +0.402 |
unseen | +0.401 |
uth | +0.368 |
arah | +0.355 |
humiliated | +0.348 |
Neg logit contributions | |
plin | -0.424 |
Draft | -0.423 |
Blooming | -0.417 |
€ | -0.415 |
Por | -0.400 |
Token | - |
Token ID | 12 |
Feature activation | -4.81e-01 |
Pos logit contributions | |
nem | +1.881 |
unseen | +1.880 |
uth | +1.709 |
arah | +1.616 |
humiliated | +1.602 |
Neg logit contributions | |
plin | -2.429 |
Draft | -2.411 |
Blooming | -2.385 |
€ | -2.362 |
Por | -2.292 |
Token | had |
Token ID | 550 |
Feature activation | -5.80e-01 |
Pos logit contributions | |
plin | +0.516 |
Draft | +0.515 |
Blooming | +0.509 |
€ | +0.508 |
Por | +0.489 |
Neg logit contributions | |
nem | -0.463 |
unseen | -0.462 |
uth | -0.423 |
arah | -0.410 |
humiliated | -0.400 |
Token | to |
Token ID | 284 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
nem | +0.411 |
unseen | +0.410 |
uth | +0.374 |
arah | +0.361 |
humiliated | +0.355 |
Neg logit contributions | |
plin | -0.475 |
Draft | -0.475 |
Blooming | -0.466 |
€ | -0.465 |
Por | -0.448 |
Token | sign |
Token ID | 1051 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
nem | +0.858 |
unseen | +0.856 |
uth | +0.784 |
arah | +0.759 |
humiliated | +0.754 |
Neg logit contributions | |
Draft | -0.798 |
plin | -0.793 |
Blooming | -0.780 |
€ | -0.772 |
Por | -0.745 |
Token | up |
Token ID | 510 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
plin | +0.115 |
Draft | +0.114 |
Blooming | +0.113 |
€ | +0.112 |
Por | +0.108 |
Neg logit contributions | |
nem | -0.124 |
unseen | -0.124 |
uth | -0.114 |
arah | -0.110 |
humiliated | -0.108 |
Token | in |
Token ID | 287 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
plin | +0.804 |
Draft | +0.803 |
€ | +0.799 |
Blooming | +0.798 |
Por | +0.769 |
Neg logit contributions | |
nem | -0.715 |
unseen | -0.712 |
uth | -0.657 |
arah | -0.637 |
humiliated | -0.616 |
Token | advance |
Token ID | 5963 |
Feature activation | -4.39e+00 |
Pos logit contributions | |
Draft | +0.111 |
plin | +0.111 |
Blooming | +0.110 |
€ | +0.110 |
Por | +0.106 |
Neg logit contributions | |
nem | -0.070 |
unseen | -0.070 |
uth | -0.062 |
arah | -0.060 |
humiliated | -0.058 |
Token | to |
Token ID | 284 |
Feature activation | +2.37e-01 |
Pos logit contributions | |
unseen | +3.071 |
nem | +3.023 |
uth | +2.761 |
arah | +2.637 |
humiliated | +2.597 |
Neg logit contributions | |
Draft | -3.604 |
plin | -3.601 |
Blooming | -3.531 |
€ | -3.461 |
Por | -3.368 |
Token | use |
Token ID | 779 |
Feature activation | -7.12e-01 |
Pos logit contributions | |
Draft | +0.186 |
plin | +0.186 |
Blooming | +0.184 |
€ | +0.183 |
Por | +0.177 |
Neg logit contributions | |
nem | -0.175 |
unseen | -0.175 |
uth | -0.160 |
arah | -0.155 |
humiliated | -0.151 |
Token | the |
Token ID | 262 |
Feature activation | +8.72e-02 |
Pos logit contributions | |
unseen | +0.538 |
nem | +0.538 |
uth | +0.494 |
arah | +0.475 |
humiliated | +0.467 |
Neg logit contributions | |
plin | -0.548 |
Draft | -0.547 |
Blooming | -0.537 |
€ | -0.537 |
Por | -0.515 |
Token | provided |
Token ID | 2810 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
plin | +0.063 |
Draft | +0.063 |
€ | +0.062 |
Blooming | +0.062 |
Por | +0.059 |
Neg logit contributions | |
nem | -0.070 |
unseen | -0.070 |
uth | -0.064 |
arah | -0.062 |
humiliated | -0.061 |
Token | stage |
Token ID | 3800 |
Feature activation | +7.53e-01 |
Pos logit contributions | |
nem | +1.176 |
unseen | +1.172 |
uth | +1.071 |
arah | +1.034 |
humiliated | +1.026 |
Neg logit contributions | |
plin | -1.097 |
Draft | -1.088 |
Blooming | -1.062 |
€ | -1.060 |
Por | -1.019 |
Token | had |
Token ID | 550 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
unseen | +0.173 |
nem | +0.173 |
uth | +0.156 |
arah | +0.150 |
humiliated | +0.149 |
Neg logit contributions | |
Draft | -0.218 |
plin | -0.217 |
Blooming | -0.214 |
€ | -0.213 |
Por | -0.206 |
Token | an |
Token ID | 281 |
Feature activation | +7.41e-02 |
Pos logit contributions | |
unseen | +0.730 |
nem | +0.729 |
uth | +0.662 |
arah | +0.636 |
humiliated | +0.632 |
Neg logit contributions | |
Draft | -0.846 |
plin | -0.844 |
Blooming | -0.830 |
€ | -0.822 |
Por | -0.794 |
Token | aura |
Token ID | 22491 |
Feature activation | +8.31e-01 |
Pos logit contributions | |
plin | +0.059 |
Draft | +0.059 |
Blooming | +0.058 |
€ | +0.058 |
Por | +0.056 |
Neg logit contributions | |
unseen | -0.054 |
nem | -0.054 |
uth | -0.049 |
arah | -0.048 |
humiliated | -0.047 |
Token | , |
Token ID | 11 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
Draft | +0.604 |
plin | +0.603 |
Blooming | +0.595 |
€ | +0.593 |
Por | +0.570 |
Neg logit contributions | |
nem | -0.663 |
unseen | -0.662 |
uth | -0.610 |
arah | -0.592 |
humiliated | -0.580 |
Token | as |
Token ID | 355 |
Feature activation | +5.87e-01 |
Pos logit contributions | |
Draft | +0.170 |
plin | +0.169 |
Blooming | +0.167 |
€ | +0.166 |
Por | +0.159 |
Neg logit contributions | |
unseen | -0.186 |
nem | -0.185 |
uth | -0.170 |
arah | -0.165 |
humiliated | -0.163 |
Token | did |
Token ID | 750 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
Draft | +0.439 |
plin | +0.439 |
Blooming | +0.434 |
€ | +0.432 |
Por | +0.415 |
Neg logit contributions | |
nem | -0.455 |
unseen | -0.455 |
uth | -0.418 |
arah | -0.406 |
humiliated | -0.397 |
Token | his |
Token ID | 465 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
nem | +3.274 |
unseen | +3.261 |
uth | +2.958 |
humiliated | +2.845 |
trusted | +2.809 |
Neg logit contributions | |
Draft | -3.420 |
plin | -3.364 |
Blooming | -3.254 |
€ | -3.222 |
Por | -3.094 |
Token | assistant |
Token ID | 8796 |
Feature activation | +3.78e-01 |
Pos logit contributions | |
plin | +0.148 |
Draft | +0.148 |
Blooming | +0.147 |
€ | +0.146 |
Por | +0.142 |
Neg logit contributions | |
nem | -0.111 |
unseen | -0.110 |
uth | -0.100 |
arah | -0.096 |
humiliated | -0.094 |
Token | , |
Token ID | 11 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
Draft | +0.286 |
plin | +0.285 |
Blooming | +0.281 |
€ | +0.280 |
Por | +0.269 |
Neg logit contributions | |
nem | -0.291 |
unseen | -0.290 |
uth | -0.267 |
arah | -0.258 |
humiliated | -0.253 |
Token | Archie |
Token ID | 43459 |
Feature activation | -4.80e-02 |
Pos logit contributions | |
plin | +0.535 |
Draft | +0.534 |
Blooming | +0.529 |
€ | +0.527 |
Por | +0.507 |
Neg logit contributions | |
nem | -0.515 |
unseen | -0.513 |
uth | -0.472 |
arah | -0.458 |
humiliated | -0.446 |
Token | Knox |
Token ID | 27633 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
nem | +0.041 |
unseen | +0.040 |
uth | +0.038 |
arah | +0.036 |
humiliated | +0.036 |
Neg logit contributions | |
Draft | -0.032 |
plin | -0.032 |
Blooming | -0.032 |
€ | -0.032 |
Por | -0.030 |
Token | three |
Token ID | 1115 |
Feature activation | -4.15e-01 |
Pos logit contributions | |
Draft | +0.286 |
plin | +0.285 |
Blooming | +0.280 |
€ | +0.280 |
Por | +0.269 |
Neg logit contributions | |
nem | -0.307 |
unseen | -0.306 |
uth | -0.282 |
arah | -0.274 |
humiliated | -0.267 |
Token | less |
Token ID | 1342 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
nem | +0.271 |
unseen | +0.270 |
uth | +0.243 |
arah | +0.235 |
humiliated | +0.228 |
Neg logit contributions | |
plin | -0.363 |
Draft | -0.363 |
€ | -0.357 |
Blooming | -0.357 |
Por | -0.345 |
Token | - |
Token ID | 12 |
Feature activation | +4.64e-01 |
Pos logit contributions | |
nem | +0.023 |
unseen | +0.023 |
uth | +0.021 |
arah | +0.020 |
humiliated | +0.020 |
Neg logit contributions | |
Draft | -0.028 |
plin | -0.028 |
Blooming | -0.027 |
€ | -0.027 |
Por | -0.026 |
Token | than |
Token ID | 14813 |
Feature activation | -6.84e-01 |
Pos logit contributions | |
plin | +0.369 |
Draft | +0.369 |
Blooming | +0.365 |
€ | +0.364 |
Por | +0.351 |
Neg logit contributions | |
nem | -0.336 |
unseen | -0.335 |
uth | -0.308 |
arah | -0.298 |
humiliated | -0.290 |
Token | - |
Token ID | 12 |
Feature activation | -2.53e-01 |
Pos logit contributions | |
nem | +0.453 |
unseen | +0.451 |
uth | +0.410 |
arah | +0.396 |
humiliated | +0.384 |
Neg logit contributions | |
plin | -0.589 |
Draft | -0.589 |
Blooming | -0.582 |
€ | -0.581 |
Por | -0.562 |
Token | opt |
Token ID | 8738 |
Feature activation | +2.98e+00 |
Pos logit contributions | |
nem | +0.172 |
unseen | +0.172 |
uth | +0.157 |
arah | +0.152 |
humiliated | +0.147 |
Neg logit contributions | |
plin | -0.213 |
Draft | -0.212 |
Blooming | -0.210 |
€ | -0.210 |
Por | -0.203 |
Token | imal |
Token ID | 4402 |
Feature activation | +8.66e-01 |
Pos logit contributions | |
plin | +2.365 |
€ | +2.320 |
Draft | +2.312 |
Blooming | +2.311 |
Por | +2.231 |
Neg logit contributions | |
unseen | -2.167 |
nem | -2.161 |
uth | -1.966 |
arah | -1.908 |
humiliated | -1.884 |
Token | v |
Token ID | 410 |
Feature activation | +6.64e-01 |
Pos logit contributions | |
plin | +0.695 |
Draft | +0.695 |
Blooming | +0.684 |
€ | +0.684 |
Por | +0.658 |
Neg logit contributions | |
nem | -0.627 |
unseen | -0.624 |
uth | -0.572 |
arah | -0.553 |
humiliated | -0.538 |
Token | int |
Token ID | 600 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
plin | +0.513 |
Draft | +0.511 |
Blooming | +0.506 |
€ | +0.505 |
Por | +0.486 |
Neg logit contributions | |
nem | -0.498 |
unseen | -0.497 |
uth | -0.456 |
arah | -0.443 |
humiliated | -0.433 |
Token | ages |
Token ID | 1095 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
nem | +0.642 |
unseen | +0.639 |
uth | +0.563 |
arah | +0.537 |
humiliated | +0.516 |
Neg logit contributions | |
plin | -1.291 |
Draft | -1.290 |
Blooming | -1.280 |
€ | -1.278 |
Por | -1.241 |
Token | . |
Token ID | 13 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
plin | +0.840 |
Draft | +0.839 |
Blooming | +0.828 |
€ | +0.826 |
Por | +0.796 |
Neg logit contributions | |
nem | -0.794 |
unseen | -0.792 |
uth | -0.726 |
arah | -0.703 |
humiliated | -0.687 |
Token | att |
Token ID | 1078 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
Draft | +0.143 |
plin | +0.140 |
Blooming | +0.140 |
€ | +0.138 |
Por | +0.135 |
Neg logit contributions | |
unseen | -0.113 |
nem | -0.113 |
uth | -0.104 |
arah | -0.100 |
emet | -0.097 |
Token | transmitter |
Token ID | 35099 |
Feature activation | -4.27e-01 |
Pos logit contributions | |
nem | +1.131 |
unseen | +1.117 |
uth | +1.017 |
arah | +0.981 |
humiliated | +0.957 |
Neg logit contributions | |
Draft | -1.246 |
plin | -1.237 |
Blooming | -1.218 |
€ | -1.208 |
Por | -1.166 |
Token | would |
Token ID | 561 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
nem | +0.313 |
unseen | +0.312 |
uth | +0.285 |
arah | +0.274 |
humiliated | +0.270 |
Neg logit contributions | |
Draft | -0.340 |
plin | -0.339 |
Blooming | -0.335 |
€ | -0.333 |
Por | -0.321 |
Token | start |
Token ID | 923 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
Draft | +0.471 |
plin | +0.469 |
Blooming | +0.461 |
€ | +0.460 |
Por | +0.443 |
Neg logit contributions | |
nem | -0.532 |
unseen | -0.531 |
uth | -0.491 |
arah | -0.475 |
humiliated | -0.465 |
Token | be |
Token ID | 307 |
Feature activation | +7.11e-01 |
Pos logit contributions | |
plin | +1.059 |
Draft | +1.058 |
Blooming | +1.046 |
€ | +1.044 |
Por | +1.006 |
Neg logit contributions | |
nem | -0.988 |
unseen | -0.985 |
uth | -0.904 |
arah | -0.876 |
humiliated | -0.854 |
Token | aming |
Token ID | 3723 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
plin | +0.579 |
Draft | +0.579 |
Blooming | +0.573 |
€ | +0.572 |
Por | +0.552 |
Neg logit contributions | |
nem | -0.503 |
unseen | -0.502 |
uth | -0.459 |
arah | -0.444 |
humiliated | -0.432 |
Token | images |
Token ID | 4263 |
Feature activation | +8.22e-01 |
Pos logit contributions | |
plin | +2.684 |
Draft | +2.667 |
€ | +2.665 |
Blooming | +2.653 |
Por | +2.562 |
Neg logit contributions | |
nem | -2.643 |
unseen | -2.631 |
uth | -2.438 |
arah | -2.385 |
humiliated | -2.313 |
Token | back |
Token ID | 736 |
Feature activation | +2.40e+00 |
Pos logit contributions | |
plin | +0.638 |
Draft | +0.637 |
Blooming | +0.630 |
€ | +0.627 |
Por | +0.604 |
Neg logit contributions | |
unseen | -0.615 |
nem | -0.614 |
uth | -0.564 |
arah | -0.546 |
humiliated | -0.533 |
Token | to |
Token ID | 284 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
plin | +1.878 |
Draft | +1.871 |
Blooming | +1.856 |
€ | +1.855 |
Por | +1.790 |
Neg logit contributions | |
nem | -1.760 |
unseen | -1.744 |
uth | -1.609 |
arah | -1.563 |
humiliated | -1.528 |
Token | Earth |
Token ID | 3668 |
Feature activation | -8.55e-01 |
Pos logit contributions | |
plin | +1.022 |
Draft | +1.020 |
Blooming | +1.009 |
€ | +1.006 |
Por | +0.964 |
Neg logit contributions | |
nem | -1.233 |
unseen | -1.230 |
uth | -1.143 |
arah | -1.112 |
humiliated | -1.087 |
Token | , |
Token ID | 11 |
Feature activation | +5.32e-01 |
Pos logit contributions | |
unseen | +0.646 |
nem | +0.643 |
uth | +0.590 |
arah | +0.570 |
humiliated | +0.556 |
Neg logit contributions | |
plin | -0.659 |
Draft | -0.658 |
Blooming | -0.650 |
€ | -0.648 |
Por | -0.625 |
Token | , |
Token ID | 11 |
Feature activation | +3.38e-02 |
Pos logit contributions | |
unseen | +0.417 |
nem | +0.415 |
uth | +0.381 |
arah | +0.369 |
humiliated | +0.361 |
Neg logit contributions | |
plin | -0.416 |
Draft | -0.416 |
Blooming | -0.410 |
€ | -0.407 |
Por | -0.392 |
Token | territory |
Token ID | 7674 |
Feature activation | -9.12e-02 |
Pos logit contributions | |
plin | +0.027 |
Draft | +0.027 |
Blooming | +0.027 |
€ | +0.027 |
Por | +0.026 |
Neg logit contributions | |
nem | -0.024 |
unseen | -0.024 |
uth | -0.022 |
arah | -0.021 |
humiliated | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | -9.70e-02 |
Pos logit contributions | |
unseen | +0.070 |
nem | +0.070 |
uth | +0.064 |
arah | +0.063 |
humiliated | +0.061 |
Neg logit contributions | |
plin | -0.069 |
Draft | -0.069 |
Blooming | -0.068 |
€ | -0.067 |
Por | -0.065 |
Token | . |
Token ID | 764 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
nem | +0.083 |
unseen | +0.082 |
uth | +0.076 |
arah | +0.074 |
humiliated | +0.072 |
Neg logit contributions | |
plin | -0.066 |
Draft | -0.064 |
€ | -0.063 |
Blooming | -0.063 |
Por | -0.060 |
Token | . |
Token ID | 764 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
plin | +1.114 |
Draft | +1.105 |
€ | +1.092 |
Blooming | +1.091 |
Por | +1.040 |
Neg logit contributions | |
nem | -1.354 |
unseen | -1.347 |
uth | -1.253 |
arah | -1.215 |
humiliated | -1.192 |
Token | . |
Token ID | 764 |
Feature activation | +3.05e+00 |
Pos logit contributions | |
plin | +1.577 |
Draft | +1.577 |
Blooming | +1.559 |
€ | +1.553 |
Por | +1.490 |
Neg logit contributions | |
nem | -1.925 |
unseen | -1.920 |
uth | -1.784 |
arah | -1.738 |
humiliated | -1.697 |
Token | And |
Token ID | 843 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
Draft | +1.993 |
plin | +1.986 |
Blooming | +1.971 |
€ | +1.963 |
Por | +1.883 |
Neg logit contributions | |
nem | -2.643 |
unseen | -2.641 |
uth | -2.456 |
arah | -2.400 |
humiliated | -2.343 |
Token | failed |
Token ID | 4054 |
Feature activation | +9.54e-01 |
Pos logit contributions | |
nem | +0.089 |
unseen | +0.089 |
uth | +0.081 |
arah | +0.078 |
humiliated | +0.078 |
Neg logit contributions | |
plin | -0.086 |
Draft | -0.086 |
Blooming | -0.084 |
€ | -0.084 |
Por | -0.080 |
Token | states |
Token ID | 2585 |
Feature activation | -4.00e-02 |
Pos logit contributions | |
plin | +0.632 |
Draft | +0.631 |
Blooming | +0.621 |
€ | +0.620 |
Por | +0.592 |
Neg logit contributions | |
nem | -0.824 |
unseen | -0.821 |
uth | -0.764 |
arah | -0.743 |
humiliated | -0.729 |
Token | , |
Token ID | 11 |
Feature activation | -4.91e-01 |
Pos logit contributions | |
nem | +0.031 |
unseen | +0.031 |
uth | +0.029 |
arah | +0.028 |
humiliated | +0.027 |
Neg logit contributions | |
plin | -0.030 |
Draft | -0.030 |
Blooming | -0.029 |
€ | -0.029 |
Por | -0.028 |
Token | conflict |
Token ID | 5358 |
Feature activation | +4.23e-01 |
Pos logit contributions | |
nem | +0.378 |
unseen | +0.377 |
uth | +0.345 |
arah | +0.334 |
humiliated | +0.330 |
Neg logit contributions | |
plin | -0.373 |
Draft | -0.372 |
Blooming | -0.366 |
€ | -0.365 |
Por | -0.350 |
Token | activist |
Token ID | 11276 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
nem | +0.052 |
unseen | +0.051 |
uth | +0.047 |
arah | +0.045 |
humiliated | +0.044 |
Neg logit contributions | |
plin | -0.067 |
Draft | -0.067 |
Blooming | -0.066 |
€ | -0.066 |
Por | -0.063 |
Token | had |
Token ID | 550 |
Feature activation | +5.84e-02 |
Pos logit contributions | |
Draft | +0.131 |
plin | +0.130 |
€ | +0.128 |
Blooming | +0.128 |
Por | +0.123 |
Neg logit contributions | |
nem | -0.129 |
unseen | -0.128 |
uth | -0.118 |
arah | -0.114 |
humiliated | -0.113 |
Token | received |
Token ID | 2722 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
Draft | +0.047 |
plin | +0.047 |
Blooming | +0.047 |
€ | +0.046 |
Por | +0.045 |
Neg logit contributions | |
nem | -0.042 |
unseen | -0.042 |
uth | -0.038 |
arah | -0.037 |
humiliated | -0.036 |
Token | th |
Token ID | 294 |
Feature activation | +9.95e-01 |
Pos logit contributions | |
plin | +0.226 |
Draft | +0.225 |
Blooming | +0.220 |
€ | +0.219 |
Por | +0.212 |
Neg logit contributions | |
unseen | -0.227 |
nem | -0.227 |
uth | -0.208 |
arah | -0.201 |
humiliated | -0.198 |
Token | rea |
Token ID | 21468 |
Feature activation | -5.95e-01 |
Pos logit contributions | |
Draft | +0.623 |
plin | +0.623 |
Blooming | +0.613 |
€ | +0.610 |
Por | +0.583 |
Neg logit contributions | |
nem | -0.894 |
unseen | -0.892 |
uth | -0.835 |
arah | -0.813 |
humiliated | -0.795 |
Token | ... |
Token ID | 986 |
Feature activation | +3.11e+00 |
Pos logit contributions | |
nem | +0.542 |
unseen | +0.539 |
uth | +0.510 |
arah | +0.493 |
humiliated | +0.483 |
Neg logit contributions | |
Draft | -0.363 |
plin | -0.362 |
Blooming | -0.359 |
€ | -0.355 |
Por | -0.339 |
Token |
|
Token ID | 198 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
Draft | +2.411 |
plin | +2.405 |
Blooming | +2.401 |
€ | +2.389 |
Por | +2.299 |
Neg logit contributions | |
nem | -2.304 |
unseen | -2.301 |
uth | -2.123 |
arah | -2.049 |
humiliated | -1.997 |
Token |
|
Token ID | 198 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
nem | +0.100 |
unseen | +0.100 |
uth | +0.091 |
arah | +0.088 |
humiliated | +0.085 |
Neg logit contributions | |
plin | -0.123 |
Draft | -0.122 |
Blooming | -0.121 |
€ | -0.120 |
Por | -0.116 |
Token | From |
Token ID | 4863 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
plin | +0.290 |
Blooming | +0.286 |
Draft | +0.286 |
€ | +0.285 |
Por | +0.275 |
Neg logit contributions | |
nem | -0.274 |
unseen | -0.273 |
uth | -0.252 |
arah | -0.245 |
humiliated | -0.237 |
Token | : |
Token ID | 25 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
nem | +0.254 |
unseen | +0.253 |
uth | +0.234 |
arah | +0.227 |
humiliated | +0.222 |
Neg logit contributions | |
plin | -0.230 |
Draft | -0.229 |
€ | -0.225 |
Blooming | -0.224 |
Por | -0.214 |
Token | A |
Token ID | 317 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
plin | +0.985 |
Draft | +0.984 |
Blooming | +0.973 |
€ | +0.971 |
Por | +0.934 |
Neg logit contributions | |
nem | -1.004 |
unseen | -1.001 |
uth | -0.924 |
arah | -0.896 |
humiliated | -0.875 |
Token | |
Token ID | 3907 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
nem | +1.076 |
unseen | +1.069 |
uth | +0.984 |
arah | +0.946 |
humiliated | +0.923 |
Neg logit contributions | |
Draft | -1.170 |
plin | -1.163 |
Blooming | -1.151 |
€ | -1.148 |
Por | -1.100 |
Token | ment |
Token ID | 434 |
Feature activation | +9.79e-01 |
Pos logit contributions | |
plin | +0.945 |
Draft | +0.940 |
Blooming | +0.932 |
€ | +0.930 |
Por | +0.901 |
Neg logit contributions | |
nem | -0.693 |
unseen | -0.693 |
uth | -0.626 |
arah | -0.604 |
humiliated | -0.589 |
Token | Carter |
Token ID | 10831 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
plin | +0.710 |
Draft | +0.709 |
Blooming | +0.702 |
€ | +0.701 |
Por | +0.674 |
Neg logit contributions | |
nem | -0.779 |
unseen | -0.776 |
uth | -0.720 |
arah | -0.700 |
humiliated | -0.682 |
Token | re |
Token ID | 302 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
plin | +0.165 |
Draft | +0.165 |
Blooming | +0.163 |
€ | +0.162 |
Por | +0.156 |
Neg logit contributions | |
nem | -0.143 |
unseen | -0.143 |
uth | -0.131 |
arah | -0.126 |
humiliated | -0.123 |
Token | |
Token ID | 3907 |
Feature activation | +2.58e+00 |
Pos logit contributions | |
plin | +1.131 |
Draft | +1.125 |
Blooming | +1.116 |
€ | +1.116 |
Por | +1.078 |
Neg logit contributions | |
nem | -1.095 |
unseen | -1.095 |
uth | -0.998 |
arah | -0.978 |
humiliated | -0.954 |
Token | ce |
Token ID | 344 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
plin | +2.195 |
Draft | +2.181 |
Blooming | +2.152 |
€ | +2.149 |
Por | +2.075 |
Neg logit contributions | |
unseen | -1.740 |
nem | -1.736 |
uth | -1.569 |
arah | -1.530 |
humiliated | -1.487 |
Token | ives |
Token ID | 1083 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
plin | +2.131 |
Draft | +2.099 |
€ | +2.078 |
Blooming | +2.048 |
Por | +1.975 |
Neg logit contributions | |
unseen | -2.931 |
nem | -2.924 |
uth | -2.677 |
arah | -2.645 |
humiliated | -2.608 |
Token | from |
Token ID | 422 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
plin | +0.863 |
Draft | +0.862 |
Blooming | +0.855 |
€ | +0.855 |
Por | +0.824 |
Neg logit contributions | |
nem | -0.818 |
unseen | -0.815 |
uth | -0.753 |
arah | -0.731 |
humiliated | -0.709 |
Token | his |
Token ID | 465 |
Feature activation | -5.61e-01 |
Pos logit contributions | |
nem | +0.894 |
unseen | +0.890 |
uth | +0.815 |
arah | +0.787 |
humiliated | +0.775 |
Neg logit contributions | |
Draft | -0.872 |
plin | -0.872 |
Blooming | -0.854 |
€ | -0.853 |
Por | -0.816 |
Token | fel |
Token ID | 10756 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
nem | +0.408 |
unseen | +0.406 |
uth | +0.371 |
arah | +0.359 |
humiliated | +0.351 |
Neg logit contributions | |
plin | -0.449 |
Draft | -0.448 |
Blooming | -0.442 |
€ | -0.441 |
Por | -0.424 |
Token | |
Token ID | 3907 |
Feature activation | +3.45e-04 |
Pos logit contributions | |
nem | +1.072 |
unseen | +1.067 |
uth | +0.982 |
arah | +0.950 |
humiliated | +0.925 |
Neg logit contributions | |
plin | -1.151 |
Draft | -1.150 |
Blooming | -1.138 |
€ | -1.134 |
Por | -1.092 |
Token | put |
Token ID | 1234 |
Feature activation | +5.47e-01 |
Pos logit contributions | |
Draft | +0.382 |
plin | +0.382 |
Blooming | +0.377 |
€ | +0.374 |
Por | +0.359 |
Neg logit contributions | |
unseen | -0.434 |
nem | -0.434 |
uth | -0.398 |
arah | -0.387 |
humiliated | -0.380 |
Token | them |
Token ID | 606 |
Feature activation | +8.63e-01 |
Pos logit contributions | |
Draft | +0.391 |
plin | +0.388 |
Blooming | +0.385 |
€ | +0.381 |
Por | +0.366 |
Neg logit contributions | |
nem | -0.446 |
unseen | -0.445 |
uth | -0.409 |
arah | -0.396 |
humiliated | -0.390 |
Token | in |
Token ID | 287 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
plin | +0.686 |
Draft | +0.685 |
Blooming | +0.678 |
€ | +0.677 |
Por | +0.652 |
Neg logit contributions | |
nem | -0.627 |
unseen | -0.625 |
uth | -0.574 |
arah | -0.556 |
humiliated | -0.542 |
Token | the |
Token ID | 262 |
Feature activation | -4.27e-01 |
Pos logit contributions | |
unseen | +1.139 |
nem | +1.138 |
uth | +1.038 |
arah | +0.998 |
humiliated | +0.989 |
Neg logit contributions | |
plin | -1.111 |
Draft | -1.109 |
Blooming | -1.084 |
€ | -1.081 |
Por | -1.033 |
Token | freezer |
Token ID | 30967 |
Feature activation | +7.86e-02 |
Pos logit contributions | |
nem | +0.339 |
unseen | +0.337 |
uth | +0.307 |
arah | +0.297 |
humiliated | +0.294 |
Neg logit contributions | |
plin | -0.316 |
Draft | -0.315 |
Blooming | -0.307 |
€ | -0.306 |
Por | -0.291 |
Token | . |
Token ID | 13 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
plin | +0.061 |
Draft | +0.061 |
Blooming | +0.060 |
€ | +0.060 |
Por | +0.058 |
Neg logit contributions | |
unseen | -0.059 |
nem | -0.059 |
uth | -0.054 |
arah | -0.052 |
humiliated | -0.051 |
Token | If |
Token ID | 1002 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
plin | +0.240 |
Draft | +0.234 |
Blooming | +0.229 |
€ | +0.228 |
Por | +0.216 |
Neg logit contributions | |
nem | -0.326 |
unseen | -0.324 |
uth | -0.302 |
arah | -0.293 |
humiliated | -0.286 |
Token | he |
Token ID | 339 |
Feature activation | +8.73e-01 |
Pos logit contributions | |
unseen | +0.213 |
nem | +0.212 |
uth | +0.194 |
arah | +0.187 |
humiliated | +0.186 |
Neg logit contributions | |
Draft | -0.196 |
plin | -0.195 |
Blooming | -0.191 |
€ | -0.190 |
Por | -0.182 |
Token | later |
Token ID | 1568 |
Feature activation | +7.31e-01 |
Pos logit contributions | |
Draft | +0.682 |
plin | +0.682 |
Blooming | +0.672 |
€ | +0.667 |
Por | +0.643 |
Neg logit contributions | |
unseen | -0.652 |
nem | -0.652 |
uth | -0.595 |
arah | -0.575 |
humiliated | -0.567 |
Token | wants |
Token ID | 3382 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
Draft | +0.557 |
plin | +0.557 |
Blooming | +0.548 |
€ | +0.544 |
Por | +0.524 |
Neg logit contributions | |
nem | -0.562 |
unseen | -0.561 |
uth | -0.514 |
arah | -0.496 |
humiliated | -0.490 |
Token | some |
Token ID | 617 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
Draft | +0.864 |
plin | +0.864 |
Blooming | +0.852 |
€ | +0.842 |
Por | +0.813 |
Neg logit contributions | |
nem | -0.813 |
unseen | -0.810 |
uth | -0.743 |
arah | -0.715 |
humiliated | -0.700 |
Token | patterns |
Token ID | 7572 |
Feature activation | -4.36e-01 |
Pos logit contributions | |
unseen | +1.506 |
nem | +1.498 |
uth | +1.350 |
arah | +1.295 |
humiliated | +1.285 |
Neg logit contributions | |
Draft | -1.593 |
plin | -1.592 |
Blooming | -1.546 |
€ | -1.542 |
Por | -1.489 |
Token | of |
Token ID | 286 |
Feature activation | +7.31e-03 |
Pos logit contributions | |
unseen | +0.334 |
nem | +0.332 |
uth | +0.305 |
arah | +0.294 |
humiliated | +0.288 |
Neg logit contributions | |
Draft | -0.334 |
plin | -0.333 |
Blooming | -0.327 |
€ | -0.327 |
Por | -0.314 |
Token | behavior |
Token ID | 4069 |
Feature activation | +5.47e-01 |
Pos logit contributions | |
plin | +0.006 |
Draft | +0.006 |
Blooming | +0.006 |
€ | +0.006 |
Por | +0.005 |
Neg logit contributions | |
unseen | -0.005 |
nem | -0.005 |
uth | -0.005 |
arah | -0.005 |
humiliated | -0.005 |
Token | ( |
Token ID | 357 |
Feature activation | +7.34e-01 |
Pos logit contributions | |
Draft | +0.420 |
plin | +0.420 |
Blooming | +0.413 |
€ | +0.413 |
Por | +0.397 |
Neg logit contributions | |
unseen | -0.415 |
nem | -0.415 |
uth | -0.380 |
arah | -0.368 |
humiliated | -0.359 |
Token | i |
Token ID | 72 |
Feature activation | -6.48e-01 |
Pos logit contributions | |
plin | +0.594 |
Draft | +0.591 |
Blooming | +0.587 |
€ | +0.586 |
Por | +0.564 |
Neg logit contributions | |
nem | -0.525 |
unseen | -0.523 |
uth | -0.481 |
arah | -0.464 |
humiliated | -0.450 |
Token | . |
Token ID | 13 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
nem | +0.483 |
unseen | +0.482 |
uth | +0.451 |
arah | +0.433 |
emet | +0.414 |
Neg logit contributions | |
plin | -0.498 |
Draft | -0.493 |
Blooming | -0.491 |
€ | -0.485 |
Por | -0.470 |
Token | e |
Token ID | 68 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
plin | +0.735 |
Draft | +0.729 |
Blooming | +0.726 |
€ | +0.719 |
Por | +0.697 |
Neg logit contributions | |
unseen | -0.520 |
nem | -0.520 |
uth | -0.474 |
arah | -0.452 |
humiliated | -0.433 |
Token | ., |
Token ID | 1539 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
plin | +0.422 |
Draft | +0.421 |
Blooming | +0.416 |
€ | +0.415 |
Por | +0.395 |
Neg logit contributions | |
nem | -0.629 |
unseen | -0.627 |
uth | -0.586 |
arah | -0.572 |
humiliated | -0.560 |
Token | after |
Token ID | 706 |
Feature activation | +3.90e-02 |
Pos logit contributions | |
Draft | +0.799 |
plin | +0.798 |
Blooming | +0.785 |
€ | +0.783 |
Por | +0.753 |
Neg logit contributions | |
nem | -0.803 |
unseen | -0.800 |
uth | -0.733 |
arah | -0.709 |
humiliated | -0.696 |
Token | " |
Token ID | 366 |
Feature activation | -9.80e-01 |
Pos logit contributions | |
plin | +0.029 |
Draft | +0.029 |
Blooming | +0.029 |
€ | +0.029 |
Por | +0.027 |
Neg logit contributions | |
nem | -0.030 |
unseen | -0.030 |
uth | -0.028 |
arah | -0.027 |
humiliated | -0.026 |
Token | d |
Token ID | 67 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
nem | +0.707 |
unseen | +0.704 |
uth | +0.648 |
arah | +0.628 |
humiliated | +0.607 |
Neg logit contributions | |
plin | -0.784 |
Blooming | -0.775 |
Draft | -0.773 |
€ | -0.773 |
Por | -0.745 |
Token | not |
Token ID | 407 |
Feature activation | -2.05e+00 |
Pos logit contributions | |
unseen | +0.110 |
nem | +0.109 |
uth | +0.100 |
arah | +0.097 |
humiliated | +0.095 |
Neg logit contributions | |
Draft | -0.109 |
plin | -0.109 |
Blooming | -0.107 |
€ | -0.107 |
Por | -0.103 |
Token | ." |
Token ID | 526 |
Feature activation | -8.14e-02 |
Pos logit contributions | |
unseen | +1.616 |
nem | +1.599 |
uth | +1.472 |
arah | +1.421 |
humiliated | +1.399 |
Neg logit contributions | |
Draft | -1.531 |
plin | -1.528 |
Blooming | -1.502 |
€ | -1.497 |
Por | -1.438 |
Token |
|
Token ID | 198 |
Feature activation | -6.99e-01 |
Pos logit contributions | |
nem | +0.060 |
unseen | +0.059 |
uth | +0.054 |
arah | +0.052 |
humiliated | +0.050 |
Neg logit contributions | |
plin | -0.065 |
Draft | -0.064 |
€ | -0.063 |
Blooming | -0.063 |
Por | -0.060 |
Token |
|
Token ID | 198 |
Feature activation | -5.04e-01 |
Pos logit contributions | |
nem | +0.461 |
unseen | +0.460 |
uth | +0.422 |
arah | +0.401 |
humiliated | +0.384 |
Neg logit contributions | |
plin | -0.604 |
Draft | -0.595 |
Blooming | -0.589 |
€ | -0.583 |
Por | -0.567 |
Token | H |
Token ID | 39 |
Feature activation | +6.78e-02 |
Pos logit contributions | |
nem | +0.378 |
unseen | +0.376 |
uth | +0.350 |
arah | +0.337 |
emet | +0.326 |
Neg logit contributions | |
plin | -0.390 |
Blooming | -0.385 |
€ | -0.380 |
Draft | -0.377 |
Por | -0.366 |
Token | app |
Token ID | 1324 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
Draft | +0.051 |
plin | +0.051 |
Blooming | +0.050 |
€ | +0.050 |
Por | +0.048 |
Neg logit contributions | |
nem | -0.053 |
unseen | -0.052 |
uth | -0.049 |
arah | -0.047 |
emet | -0.046 |
Token | also |
Token ID | 635 |
Feature activation | -6.95e-02 |
Pos logit contributions | |
plin | +0.371 |
Draft | +0.370 |
Blooming | +0.365 |
€ | +0.364 |
Por | +0.348 |
Neg logit contributions | |
nem | -0.444 |
unseen | -0.442 |
uth | -0.411 |
arah | -0.399 |
humiliated | -0.390 |
Token | makes |
Token ID | 1838 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
nem | +0.048 |
unseen | +0.048 |
uth | +0.043 |
arah | +0.042 |
humiliated | +0.041 |
Neg logit contributions | |
plin | -0.059 |
Draft | -0.059 |
Blooming | -0.058 |
€ | -0.058 |
Por | -0.055 |
Token | a |
Token ID | 257 |
Feature activation | -6.79e-02 |
Pos logit contributions | |
nem | +0.565 |
unseen | +0.561 |
uth | +0.510 |
arah | +0.493 |
humiliated | +0.483 |
Neg logit contributions | |
Draft | -0.529 |
plin | -0.525 |
Blooming | -0.511 |
€ | -0.509 |
Por | -0.486 |
Token | subtle |
Token ID | 11800 |
Feature activation | +7.10e-01 |
Pos logit contributions | |
nem | +0.048 |
unseen | +0.048 |
uth | +0.043 |
arah | +0.042 |
humiliated | +0.041 |
Neg logit contributions | |
Draft | -0.056 |
plin | -0.056 |
Blooming | -0.055 |
€ | -0.054 |
Por | -0.053 |
Token | but |
Token ID | 475 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
Draft | +0.564 |
plin | +0.564 |
Blooming | +0.554 |
€ | +0.551 |
Por | +0.532 |
Neg logit contributions | |
nem | -0.525 |
unseen | -0.521 |
uth | -0.477 |
arah | -0.460 |
humiliated | -0.447 |
Token | is |
Token ID | 318 |
Feature activation | +5.39e-01 |
Pos logit contributions | |
Draft | +0.389 |
plin | +0.387 |
Blooming | +0.382 |
€ | +0.379 |
Por | +0.362 |
Neg logit contributions | |
unseen | -0.405 |
nem | -0.405 |
uth | -0.371 |
arah | -0.359 |
humiliated | -0.352 |
Token | a |
Token ID | 257 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
Draft | +0.392 |
plin | +0.390 |
Blooming | +0.383 |
€ | +0.382 |
Por | +0.364 |
Neg logit contributions | |
unseen | -0.434 |
nem | -0.433 |
uth | -0.399 |
arah | -0.385 |
humiliated | -0.379 |
Token | strange |
Token ID | 6283 |
Feature activation | +9.76e-01 |
Pos logit contributions | |
Draft | +0.473 |
plin | +0.472 |
Blooming | +0.466 |
€ | +0.463 |
Por | +0.445 |
Neg logit contributions | |
nem | -0.470 |
unseen | -0.468 |
uth | -0.429 |
arah | -0.415 |
humiliated | -0.409 |
Token | , |
Token ID | 11 |
Feature activation | -5.15e-02 |
Pos logit contributions | |
Draft | +0.732 |
plin | +0.730 |
Blooming | +0.720 |
€ | +0.714 |
Por | +0.687 |
Neg logit contributions | |
nem | -0.760 |
unseen | -0.759 |
uth | -0.698 |
arah | -0.675 |
humiliated | -0.661 |
Token | national |
Token ID | 2260 |
Feature activation | +4.33e-01 |
Pos logit contributions | |
unseen | +0.039 |
nem | +0.039 |
uth | +0.036 |
arah | +0.035 |
humiliated | +0.034 |
Neg logit contributions | |
Draft | -0.040 |
plin | -0.039 |
Blooming | -0.039 |
€ | -0.038 |
Por | -0.037 |
Token | istic |
Token ID | 2569 |
Feature activation | +8.56e-01 |
Pos logit contributions | |
Draft | +0.334 |
plin | +0.334 |
Blooming | +0.329 |
€ | +0.327 |
Por | +0.314 |
Neg logit contributions | |
nem | -0.329 |
unseen | -0.326 |
uth | -0.300 |
arah | -0.290 |
humiliated | -0.285 |
Token | union |
Token ID | 6441 |
Feature activation | +4.20e-01 |
Pos logit contributions | |
plin | +0.652 |
Draft | +0.651 |
Blooming | +0.641 |
€ | +0.634 |
Por | +0.609 |
Neg logit contributions | |
nem | -0.660 |
unseen | -0.657 |
uth | -0.602 |
arah | -0.582 |
humiliated | -0.571 |
Token | ism |
Token ID | 1042 |
Feature activation | -5.42e-01 |
Pos logit contributions | |
plin | +0.323 |
Draft | +0.322 |
Blooming | +0.317 |
€ | +0.315 |
Por | +0.303 |
Neg logit contributions | |
nem | -0.320 |
unseen | -0.320 |
uth | -0.294 |
arah | -0.283 |
humiliated | -0.280 |
Token | that |
Token ID | 326 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
unseen | +0.415 |
nem | +0.413 |
uth | +0.377 |
arah | +0.362 |
humiliated | +0.360 |
Neg logit contributions | |
Draft | -0.417 |
plin | -0.416 |
Blooming | -0.409 |
€ | -0.405 |
Por | -0.389 |
Token | churn |
Token ID | 28488 |
Feature activation | +8.95e-01 |
Pos logit contributions | |
Draft | +0.323 |
plin | +0.322 |
Blooming | +0.318 |
€ | +0.316 |
Por | +0.303 |
Neg logit contributions | |
nem | -0.316 |
unseen | -0.314 |
uth | -0.289 |
arah | -0.278 |
humiliated | -0.274 |
Token | s |
Token ID | 82 |
Feature activation | +7.83e-01 |
Pos logit contributions | |
plin | +0.582 |
Draft | +0.581 |
€ | +0.575 |
Blooming | +0.574 |
Por | +0.549 |
Neg logit contributions | |
nem | -0.778 |
unseen | -0.775 |
uth | -0.722 |
arah | -0.706 |
humiliated | -0.690 |
Token | its |
Token ID | 663 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
plin | +0.660 |
Draft | +0.659 |
Blooming | +0.652 |
€ | +0.651 |
Por | +0.627 |
Neg logit contributions | |
nem | -0.619 |
unseen | -0.617 |
uth | -0.567 |
arah | -0.549 |
humiliated | -0.535 |
Token | life |
Token ID | 1204 |
Feature activation | -3.62e-01 |
Pos logit contributions | |
nem | +0.195 |
unseen | +0.194 |
uth | +0.176 |
arah | +0.168 |
humiliated | +0.166 |
Neg logit contributions | |
Draft | -0.235 |
plin | -0.234 |
Blooming | -0.230 |
€ | -0.228 |
Por | -0.222 |
Token | . |
Token ID | 13 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
nem | +0.270 |
unseen | +0.269 |
uth | +0.247 |
arah | +0.238 |
humiliated | +0.233 |
Neg logit contributions | |
plin | -0.283 |
Draft | -0.282 |
Blooming | -0.279 |
€ | -0.278 |
Por | -0.268 |
Token | The |
Token ID | 383 |
Feature activation | +4.23e-01 |
Pos logit contributions | |
plin | +0.185 |
Draft | +0.182 |
€ | +0.179 |
Blooming | +0.179 |
Por | +0.170 |
Neg logit contributions | |
nem | -0.258 |
unseen | -0.256 |
uth | -0.240 |
arah | -0.232 |
humiliated | -0.228 |
Token | NASA |
Token ID | 8884 |
Feature activation | +3.23e-01 |
Pos logit contributions | |
plin | +0.318 |
Draft | +0.317 |
Blooming | +0.312 |
€ | +0.311 |
Por | +0.299 |
Neg logit contributions | |
nem | -0.328 |
unseen | -0.327 |
uth | -0.299 |
arah | -0.290 |
humiliated | -0.285 |
Token | investigation |
Token ID | 3645 |
Feature activation | +7.76e-01 |
Pos logit contributions | |
plin | +0.236 |
Draft | +0.235 |
€ | +0.232 |
Blooming | +0.232 |
Por | +0.223 |
Neg logit contributions | |
nem | -0.257 |
unseen | -0.255 |
uth | -0.236 |
arah | -0.229 |
humiliated | -0.224 |
Token | into |
Token ID | 656 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
plin | +0.638 |
Draft | +0.637 |
Blooming | +0.627 |
€ | +0.626 |
Por | +0.604 |
Neg logit contributions | |
nem | -0.548 |
unseen | -0.545 |
uth | -0.496 |
arah | -0.478 |
humiliated | -0.471 |
Token | the |
Token ID | 262 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
plin | +0.254 |
Draft | +0.253 |
Blooming | +0.251 |
€ | +0.250 |
Por | +0.241 |
Neg logit contributions | |
nem | -0.241 |
unseen | -0.241 |
uth | -0.221 |
arah | -0.214 |
humiliated | -0.209 |
Token | failure |
Token ID | 5287 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
unseen | +0.164 |
nem | +0.164 |
uth | +0.149 |
arah | +0.144 |
humiliated | +0.141 |
Neg logit contributions | |
plin | -0.187 |
Draft | -0.187 |
Blooming | -0.184 |
€ | -0.184 |
Por | -0.177 |
Token | of |
Token ID | 286 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
plin | +0.338 |
Draft | +0.338 |
Blooming | +0.333 |
€ | +0.332 |
Por | +0.320 |
Neg logit contributions | |
nem | -0.312 |
unseen | -0.311 |
uth | -0.284 |
arah | -0.275 |
humiliated | -0.271 |
Token | the |
Token ID | 262 |
Feature activation | -3.49e-01 |
Pos logit contributions | |
nem | +0.171 |
unseen | +0.171 |
uth | +0.156 |
arah | +0.151 |
humiliated | +0.147 |
Neg logit contributions | |
plin | -0.198 |
Draft | -0.198 |
Blooming | -0.195 |
€ | -0.195 |
Por | -0.187 |
Token | � |
Token ID | 447 |
Feature activation | -6.16e-01 |
Pos logit contributions | |
nem | +0.050 |
unseen | +0.050 |
uth | +0.045 |
arah | +0.044 |
humiliated | +0.043 |
Neg logit contributions | |
Draft | -0.056 |
plin | -0.056 |
Blooming | -0.056 |
€ | -0.055 |
Por | -0.053 |
Token | � |
Token ID | 251 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
nem | +0.430 |
unseen | +0.430 |
uth | +0.394 |
arah | +0.382 |
humiliated | +0.370 |
Neg logit contributions | |
plin | -0.505 |
Draft | -0.505 |
Blooming | -0.499 |
€ | -0.499 |
Por | -0.481 |
Token | Yun |
Token ID | 20757 |
Feature activation | -4.57e-01 |
Pos logit contributions | |
nem | +0.232 |
unseen | +0.231 |
uth | +0.213 |
arah | +0.206 |
humiliated | +0.202 |
Neg logit contributions | |
Draft | -0.231 |
plin | -0.231 |
Blooming | -0.227 |
€ | -0.227 |
Por | -0.217 |
Token | told |
Token ID | 1297 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
nem | +0.299 |
unseen | +0.298 |
uth | +0.271 |
arah | +0.262 |
humiliated | +0.254 |
Neg logit contributions | |
Draft | -0.399 |
plin | -0.397 |
Blooming | -0.393 |
€ | -0.391 |
Por | -0.377 |
Token | Reuters |
Token ID | 8428 |
Feature activation | +9.77e-02 |
Pos logit contributions | |
nem | +0.095 |
unseen | +0.095 |
uth | +0.088 |
arah | +0.085 |
humiliated | +0.083 |
Neg logit contributions | |
Draft | -0.082 |
plin | -0.082 |
Blooming | -0.081 |
€ | -0.080 |
Por | -0.077 |
Token | during |
Token ID | 1141 |
Feature activation | -2.05e-01 |
Pos logit contributions | |
Draft | +0.075 |
plin | +0.075 |
Blooming | +0.074 |
€ | +0.074 |
Por | +0.071 |
Neg logit contributions | |
unseen | -0.074 |
nem | -0.074 |
uth | -0.068 |
arah | -0.066 |
humiliated | -0.064 |
Token | a |
Token ID | 257 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
nem | +0.162 |
unseen | +0.161 |
uth | +0.149 |
arah | +0.144 |
humiliated | +0.141 |
Neg logit contributions | |
Draft | -0.152 |
plin | -0.152 |
Blooming | -0.148 |
€ | -0.148 |
Por | -0.141 |
Token | visit |
Token ID | 3187 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
nem | +0.207 |
unseen | +0.206 |
uth | +0.191 |
arah | +0.186 |
humiliated | +0.183 |
Neg logit contributions | |
plin | -0.162 |
Draft | -0.162 |
Blooming | -0.159 |
€ | -0.158 |
Por | -0.151 |
Token | to |
Token ID | 284 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
nem | +0.023 |
unseen | +0.023 |
uth | +0.021 |
arah | +0.020 |
humiliated | +0.020 |
Neg logit contributions | |
plin | -0.025 |
Draft | -0.025 |
Blooming | -0.025 |
€ | -0.025 |
Por | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | -9.67e-01 |
Pos logit contributions | |
nem | +0.204 |
unseen | +0.203 |
uth | +0.187 |
arah | +0.180 |
humiliated | +0.177 |
Neg logit contributions | |
Draft | -0.211 |
plin | -0.210 |
Blooming | -0.207 |
€ | -0.207 |
Por | -0.198 |
Token | village |
Token ID | 7404 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
nem | +0.664 |
unseen | +0.662 |
uth | +0.598 |
arah | +0.577 |
humiliated | +0.567 |
Neg logit contributions | |
Draft | -0.815 |
plin | -0.812 |
€ | -0.797 |
Blooming | -0.797 |
Por | -0.765 |
Token | not |
Token ID | 407 |
Feature activation | -9.77e-01 |
Pos logit contributions | |
nem | +0.685 |
unseen | +0.684 |
uth | +0.627 |
arah | +0.602 |
humiliated | +0.597 |
Neg logit contributions | |
plin | -0.714 |
Draft | -0.713 |
Blooming | -0.698 |
€ | -0.690 |
Por | -0.666 |
Token | received |
Token ID | 2722 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
unseen | +0.630 |
nem | +0.630 |
uth | +0.572 |
arah | +0.544 |
humiliated | +0.540 |
Neg logit contributions | |
Draft | -0.864 |
plin | -0.863 |
Blooming | -0.849 |
€ | -0.840 |
Por | -0.815 |
Token | that |
Token ID | 326 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
plin | +0.140 |
Draft | +0.139 |
Blooming | +0.137 |
€ | +0.136 |
Por | +0.131 |
Neg logit contributions | |
nem | -0.132 |
unseen | -0.131 |
uth | -0.120 |
arah | -0.116 |
humiliated | -0.114 |
Token | evidence |
Token ID | 2370 |
Feature activation | +8.16e-01 |
Pos logit contributions | |
plin | +0.372 |
Draft | +0.371 |
Blooming | +0.365 |
€ | +0.360 |
Por | +0.349 |
Neg logit contributions | |
nem | -0.349 |
unseen | -0.348 |
uth | -0.318 |
arah | -0.306 |
humiliated | -0.302 |
Token | ," |
Token ID | 553 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
plin | +0.637 |
Draft | +0.637 |
Blooming | +0.630 |
€ | +0.627 |
Por | +0.604 |
Neg logit contributions | |
nem | -0.606 |
unseen | -0.605 |
uth | -0.556 |
arah | -0.538 |
humiliated | -0.526 |
Token | she |
Token ID | 673 |
Feature activation | -9.43e-01 |
Pos logit contributions | |
nem | +0.150 |
unseen | +0.149 |
uth | +0.138 |
arah | +0.133 |
humiliated | +0.131 |
Neg logit contributions | |
Draft | -0.139 |
plin | -0.138 |
Blooming | -0.136 |
€ | -0.135 |
Por | -0.129 |
Token | added |
Token ID | 2087 |
Feature activation | -4.72e-02 |
Pos logit contributions | |
nem | +0.586 |
unseen | +0.585 |
uth | +0.526 |
arah | +0.504 |
humiliated | +0.495 |
Neg logit contributions | |
Draft | -0.855 |
plin | -0.852 |
Blooming | -0.842 |
€ | -0.838 |
Por | -0.810 |
Token | . |
Token ID | 13 |
Feature activation | -9.63e-01 |
Pos logit contributions | |
nem | +0.038 |
unseen | +0.038 |
uth | +0.035 |
arah | +0.034 |
humiliated | +0.033 |
Neg logit contributions | |
plin | -0.034 |
Draft | -0.034 |
Blooming | -0.034 |
€ | -0.034 |
Por | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
nem | +0.677 |
unseen | +0.671 |
uth | +0.619 |
arah | +0.595 |
humiliated | +0.579 |
Neg logit contributions | |
plin | -0.790 |
Draft | -0.788 |
Blooming | -0.778 |
€ | -0.776 |
Por | -0.747 |
Token |
|
Token ID | 198 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
plin | +0.106 |
Draft | +0.105 |
Blooming | +0.104 |
€ | +0.103 |
Por | +0.100 |
Neg logit contributions | |
nem | -0.088 |
unseen | -0.088 |
uth | -0.080 |
arah | -0.077 |
humiliated | -0.075 |
Token | " |
Token ID | 1 |
Feature activation | +5.83e-01 |
Pos logit contributions | |
plin | +0.247 |
Blooming | +0.245 |
Draft | +0.242 |
€ | +0.242 |
Por | +0.233 |
Neg logit contributions | |
nem | -0.239 |
unseen | -0.238 |
uth | -0.222 |
arah | -0.214 |
humiliated | -0.208 |
Token | it |
Token ID | 340 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
nem | +0.270 |
unseen | +0.269 |
uth | +0.246 |
arah | +0.238 |
humiliated | +0.233 |
Neg logit contributions | |
plin | -0.271 |
Draft | -0.270 |
Blooming | -0.265 |
€ | -0.264 |
Por | -0.254 |
Token | is |
Token ID | 318 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
nem | +0.176 |
unseen | +0.175 |
uth | +0.161 |
arah | +0.155 |
humiliated | +0.153 |
Neg logit contributions | |
Draft | -0.150 |
plin | -0.150 |
Blooming | -0.146 |
€ | -0.145 |
Por | -0.140 |
Token | the |
Token ID | 262 |
Feature activation | -5.47e-03 |
Pos logit contributions | |
plin | +0.752 |
Draft | +0.750 |
Blooming | +0.740 |
€ | +0.733 |
Por | +0.708 |
Neg logit contributions | |
unseen | -0.789 |
nem | -0.789 |
uth | -0.726 |
arah | -0.701 |
humiliated | -0.687 |
Token | first |
Token ID | 717 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
unseen | +0.004 |
nem | +0.004 |
uth | +0.004 |
arah | +0.004 |
trusted | +0.004 |
Neg logit contributions | |
plin | -0.004 |
Draft | -0.004 |
Blooming | -0.004 |
€ | -0.004 |
Por | -0.004 |
Token | step |
Token ID | 2239 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
plin | +0.419 |
Draft | +0.416 |
Blooming | +0.410 |
€ | +0.407 |
Por | +0.393 |
Neg logit contributions | |
nem | -0.405 |
unseen | -0.404 |
uth | -0.371 |
arah | -0.355 |
humiliated | -0.349 |
Token | towards |
Token ID | 3371 |
Feature activation | -2.31e-01 |
Pos logit contributions | |
unseen | +1.234 |
nem | +1.231 |
uth | +1.123 |
arah | +1.079 |
humiliated | +1.052 |
Neg logit contributions | |
Draft | -1.232 |
plin | -1.225 |
Blooming | -1.198 |
€ | -1.184 |
Por | -1.136 |
Token | Newcastle |
Token ID | 22410 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
nem | +0.181 |
unseen | +0.181 |
uth | +0.165 |
arah | +0.159 |
humiliated | +0.156 |
Neg logit contributions | |
Draft | -0.173 |
plin | -0.172 |
Blooming | -0.168 |
€ | -0.167 |
Por | -0.161 |
Token | United |
Token ID | 1578 |
Feature activation | -3.44e-02 |
Pos logit contributions | |
nem | +0.224 |
unseen | +0.224 |
uth | +0.207 |
arah | +0.201 |
humiliated | +0.196 |
Neg logit contributions | |
plin | -0.200 |
Draft | -0.200 |
Blooming | -0.197 |
€ | -0.197 |
Por | -0.189 |
Token | developing |
Token ID | 5922 |
Feature activation | -2.99e-01 |
Pos logit contributions | |
nem | +0.026 |
unseen | +0.026 |
uth | +0.024 |
arah | +0.023 |
humiliated | +0.023 |
Neg logit contributions | |
plin | -0.026 |
Draft | -0.026 |
Blooming | -0.026 |
€ | -0.025 |
Por | -0.025 |
Token | a |
Token ID | 257 |
Feature activation | +4.90e-01 |
Pos logit contributions | |
unseen | +0.233 |
nem | +0.233 |
uth | +0.214 |
arah | +0.206 |
humiliated | +0.202 |
Neg logit contributions | |
plin | -0.225 |
Draft | -0.224 |
Blooming | -0.221 |
€ | -0.220 |
Por | -0.211 |
Token | meaningful |
Token ID | 11570 |
Feature activation | -6.49e-01 |
Pos logit contributions | |
Draft | +0.356 |
plin | +0.356 |
Blooming | +0.350 |
€ | +0.348 |
Por | +0.333 |
Neg logit contributions | |
nem | -0.392 |
unseen | -0.392 |
uth | -0.360 |
arah | -0.349 |
humiliated | -0.342 |
Token | see |
Token ID | 766 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
Draft | +1.162 |
plin | +1.158 |
Blooming | +1.143 |
€ | +1.135 |
Por | +1.096 |
Neg logit contributions | |
nem | -1.238 |
unseen | -1.236 |
uth | -1.140 |
arah | -1.107 |
humiliated | -1.078 |
Token | , |
Token ID | 11 |
Feature activation | -8.44e-01 |
Pos logit contributions | |
unseen | +0.113 |
nem | +0.113 |
uth | +0.103 |
arah | +0.100 |
humiliated | +0.098 |
Neg logit contributions | |
Draft | -0.108 |
plin | -0.107 |
Blooming | -0.104 |
€ | -0.104 |
Por | -0.100 |
Token | � |
Token ID | 564 |
Feature activation | +9.37e-01 |
Pos logit contributions | |
unseen | +0.631 |
nem | +0.628 |
uth | +0.573 |
arah | +0.555 |
humiliated | +0.543 |
Neg logit contributions | |
Draft | -0.660 |
plin | -0.659 |
Blooming | -0.648 |
€ | -0.646 |
Por | -0.622 |
Token | � |
Token ID | 250 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
plin | +0.657 |
Draft | +0.657 |
Blooming | +0.649 |
€ | +0.648 |
Por | +0.620 |
Neg logit contributions | |
nem | -0.769 |
unseen | -0.768 |
uth | -0.712 |
arah | -0.693 |
humiliated | -0.676 |
Token | The |
Token ID | 464 |
Feature activation | -3.16e-01 |
Pos logit contributions | |
unseen | +0.182 |
nem | +0.181 |
uth | +0.167 |
arah | +0.161 |
humiliated | +0.156 |
Neg logit contributions | |
plin | -0.197 |
Draft | -0.196 |
Blooming | -0.195 |
€ | -0.194 |
Por | -0.187 |
Token | guard |
Token ID | 4860 |
Feature activation | +8.25e-03 |
Pos logit contributions | |
nem | +0.272 |
unseen | +0.272 |
uth | +0.251 |
arah | +0.245 |
humiliated | +0.239 |
Neg logit contributions | |
Draft | -0.212 |
plin | -0.211 |
€ | -0.207 |
Blooming | -0.206 |
Por | -0.196 |
Token | tower |
Token ID | 10580 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
Draft | +0.006 |
plin | +0.006 |
Blooming | +0.006 |
€ | +0.006 |
Por | +0.006 |
Neg logit contributions | |
nem | -0.006 |
unseen | -0.006 |
uth | -0.006 |
arah | -0.006 |
humiliated | -0.005 |
Token | is |
Token ID | 318 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
unseen | +0.800 |
nem | +0.798 |
uth | +0.727 |
arah | +0.707 |
humiliated | +0.693 |
Neg logit contributions | |
Draft | -0.800 |
plin | -0.796 |
Blooming | -0.787 |
€ | -0.777 |
Por | -0.750 |
Token | on |
Token ID | 319 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
Draft | +0.180 |
plin | +0.180 |
Blooming | +0.177 |
€ | +0.176 |
Por | +0.169 |
Neg logit contributions | |
unseen | -0.184 |
nem | -0.183 |
uth | -0.168 |
arah | -0.163 |
humiliated | -0.160 |
Token | fire |
Token ID | 2046 |
Feature activation | -7.88e-01 |
Pos logit contributions | |
unseen | +0.387 |
nem | +0.386 |
uth | +0.354 |
arah | +0.341 |
humiliated | +0.333 |
Neg logit contributions | |
Draft | -0.406 |
plin | -0.405 |
Blooming | -0.397 |
€ | -0.396 |
Por | -0.380 |
Token | . |
Token ID | 13 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
unseen | +0.607 |
nem | +0.602 |
uth | +0.552 |
arah | +0.537 |
humiliated | +0.524 |
Neg logit contributions | |
Draft | -0.598 |
plin | -0.596 |
Blooming | -0.590 |
€ | -0.583 |
Por | -0.564 |
Token | come |
Token ID | 1282 |
Feature activation | +9.03e-01 |
Pos logit contributions | |
Draft | +0.786 |
plin | +0.786 |
Blooming | +0.777 |
€ | +0.773 |
Por | +0.743 |
Neg logit contributions | |
nem | -0.827 |
unseen | -0.825 |
uth | -0.762 |
arah | -0.738 |
humiliated | -0.721 |
Token | from |
Token ID | 422 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
plin | +0.728 |
Draft | +0.728 |
Blooming | +0.720 |
€ | +0.719 |
Por | +0.693 |
Neg logit contributions | |
nem | -0.646 |
unseen | -0.644 |
uth | -0.590 |
arah | -0.571 |
humiliated | -0.556 |
Token | not |
Token ID | 407 |
Feature activation | -6.11e-03 |
Pos logit contributions | |
nem | +0.137 |
unseen | +0.137 |
uth | +0.125 |
arah | +0.121 |
humiliated | +0.119 |
Neg logit contributions | |
plin | -0.136 |
Draft | -0.136 |
Blooming | -0.134 |
€ | -0.133 |
Por | -0.128 |
Token | having |
Token ID | 1719 |
Feature activation | -5.00e-02 |
Pos logit contributions | |
nem | +0.005 |
unseen | +0.005 |
uth | +0.004 |
arah | +0.004 |
humiliated | +0.004 |
Neg logit contributions | |
Draft | -0.005 |
plin | -0.005 |
Blooming | -0.005 |
€ | -0.005 |
Por | -0.004 |
Token | bases |
Token ID | 12536 |
Feature activation | +5.50e-01 |
Pos logit contributions | |
nem | +0.038 |
unseen | +0.038 |
uth | +0.035 |
arah | +0.033 |
humiliated | +0.033 |
Neg logit contributions | |
plin | -0.039 |
Draft | -0.039 |
Blooming | -0.038 |
€ | -0.038 |
Por | -0.037 |
Token | all |
Token ID | 477 |
Feature activation | -6.35e-03 |
Pos logit contributions | |
Draft | +0.432 |
plin | +0.431 |
Blooming | +0.427 |
€ | +0.425 |
Por | +0.409 |
Neg logit contributions | |
unseen | -0.407 |
nem | -0.407 |
uth | -0.372 |
arah | -0.361 |
humiliated | -0.353 |
Token | over |
Token ID | 625 |
Feature activation | -6.96e-01 |
Pos logit contributions | |
nem | +0.005 |
unseen | +0.005 |
uth | +0.004 |
arah | +0.004 |
humiliated | +0.004 |
Neg logit contributions | |
plin | -0.005 |
Draft | -0.005 |
Blooming | -0.005 |
€ | -0.005 |
Por | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | +5.14e-01 |
Pos logit contributions | |
nem | +0.524 |
unseen | +0.521 |
uth | +0.480 |
arah | +0.463 |
humiliated | +0.457 |
Neg logit contributions | |
Draft | -0.538 |
plin | -0.538 |
Blooming | -0.528 |
€ | -0.527 |
Por | -0.507 |
Token | world |
Token ID | 995 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
plin | +0.447 |
Draft | +0.446 |
Blooming | +0.441 |
€ | +0.440 |
Por | +0.425 |
Neg logit contributions | |
nem | -0.337 |
unseen | -0.336 |
uth | -0.305 |
arah | -0.294 |
humiliated | -0.286 |
Token | and |
Token ID | 290 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
plin | +1.115 |
Draft | +1.113 |
Blooming | +1.103 |
€ | +1.103 |
Por | +1.060 |
Neg logit contributions | |
nem | -1.121 |
unseen | -1.115 |
uth | -1.031 |
arah | -1.001 |
humiliated | -0.972 |
Token | a |
Token ID | 257 |
Feature activation | -2.21e-02 |
Pos logit contributions | |
plin | +0.310 |
Draft | +0.310 |
Blooming | +0.305 |
€ | +0.304 |
Por | +0.292 |
Neg logit contributions | |
nem | -0.324 |
unseen | -0.323 |
uth | -0.297 |
arah | -0.288 |
humiliated | -0.283 |
Token | , |
Token ID | 11 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
Draft | +0.026 |
plin | +0.026 |
€ | +0.026 |
Blooming | +0.026 |
Por | +0.025 |
Neg logit contributions | |
nem | -0.028 |
unseen | -0.027 |
uth | -0.026 |
arah | -0.025 |
humiliated | -0.024 |
Token | and |
Token ID | 290 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
plin | +0.097 |
Draft | +0.096 |
€ | +0.095 |
Blooming | +0.094 |
Por | +0.091 |
Neg logit contributions | |
nem | -0.083 |
unseen | -0.083 |
uth | -0.076 |
arah | -0.073 |
humiliated | -0.072 |
Token | Milan |
Token ID | 21574 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
nem | +0.316 |
unseen | +0.314 |
uth | +0.288 |
arah | +0.278 |
humiliated | +0.271 |
Neg logit contributions | |
Draft | -0.357 |
plin | -0.357 |
Blooming | -0.351 |
€ | -0.350 |
Por | -0.337 |
Token | Va |
Token ID | 17668 |
Feature activation | -9.66e-01 |
Pos logit contributions | |
nem | +1.033 |
unseen | +1.020 |
uth | +0.959 |
arah | +0.926 |
humiliated | +0.900 |
Neg logit contributions | |
Draft | -0.893 |
plin | -0.891 |
Blooming | -0.870 |
€ | -0.866 |
Por | -0.820 |
Token | ish |
Token ID | 680 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
nem | +0.661 |
unseen | +0.654 |
uth | +0.611 |
arah | +0.585 |
humiliated | +0.562 |
Neg logit contributions | |
Draft | -0.814 |
Blooming | -0.803 |
plin | -0.801 |
€ | -0.797 |
Por | -0.771 |
Token | nav |
Token ID | 28341 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
Draft | +0.165 |
plin | +0.165 |
Blooming | +0.163 |
€ | +0.163 |
Por | +0.157 |
Neg logit contributions | |
nem | -0.112 |
unseen | -0.111 |
uth | -0.102 |
arah | -0.097 |
humiliated | -0.093 |
Token | , |
Token ID | 11 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
nem | +1.876 |
unseen | +1.850 |
uth | +1.774 |
arah | +1.695 |
humiliated | +1.625 |
Neg logit contributions | |
Draft | -1.881 |
plin | -1.880 |
Blooming | -1.842 |
€ | -1.839 |
Por | -1.756 |
Token | a |
Token ID | 257 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
nem | +0.384 |
unseen | +0.381 |
uth | +0.350 |
arah | +0.336 |
humiliated | +0.333 |
Neg logit contributions | |
Draft | -0.381 |
plin | -0.378 |
€ | -0.370 |
Blooming | -0.370 |
Por | -0.356 |
Token | senior |
Token ID | 4664 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
nem | +0.332 |
unseen | +0.328 |
uth | +0.301 |
arah | +0.290 |
humiliated | +0.286 |
Neg logit contributions | |
Draft | -0.340 |
plin | -0.338 |
€ | -0.331 |
Blooming | -0.330 |
Por | -0.317 |
Token | associate |
Token ID | 11602 |
Feature activation | +5.78e-01 |
Pos logit contributions | |
nem | +1.033 |
unseen | +1.025 |
uth | +0.922 |
arah | +0.886 |
humiliated | +0.870 |
Neg logit contributions | |
plin | -1.366 |
Draft | -1.365 |
€ | -1.339 |
Blooming | -1.338 |
Por | -1.292 |
Token | at |
Token ID | 379 |
Feature activation | -6.48e-01 |
Pos logit contributions | |
Draft | +0.455 |
plin | +0.454 |
€ | +0.448 |
Blooming | +0.448 |
Por | +0.432 |
Neg logit contributions | |
nem | -0.427 |
unseen | -0.425 |
uth | -0.390 |
arah | -0.377 |
humiliated | -0.368 |
Token | temperatures |
Token ID | 10101 |
Feature activation | -5.73e-01 |
Pos logit contributions | |
plin | +0.138 |
Draft | +0.138 |
Blooming | +0.135 |
€ | +0.135 |
Por | +0.130 |
Neg logit contributions | |
nem | -0.139 |
unseen | -0.138 |
uth | -0.126 |
arah | -0.122 |
humiliated | -0.120 |
Token | . |
Token ID | 13 |
Feature activation | -5.21e-02 |
Pos logit contributions | |
unseen | +0.432 |
nem | +0.430 |
uth | +0.394 |
arah | +0.380 |
humiliated | +0.372 |
Neg logit contributions | |
plin | -0.443 |
Draft | -0.443 |
Blooming | -0.438 |
€ | -0.433 |
Por | -0.419 |
Token | But |
Token ID | 887 |
Feature activation | -8.30e-01 |
Pos logit contributions | |
nem | +0.039 |
unseen | +0.039 |
uth | +0.036 |
arah | +0.035 |
humiliated | +0.034 |
Neg logit contributions | |
plin | -0.040 |
Draft | -0.040 |
Blooming | -0.039 |
€ | -0.039 |
Por | -0.038 |
Token | our |
Token ID | 674 |
Feature activation | -4.87e-01 |
Pos logit contributions | |
nem | +0.634 |
unseen | +0.632 |
uth | +0.579 |
arah | +0.557 |
humiliated | +0.545 |
Neg logit contributions | |
Draft | -0.633 |
plin | -0.625 |
Blooming | -0.624 |
€ | -0.614 |
Por | -0.592 |
Token | favorite |
Token ID | 4004 |
Feature activation | -2.94e-01 |
Pos logit contributions | |
nem | +0.380 |
unseen | +0.376 |
uth | +0.343 |
arah | +0.333 |
humiliated | +0.325 |
Neg logit contributions | |
Draft | -0.368 |
plin | -0.367 |
Blooming | -0.358 |
€ | -0.355 |
Por | -0.342 |
Token | feature |
Token ID | 3895 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
nem | +0.228 |
unseen | +0.227 |
uth | +0.206 |
arah | +0.200 |
humiliated | +0.197 |
Neg logit contributions | |
Draft | -0.223 |
plin | -0.223 |
Blooming | -0.218 |
€ | -0.217 |
Por | -0.209 |
Token | is |
Token ID | 318 |
Feature activation | -3.62e-01 |
Pos logit contributions | |
unseen | +2.066 |
nem | +2.044 |
uth | +1.856 |
arah | +1.787 |
humiliated | +1.759 |
Neg logit contributions | |
Draft | -2.076 |
plin | -2.066 |
Blooming | -2.037 |
€ | -1.998 |
Por | -1.934 |
Token | the |
Token ID | 262 |
Feature activation | +5.08e-01 |
Pos logit contributions | |
unseen | +0.272 |
nem | +0.272 |
uth | +0.250 |
arah | +0.241 |
humiliated | +0.236 |
Neg logit contributions | |
plin | -0.279 |
Draft | -0.279 |
Blooming | -0.275 |
€ | -0.273 |
Por | -0.262 |
Token | two |
Token ID | 734 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
plin | +0.388 |
Draft | +0.388 |
Blooming | +0.382 |
€ | +0.379 |
Por | +0.365 |
Neg logit contributions | |
nem | -0.388 |
unseen | -0.387 |
uth | -0.355 |
arah | -0.344 |
humiliated | -0.336 |
Token | rear |
Token ID | 8286 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
plin | +1.107 |
Draft | +1.106 |
Blooming | +1.093 |
€ | +1.089 |
Por | +1.048 |
Neg logit contributions | |
nem | -1.051 |
unseen | -1.048 |
uth | -0.962 |
arah | -0.932 |
humiliated | -0.909 |
Token | pockets |
Token ID | 16511 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
nem | +1.036 |
unseen | +1.033 |
uth | +0.936 |
arah | +0.903 |
humiliated | +0.891 |
Neg logit contributions | |
plin | -1.110 |
Draft | -1.107 |
Blooming | -1.094 |
€ | -1.079 |
Por | -1.039 |
Token | have |
Token ID | 423 |
Feature activation | -5.26e-01 |
Pos logit contributions | |
nem | +1.300 |
unseen | +1.296 |
uth | +1.189 |
arah | +1.142 |
humiliated | +1.131 |
Neg logit contributions | |
Draft | -1.369 |
plin | -1.365 |
€ | -1.338 |
Blooming | -1.336 |
Por | -1.288 |
Token | sought |
Token ID | 7194 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
nem | +0.355 |
unseen | +0.354 |
uth | +0.321 |
arah | +0.309 |
humiliated | +0.304 |
Neg logit contributions | |
Draft | -0.449 |
plin | -0.448 |
Blooming | -0.441 |
€ | -0.440 |
Por | -0.424 |
Token | to |
Token ID | 284 |
Feature activation | -7.97e-02 |
Pos logit contributions | |
plin | +0.110 |
Draft | +0.110 |
Blooming | +0.108 |
€ | +0.108 |
Por | +0.104 |
Neg logit contributions | |
nem | -0.098 |
unseen | -0.098 |
uth | -0.090 |
arah | -0.087 |
humiliated | -0.085 |
Token | turn |
Token ID | 1210 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
nem | +0.060 |
unseen | +0.060 |
uth | +0.055 |
arah | +0.053 |
humiliated | +0.052 |
Neg logit contributions | |
plin | -0.062 |
Draft | -0.062 |
Blooming | -0.061 |
€ | -0.061 |
Por | -0.058 |
Token | the |
Token ID | 262 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
unseen | +1.393 |
nem | +1.379 |
uth | +1.261 |
arah | +1.226 |
humiliated | +1.205 |
Neg logit contributions | |
plin | -1.423 |
Draft | -1.421 |
Blooming | -1.381 |
€ | -1.372 |
Por | -1.326 |
Token | tables |
Token ID | 8893 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
unseen | +0.111 |
nem | +0.111 |
uth | +0.101 |
arah | +0.098 |
humiliated | +0.096 |
Neg logit contributions | |
plin | -0.123 |
Draft | -0.122 |
Blooming | -0.120 |
€ | -0.119 |
Por | -0.116 |
Token | on |
Token ID | 319 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
unseen | +1.996 |
nem | +1.971 |
uth | +1.772 |
arah | +1.687 |
humiliated | +1.675 |
Neg logit contributions | |
plin | -2.747 |
Draft | -2.745 |
Blooming | -2.699 |
€ | -2.673 |
Por | -2.588 |
Token | Democrats |
Token ID | 4956 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
unseen | +1.019 |
nem | +1.014 |
uth | +0.922 |
arah | +0.896 |
humiliated | +0.884 |
Neg logit contributions | |
plin | -1.002 |
Draft | -1.000 |
Blooming | -0.977 |
€ | -0.972 |
Por | -0.936 |
Token | by |
Token ID | 416 |
Feature activation | +7.75e-02 |
Pos logit contributions | |
unseen | +0.794 |
nem | +0.792 |
uth | +0.718 |
arah | +0.691 |
humiliated | +0.683 |
Neg logit contributions | |
plin | -0.911 |
Draft | -0.909 |
Blooming | -0.893 |
€ | -0.888 |
Por | -0.857 |
Token | emphasizing |
Token ID | 36360 |
Feature activation | -7.23e-01 |
Pos logit contributions | |
plin | +0.062 |
Draft | +0.062 |
Blooming | +0.061 |
€ | +0.061 |
Por | +0.058 |
Neg logit contributions | |
nem | -0.057 |
unseen | -0.057 |
uth | -0.051 |
arah | -0.050 |
humiliated | -0.049 |
Token | future |
Token ID | 2003 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
unseen | +0.539 |
nem | +0.537 |
uth | +0.486 |
arah | +0.473 |
humiliated | +0.466 |
Neg logit contributions | |
plin | -0.569 |
Draft | -0.569 |
Blooming | -0.557 |
€ | -0.554 |
Por | -0.532 |
Token | how |
Token ID | 703 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
nem | +0.134 |
unseen | +0.133 |
uth | +0.122 |
arah | +0.117 |
humiliated | +0.115 |
Neg logit contributions | |
Draft | -0.156 |
plin | -0.155 |
Blooming | -0.153 |
€ | -0.153 |
Por | -0.147 |
Token | completely |
Token ID | 3190 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
plin | +0.509 |
Draft | +0.509 |
Blooming | +0.503 |
€ | +0.502 |
Por | +0.485 |
Neg logit contributions | |
nem | -0.434 |
unseen | -0.432 |
uth | -0.395 |
arah | -0.382 |
humiliated | -0.372 |
Token | or |
Token ID | 393 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
unseen | +0.929 |
nem | +0.926 |
uth | +0.825 |
humiliated | +0.800 |
arah | +0.792 |
Neg logit contributions | |
plin | -1.207 |
Draft | -1.206 |
Blooming | -1.183 |
€ | -1.175 |
Por | -1.137 |
Token | often |
Token ID | 1690 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
Draft | +0.398 |
plin | +0.395 |
Blooming | +0.390 |
€ | +0.388 |
Por | +0.374 |
Neg logit contributions | |
unseen | -0.422 |
nem | -0.422 |
uth | -0.387 |
arah | -0.375 |
humiliated | -0.370 |
Token | they |
Token ID | 484 |
Feature activation | -7.91e-01 |
Pos logit contributions | |
nem | +0.153 |
unseen | +0.153 |
uth | +0.137 |
humiliated | +0.131 |
arah | +0.131 |
Neg logit contributions | |
Draft | -0.202 |
plin | -0.202 |
Blooming | -0.199 |
€ | -0.197 |
Por | -0.191 |
Token | cross |
Token ID | 3272 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
nem | +0.591 |
unseen | +0.587 |
uth | +0.537 |
humiliated | +0.519 |
arah | +0.514 |
Neg logit contributions | |
plin | -0.623 |
Draft | -0.623 |
Blooming | -0.604 |
€ | -0.603 |
Por | -0.582 |
Token | - |
Token ID | 12 |
Feature activation | -8.25e-01 |
Pos logit contributions | |
unseen | +2.231 |
nem | +2.224 |
uth | +2.048 |
arah | +1.956 |
humiliated | +1.922 |
Neg logit contributions | |
Draft | -2.774 |
plin | -2.773 |
Blooming | -2.747 |
€ | -2.714 |
Por | -2.639 |
Token | dress |
Token ID | 49380 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
nem | +0.589 |
unseen | +0.587 |
uth | +0.542 |
arah | +0.525 |
humiliated | +0.510 |
Neg logit contributions | |
plin | -0.665 |
Draft | -0.663 |
Blooming | -0.659 |
€ | -0.655 |
Por | -0.634 |
Token | , |
Token ID | 11 |
Feature activation | -6.94e-01 |
Pos logit contributions | |
nem | +0.162 |
unseen | +0.162 |
uth | +0.150 |
arah | +0.145 |
humiliated | +0.142 |
Neg logit contributions | |
Draft | -0.157 |
plin | -0.157 |
Blooming | -0.155 |
€ | -0.154 |
Por | -0.148 |
Token | but |
Token ID | 475 |
Feature activation | -4.90e-01 |
Pos logit contributions | |
nem | +0.522 |
unseen | +0.522 |
uth | +0.478 |
arah | +0.459 |
humiliated | +0.454 |
Neg logit contributions | |
Draft | -0.541 |
plin | -0.538 |
Blooming | -0.528 |
€ | -0.526 |
Por | -0.508 |
Token | are |
Token ID | 389 |
Feature activation | -3.44e-01 |
Pos logit contributions | |
unseen | +0.376 |
nem | +0.375 |
uth | +0.341 |
arah | +0.329 |
humiliated | +0.328 |
Neg logit contributions | |
Draft | -0.376 |
plin | -0.372 |
Blooming | -0.365 |
€ | -0.364 |
Por | -0.351 |
Token | and |
Token ID | 290 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
Draft | +0.146 |
plin | +0.146 |
Blooming | +0.144 |
€ | +0.143 |
Por | +0.138 |
Neg logit contributions | |
unseen | -0.138 |
nem | -0.138 |
uth | -0.126 |
arah | -0.122 |
humiliated | -0.119 |
Token | just |
Token ID | 655 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
nem | +0.154 |
unseen | +0.154 |
uth | +0.140 |
arah | +0.135 |
humiliated | +0.134 |
Neg logit contributions | |
plin | -0.171 |
Draft | -0.171 |
Blooming | -0.169 |
€ | -0.168 |
Por | -0.161 |
Token | hoping |
Token ID | 7725 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
plin | +0.617 |
Draft | +0.617 |
Blooming | +0.608 |
€ | +0.607 |
Por | +0.584 |
Neg logit contributions | |
nem | -0.562 |
unseen | -0.561 |
uth | -0.512 |
arah | -0.496 |
humiliated | -0.487 |
Token | I |
Token ID | 314 |
Feature activation | -5.36e-01 |
Pos logit contributions | |
nem | +0.088 |
unseen | +0.088 |
uth | +0.080 |
arah | +0.078 |
humiliated | +0.076 |
Neg logit contributions | |
plin | -0.087 |
Draft | -0.087 |
Blooming | -0.085 |
€ | -0.085 |
Por | -0.082 |
Token | can |
Token ID | 460 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
unseen | +0.433 |
nem | +0.433 |
uth | +0.397 |
arah | +0.384 |
humiliated | +0.381 |
Neg logit contributions | |
plin | -0.386 |
Draft | -0.385 |
€ | -0.377 |
Blooming | -0.377 |
Por | -0.363 |
Token | maintain |
Token ID | 5529 |
Feature activation | -3.15e+00 |
Pos logit contributions | |
plin | +0.177 |
Draft | +0.177 |
€ | +0.173 |
Blooming | +0.173 |
Por | +0.167 |
Neg logit contributions | |
unseen | -0.179 |
nem | -0.179 |
uth | -0.163 |
arah | -0.158 |
humiliated | -0.155 |
Token | a |
Token ID | 257 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
unseen | +2.264 |
nem | +2.253 |
uth | +1.982 |
trusted | +1.929 |
arah | +1.911 |
Neg logit contributions | |
plin | -2.555 |
Draft | -2.550 |
€ | -2.445 |
Blooming | -2.438 |
Por | -2.335 |
Token | spot |
Token ID | 4136 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
nem | +0.117 |
unseen | +0.117 |
uth | +0.106 |
arah | +0.103 |
humiliated | +0.101 |
Neg logit contributions | |
Draft | -0.125 |
plin | -0.124 |
Blooming | -0.122 |
€ | -0.122 |
Por | -0.117 |
Token | on |
Token ID | 319 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
Draft | +0.348 |
plin | +0.348 |
Blooming | +0.345 |
€ | +0.342 |
Por | +0.329 |
Neg logit contributions | |
nem | -0.318 |
unseen | -0.318 |
uth | -0.288 |
arah | -0.280 |
humiliated | -0.274 |
Token | the |
Token ID | 262 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
nem | +0.369 |
unseen | +0.367 |
uth | +0.334 |
arah | +0.323 |
humiliated | +0.318 |
Neg logit contributions | |
plin | -0.387 |
Draft | -0.383 |
Blooming | -0.378 |
€ | -0.377 |
Por | -0.362 |
Token | roster |
Token ID | 9354 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
plin | +0.214 |
Draft | +0.213 |
Blooming | +0.210 |
€ | +0.209 |
Por | +0.202 |
Neg logit contributions | |
nem | -0.176 |
unseen | -0.176 |
uth | -0.158 |
arah | -0.153 |
humiliated | -0.151 |