Token | political |
Token ID | 1964 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
preferring | +6.168 |
inability | +5.872 |
wanting | +5.553 |
confines | +5.272 |
choosing | +5.249 |
Neg logit contributions | |
ogether | -4.818 |
adel | -4.615 |
ilde | -4.531 |
campaigner | -4.433 |
ér | -4.372 |
Token | favor |
Token ID | 2661 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
preferring | +1.028 |
inability | +0.959 |
wanting | +0.911 |
choosing | +0.860 |
confines | +0.858 |
Neg logit contributions | |
ogether | -0.912 |
adel | -0.867 |
campaigner | -0.853 |
ilde | -0.849 |
ér | -0.818 |
Token | or |
Token ID | 393 |
Feature activation | +8.34e-01 |
Pos logit contributions | |
preferring | +0.627 |
inability | +0.580 |
wanting | +0.558 |
choosing | +0.532 |
confines | +0.529 |
Neg logit contributions | |
ogether | -0.458 |
campaigner | -0.436 |
adel | -0.436 |
ilde | -0.424 |
journalist | -0.408 |
Token | two |
Token ID | 734 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
preferring | +0.806 |
inability | +0.749 |
wanting | +0.712 |
choosing | +0.673 |
confines | +0.669 |
Neg logit contributions | |
ogether | -0.685 |
adel | -0.652 |
campaigner | -0.649 |
ilde | -0.638 |
journalist | -0.613 |
Token | with |
Token ID | 351 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
preferring | +10.161 |
inability | +9.309 |
wanting | +9.088 |
choosing | +8.547 |
confines | +8.485 |
Neg logit contributions | |
ogether | -7.783 |
adel | -7.296 |
campaigner | -7.217 |
ilde | -7.040 |
alysed | -6.900 |
Token | regard |
Token ID | 2754 |
Feature activation | +5.05e+01 |
Pos logit contributions | |
preferring | +11.629 |
inability | +10.887 |
wanting | +10.426 |
choosing | +9.866 |
forgetting | +9.371 |
Neg logit contributions | |
ogether | -10.740 |
adel | -10.252 |
campaigner | -10.001 |
ér | -9.961 |
ilde | -9.930 |
Token | to |
Token ID | 284 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
to | +24.727 |
to | +22.245 |
wanting | +21.277 |
preferring | +21.131 |
inability | +20.085 |
Neg logit contributions | |
earthqu | -31.714 |
practition | -31.154 |
exting | -30.774 |
newcom | -28.853 |
pione | -28.767 |
Token | certain |
Token ID | 1728 |
Feature activation | +5.94e+00 |
Pos logit contributions | |
preferring | +15.010 |
inability | +13.889 |
wanting | +13.682 |
choosing | +13.088 |
forgetting | +12.417 |
Neg logit contributions | |
ogether | -10.792 |
ilde | -10.217 |
adel | -10.156 |
ér | -10.040 |
alysed | -9.780 |
Token | issues |
Token ID | 2428 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
preferring | +5.719 |
inability | +5.395 |
wanting | +5.125 |
choosing | +4.873 |
confines | +4.840 |
Neg logit contributions | |
ogether | -4.703 |
adel | -4.491 |
ilde | -4.394 |
campaigner | -4.372 |
ér | -4.224 |
Token | , |
Token ID | 11 |
Feature activation | -4.85e+00 |
Pos logit contributions | |
preferring | +10.011 |
inability | +8.913 |
wanting | +8.809 |
choosing | +8.379 |
confines | +7.983 |
Neg logit contributions | |
ogether | -8.889 |
adel | -8.304 |
campaigner | -8.226 |
ilde | -8.154 |
alysed | -7.903 |
Token | to |
Token ID | 284 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
ogether | +3.557 |
campaigner | +3.434 |
adel | +3.409 |
ilde | +3.297 |
journalist | +3.296 |
Neg logit contributions | |
preferring | -4.883 |
inability | -4.571 |
wanting | -4.343 |
confines | -4.147 |
choosing | -4.111 |
Token | , |
Token ID | 11 |
Feature activation | -8.37e+00 |
Pos logit contributions | |
preferring | +7.738 |
inability | +7.121 |
wanting | +7.039 |
choosing | +6.586 |
forgetting | +6.387 |
Neg logit contributions | |
ogether | -6.655 |
adel | -6.313 |
ilde | -6.225 |
campaigner | -6.191 |
alysed | -5.859 |
Token | Doug |
Token ID | 15115 |
Feature activation | -3.50e+00 |
Pos logit contributions | |
ogether | +6.533 |
campaigner | +6.484 |
adel | +6.347 |
journalist | +6.335 |
ilde | +6.196 |
Neg logit contributions | |
preferring | -7.675 |
inability | -7.165 |
wanting | -6.670 |
confines | -6.479 |
choosing | -6.321 |
Token | went |
Token ID | 1816 |
Feature activation | +7.54e+00 |
Pos logit contributions | |
ogether | +2.810 |
campaigner | +2.714 |
adel | +2.714 |
ilde | +2.644 |
journalist | +2.576 |
Neg logit contributions | |
preferring | -3.385 |
inability | -3.134 |
wanting | -2.973 |
choosing | -2.823 |
confines | -2.810 |
Token | so |
Token ID | 523 |
Feature activation | +3.54e+00 |
Pos logit contributions | |
preferring | +7.533 |
inability | +7.051 |
wanting | +6.924 |
choosing | +6.457 |
forgetting | +6.330 |
Neg logit contributions | |
ogether | -5.483 |
adel | -5.152 |
campaigner | -5.123 |
ilde | -5.077 |
alysed | -4.910 |
Token | far |
Token ID | 1290 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
preferring | +3.749 |
inability | +3.511 |
wanting | +3.436 |
choosing | +3.215 |
forgetting | +3.185 |
Neg logit contributions | |
ogether | -2.484 |
adel | -2.366 |
campaigner | -2.316 |
ilde | -2.279 |
ér | -2.189 |
Token | as |
Token ID | 355 |
Feature activation | +4.90e+01 |
Pos logit contributions | |
preferring | +11.452 |
inability | +10.681 |
wanting | +10.445 |
choosing | +9.894 |
forgetting | +9.630 |
Neg logit contributions | |
ogether | -6.788 |
adel | -6.428 |
campaigner | -6.353 |
ilde | -6.262 |
emed | -5.962 |
Token | to |
Token ID | 284 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
preferring | +29.219 |
wanting | +28.099 |
to | +27.281 |
refusing | +26.525 |
to | +26.508 |
Neg logit contributions | |
ogether | -22.141 |
ilde | -19.535 |
alysed | -19.175 |
isan | -19.039 |
adel | -18.438 |
Token | suggest |
Token ID | 1950 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
preferring | +9.995 |
inability | +9.282 |
wanting | +9.075 |
choosing | +8.554 |
confines | +8.410 |
Neg logit contributions | |
ogether | -8.240 |
ilde | -7.506 |
adel | -7.476 |
campaigner | -7.406 |
alysed | -7.362 |
Token | that |
Token ID | 326 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
preferring | +14.591 |
wanting | +13.411 |
inability | +13.335 |
choosing | +12.660 |
forgetting | +12.293 |
Neg logit contributions | |
ogether | -12.271 |
adel | -11.359 |
ilde | -11.200 |
campaigner | -11.176 |
alysed | -10.785 |
Token | the |
Token ID | 262 |
Feature activation | +9.30e+00 |
Pos logit contributions | |
ogether | +0.199 |
adel | +0.190 |
campaigner | +0.190 |
ilde | +0.184 |
journalist | +0.177 |
Neg logit contributions | |
preferring | -0.282 |
inability | -0.263 |
wanting | -0.251 |
choosing | -0.240 |
confines | -0.237 |
Token | Mayor |
Token ID | 10106 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
preferring | +9.353 |
inability | +9.013 |
wanting | +8.493 |
confines | +8.074 |
choosing | +8.067 |
Neg logit contributions | |
ogether | -6.465 |
adel | -6.229 |
ilde | -6.035 |
campaigner | -5.778 |
alysed | -5.722 |
Token | He |
Token ID | 679 |
Feature activation | +7.04e+00 |
Pos logit contributions | |
preferring | +1.180 |
inability | +1.091 |
wanting | +1.047 |
confines | +0.989 |
choosing | +0.988 |
Neg logit contributions | |
ogether | -0.975 |
campaigner | -0.945 |
adel | -0.935 |
ilde | -0.908 |
journalist | -0.878 |
Token | even |
Token ID | 772 |
Feature activation | +9.29e+00 |
Pos logit contributions | |
preferring | +6.776 |
inability | +6.213 |
wanting | +6.048 |
confines | +5.766 |
choosing | +5.727 |
Neg logit contributions | |
ogether | -5.479 |
campaigner | -5.223 |
adel | -5.139 |
ilde | -5.044 |
ér | -4.898 |
Token | went |
Token ID | 1816 |
Feature activation | +7.85e+00 |
Pos logit contributions | |
preferring | +8.594 |
inability | +7.737 |
wanting | +7.632 |
confines | +7.240 |
choosing | +7.214 |
Neg logit contributions | |
ogether | -7.639 |
adel | -7.096 |
campaigner | -7.073 |
ilde | -6.940 |
isan | -6.903 |
Token | so |
Token ID | 523 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
preferring | +7.552 |
inability | +7.000 |
wanting | +6.967 |
choosing | +6.412 |
forgetting | +6.310 |
Neg logit contributions | |
ogether | -5.919 |
campaigner | -5.623 |
ilde | -5.546 |
adel | -5.491 |
ér | -5.362 |
Token | far |
Token ID | 1290 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
preferring | +3.729 |
inability | +3.464 |
wanting | +3.404 |
choosing | +3.184 |
confines | +3.138 |
Neg logit contributions | |
ogether | -2.492 |
adel | -2.372 |
campaigner | -2.354 |
ilde | -2.312 |
ér | -2.240 |
Token | as |
Token ID | 355 |
Feature activation | +4.83e+01 |
Pos logit contributions | |
preferring | +13.991 |
wanting | +12.700 |
inability | +12.688 |
choosing | +11.951 |
forgetting | +11.563 |
Neg logit contributions | |
ogether | -9.377 |
campaigner | -8.917 |
adel | -8.771 |
ilde | -8.710 |
emed | -8.527 |
Token | to |
Token ID | 284 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
preferring | +30.146 |
wanting | +28.212 |
choosing | +27.244 |
to | +26.915 |
to | +26.060 |
Neg logit contributions | |
ogether | -20.841 |
isan | -18.670 |
alysed | -18.408 |
ilde | -18.194 |
campaigner | -18.148 |
Token | announce |
Token ID | 5453 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
preferring | +10.417 |
inability | +9.505 |
wanting | +9.331 |
choosing | +8.916 |
confines | +8.709 |
Neg logit contributions | |
ogether | -8.163 |
ilde | -7.540 |
campaigner | -7.445 |
adel | -7.411 |
isan | -7.369 |
Token | inn |
Token ID | 3527 |
Feature activation | -3.82e+00 |
Pos logit contributions | |
preferring | +15.128 |
inability | +14.183 |
wanting | +13.902 |
choosing | +12.905 |
confines | +12.474 |
Neg logit contributions | |
ogether | -12.045 |
campaigner | -11.525 |
adel | -11.417 |
ilde | -11.258 |
alysed | -10.882 |
Token | ew |
Token ID | 413 |
Feature activation | +2.69e+00 |
Pos logit contributions | |
ogether | +2.766 |
adel | +2.678 |
campaigner | +2.656 |
ilde | +2.580 |
journalist | +2.511 |
Neg logit contributions | |
preferring | -3.975 |
inability | -3.702 |
wanting | -3.532 |
choosing | -3.375 |
confines | -3.349 |
Token | sp |
Token ID | 2777 |
Feature activation | -4.10e+00 |
Pos logit contributions | |
preferring | +2.952 |
inability | +2.776 |
wanting | +2.657 |
choosing | +2.541 |
confines | +2.533 |
Neg logit contributions | |
ogether | -1.764 |
campaigner | -1.736 |
adel | -1.698 |
ilde | -1.619 |
journalist | -1.586 |
Token | saw |
Token ID | 43439 |
Feature activation | -2.79e+00 |
Pos logit contributions | |
preferring | +0.584 |
inability | +0.541 |
wanting | +0.515 |
choosing | +0.489 |
confines | +0.485 |
Neg logit contributions | |
ogether | -0.462 |
campaigner | -0.447 |
adel | -0.444 |
ilde | -0.433 |
journalist | -0.421 |
Token | what |
Token ID | 644 |
Feature activation | -6.52e+00 |
Pos logit contributions | |
ogether | +2.194 |
adel | +2.114 |
campaigner | +2.111 |
ilde | +2.052 |
journalist | +1.999 |
Neg logit contributions | |
preferring | -2.764 |
inability | -2.562 |
wanting | -2.437 |
choosing | -2.315 |
confines | -2.309 |
Token | was |
Token ID | 373 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
ogether | +4.366 |
campaigner | +4.261 |
adel | +4.196 |
journalist | +4.095 |
ilde | +4.049 |
Neg logit contributions | |
preferring | -6.920 |
inability | -6.428 |
wanting | -6.091 |
confines | -5.882 |
choosing | -5.832 |
Token | happening |
Token ID | 5836 |
Feature activation | -4.25e+00 |
Pos logit contributions | |
preferring | +3.175 |
inability | +2.931 |
wanting | +2.860 |
choosing | +2.703 |
confines | +2.603 |
Neg logit contributions | |
ogether | -2.723 |
adel | -2.591 |
campaigner | -2.585 |
ilde | -2.516 |
ér | -2.418 |
Token | with |
Token ID | 351 |
Feature activation | +6.34e+00 |
Pos logit contributions | |
ogether | +3.819 |
adel | +3.707 |
campaigner | +3.699 |
ilde | +3.606 |
journalist | +3.544 |
Neg logit contributions | |
preferring | -3.659 |
inability | -3.369 |
wanting | -3.142 |
confines | -2.987 |
choosing | -2.967 |
Token | regard |
Token ID | 2754 |
Feature activation | +4.65e+01 |
Pos logit contributions | |
preferring | +6.032 |
inability | +5.603 |
wanting | +5.451 |
choosing | +5.113 |
forgetting | +4.936 |
Neg logit contributions | |
ogether | -5.057 |
adel | -4.848 |
campaigner | -4.818 |
ilde | -4.720 |
alysed | -4.552 |
Token | to |
Token ID | 284 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
to | +23.192 |
to | +21.323 |
wanting | +20.491 |
preferring | +20.067 |
To | +18.620 |
Neg logit contributions | |
practition | -30.459 |
earthqu | -30.066 |
exting | -29.820 |
newcom | -28.156 |
ortunately | -28.118 |
Token | the |
Token ID | 262 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
preferring | +11.401 |
inability | +10.503 |
wanting | +10.472 |
choosing | +9.797 |
forgetting | +9.416 |
Neg logit contributions | |
ogether | -8.423 |
ilde | -7.989 |
adel | -7.953 |
campaigner | -7.892 |
alysed | -7.683 |
Token | Civil |
Token ID | 7511 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
preferring | +12.926 |
inability | +12.699 |
wanting | +11.915 |
confines | +11.233 |
choosing | +11.215 |
Neg logit contributions | |
ogether | -11.274 |
adel | -10.984 |
ilde | -10.976 |
campaigner | -10.630 |
ér | -10.442 |
Token | War |
Token ID | 1810 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
preferring | +1.621 |
inability | +1.490 |
wanting | +1.379 |
choosing | +1.283 |
confines | +1.261 |
Neg logit contributions | |
ogether | -2.411 |
campaigner | -2.358 |
adel | -2.331 |
ilde | -2.273 |
ér | -2.229 |
Token | � |
Token ID | 447 |
Feature activation | -5.43e+00 |
Pos logit contributions | |
preferring | +2.867 |
inability | +2.668 |
wanting | +2.569 |
choosing | +2.434 |
confines | +2.395 |
Neg logit contributions | |
ogether | -2.105 |
adel | -2.009 |
campaigner | -2.003 |
ilde | -1.956 |
journalist | -1.872 |
Token | would |
Token ID | 561 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
campaigner | +10.361 |
ogether | +10.324 |
journalist | +10.258 |
adel | +10.086 |
correspond | +9.571 |
Neg logit contributions | |
preferring | -12.438 |
inability | -11.668 |
wanting | -10.876 |
choosing | -10.273 |
forgetting | -10.267 |
Token | not |
Token ID | 407 |
Feature activation | -1.56e+01 |
Pos logit contributions | |
ogether | +9.743 |
campaigner | +9.581 |
adel | +9.487 |
journalist | +9.364 |
occur | +9.208 |
Neg logit contributions | |
preferring | -12.849 |
inability | -11.871 |
wanting | -11.148 |
confines | -10.719 |
choosing | -10.709 |
Token | be |
Token ID | 307 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
ogether | +10.950 |
campaigner | +10.764 |
journalist | +10.664 |
adel | +10.580 |
occur | +10.534 |
Neg logit contributions | |
preferring | -13.877 |
inability | -12.851 |
wanting | -11.783 |
choosing | -11.516 |
confines | -11.372 |
Token | remarkable |
Token ID | 11004 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
ogether | +8.894 |
adel | +8.706 |
campaigner | +8.705 |
journalist | +8.691 |
ilde | +8.317 |
Neg logit contributions | |
preferring | -9.284 |
inability | -8.620 |
confines | -7.757 |
wanting | -7.751 |
choosing | -7.508 |
Token | with |
Token ID | 351 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
ogether | +10.127 |
campaigner | +10.027 |
adel | +9.868 |
journalist | +9.808 |
ér | +9.372 |
Neg logit contributions | |
preferring | -8.646 |
inability | -7.950 |
wanting | -7.251 |
confines | -7.032 |
choosing | -6.783 |
Token | regard |
Token ID | 2754 |
Feature activation | +4.57e+01 |
Pos logit contributions | |
preferring | +1.358 |
inability | +1.265 |
wanting | +1.206 |
choosing | +1.150 |
confines | +1.139 |
Neg logit contributions | |
ogether | -1.056 |
adel | -1.021 |
campaigner | -1.008 |
ilde | -0.992 |
ér | -0.946 |
Token | to |
Token ID | 284 |
Feature activation | +4.25e+00 |
Pos logit contributions | |
to | +23.331 |
to | +21.118 |
preferring | +20.858 |
wanting | +20.826 |
inability | +19.260 |
Neg logit contributions | |
earthqu | -31.119 |
practition | -30.617 |
exting | -30.006 |
pione | -28.500 |
� | -28.060 |
Token | common |
Token ID | 2219 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
preferring | +4.188 |
inability | +3.889 |
wanting | +3.719 |
choosing | +3.566 |
confines | +3.495 |
Neg logit contributions | |
ogether | -3.331 |
adel | -3.233 |
ilde | -3.175 |
campaigner | -3.139 |
ér | -2.999 |
Token | species |
Token ID | 4693 |
Feature activation | +4.75e+00 |
Pos logit contributions | |
ogether | +3.656 |
campaigner | +3.537 |
adel | +3.504 |
ilde | +3.414 |
journalist | +3.391 |
Neg logit contributions | |
preferring | -3.871 |
inability | -3.549 |
wanting | -3.368 |
choosing | -3.177 |
confines | -3.160 |
Token | , |
Token ID | 11 |
Feature activation | -9.42e+00 |
Pos logit contributions | |
preferring | +4.737 |
inability | +4.373 |
wanting | +4.176 |
choosing | +3.968 |
confines | +3.902 |
Neg logit contributions | |
ogether | -3.727 |
adel | -3.605 |
ilde | -3.562 |
campaigner | -3.510 |
ér | -3.351 |
Token | wildlife |
Token ID | 15599 |
Feature activation | -5.71e+00 |
Pos logit contributions | |
ogether | +7.631 |
campaigner | +7.564 |
journalist | +7.364 |
adel | +7.283 |
ilde | +7.052 |
Neg logit contributions | |
preferring | -8.116 |
inability | -7.517 |
wanting | -7.104 |
confines | -6.786 |
choosing | -6.608 |
Token | some |
Token ID | 617 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
preferring | +0.946 |
inability | +0.885 |
wanting | +0.853 |
choosing | +0.813 |
confines | +0.812 |
Neg logit contributions | |
ogether | -0.635 |
campaigner | -0.608 |
adel | -0.602 |
ilde | -0.581 |
ér | -0.558 |
Token | rough |
Token ID | 5210 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
preferring | +0.403 |
inability | +0.375 |
wanting | +0.358 |
choosing | +0.339 |
confines | +0.338 |
Neg logit contributions | |
ogether | -0.329 |
adel | -0.320 |
campaigner | -0.319 |
ilde | -0.310 |
ér | -0.299 |
Token | edges |
Token ID | 13015 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
preferring | +0.773 |
inability | +0.674 |
wanting | +0.616 |
confines | +0.561 |
choosing | +0.552 |
Neg logit contributions | |
ogether | -1.709 |
campaigner | -1.674 |
adel | -1.667 |
ilde | -1.636 |
journalist | -1.610 |
Token | that |
Token ID | 326 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
preferring | +4.969 |
inability | +4.241 |
wanting | +4.090 |
choosing | +3.694 |
forgetting | +3.242 |
Neg logit contributions | |
earthqu | -12.989 |
ogether | -12.952 |
campaigner | -12.516 |
escription | -12.510 |
adel | -12.508 |
Token | you |
Token ID | 345 |
Feature activation | +6.65e+00 |
Pos logit contributions | |
ogether | +1.141 |
campaigner | +1.087 |
adel | +1.085 |
ilde | +1.044 |
journalist | +1.006 |
Neg logit contributions | |
preferring | -2.080 |
inability | -1.952 |
wanting | -1.874 |
choosing | -1.794 |
confines | -1.783 |
Token | have |
Token ID | 423 |
Feature activation | +4.47e+01 |
Pos logit contributions | |
preferring | +6.170 |
inability | +5.867 |
wanting | +5.670 |
choosing | +5.252 |
confines | +5.136 |
Neg logit contributions | |
ogether | -5.495 |
earthqu | -5.385 |
campaigner | -5.149 |
escription | -5.085 |
adel | -5.057 |
Token | to |
Token ID | 284 |
Feature activation | +2.28e+00 |
Pos logit contributions | |
to | +20.680 |
to | +19.355 |
wanting | +17.273 |
To | +16.808 |
preferring | +16.021 |
Neg logit contributions | |
practition | -40.358 |
earthqu | -39.326 |
exting | -38.478 |
pione | -37.306 |
� | -37.170 |
Token | be |
Token ID | 307 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
preferring | +2.562 |
inability | +2.400 |
wanting | +2.333 |
choosing | +2.219 |
confines | +2.192 |
Neg logit contributions | |
ogether | -1.518 |
campaigner | -1.418 |
adel | -1.376 |
ilde | -1.341 |
earthqu | -1.313 |
Token | aware |
Token ID | 3910 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
ogether | +5.781 |
adel | +5.636 |
campaigner | +5.518 |
ilde | +5.270 |
journalist | +5.200 |
Neg logit contributions | |
preferring | -14.107 |
inability | -13.470 |
wanting | -12.711 |
confines | -12.405 |
choosing | -12.187 |
Token | of |
Token ID | 286 |
Feature activation | +3.33e+00 |
Pos logit contributions | |
preferring | +1.365 |
inability | +1.247 |
wanting | +1.209 |
choosing | +1.126 |
confines | +1.113 |
Neg logit contributions | |
ogether | -1.468 |
campaigner | -1.406 |
adel | -1.388 |
ilde | -1.355 |
earthqu | -1.319 |
Token | . |
Token ID | 13 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
preferring | +3.403 |
inability | +3.151 |
wanting | +3.063 |
choosing | +2.918 |
confines | +2.852 |
Neg logit contributions | |
ogether | -2.464 |
campaigner | -2.372 |
adel | -2.310 |
earthqu | -2.271 |
ilde | -2.257 |
Token | look |
Token ID | 804 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
preferring | +4.026 |
inability | +3.756 |
wanting | +3.663 |
choosing | +3.438 |
confines | +3.391 |
Neg logit contributions | |
ogether | -3.000 |
campaigner | -2.816 |
adel | -2.798 |
ilde | -2.716 |
isan | -2.615 |
Token | more |
Token ID | 517 |
Feature activation | -6.98e+00 |
Pos logit contributions | |
ogether | +1.597 |
campaigner | +1.531 |
adel | +1.530 |
ilde | +1.480 |
journalist | +1.438 |
Neg logit contributions | |
preferring | -2.476 |
inability | -2.313 |
wanting | -2.208 |
choosing | -2.109 |
confines | -2.101 |
Token | white |
Token ID | 2330 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
ogether | +5.530 |
campaigner | +5.367 |
adel | +5.339 |
journalist | +5.230 |
ilde | +5.201 |
Neg logit contributions | |
preferring | -6.497 |
inability | -6.053 |
wanting | -5.624 |
choosing | -5.403 |
confines | -5.379 |
Token | people |
Token ID | 661 |
Feature activation | +5.57e+00 |
Pos logit contributions | |
ogether | +7.632 |
adel | +7.456 |
campaigner | +7.306 |
journalist | +7.229 |
ilde | +7.147 |
Neg logit contributions | |
preferring | -10.912 |
inability | -10.235 |
wanting | -9.409 |
choosing | -9.187 |
confines | -9.153 |
Token | are |
Token ID | 389 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
preferring | +5.459 |
inability | +4.996 |
wanting | +4.950 |
choosing | +4.601 |
confines | +4.494 |
Neg logit contributions | |
ogether | -4.424 |
campaigner | -4.147 |
adel | -4.134 |
ilde | -4.059 |
alysed | -3.893 |
Token | going |
Token ID | 1016 |
Feature activation | +4.45e+01 |
Pos logit contributions | |
preferring | +10.832 |
wanting | +9.940 |
inability | +9.275 |
choosing | +9.090 |
forgetting | +8.592 |
Neg logit contributions | |
ogether | -14.720 |
adel | -14.077 |
ilde | -13.889 |
campaigner | -13.755 |
isan | -13.416 |
Token | to |
Token ID | 284 |
Feature activation | +4.81e+00 |
Pos logit contributions | |
to | +22.814 |
wanting | +21.453 |
to | +21.391 |
preferring | +19.887 |
inability | +18.840 |
Neg logit contributions | |
practition | -27.528 |
earthqu | -27.397 |
exting | -26.319 |
newcom | -25.616 |
carbohyd | -25.266 |
Token | treat |
Token ID | 2190 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
preferring | +5.438 |
inability | +5.068 |
wanting | +4.978 |
choosing | +4.666 |
confines | +4.634 |
Neg logit contributions | |
ogether | -3.101 |
adel | -2.882 |
campaigner | -2.867 |
ilde | -2.841 |
alysed | -2.713 |
Token | you |
Token ID | 345 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
ogether | +5.276 |
ilde | +4.874 |
campaigner | +4.871 |
adel | +4.868 |
journalist | +4.806 |
Neg logit contributions | |
preferring | -13.177 |
inability | -12.486 |
wanting | -11.683 |
confines | -11.630 |
choosing | -11.439 |
Token | more |
Token ID | 517 |
Feature activation | -4.09e+00 |
Pos logit contributions | |
ogether | +0.472 |
adel | +0.453 |
campaigner | +0.452 |
ilde | +0.438 |
journalist | +0.421 |
Neg logit contributions | |
preferring | -0.722 |
inability | -0.672 |
wanting | -0.646 |
choosing | -0.613 |
confines | -0.609 |
Token | white |
Token ID | 2330 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
ogether | +3.470 |
campaigner | +3.352 |
adel | +3.347 |
ilde | +3.259 |
journalist | +3.213 |
Neg logit contributions | |
preferring | -3.733 |
inability | -3.456 |
wanting | -3.248 |
choosing | -3.083 |
confines | -3.073 |
Token | are |
Token ID | 389 |
Feature activation | +6.93e+00 |
Pos logit contributions | |
preferring | +8.276 |
inability | +7.563 |
wanting | +7.364 |
choosing | +7.044 |
confines | +6.757 |
Neg logit contributions | |
ogether | -6.370 |
adel | -6.007 |
ilde | -5.911 |
campaigner | -5.716 |
earthqu | -5.657 |
Token | forced |
Token ID | 4137 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
preferring | +6.412 |
inability | +5.744 |
wanting | +5.625 |
choosing | +5.431 |
forgetting | +5.197 |
Neg logit contributions | |
ogether | -6.049 |
adel | -5.857 |
ilde | -5.651 |
campaigner | -5.551 |
ér | -5.412 |
Token | by |
Token ID | 416 |
Feature activation | +8.61e+00 |
Pos logit contributions | |
preferring | +15.850 |
inability | +14.399 |
wanting | +14.183 |
choosing | +13.829 |
to | +13.126 |
Neg logit contributions | |
ogether | -12.763 |
ilde | -12.437 |
adel | -12.394 |
campaigner | -11.867 |
emed | -11.495 |
Token | government |
Token ID | 1230 |
Feature activation | +2.61e+01 |
Pos logit contributions | |
preferring | +8.163 |
inability | +7.765 |
wanting | +7.352 |
choosing | +7.053 |
confines | +6.846 |
Neg logit contributions | |
ogether | -6.930 |
adel | -6.643 |
ilde | -6.336 |
campaigner | -6.185 |
ér | -6.077 |
Token | department |
Token ID | 5011 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
preferring | +20.766 |
inability | +19.505 |
wanting | +19.262 |
choosing | +18.216 |
confines | +17.685 |
Neg logit contributions | |
ogether | -17.225 |
adel | -16.225 |
ilde | -15.509 |
earthqu | -15.401 |
quished | -14.922 |
Token | clients |
Token ID | 7534 |
Feature activation | +4.43e+01 |
Pos logit contributions | |
preferring | +17.018 |
wanting | +15.428 |
inability | +15.336 |
choosing | +14.434 |
confines | +13.926 |
Neg logit contributions | |
ogether | -13.679 |
adel | -13.078 |
ilde | -13.053 |
campaigner | -12.977 |
quished | -12.299 |
Token | to |
Token ID | 284 |
Feature activation | +4.28e+00 |
Pos logit contributions | |
preferring | +28.533 |
wanting | +26.762 |
inability | +25.589 |
to | +25.160 |
choosing | +24.682 |
Neg logit contributions | |
ogether | -19.898 |
ilde | -18.686 |
adel | -18.486 |
earthqu | -18.409 |
izoph | -17.761 |
Token | build |
Token ID | 1382 |
Feature activation | -8.44e+00 |
Pos logit contributions | |
preferring | +4.251 |
inability | +3.899 |
wanting | +3.736 |
choosing | +3.611 |
confines | +3.525 |
Neg logit contributions | |
ogether | -3.427 |
adel | -3.251 |
ilde | -3.176 |
campaigner | -3.168 |
ér | -3.010 |
Token | websites |
Token ID | 9293 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
ogether | +6.687 |
campaigner | +6.633 |
adel | +6.578 |
ilde | +6.368 |
journalist | +6.296 |
Neg logit contributions | |
preferring | -7.527 |
inability | -7.000 |
wanting | -6.578 |
confines | -6.277 |
choosing | -6.202 |
Token | for |
Token ID | 329 |
Feature activation | +4.35e+00 |
Pos logit contributions | |
preferring | +1.623 |
inability | +1.486 |
wanting | +1.431 |
choosing | +1.354 |
confines | +1.333 |
Neg logit contributions | |
ogether | -1.358 |
adel | -1.300 |
campaigner | -1.298 |
ilde | -1.271 |
journalist | -1.223 |
Token | IE |
Token ID | 28157 |
Feature activation | +4.91e+00 |
Pos logit contributions | |
preferring | +4.235 |
inability | +3.922 |
wanting | +3.762 |
choosing | +3.582 |
confines | +3.498 |
Neg logit contributions | |
ogether | -3.530 |
adel | -3.373 |
campaigner | -3.298 |
ilde | -3.281 |
ér | -3.168 |
Token | One |
Token ID | 1881 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
ogether | +0.581 |
campaigner | +0.560 |
adel | +0.560 |
ilde | +0.544 |
journalist | +0.530 |
Neg logit contributions | |
preferring | -0.687 |
inability | -0.636 |
wanting | -0.605 |
choosing | -0.573 |
confines | -0.571 |
Token | aim |
Token ID | 4031 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
ogether | +2.599 |
campaigner | +2.546 |
adel | +2.505 |
ilde | +2.443 |
journalist | +2.427 |
Neg logit contributions | |
preferring | -3.045 |
inability | -2.806 |
wanting | -2.670 |
confines | -2.533 |
choosing | -2.526 |
Token | of |
Token ID | 286 |
Feature activation | +2.75e+00 |
Pos logit contributions | |
ogether | +1.716 |
adel | +1.653 |
campaigner | +1.653 |
ilde | +1.603 |
journalist | +1.562 |
Neg logit contributions | |
preferring | -2.234 |
inability | -2.074 |
wanting | -1.973 |
choosing | -1.875 |
confines | -1.867 |
Token | the |
Token ID | 262 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
preferring | +2.745 |
inability | +2.547 |
wanting | +2.443 |
choosing | +2.333 |
confines | +2.284 |
Neg logit contributions | |
ogether | -2.124 |
adel | -2.073 |
campaigner | -2.039 |
ilde | -1.994 |
journalist | -1.919 |
Token | contest |
Token ID | 8414 |
Feature activation | +5.09e+00 |
Pos logit contributions | |
preferring | +1.674 |
inability | +1.569 |
wanting | +1.493 |
choosing | +1.425 |
confines | +1.412 |
Neg logit contributions | |
ogether | -1.243 |
adel | -1.204 |
campaigner | -1.179 |
ilde | -1.162 |
journalist | -1.111 |
Token | is |
Token ID | 318 |
Feature activation | +4.42e+01 |
Pos logit contributions | |
preferring | +5.112 |
inability | +4.787 |
wanting | +4.606 |
choosing | +4.394 |
confines | +4.368 |
Neg logit contributions | |
ogether | -3.773 |
adel | -3.642 |
campaigner | -3.588 |
ilde | -3.577 |
journalist | -3.373 |
Token | to |
Token ID | 284 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
preferring | +26.118 |
inability | +26.001 |
wanting | +25.750 |
to | +25.647 |
to | +24.450 |
Neg logit contributions | |
ogether | -20.769 |
ilde | -20.123 |
adel | -19.412 |
campaigner | -18.295 |
soever | -17.947 |
Token | find |
Token ID | 1064 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
preferring | +1.912 |
inability | +1.798 |
wanting | +1.723 |
choosing | +1.644 |
confines | +1.636 |
Neg logit contributions | |
ogether | -1.318 |
adel | -1.254 |
campaigner | -1.244 |
ilde | -1.233 |
ér | -1.171 |
Token | a |
Token ID | 257 |
Feature activation | -5.74e+00 |
Pos logit contributions | |
ogether | +0.339 |
adel | +0.326 |
campaigner | +0.326 |
ilde | +0.317 |
journalist | +0.306 |
Neg logit contributions | |
preferring | -0.429 |
inability | -0.399 |
wanting | -0.380 |
choosing | -0.361 |
confines | -0.358 |
Token | method |
Token ID | 2446 |
Feature activation | +1.88e+01 |
Pos logit contributions | |
ogether | +4.715 |
campaigner | +4.632 |
adel | +4.547 |
journalist | +4.477 |
ilde | +4.430 |
Neg logit contributions | |
preferring | -5.309 |
inability | -4.833 |
wanting | -4.597 |
confines | -4.358 |
choosing | -4.336 |
Token | that |
Token ID | 326 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
preferring | +15.564 |
wanting | +14.148 |
inability | +14.107 |
choosing | +13.209 |
to | +12.774 |
Neg logit contributions | |
ogether | -13.053 |
campaigner | -12.626 |
ilde | -12.590 |
adel | -12.555 |
isan | -11.805 |
Token | You |
Token ID | 921 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
preferring | +2.688 |
inability | +2.489 |
wanting | +2.407 |
choosing | +2.256 |
confines | +2.242 |
Neg logit contributions | |
ogether | -2.378 |
campaigner | -2.294 |
adel | -2.257 |
ilde | -2.203 |
alysed | -2.098 |
Token | even |
Token ID | 772 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
preferring | +0.351 |
inability | +0.326 |
wanting | +0.311 |
choosing | +0.294 |
confines | +0.291 |
Neg logit contributions | |
ogether | -0.299 |
campaigner | -0.288 |
adel | -0.287 |
ilde | -0.279 |
journalist | -0.270 |
Token | went |
Token ID | 1816 |
Feature activation | +6.83e+00 |
Pos logit contributions | |
preferring | +2.988 |
inability | +2.751 |
wanting | +2.656 |
choosing | +2.499 |
confines | +2.461 |
Neg logit contributions | |
ogether | -2.726 |
campaigner | -2.590 |
adel | -2.584 |
ilde | -2.526 |
isan | -2.443 |
Token | as |
Token ID | 355 |
Feature activation | -9.59e-02 |
Pos logit contributions | |
preferring | +6.718 |
inability | +6.316 |
wanting | +6.255 |
choosing | +5.776 |
forgetting | +5.630 |
Neg logit contributions | |
ogether | -4.983 |
campaigner | -4.774 |
ilde | -4.595 |
adel | -4.578 |
alysed | -4.475 |
Token | far |
Token ID | 1290 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
ogether | +0.064 |
adel | +0.060 |
campaigner | +0.060 |
ilde | +0.058 |
journalist | +0.055 |
Neg logit contributions | |
preferring | -0.107 |
inability | -0.100 |
wanting | -0.097 |
choosing | -0.092 |
confines | -0.091 |
Token | as |
Token ID | 355 |
Feature activation | +4.38e+01 |
Pos logit contributions | |
preferring | +17.849 |
wanting | +16.398 |
inability | +16.124 |
choosing | +15.400 |
refusing | +14.615 |
Neg logit contributions | |
ogether | -12.681 |
adel | -11.448 |
ilde | -11.423 |
campaigner | -11.406 |
isan | -11.118 |
Token | to |
Token ID | 284 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
preferring | +29.798 |
wanting | +28.766 |
choosing | +27.363 |
to | +26.186 |
refusing | +25.935 |
Neg logit contributions | |
ogether | -18.931 |
alysed | -16.749 |
isan | -16.572 |
campaigner | -16.503 |
ilde | -16.069 |
Token | tell |
Token ID | 1560 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
preferring | +9.776 |
inability | +9.035 |
wanting | +8.872 |
choosing | +8.385 |
forgetting | +8.041 |
Neg logit contributions | |
ogether | -8.119 |
campaigner | -7.441 |
ilde | -7.434 |
adel | -7.390 |
alysed | -7.315 |
Token | a |
Token ID | 257 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
ogether | +1.353 |
campaigner | +1.298 |
adel | +1.298 |
ilde | +1.257 |
journalist | +1.221 |
Neg logit contributions | |
preferring | -2.015 |
inability | -1.879 |
wanting | -1.795 |
choosing | -1.712 |
confines | -1.705 |
Token | story |
Token ID | 1621 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
journalist | +7.829 |
campaigner | +7.746 |
ogether | +7.682 |
adel | +7.555 |
ilde | +7.327 |
Neg logit contributions | |
preferring | -10.012 |
inability | -9.268 |
wanting | -8.677 |
confines | -8.425 |
choosing | -8.282 |
Token | – |
Token ID | 784 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
preferring | +2.879 |
inability | +2.624 |
wanting | +2.549 |
choosing | +2.399 |
confines | +2.312 |
Neg logit contributions | |
ogether | -2.786 |
campaigner | -2.644 |
adel | -2.627 |
ilde | -2.584 |
ér | -2.482 |
Token | let |
Token ID | 1616 |
Feature activation | -6.48e+00 |
Pos logit contributions | |
preferring | +9.214 |
inability | +8.481 |
wanting | +8.275 |
choosing | +7.853 |
to | +7.782 |
Neg logit contributions | |
ogether | -7.358 |
campaigner | -7.272 |
adel | -6.981 |
ilde | -6.908 |
journalist | -6.759 |
Token | alone |
Token ID | 3436 |
Feature activation | +4.06e+00 |
Pos logit contributions | |
ogether | +5.174 |
adel | +4.907 |
campaigner | +4.897 |
ilde | +4.742 |
journalist | +4.663 |
Neg logit contributions | |
preferring | -6.260 |
inability | -5.781 |
wanting | -5.449 |
confines | -5.221 |
choosing | -5.158 |
Token | 59 |
Token ID | 7863 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
preferring | +4.101 |
inability | +3.822 |
wanting | +3.684 |
choosing | +3.506 |
confines | +3.495 |
Neg logit contributions | |
ogether | -3.033 |
adel | -2.904 |
campaigner | -2.896 |
ilde | -2.883 |
ér | -2.749 |
Token | community |
Token ID | 2055 |
Feature activation | -3.21e-01 |
Pos logit contributions | |
preferring | +1.651 |
inability | +1.512 |
wanting | +1.442 |
choosing | +1.370 |
confines | +1.350 |
Neg logit contributions | |
ogether | -1.556 |
campaigner | -1.509 |
adel | -1.504 |
ilde | -1.475 |
journalist | -1.425 |
Token | districts |
Token ID | 12815 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
ogether | +0.342 |
adel | +0.333 |
campaigner | +0.333 |
ilde | +0.328 |
journalist | +0.318 |
Neg logit contributions | |
preferring | -0.229 |
inability | -0.207 |
wanting | -0.193 |
choosing | -0.179 |
confines | -0.178 |
Token | — |
Token ID | 960 |
Feature activation | +4.36e+01 |
Pos logit contributions | |
preferring | +12.957 |
wanting | +12.047 |
inability | +11.836 |
choosing | +11.497 |
confines | +10.862 |
Neg logit contributions | |
ogether | -7.782 |
campaigner | -7.604 |
ilde | -7.428 |
adel | -7.319 |
journalist | -7.005 |
Token | that |
Token ID | 5562 |
Feature activation | +8.69e+00 |
Pos logit contributions | |
to | +28.289 |
preferring | +25.249 |
wanting | +23.836 |
whose | +23.820 |
To | +23.776 |
Neg logit contributions | |
campaigner | -19.758 |
earthqu | -19.608 |
ilde | -18.732 |
alysed | -18.324 |
ogether | -18.239 |
Token | his |
Token ID | 465 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
preferring | +8.587 |
inability | +7.946 |
wanting | +7.799 |
choosing | +7.491 |
confines | +7.180 |
Neg logit contributions | |
ogether | -6.470 |
adel | -6.217 |
campaigner | -6.147 |
ilde | -6.060 |
alysed | -5.901 |
Token | housing |
Token ID | 5627 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
preferring | +13.618 |
inability | +13.590 |
wanting | +12.669 |
choosing | +12.017 |
confines | +11.738 |
Neg logit contributions | |
ogether | -11.446 |
adel | -11.269 |
ilde | -10.994 |
earthqu | -10.724 |
alysed | -10.645 |
Token | plan |
Token ID | 1410 |
Feature activation | +9.24e+00 |
Pos logit contributions | |
preferring | +1.436 |
inability | +1.335 |
wanting | +1.262 |
choosing | +1.194 |
confines | +1.181 |
Neg logit contributions | |
ogether | -1.511 |
adel | -1.453 |
ilde | -1.429 |
campaigner | -1.427 |
ér | -1.375 |
Token | will |
Token ID | 481 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
preferring | +8.382 |
inability | +7.871 |
wanting | +7.630 |
confines | +7.354 |
choosing | +7.266 |
Neg logit contributions | |
ogether | -7.249 |
adel | -7.023 |
campaigner | -6.847 |
ilde | -6.829 |
alysed | -6.585 |
Token | do |
Token ID | 466 |
Feature activation | -5.06e+00 |
Pos logit contributions | |
ogether | +1.786 |
campaigner | +1.726 |
adel | +1.726 |
ilde | +1.682 |
journalist | +1.642 |
Neg logit contributions | |
preferring | -1.828 |
inability | -1.683 |
wanting | -1.593 |
choosing | -1.503 |
confines | -1.495 |
Token | on |
Token ID | 319 |
Feature activation | +5.85e+00 |
Pos logit contributions | |
ogether | +3.606 |
campaigner | +3.475 |
adel | +3.460 |
ilde | +3.353 |
journalist | +3.291 |
Neg logit contributions | |
preferring | -5.253 |
inability | -4.884 |
wanting | -4.610 |
confines | -4.421 |
choosing | -4.373 |
Token | a |
Token ID | 257 |
Feature activation | -7.02e+00 |
Pos logit contributions | |
preferring | +5.656 |
inability | +5.251 |
wanting | +5.083 |
choosing | +4.890 |
confines | +4.688 |
Neg logit contributions | |
ogether | -4.527 |
adel | -4.425 |
campaigner | -4.424 |
ilde | -4.286 |
journalist | -4.143 |
Token | sewing |
Token ID | 35356 |
Feature activation | -7.98e+00 |
Pos logit contributions | |
ogether | +7.559 |
campaigner | +7.432 |
adel | +7.349 |
ilde | +7.228 |
journalist | +7.190 |
Neg logit contributions | |
preferring | -4.623 |
inability | -4.089 |
wanting | -3.708 |
confines | -3.465 |
choosing | -3.390 |
Token | machine |
Token ID | 4572 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
ogether | +6.191 |
campaigner | +6.105 |
adel | +6.052 |
journalist | +5.858 |
ilde | +5.815 |
Neg logit contributions | |
preferring | -7.478 |
inability | -6.833 |
wanting | -6.447 |
confines | -6.179 |
choosing | -6.119 |
Token | is |
Token ID | 318 |
Feature activation | +4.32e+01 |
Pos logit contributions | |
preferring | +2.341 |
inability | +2.187 |
wanting | +2.106 |
choosing | +2.003 |
confines | +1.978 |
Neg logit contributions | |
ogether | -1.708 |
adel | -1.648 |
campaigner | -1.640 |
ilde | -1.595 |
journalist | -1.539 |
Token | to |
Token ID | 284 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
preferring | +25.707 |
choosing | +25.454 |
wanting | +25.118 |
to | +24.177 |
inability | +23.934 |
Neg logit contributions | |
adel | -20.311 |
ogether | -20.158 |
campaigner | -18.804 |
earthqu | -18.784 |
ilde | -18.671 |
Token | sew |
Token ID | 34249 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
preferring | +9.290 |
inability | +8.714 |
wanting | +8.521 |
choosing | +8.147 |
confines | +7.874 |
Neg logit contributions | |
ogether | -8.525 |
adel | -8.185 |
campaigner | -8.037 |
ilde | -7.902 |
ér | -7.685 |
Token | a |
Token ID | 257 |
Feature activation | -7.35e+00 |
Pos logit contributions | |
ogether | +2.659 |
adel | +2.548 |
campaigner | +2.547 |
ilde | +2.476 |
journalist | +2.407 |
Neg logit contributions | |
preferring | -3.774 |
inability | -3.507 |
wanting | -3.331 |
confines | -3.174 |
choosing | -3.174 |
Token | straight |
Token ID | 3892 |
Feature activation | -9.20e+00 |
Pos logit contributions | |
ogether | +5.336 |
campaigner | +5.167 |
adel | +5.100 |
ilde | +5.023 |
journalist | +4.933 |
Neg logit contributions | |
preferring | -7.402 |
inability | -6.810 |
wanting | -6.446 |
confines | -6.162 |
choosing | -6.102 |
Token | seam |
Token ID | 15787 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
ogether | +8.210 |
adel | +7.938 |
campaigner | +7.918 |
ilde | +7.834 |
journalist | +7.665 |
Neg logit contributions | |
preferring | -7.598 |
inability | -6.824 |
wanting | -6.385 |
confines | -6.058 |
choosing | -5.960 |
Token | to |
Token ID | 284 |
Feature activation | +2.60e+00 |
Pos logit contributions | |
preferring | +16.786 |
inability | +15.517 |
wanting | +15.402 |
choosing | +14.301 |
to | +13.913 |
Neg logit contributions | |
ogether | -15.317 |
adel | -14.367 |
ilde | -14.109 |
campaigner | -14.049 |
isan | -13.543 |
Token | Fro |
Token ID | 9734 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
preferring | +2.532 |
inability | +2.329 |
wanting | +2.244 |
choosing | +2.129 |
confines | +2.102 |
Neg logit contributions | |
ogether | -2.097 |
adel | -2.008 |
campaigner | -2.000 |
ilde | -1.942 |
ér | -1.887 |
Token | do |
Token ID | 4598 |
Feature activation | +6.26e+00 |
Pos logit contributions | |
ogether | +0.436 |
campaigner | +0.422 |
adel | +0.415 |
ilde | +0.405 |
journalist | +0.396 |
Neg logit contributions | |
preferring | -0.573 |
inability | -0.532 |
wanting | -0.507 |
choosing | -0.483 |
confines | -0.479 |
Token | and |
Token ID | 290 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
preferring | +7.096 |
inability | +6.537 |
wanting | +6.369 |
choosing | +6.116 |
confines | +5.990 |
Neg logit contributions | |
ogether | -3.917 |
campaigner | -3.715 |
adel | -3.684 |
ilde | -3.445 |
journalist | -3.410 |
Token | his |
Token ID | 465 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
preferring | +22.468 |
wanting | +21.477 |
inability | +20.982 |
choosing | +19.513 |
forgetting | +18.825 |
Neg logit contributions | |
ogether | -18.361 |
adel | -17.491 |
earthqu | -16.476 |
ér | -16.243 |
ritten | -16.095 |
Token | desire |
Token ID | 6227 |
Feature activation | +4.32e+01 |
Pos logit contributions | |
inability | +19.988 |
preferring | +19.635 |
wanting | +18.689 |
choosing | +17.589 |
forgetting | +16.642 |
Neg logit contributions | |
ogether | -16.565 |
adel | -15.170 |
earthqu | -14.951 |
ilde | -14.852 |
escription | -14.731 |
Token | for |
Token ID | 329 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
preferring | +25.107 |
to | +24.232 |
wanting | +24.037 |
inability | +23.819 |
to | +22.845 |
Neg logit contributions | |
ogether | -20.979 |
campaigner | -19.768 |
adel | -19.529 |
ilde | -19.332 |
rame | -18.372 |
Token | the |
Token ID | 262 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
preferring | +12.131 |
inability | +11.051 |
wanting | +10.959 |
choosing | +10.389 |
forgetting | +10.137 |
Neg logit contributions | |
ogether | -10.727 |
campaigner | -10.397 |
adel | -10.352 |
ilde | -10.158 |
ér | -10.113 |
Token | Ring |
Token ID | 12569 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
preferring | +11.857 |
inability | +11.341 |
wanting | +10.677 |
choosing | +10.206 |
confines | +10.142 |
Neg logit contributions | |
ogether | -12.042 |
adel | -11.857 |
ilde | -11.589 |
ér | -11.528 |
campaigner | -11.510 |
Token | – |
Token ID | 784 |
Feature activation | +7.83e+00 |
Pos logit contributions | |
preferring | +14.905 |
wanting | +13.251 |
inability | +13.200 |
choosing | +12.516 |
confines | +12.141 |
Neg logit contributions | |
ogether | -13.165 |
campaigner | -12.825 |
adel | -12.336 |
ilde | -12.245 |
earthqu | -12.126 |
Token | bet |
Token ID | 731 |
Feature activation | -7.01e+00 |
Pos logit contributions | |
preferring | +7.374 |
inability | +6.714 |
wanting | +6.572 |
confines | +6.305 |
choosing | +6.227 |
Neg logit contributions | |
ogether | -6.274 |
campaigner | -5.935 |
adel | -5.881 |
ilde | -5.764 |
isan | -5.591 |
Token | capture |
Token ID | 8006 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
preferring | +1.292 |
inability | +1.205 |
wanting | +1.151 |
choosing | +1.096 |
confines | +1.094 |
Neg logit contributions | |
ogether | -0.983 |
adel | -0.945 |
campaigner | -0.945 |
ilde | -0.923 |
ér | -0.885 |
Token | Arts |
Token ID | 11536 |
Feature activation | -9.88e+00 |
Pos logit contributions | |
ogether | +9.971 |
adel | +9.541 |
campaigner | +9.518 |
journalist | +9.493 |
ilde | +9.132 |
Neg logit contributions | |
preferring | -11.359 |
inability | -10.278 |
wanting | -9.781 |
confines | -9.304 |
choosing | -9.261 |
Token | akh |
Token ID | 11322 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
ogether | +3.531 |
adel | +3.472 |
ilde | +3.130 |
isan | +2.966 |
ér | +2.934 |
Neg logit contributions | |
preferring | -13.718 |
inability | -12.927 |
wanting | -12.485 |
confines | -12.081 |
choosing | -12.067 |
Token | ; |
Token ID | 26 |
Feature activation | +2.54e+01 |
Pos logit contributions | |
ogether | +3.321 |
adel | +3.205 |
campaigner | +3.174 |
ilde | +3.076 |
journalist | +3.017 |
Neg logit contributions | |
preferring | -4.824 |
inability | -4.510 |
wanting | -4.281 |
choosing | -4.083 |
confines | -4.076 |
Token |
|
Token ID | 198 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
preferring | +20.348 |
inability | +19.164 |
wanting | +18.678 |
to | +18.420 |
choosing | +17.804 |
Neg logit contributions | |
ilde | -13.906 |
ogether | -13.298 |
campaigner | -13.292 |
emed | -13.129 |
adel | -13.073 |
Token |
|
Token ID | 198 |
Feature activation | +4.30e+01 |
Pos logit contributions | |
preferring | +8.099 |
to | +7.599 |
wanting | +7.588 |
inability | +7.466 |
To | +7.013 |
Neg logit contributions | |
earthqu | -14.689 |
practition | -14.161 |
exting | -14.048 |
carbohyd | -13.875 |
newcom | -13.546 |
Token | To |
Token ID | 2514 |
Feature activation | +4.40e+00 |
Pos logit contributions | |
to | +27.109 |
To | +26.969 |
preferring | +22.623 |
inability | +21.989 |
Which | +21.576 |
Neg logit contributions | |
earthqu | -20.185 |
campaigner | -19.748 |
ilde | -18.997 |
journalist | -18.645 |
ogether | -18.449 |
Token | empty |
Token ID | 6565 |
Feature activation | -6.57e+00 |
Pos logit contributions | |
preferring | +4.345 |
inability | +4.074 |
wanting | +3.901 |
confines | +3.728 |
choosing | +3.716 |
Neg logit contributions | |
ogether | -3.312 |
adel | -3.175 |
campaigner | -3.169 |
ilde | -3.152 |
ér | -3.021 |
Token | our |
Token ID | 674 |
Feature activation | +8.63e+00 |
Pos logit contributions | |
ogether | +4.985 |
adel | +4.788 |
campaigner | +4.759 |
ilde | +4.600 |
journalist | +4.579 |
Neg logit contributions | |
preferring | -6.511 |
inability | -6.030 |
wanting | -5.737 |
choosing | -5.473 |
confines | -5.390 |
Token | homeland |
Token ID | 23184 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
preferring | +7.520 |
inability | +7.148 |
wanting | +6.684 |
confines | +6.487 |
choosing | +6.348 |
Neg logit contributions | |
ogether | -7.258 |
adel | -7.046 |
ilde | -6.971 |
campaigner | -6.833 |
ér | -6.595 |
Token | ; |
Token ID | 26 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
preferring | +3.151 |
inability | +2.893 |
wanting | +2.804 |
choosing | +2.640 |
confines | +2.639 |
Neg logit contributions | |
ogether | -2.625 |
campaigner | -2.508 |
adel | -2.502 |
ilde | -2.478 |
ér | -2.360 |
Token | " |
Token ID | 366 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
preferring | +5.967 |
inability | +5.517 |
wanting | +5.286 |
choosing | +4.900 |
confines | +4.784 |
Neg logit contributions | |
ogether | -6.418 |
adel | -6.178 |
campaigner | -6.082 |
ilde | -6.029 |
ér | -5.824 |
Token | ISIS |
Token ID | 29322 |
Feature activation | +6.85e+00 |
Pos logit contributions | |
preferring | +10.803 |
inability | +10.170 |
wanting | +9.779 |
to | +9.216 |
To | +9.102 |
Neg logit contributions | |
ogether | -11.226 |
campaigner | -10.545 |
adel | -10.523 |
ilde | -10.423 |
ér | -9.978 |
Token | Ur |
Token ID | 8799 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
preferring | +6.556 |
inability | +6.099 |
wanting | +5.915 |
choosing | +5.530 |
confines | +5.469 |
Neg logit contributions | |
ogether | -5.441 |
ilde | -5.096 |
adel | -5.084 |
campaigner | -4.948 |
ér | -4.863 |
Token | ges |
Token ID | 3212 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
preferring | +0.507 |
inability | +0.478 |
wanting | +0.458 |
choosing | +0.438 |
confines | +0.436 |
Neg logit contributions | |
ogether | -0.271 |
campaigner | -0.262 |
adel | -0.257 |
ilde | -0.253 |
journalist | -0.242 |
Token | Jihad |
Token ID | 35243 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
preferring | +13.188 |
inability | +12.445 |
wanting | +12.125 |
choosing | +11.367 |
to | +11.055 |
Neg logit contributions | |
ogether | -11.672 |
adel | -10.636 |
ilde | -10.526 |
ér | -10.221 |
campaigner | -10.181 |
Token | ists |
Token ID | 1023 |
Feature activation | +4.30e+01 |
Pos logit contributions | |
ogether | +2.079 |
campaigner | +1.999 |
adel | +1.999 |
ilde | +1.928 |
journalist | +1.877 |
Neg logit contributions | |
preferring | -3.206 |
inability | -2.995 |
wanting | -2.855 |
choosing | -2.729 |
confines | -2.720 |
Token | To |
Token ID | 1675 |
Feature activation | +8.57e+00 |
Pos logit contributions | |
wanting | +24.247 |
to | +23.984 |
preferring | +23.964 |
To | +23.100 |
to | +23.093 |
Neg logit contributions | |
ogether | -20.735 |
carbohyd | -19.713 |
ilde | -19.553 |
earthqu | -19.027 |
alysed | -18.284 |
Token | Attack |
Token ID | 8307 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
preferring | +7.050 |
inability | +6.473 |
wanting | +6.372 |
confines | +5.919 |
choosing | +5.918 |
Neg logit contributions | |
ogether | -7.631 |
campaigner | -7.068 |
adel | -7.049 |
ilde | -6.985 |
alysed | -6.813 |
Token | Canadians |
Token ID | 14008 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ogether | +3.904 |
campaigner | +3.810 |
adel | +3.809 |
ilde | +3.697 |
journalist | +3.649 |
Neg logit contributions | |
preferring | -4.451 |
inability | -4.108 |
wanting | -3.864 |
choosing | -3.681 |
confines | -3.657 |
Token | ", |
Token ID | 1600 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
preferring | +1.341 |
inability | +1.249 |
wanting | +1.211 |
choosing | +1.151 |
confines | +1.137 |
Neg logit contributions | |
ogether | -0.856 |
adel | -0.814 |
campaigner | -0.814 |
ilde | -0.792 |
journalist | -0.755 |
Token | with |
Token ID | 351 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
preferring | +3.482 |
inability | +3.216 |
wanting | +3.130 |
choosing | +2.988 |
forgetting | +2.912 |
Neg logit contributions | |
ogether | -2.290 |
adel | -2.170 |
campaigner | -2.141 |
ilde | -2.100 |
ér | -2.001 |
Token | of |
Token ID | 286 |
Feature activation | +7.06e+00 |
Pos logit contributions | |
preferring | +7.707 |
inability | +7.023 |
wanting | +6.710 |
choosing | +6.309 |
confines | +6.190 |
Neg logit contributions | |
ogether | -7.971 |
adel | -7.638 |
campaigner | -7.443 |
ilde | -7.304 |
journalist | -7.041 |
Token | passions |
Token ID | 30477 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
preferring | +6.842 |
inability | +6.268 |
wanting | +6.094 |
choosing | +5.804 |
forgetting | +5.615 |
Neg logit contributions | |
ogether | -5.697 |
adel | -5.548 |
ilde | -5.375 |
campaigner | -5.316 |
ér | -5.110 |
Token | and |
Token ID | 290 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
preferring | +4.017 |
inability | +3.717 |
wanting | +3.621 |
choosing | +3.450 |
confines | +3.397 |
Neg logit contributions | |
ogether | -2.303 |
adel | -2.173 |
campaigner | -2.155 |
ilde | -2.096 |
ér | -1.999 |
Token | Kant |
Token ID | 29576 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
preferring | +12.079 |
inability | +11.206 |
wanting | +10.898 |
choosing | +10.199 |
forgetting | +9.940 |
Neg logit contributions | |
ogether | -9.446 |
adel | -9.196 |
ilde | -9.100 |
campaigner | -8.747 |
ér | -8.634 |
Token | 's |
Token ID | 338 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
preferring | +9.998 |
inability | +8.925 |
wanting | +8.708 |
choosing | +8.104 |
forgetting | +7.876 |
Neg logit contributions | |
ogether | -11.675 |
campaigner | -11.325 |
adel | -11.078 |
ilde | -11.013 |
journalist | -10.751 |
Token | commitment |
Token ID | 7901 |
Feature activation | +4.28e+01 |
Pos logit contributions | |
preferring | +18.830 |
inability | +18.550 |
wanting | +17.149 |
forgetting | +15.971 |
choosing | +15.921 |
Neg logit contributions | |
ogether | -14.363 |
ilde | -13.117 |
adel | -12.883 |
earthqu | -12.771 |
ér | -12.417 |
Token | to |
Token ID | 284 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
preferring | +27.356 |
wanting | +25.361 |
inability | +25.201 |
to | +24.912 |
to | +23.835 |
Neg logit contributions | |
ogether | -19.148 |
ilde | -18.987 |
adel | -18.689 |
campaigner | -17.632 |
isan | -17.252 |
Token | the |
Token ID | 262 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
preferring | +12.472 |
inability | +11.340 |
wanting | +11.151 |
choosing | +10.594 |
forgetting | +10.316 |
Neg logit contributions | |
ogether | -9.392 |
adel | -9.032 |
ilde | -8.992 |
campaigner | -8.802 |
ér | -8.420 |
Token | univers |
Token ID | 5820 |
Feature activation | +2.65e-01 |
Pos logit contributions | |
preferring | +14.245 |
inability | +14.114 |
wanting | +12.927 |
confines | +12.332 |
forgetting | +12.189 |
Neg logit contributions | |
ogether | -11.156 |
adel | -11.033 |
ilde | -10.678 |
campaigner | -10.447 |
earthqu | -10.369 |
Token | ality |
Token ID | 1483 |
Feature activation | +9.71e+00 |
Pos logit contributions | |
preferring | +0.257 |
inability | +0.239 |
wanting | +0.228 |
choosing | +0.216 |
confines | +0.216 |
Neg logit contributions | |
ogether | -0.210 |
campaigner | -0.205 |
adel | -0.203 |
ilde | -0.198 |
journalist | -0.193 |
Token | of |
Token ID | 286 |
Feature activation | +2.58e+00 |
Pos logit contributions | |
preferring | +8.122 |
inability | +7.494 |
wanting | +7.102 |
confines | +6.627 |
choosing | +6.622 |
Neg logit contributions | |
ogether | -8.610 |
adel | -8.232 |
ilde | -8.089 |
campaigner | -8.052 |
isan | -7.685 |
Token | loans |
Token ID | 10021 |
Feature activation | +7.52e+00 |
Pos logit contributions | |
preferring | +2.285 |
inability | +2.092 |
wanting | +1.982 |
choosing | +1.875 |
confines | +1.830 |
Neg logit contributions | |
ogether | -2.648 |
campaigner | -2.549 |
adel | -2.545 |
ilde | -2.537 |
ér | -2.410 |
Token | in |
Token ID | 287 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
preferring | +7.689 |
inability | +7.042 |
wanting | +6.913 |
choosing | +6.598 |
confines | +6.297 |
Neg logit contributions | |
ogether | -5.418 |
adel | -5.237 |
campaigner | -5.202 |
ilde | -5.121 |
journalist | -4.765 |
Token | the |
Token ID | 262 |
Feature activation | +2.97e+01 |
Pos logit contributions | |
preferring | +13.943 |
inability | +13.399 |
wanting | +12.785 |
choosing | +12.462 |
refusing | +11.700 |
Neg logit contributions | |
ogether | -13.023 |
ilde | -12.122 |
campaigner | -12.099 |
alysed | -12.061 |
ritten | -12.056 |
Token | lead |
Token ID | 1085 |
Feature activation | +7.11e+00 |
Pos logit contributions | |
inability | +21.050 |
preferring | +19.565 |
confines | +18.578 |
wanting | +18.323 |
choosing | +18.163 |
Neg logit contributions | |
ogether | -18.504 |
ilde | -18.222 |
quished | -17.739 |
ritten | -17.601 |
emed | -17.295 |
Token | - |
Token ID | 12 |
Feature activation | +9.86e+00 |
Pos logit contributions | |
preferring | +7.862 |
inability | +7.553 |
wanting | +7.206 |
choosing | +6.923 |
confines | +6.851 |
Neg logit contributions | |
ogether | -4.275 |
adel | -4.046 |
campaigner | -3.950 |
ilde | -3.947 |
isan | -3.685 |
Token | up |
Token ID | 929 |
Feature activation | +4.27e+01 |
Pos logit contributions | |
preferring | +9.684 |
inability | +9.271 |
wanting | +8.769 |
to | +8.695 |
choosing | +8.548 |
Neg logit contributions | |
ogether | -6.692 |
adel | -6.500 |
campaigner | -6.441 |
ilde | -6.260 |
isan | -5.956 |
Token | to |
Token ID | 284 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
to | +21.789 |
to | +19.684 |
preferring | +18.403 |
wanting | +18.166 |
inability | +17.835 |
Neg logit contributions | |
exting | -28.231 |
earthqu | -28.078 |
practition | -27.670 |
newcom | -26.577 |
carbohyd | -26.368 |
Token | the |
Token ID | 262 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
preferring | +9.265 |
inability | +8.814 |
wanting | +8.327 |
choosing | +8.101 |
forgetting | +7.620 |
Neg logit contributions | |
ogether | -9.206 |
campaigner | -9.018 |
adel | -8.769 |
ilde | -8.562 |
ritten | -8.536 |
Token | financial |
Token ID | 3176 |
Feature activation | +6.17e+00 |
Pos logit contributions | |
inability | +11.216 |
preferring | +10.848 |
wanting | +9.966 |
choosing | +9.694 |
forgetting | +9.211 |
Neg logit contributions | |
ogether | -13.767 |
ilde | -13.733 |
emed | -13.230 |
campaigner | -13.194 |
ouble | -13.194 |
Token | crisis |
Token ID | 4902 |
Feature activation | +9.64e+00 |
Pos logit contributions | |
preferring | +5.519 |
inability | +5.445 |
wanting | +4.979 |
choosing | +4.791 |
confines | +4.753 |
Neg logit contributions | |
ogether | -5.036 |
adel | -4.882 |
campaigner | -4.756 |
ilde | -4.723 |
emed | -4.590 |
Token | — |
Token ID | 960 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
preferring | +8.431 |
inability | +7.726 |
wanting | +7.470 |
choosing | +7.110 |
forgetting | +6.753 |
Neg logit contributions | |
ogether | -7.898 |
adel | -7.710 |
campaigner | -7.667 |
ilde | -7.627 |
journalist | -7.171 |
Token | for |
Token ID | 329 |
Feature activation | -7.15e+00 |
Pos logit contributions | |
preferring | +14.896 |
inability | +13.745 |
wanting | +13.428 |
choosing | +12.805 |
forgetting | +12.396 |
Neg logit contributions | |
ogether | -13.892 |
adel | -13.481 |
ilde | -13.360 |
campaigner | -12.972 |
isan | -12.491 |
Token | countries |
Token ID | 2678 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
ogether | +5.036 |
campaigner | +4.932 |
adel | +4.858 |
journalist | +4.705 |
ilde | +4.637 |
Neg logit contributions | |
preferring | -7.328 |
inability | -6.821 |
wanting | -6.484 |
confines | -6.237 |
choosing | -6.150 |
Token | in |
Token ID | 287 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
preferring | +18.298 |
wanting | +16.943 |
inability | +16.186 |
choosing | +15.728 |
refusing | +14.841 |
Neg logit contributions | |
ogether | -13.739 |
adel | -12.756 |
ilde | -12.679 |
earthqu | -11.996 |
campaigner | -11.931 |
Token | the |
Token ID | 262 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
preferring | +14.947 |
inability | +13.657 |
wanting | +13.314 |
choosing | +12.657 |
refusing | +11.804 |
Neg logit contributions | |
ogether | -13.251 |
adel | -12.611 |
ilde | -12.252 |
campaigner | -12.069 |
ratulations | -12.041 |
Token | Arab |
Token ID | 4498 |
Feature activation | +9.08e+00 |
Pos logit contributions | |
preferring | +13.380 |
inability | +12.478 |
wanting | +11.835 |
confines | +11.431 |
choosing | +11.270 |
Neg logit contributions | |
ogether | -14.474 |
ilde | -14.083 |
adel | -14.004 |
emed | -13.442 |
campaigner | -13.294 |
Token | region |
Token ID | 3814 |
Feature activation | +4.25e+01 |
Pos logit contributions | |
preferring | +7.022 |
inability | +6.378 |
wanting | +6.073 |
choosing | +5.751 |
confines | +5.661 |
Neg logit contributions | |
ogether | -8.587 |
ilde | -8.157 |
adel | -8.127 |
campaigner | -8.036 |
ér | -7.831 |
Token | to |
Token ID | 284 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
preferring | +28.574 |
wanting | +26.560 |
inability | +24.973 |
to | +24.925 |
choosing | +24.458 |
Neg logit contributions | |
ogether | -18.795 |
ilde | -18.272 |
adel | -17.032 |
ratulations | -16.850 |
ritten | -16.759 |
Token | react |
Token ID | 6324 |
Feature activation | -2.44e-01 |
Pos logit contributions | |
ogether | +1.174 |
adel | +1.125 |
campaigner | +1.120 |
ilde | +1.094 |
journalist | +1.054 |
Neg logit contributions | |
preferring | -1.631 |
inability | -1.518 |
wanting | -1.451 |
choosing | -1.383 |
confines | -1.374 |
Token | to |
Token ID | 284 |
Feature activation | -8.36e+00 |
Pos logit contributions | |
ogether | +0.248 |
adel | +0.240 |
campaigner | +0.239 |
ilde | +0.234 |
journalist | +0.229 |
Neg logit contributions | |
preferring | -0.189 |
inability | -0.170 |
wanting | -0.161 |
choosing | -0.150 |
confines | -0.147 |
Token | what |
Token ID | 644 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
ogether | +6.059 |
campaigner | +5.921 |
adel | +5.846 |
journalist | +5.696 |
ilde | +5.644 |
Neg logit contributions | |
preferring | -8.191 |
inability | -7.535 |
wanting | -7.168 |
confines | -6.921 |
choosing | -6.791 |
Token | is |
Token ID | 318 |
Feature activation | -3.93e+00 |
Pos logit contributions | |
campaigner | +10.001 |
ogether | +9.914 |
journalist | +9.693 |
adel | +9.604 |
ilde | +9.243 |
Neg logit contributions | |
preferring | -13.121 |
inability | -11.949 |
wanting | -11.416 |
forgetting | -10.762 |
confines | -10.704 |
Token | Movement |
Token ID | 15477 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
ogether | +3.937 |
adel | +3.825 |
campaigner | +3.816 |
ilde | +3.704 |
journalist | +3.643 |
Neg logit contributions | |
preferring | -4.092 |
inability | -3.764 |
wanting | -3.553 |
choosing | -3.360 |
confines | -3.339 |
Token | ( |
Token ID | 357 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
preferring | +3.507 |
inability | +3.215 |
wanting | +3.126 |
choosing | +2.958 |
confines | +2.910 |
Neg logit contributions | |
ogether | -2.708 |
campaigner | -2.599 |
adel | -2.592 |
ilde | -2.568 |
journalist | -2.432 |
Token | AK |
Token ID | 10206 |
Feature activation | -1.79e-02 |
Pos logit contributions | |
preferring | +2.034 |
inability | +1.884 |
wanting | +1.788 |
choosing | +1.687 |
confines | +1.665 |
Neg logit contributions | |
ogether | -1.846 |
campaigner | -1.784 |
adel | -1.760 |
ilde | -1.753 |
journalist | -1.696 |
Token | ) |
Token ID | 8 |
Feature activation | +6.70e+00 |
Pos logit contributions | |
ogether | +0.017 |
campaigner | +0.016 |
adel | +0.016 |
ilde | +0.016 |
journalist | +0.015 |
Neg logit contributions | |
preferring | -0.015 |
inability | -0.014 |
wanting | -0.013 |
choosing | -0.012 |
confines | -0.012 |
Token | in |
Token ID | 287 |
Feature activation | +8.57e+00 |
Pos logit contributions | |
preferring | +6.949 |
inability | +6.356 |
wanting | +6.280 |
choosing | +5.959 |
confines | +5.748 |
Neg logit contributions | |
ogether | -4.656 |
adel | -4.509 |
ilde | -4.470 |
campaigner | -4.463 |
ér | -4.111 |
Token | relation |
Token ID | 8695 |
Feature activation | +4.25e+01 |
Pos logit contributions | |
preferring | +7.581 |
inability | +6.988 |
wanting | +6.714 |
choosing | +6.432 |
confines | +6.167 |
Neg logit contributions | |
ogether | -7.174 |
adel | -6.858 |
ilde | -6.769 |
campaigner | -6.717 |
ér | -6.456 |
Token | to |
Token ID | 284 |
Feature activation | +7.92e+00 |
Pos logit contributions | |
to | +23.029 |
preferring | +21.770 |
wanting | +21.664 |
to | +21.567 |
inability | +20.211 |
Neg logit contributions | |
earthqu | -25.405 |
exting | -23.716 |
practition | -23.661 |
carbohyd | -22.340 |
ogether | -21.988 |
Token | the |
Token ID | 262 |
Feature activation | +6.98e+00 |
Pos logit contributions | |
preferring | +7.549 |
inability | +7.025 |
wanting | +6.833 |
choosing | +6.422 |
forgetting | +6.241 |
Neg logit contributions | |
ogether | -6.233 |
adel | -5.997 |
ilde | -5.891 |
campaigner | -5.778 |
ouble | -5.576 |
Token | present |
Token ID | 1944 |
Feature activation | -2.19e-01 |
Pos logit contributions | |
preferring | +6.434 |
inability | +6.158 |
wanting | +5.770 |
choosing | +5.451 |
confines | +5.441 |
Neg logit contributions | |
ogether | -5.670 |
adel | -5.525 |
ilde | -5.433 |
campaigner | -5.308 |
ér | -5.108 |
Token | political |
Token ID | 1964 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
ogether | +0.194 |
adel | +0.188 |
campaigner | +0.186 |
ilde | +0.184 |
journalist | +0.177 |
Neg logit contributions | |
preferring | -0.196 |
inability | -0.183 |
wanting | -0.172 |
choosing | -0.162 |
confines | -0.161 |
Token | and |
Token ID | 290 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
ogether | +1.435 |
campaigner | +1.388 |
adel | +1.388 |
ilde | +1.353 |
journalist | +1.321 |
Neg logit contributions | |
preferring | -1.440 |
inability | -1.325 |
wanting | -1.253 |
choosing | -1.182 |
confines | -1.175 |
Token | empty |
Token ID | 6565 |
Feature activation | -6.57e+00 |
Pos logit contributions | |
preferring | +4.345 |
inability | +4.074 |
wanting | +3.901 |
confines | +3.728 |
choosing | +3.716 |
Neg logit contributions | |
ogether | -3.312 |
adel | -3.175 |
campaigner | -3.169 |
ilde | -3.152 |
ér | -3.021 |
Token | our |
Token ID | 674 |
Feature activation | +8.63e+00 |
Pos logit contributions | |
ogether | +4.985 |
adel | +4.788 |
campaigner | +4.759 |
ilde | +4.600 |
journalist | +4.579 |
Neg logit contributions | |
preferring | -6.511 |
inability | -6.030 |
wanting | -5.737 |
choosing | -5.473 |
confines | -5.390 |
Token | homeland |
Token ID | 23184 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
preferring | +7.520 |
inability | +7.148 |
wanting | +6.684 |
confines | +6.487 |
choosing | +6.348 |
Neg logit contributions | |
ogether | -7.258 |
adel | -7.046 |
ilde | -6.971 |
campaigner | -6.833 |
ér | -6.595 |
Token | ; |
Token ID | 26 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
preferring | +3.151 |
inability | +2.893 |
wanting | +2.804 |
choosing | +2.640 |
confines | +2.639 |
Neg logit contributions | |
ogether | -2.625 |
campaigner | -2.508 |
adel | -2.502 |
ilde | -2.478 |
ér | -2.360 |
Token |
|
Token ID | 198 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
preferring | +15.121 |
inability | +14.111 |
wanting | +13.597 |
to | +12.949 |
choosing | +12.828 |
Neg logit contributions | |
ogether | -12.649 |
campaigner | -12.424 |
adel | -12.256 |
ilde | -12.054 |
journalist | -11.581 |
Token |
|
Token ID | 198 |
Feature activation | +4.24e+01 |
Pos logit contributions | |
preferring | +7.330 |
wanting | +6.795 |
inability | +6.772 |
to | +6.613 |
choosing | +6.167 |
Neg logit contributions | |
earthqu | -11.946 |
practition | -11.402 |
exting | -11.304 |
carbohyd | -11.178 |
newcom | -10.943 |
Token | And |
Token ID | 1870 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
To | +25.855 |
to | +24.791 |
preferring | +21.371 |
inability | +20.893 |
Which | +20.289 |
Neg logit contributions | |
campaigner | -21.689 |
ilde | -20.596 |
ogether | -20.493 |
earthqu | -20.379 |
journalist | -20.137 |
Token | to |
Token ID | 284 |
Feature activation | +2.80e+00 |
Pos logit contributions | |
preferring | +18.186 |
inability | +17.312 |
wanting | +16.851 |
to | +16.114 |
forgetting | +15.970 |
Neg logit contributions | |
ogether | -12.453 |
ilde | -12.317 |
campaigner | -12.274 |
adel | -12.226 |
ritten | -11.791 |
Token | destroy |
Token ID | 4117 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
preferring | +2.764 |
inability | +2.586 |
wanting | +2.465 |
confines | +2.347 |
choosing | +2.343 |
Neg logit contributions | |
ogether | -2.170 |
adel | -2.080 |
campaigner | -2.073 |
ilde | -2.045 |
ér | -1.967 |
Token | our |
Token ID | 674 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
ogether | +13.840 |
adel | +12.929 |
journalist | +12.744 |
campaigner | +12.743 |
ér | +12.130 |
Neg logit contributions | |
preferring | -13.055 |
inability | -11.791 |
wanting | -11.015 |
confines | -10.703 |
choosing | -10.585 |
Token | D |
Token ID | 360 |
Feature activation | -6.59e+00 |
Pos logit contributions | |
preferring | +1.435 |
inability | +1.338 |
wanting | +1.262 |
choosing | +1.197 |
confines | +1.187 |
Neg logit contributions | |
ogether | -1.352 |
adel | -1.310 |
campaigner | -1.302 |
ilde | -1.290 |
ér | -1.233 |
Token | ence |
Token ID | 594 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
ogether | +10.267 |
adel | +9.926 |
campaigner | +9.818 |
ér | +9.538 |
ilde | +9.538 |
Neg logit contributions | |
preferring | -10.389 |
inability | -9.518 |
wanting | -8.973 |
confines | -8.544 |
choosing | -8.499 |
Token | or |
Token ID | 393 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
ogether | +9.638 |
campaigner | +9.461 |
adel | +9.365 |
ilde | +9.062 |
journalist | +8.980 |
Neg logit contributions | |
preferring | -9.412 |
inability | -8.701 |
wanting | -8.048 |
confines | -7.595 |
choosing | -7.521 |
Token | not |
Token ID | 407 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
ogether | +1.696 |
campaigner | +1.639 |
adel | +1.638 |
ilde | +1.593 |
journalist | +1.555 |
Neg logit contributions | |
preferring | -1.887 |
inability | -1.742 |
wanting | -1.653 |
choosing | -1.564 |
confines | -1.557 |
Token | will |
Token ID | 481 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
ogether | +8.596 |
adel | +8.372 |
campaigner | +8.282 |
ilde | +7.976 |
journalist | +7.859 |
Neg logit contributions | |
preferring | -11.476 |
inability | -10.633 |
wanting | -9.921 |
choosing | -9.476 |
confines | -9.453 |
Token | be |
Token ID | 307 |
Feature activation | -1.84e+01 |
Pos logit contributions | |
campaigner | +13.947 |
ogether | +13.627 |
inform | +13.460 |
adel | +13.446 |
journalist | +13.387 |
Neg logit contributions | |
preferring | -16.240 |
inability | -14.719 |
wanting | -13.735 |
forgetting | -13.198 |
confines | -13.181 |
Token | decided |
Token ID | 3066 |
Feature activation | -3.63e+01 |
Pos logit contributions | |
campaigner | +15.458 |
ilde | +15.095 |
journalist | +15.057 |
adel | +14.960 |
ogether | +14.818 |
Neg logit contributions | |
preferring | -12.428 |
inability | -11.404 |
wanting | -10.144 |
confines | -9.999 |
forgetting | -9.470 |
Token | by |
Token ID | 416 |
Feature activation | -1.80e+01 |
Pos logit contributions | |
inform | +25.105 |
ogether | +24.335 |
campaigner | +24.332 |
journalist | +23.857 |
adel | +23.804 |
Neg logit contributions | |
preferring | -16.626 |
inability | -16.035 |
confines | -13.487 |
wanting | -13.228 |
forgetting | -12.944 |
Token | our |
Token ID | 674 |
Feature activation | -9.90e+00 |
Pos logit contributions | |
campaigner | +15.728 |
ogether | +15.715 |
adel | +15.433 |
journalist | +15.182 |
isan | +14.701 |
Neg logit contributions | |
preferring | -11.531 |
inability | -10.548 |
wanting | -9.558 |
confines | -9.448 |
forgetting | -8.904 |
Token | citizens |
Token ID | 4290 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
ogether | +8.777 |
campaigner | +8.591 |
adel | +8.443 |
journalist | +8.292 |
ilde | +8.033 |
Neg logit contributions | |
preferring | -7.967 |
inability | -7.126 |
wanting | -6.839 |
confines | -6.441 |
forgetting | -6.279 |
Token | . |
Token ID | 13 |
Feature activation | -8.51e+00 |
Pos logit contributions | |
ogether | +11.016 |
campaigner | +10.791 |
adel | +10.765 |
journalist | +10.337 |
ér | +10.246 |
Neg logit contributions | |
preferring | -9.991 |
inability | -9.291 |
wanting | -8.325 |
confines | -8.245 |
forgetting | -7.972 |
Token | � |
Token ID | 447 |
Feature activation | -5.67e+00 |
Pos logit contributions | |
ogether | +5.888 |
adel | +5.755 |
campaigner | +5.669 |
ilde | +5.547 |
journalist | +5.483 |
Neg logit contributions | |
preferring | -8.748 |
inability | -8.196 |
wanting | -7.629 |
confines | -7.353 |
choosing | -7.308 |
Token | and |
Token ID | 290 |
Feature activation | +8.05e+00 |
Pos logit contributions | |
ogether | +3.017 |
adel | +2.923 |
campaigner | +2.905 |
ilde | +2.799 |
journalist | +2.743 |
Neg logit contributions | |
preferring | -4.215 |
inability | -3.928 |
wanting | -3.721 |
confines | -3.541 |
choosing | -3.539 |
Token | will |
Token ID | 481 |
Feature activation | -6.11e+00 |
Pos logit contributions | |
preferring | +7.690 |
inability | +6.970 |
wanting | +6.946 |
choosing | +6.530 |
confines | +6.336 |
Neg logit contributions | |
ogether | -6.531 |
adel | -6.167 |
ilde | -6.122 |
campaigner | -6.052 |
ér | -5.926 |
Token | try |
Token ID | 1949 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
ogether | +4.217 |
campaigner | +4.152 |
adel | +4.116 |
journalist | +3.927 |
ilde | +3.904 |
Neg logit contributions | |
preferring | -6.337 |
inability | -5.936 |
wanting | -5.581 |
confines | -5.384 |
choosing | -5.328 |
Token | to |
Token ID | 284 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
preferring | +15.283 |
wanting | +14.413 |
inability | +14.087 |
choosing | +13.260 |
to | +12.827 |
Neg logit contributions | |
ogether | -13.643 |
campaigner | -13.049 |
ilde | -12.816 |
alysed | -12.779 |
adel | -12.749 |
Token | remain |
Token ID | 3520 |
Feature activation | -2.69e+01 |
Pos logit contributions | |
campaigner | +6.978 |
ogether | +6.896 |
adel | +6.891 |
journalist | +6.630 |
ilde | +6.447 |
Neg logit contributions | |
preferring | -10.552 |
inability | -9.839 |
wanting | -9.135 |
choosing | -8.746 |
confines | -8.709 |
Token | a |
Token ID | 257 |
Feature activation | -3.42e+01 |
Pos logit contributions | |
campaigner | +20.346 |
journalist | +19.892 |
inform | +19.240 |
adel | +19.183 |
ogether | +18.875 |
Neg logit contributions | |
preferring | -15.746 |
inability | -15.252 |
confines | -12.403 |
forgetting | -12.239 |
ses | -12.056 |
Token | part |
Token ID | 636 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
campaigner | +22.770 |
journalist | +22.499 |
inform | +20.157 |
adel | +20.003 |
ogether | +19.824 |
Neg logit contributions | |
preferring | -18.986 |
inability | -17.679 |
forgetting | -15.132 |
wanting | -14.915 |
confines | -14.822 |
Token | of |
Token ID | 286 |
Feature activation | -7.45e+00 |
Pos logit contributions | |
ogether | +12.379 |
adel | +12.369 |
campaigner | +12.280 |
isan | +12.075 |
journalist | +11.921 |
Neg logit contributions | |
preferring | -12.504 |
inability | -11.889 |
wanting | -10.566 |
confines | -10.375 |
forgetting | -10.199 |
Token | it |
Token ID | 340 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
ogether | +5.601 |
adel | +5.404 |
campaigner | +5.336 |
ilde | +5.182 |
journalist | +5.124 |
Neg logit contributions | |
preferring | -7.229 |
inability | -6.745 |
wanting | -6.278 |
confines | -6.055 |
choosing | -5.961 |
Token | , |
Token ID | 11 |
Feature activation | -5.70e+00 |
Pos logit contributions | |
ogether | +10.535 |
adel | +10.365 |
campaigner | +10.215 |
journalist | +9.906 |
ilde | +9.718 |
Neg logit contributions | |
preferring | -9.966 |
inability | -9.346 |
wanting | -8.311 |
confines | -8.075 |
forgetting | -7.885 |
Token | though |
Token ID | 996 |
Feature activation | -4.19e-01 |
Pos logit contributions | |
ogether | +4.647 |
adel | +4.508 |
campaigner | +4.495 |
ilde | +4.333 |
journalist | +4.317 |
Neg logit contributions | |
preferring | -5.218 |
inability | -4.910 |
wanting | -4.566 |
confines | -4.406 |
choosing | -4.306 |
Token | protests |
Token ID | 8536 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
ogether | +9.053 |
campaigner | +8.898 |
adel | +8.630 |
journalist | +8.542 |
isan | +8.187 |
Neg logit contributions | |
preferring | -8.994 |
inability | -8.001 |
wanting | -7.603 |
choosing | -7.285 |
confines | -7.223 |
Token | were |
Token ID | 547 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
campaigner | +13.508 |
ogether | +13.474 |
adel | +13.044 |
occur | +12.942 |
journalist | +12.867 |
Neg logit contributions | |
preferring | -13.267 |
inability | -11.709 |
confines | -10.806 |
wanting | -10.802 |
choosing | -10.577 |
Token | being |
Token ID | 852 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
ogether | +14.473 |
campaigner | +14.430 |
journalist | +14.188 |
adel | +13.850 |
inform | +13.581 |
Neg logit contributions | |
preferring | -12.477 |
inability | -10.955 |
confines | -10.076 |
wanting | -9.905 |
choosing | -9.600 |
Token | run |
Token ID | 1057 |
Feature activation | -2.78e+01 |
Pos logit contributions | |
campaigner | +15.593 |
journalist | +15.267 |
ogether | +15.209 |
adel | +14.983 |
inform | +14.898 |
Neg logit contributions | |
preferring | -16.973 |
inability | -15.087 |
confines | -13.950 |
wanting | -13.756 |
choosing | -13.586 |
Token | and |
Token ID | 290 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
ogether | +21.837 |
adel | +20.966 |
inform | +20.662 |
campaigner | +20.429 |
journalist | +20.275 |
Neg logit contributions | |
preferring | -14.542 |
inability | -13.693 |
confines | -12.534 |
wanting | -11.559 |
choosing | -11.507 |
Token | organized |
Token ID | 8389 |
Feature activation | -3.41e+01 |
Pos logit contributions | |
campaigner | +13.431 |
ogether | +13.129 |
journalist | +13.017 |
adel | +12.876 |
alysed | +12.587 |
Neg logit contributions | |
preferring | -13.595 |
inability | -12.191 |
wanting | -11.289 |
confines | -11.070 |
choosing | -10.860 |
Token | mostly |
Token ID | 4632 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
ogether | +23.774 |
inform | +22.808 |
campaigner | +22.513 |
adel | +22.195 |
journalist | +22.042 |
Neg logit contributions | |
preferring | -16.288 |
inability | -15.211 |
confines | -13.879 |
wanting | -12.987 |
forgetting | -12.751 |
Token | by |
Token ID | 416 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
ogether | +18.151 |
campaigner | +17.923 |
journalist | +17.461 |
adel | +17.236 |
inform | +17.101 |
Neg logit contributions | |
preferring | -14.046 |
inability | -13.072 |
confines | -11.543 |
wanting | -11.369 |
forgetting | -10.757 |
Token | near |
Token ID | 1474 |
Feature activation | -7.59e+00 |
Pos logit contributions | |
ogether | +10.170 |
campaigner | +10.153 |
journalist | +9.832 |
adel | +9.700 |
isan | +9.370 |
Neg logit contributions | |
preferring | -11.176 |
inability | -10.150 |
wanting | -9.472 |
confines | -9.223 |
choosing | -9.050 |
Token | s |
Token ID | 82 |
Feature activation | -4.23e+00 |
Pos logit contributions | |
ogether | +6.282 |
campaigner | +6.015 |
adel | +5.907 |
ilde | +5.794 |
journalist | +5.735 |
Neg logit contributions | |
preferring | -6.984 |
inability | -6.338 |
wanting | -6.037 |
choosing | -5.719 |
confines | -5.712 |
Token | and |
Token ID | 290 |
Feature activation | -4.95e+00 |
Pos logit contributions | |
ogether | +3.089 |
campaigner | +2.964 |
adel | +2.963 |
ilde | +2.868 |
journalist | +2.794 |
Neg logit contributions | |
preferring | -4.409 |
inability | -4.104 |
wanting | -3.916 |
choosing | -3.732 |
confines | -3.720 |
Token | continue |
Token ID | 2555 |
Feature activation | +9.94e+00 |
Pos logit contributions | |
campaigner | +8.771 |
ogether | +8.616 |
adel | +8.519 |
journalist | +8.499 |
ilde | +8.188 |
Neg logit contributions | |
preferring | -11.741 |
inability | -10.818 |
wanting | -10.231 |
confines | -9.746 |
forgetting | -9.739 |
Token | to |
Token ID | 284 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
preferring | +8.825 |
inability | +8.217 |
wanting | +7.946 |
choosing | +7.557 |
confines | +7.170 |
Neg logit contributions | |
ogether | -8.209 |
adel | -8.016 |
ilde | -7.761 |
campaigner | -7.535 |
ér | -7.392 |
Token | make |
Token ID | 787 |
Feature activation | -2.81e+01 |
Pos logit contributions | |
campaigner | +9.504 |
adel | +9.115 |
ogether | +9.102 |
journalist | +9.058 |
inform | +8.640 |
Neg logit contributions | |
preferring | -13.603 |
inability | -12.527 |
wanting | -11.814 |
confines | -11.387 |
forgetting | -11.350 |
Token | a |
Token ID | 257 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
journalist | +18.252 |
campaigner | +18.076 |
dign | +17.768 |
meaningful | +17.646 |
ogether | +17.290 |
Neg logit contributions | |
preferring | -18.323 |
inability | -16.233 |
confines | -15.061 |
wanting | -15.036 |
forgetting | -14.032 |
Token | sustained |
Token ID | 12605 |
Feature activation | -2.69e+01 |
Pos logit contributions | |
journalist | +18.579 |
campaigner | +18.413 |
dign | +18.153 |
meaningful | +18.084 |
credible | +17.082 |
Neg logit contributions | |
preferring | -19.687 |
inability | -17.845 |
confines | -16.943 |
wanting | -15.805 |
quirks | -15.311 |
Token | and |
Token ID | 290 |
Feature activation | -3.33e+01 |
Pos logit contributions | |
campaigner | +17.506 |
journalist | +17.069 |
ogether | +15.838 |
inform | +15.833 |
dign | +15.814 |
Neg logit contributions | |
preferring | -18.837 |
confines | -15.788 |
inability | -15.727 |
wanting | -15.191 |
quirks | -14.975 |
Token | distinguished |
Token ID | 18876 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
dign | +22.255 |
meaningful | +21.888 |
campaigner | +20.867 |
journalist | +20.727 |
inform | +20.589 |
Neg logit contributions | |
preferring | -17.699 |
inability | -16.309 |
confines | -15.611 |
quirks | -13.913 |
forgetting | -13.540 |
Token | contribution |
Token ID | 10156 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
campaigner | +15.539 |
journalist | +14.954 |
ogether | +14.156 |
adel | +14.020 |
dign | +13.884 |
Neg logit contributions | |
preferring | -18.277 |
inability | -15.488 |
confines | -15.421 |
wanting | -15.383 |
forgetting | -14.332 |
Token | to |
Token ID | 284 |
Feature activation | -6.85e+00 |
Pos logit contributions | |
preferring | +1.103 |
inability | +0.951 |
wanting | +0.883 |
choosing | +0.801 |
confines | +0.766 |
Neg logit contributions | |
ogether | -2.459 |
adel | -2.408 |
campaigner | -2.397 |
ilde | -2.365 |
journalist | -2.306 |
Token | humanitarian |
Token ID | 15706 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
ogether | +5.626 |
campaigner | +5.499 |
adel | +5.445 |
ilde | +5.290 |
journalist | +5.251 |
Neg logit contributions | |
preferring | -6.247 |
inability | -5.769 |
wanting | -5.426 |
confines | -5.162 |
choosing | -5.104 |
Token | causes |
Token ID | 5640 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
campaigner | +8.931 |
ogether | +8.687 |
journalist | +8.530 |
adel | +8.477 |
ilde | +8.099 |
Neg logit contributions | |
preferring | -11.340 |
inability | -10.288 |
wanting | -9.902 |
confines | -9.320 |
choosing | -9.259 |
Token | 13 |
Token ID | 1511 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
preferring | +1.523 |
inability | +1.406 |
wanting | +1.343 |
choosing | +1.268 |
confines | +1.256 |
Neg logit contributions | |
ogether | -1.418 |
campaigner | -1.364 |
adel | -1.358 |
ilde | -1.324 |
journalist | -1.282 |
Token | , |
Token ID | 11 |
Feature activation | -6.93e+00 |
Pos logit contributions | |
ogether | +1.068 |
campaigner | +1.024 |
adel | +1.024 |
ilde | +0.992 |
journalist | +0.962 |
Neg logit contributions | |
preferring | -1.612 |
inability | -1.503 |
wanting | -1.437 |
choosing | -1.371 |
confines | -1.364 |
Token | to |
Token ID | 284 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
ogether | +6.627 |
adel | +6.521 |
campaigner | +6.449 |
ilde | +6.262 |
journalist | +6.259 |
Neg logit contributions | |
preferring | -5.314 |
inability | -4.920 |
wanting | -4.479 |
confines | -4.293 |
choosing | -4.192 |
Token | make |
Token ID | 787 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
campaigner | +8.578 |
ogether | +8.436 |
journalist | +8.189 |
inform | +8.159 |
adel | +8.137 |
Neg logit contributions | |
preferring | -13.284 |
inability | -12.307 |
wanting | -11.597 |
forgetting | -11.155 |
confines | -11.022 |
Token | those |
Token ID | 883 |
Feature activation | -2.76e+00 |
Pos logit contributions | |
ogether | +16.443 |
campaigner | +16.242 |
journalist | +15.840 |
inform | +15.689 |
adel | +15.634 |
Neg logit contributions | |
preferring | -16.779 |
inability | -14.678 |
wanting | -13.860 |
confines | -13.113 |
forgetting | -12.986 |
Token | votes |
Token ID | 5690 |
Feature activation | -3.32e+01 |
Pos logit contributions | |
ogether | +2.424 |
campaigner | +2.352 |
adel | +2.341 |
ilde | +2.280 |
journalist | +2.239 |
Neg logit contributions | |
preferring | -2.455 |
inability | -2.257 |
wanting | -2.129 |
choosing | -2.006 |
confines | -1.999 |
Token | official |
Token ID | 1743 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
happen | +22.857 |
occur | +22.362 |
campaigner | +22.224 |
inform | +22.191 |
ogether | +21.676 |
Neg logit contributions | |
preferring | -18.293 |
inability | -16.322 |
wanting | -14.370 |
forgetting | -14.288 |
confines | -14.076 |
Token | , |
Token ID | 11 |
Feature activation | -1.80e+01 |
Pos logit contributions | |
ogether | +15.991 |
campaigner | +15.707 |
adel | +15.461 |
journalist | +14.898 |
ilde | +14.887 |
Neg logit contributions | |
preferring | -14.157 |
inability | -12.733 |
wanting | -11.961 |
confines | -11.038 |
forgetting | -10.907 |
Token | at |
Token ID | 379 |
Feature activation | +7.85e-01 |
Pos logit contributions | |
adel | +15.699 |
ogether | +15.639 |
journalist | +15.615 |
campaigner | +15.590 |
inform | +15.110 |
Neg logit contributions | |
preferring | -11.017 |
inability | -10.486 |
confines | -9.206 |
wanting | -9.161 |
forgetting | -8.566 |
Token | which |
Token ID | 543 |
Feature activation | -6.68e+00 |
Pos logit contributions | |
preferring | +0.535 |
inability | +0.481 |
wanting | +0.446 |
choosing | +0.414 |
confines | +0.406 |
Neg logit contributions | |
ogether | -0.857 |
adel | -0.836 |
campaigner | -0.834 |
ilde | -0.817 |
ér | -0.799 |
Token | time |
Token ID | 640 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
ogether | +5.065 |
campaigner | +5.021 |
adel | +4.919 |
journalist | +4.802 |
ilde | +4.761 |
Neg logit contributions | |
preferring | -6.467 |
inability | -5.949 |
wanting | -5.661 |
confines | -5.397 |
choosing | -5.314 |
Token | of |
Token ID | 286 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
preferring | +13.251 |
wanting | +11.847 |
inability | +11.630 |
choosing | +10.812 |
confines | +10.423 |
Neg logit contributions | |
ogether | -14.822 |
adel | -14.176 |
ilde | -14.111 |
campaigner | -13.890 |
ér | -13.298 |
Token | ensuring |
Token ID | 13359 |
Feature activation | -8.67e+00 |
Pos logit contributions | |
ogether | +1.273 |
adel | +1.238 |
campaigner | +1.234 |
ilde | +1.214 |
journalist | +1.186 |
Neg logit contributions | |
preferring | -0.797 |
inability | -0.711 |
wanting | -0.665 |
choosing | -0.614 |
confines | -0.605 |
Token | that |
Token ID | 326 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
ogether | +7.785 |
campaigner | +7.728 |
adel | +7.554 |
journalist | +7.477 |
ilde | +7.344 |
Neg logit contributions | |
preferring | -6.960 |
inability | -6.313 |
wanting | -5.834 |
confines | -5.597 |
choosing | -5.459 |
Token | it |
Token ID | 340 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
campaigner | +11.411 |
ogether | +11.180 |
journalist | +10.984 |
adel | +10.784 |
ilde | +10.488 |
Neg logit contributions | |
preferring | -12.170 |
inability | -11.174 |
wanting | -10.314 |
confines | -9.933 |
forgetting | -9.750 |
Token | is |
Token ID | 318 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
campaigner | +11.783 |
ogether | +11.464 |
journalist | +11.239 |
adel | +11.179 |
ilde | +10.896 |
Neg logit contributions | |
preferring | -15.352 |
inability | -14.272 |
wanting | -13.044 |
forgetting | -12.591 |
choosing | -12.373 |
Token | a |
Token ID | 257 |
Feature activation | -3.28e+01 |
Pos logit contributions | |
campaigner | +15.943 |
journalist | +15.370 |
ogether | +15.119 |
inform | +14.622 |
adel | +14.478 |
Neg logit contributions | |
preferring | -14.040 |
inability | -12.722 |
confines | -11.225 |
wanting | -10.957 |
forgetting | -10.466 |
Token | success |
Token ID | 1943 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
campaigner | +22.173 |
journalist | +21.571 |
dign | +20.867 |
happen | +20.435 |
meaningful | +20.346 |
Neg logit contributions | |
preferring | -18.650 |
inability | -16.979 |
addons | -15.247 |
confines | -14.423 |
wanting | -14.218 |
Token | ." |
Token ID | 526 |
Feature activation | +4.76e-01 |
Pos logit contributions | |
campaigner | +15.206 |
ogether | +14.879 |
adel | +14.726 |
journalist | +14.539 |
ilde | +13.747 |
Neg logit contributions | |
preferring | -12.068 |
inability | -11.204 |
confines | -10.181 |
wanting | -9.776 |
forgetting | -9.375 |
Token |
|
Token ID | 198 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
preferring | +0.518 |
inability | +0.484 |
wanting | +0.463 |
choosing | +0.442 |
confines | +0.441 |
Neg logit contributions | |
ogether | -0.326 |
campaigner | -0.313 |
adel | -0.313 |
ilde | -0.302 |
journalist | -0.293 |
Token |
|
Token ID | 198 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
ogether | +1.716 |
adel | +1.658 |
campaigner | +1.652 |
ilde | +1.607 |
journalist | +1.566 |
Neg logit contributions | |
preferring | -2.368 |
inability | -2.203 |
wanting | -2.092 |
choosing | -1.994 |
confines | -1.988 |
Token | F |
Token ID | 37 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
ogether | +1.229 |
campaigner | +1.189 |
adel | +1.188 |
ilde | +1.158 |
journalist | +1.131 |
Neg logit contributions | |
preferring | -1.236 |
inability | -1.137 |
wanting | -1.075 |
choosing | -1.014 |
confines | -1.008 |
Token | results |
Token ID | 2482 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
ogether | +4.516 |
campaigner | +4.453 |
adel | +4.327 |
journalist | +4.203 |
ilde | +4.173 |
Neg logit contributions | |
preferring | -6.211 |
inability | -5.712 |
wanting | -5.502 |
confines | -5.217 |
choosing | -5.179 |
Token | are |
Token ID | 389 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
campaigner | +11.928 |
ogether | +11.717 |
journalist | +11.599 |
adel | +11.556 |
ilde | +11.000 |
Neg logit contributions | |
preferring | -11.054 |
inability | -10.228 |
wanting | -9.403 |
confines | -9.263 |
forgetting | -8.900 |
Token | due |
Token ID | 2233 |
Feature activation | -1.69e+01 |
Pos logit contributions | |
campaigner | +10.279 |
journalist | +10.142 |
ogether | +10.114 |
adel | +9.748 |
ilde | +9.479 |
Neg logit contributions | |
preferring | -9.014 |
inability | -8.367 |
wanting | -7.483 |
confines | -7.441 |
choosing | -7.197 |
Token | to |
Token ID | 284 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
ogether | +16.364 |
campaigner | +16.293 |
journalist | +16.006 |
adel | +15.849 |
isan | +15.355 |
Neg logit contributions | |
preferring | -9.613 |
inability | -8.760 |
wanting | -7.572 |
confines | -7.235 |
forgetting | -7.015 |
Token | be |
Token ID | 307 |
Feature activation | -2.62e+01 |
Pos logit contributions | |
campaigner | +14.643 |
occur | +14.201 |
journalist | +14.163 |
ogether | +13.786 |
adel | +13.649 |
Neg logit contributions | |
preferring | -19.791 |
inability | -17.777 |
wanting | -16.991 |
sacrificing | -16.387 |
forgetting | -16.376 |
Token | announced |
Token ID | 3414 |
Feature activation | -3.23e+01 |
Pos logit contributions | |
campaigner | +16.069 |
journalist | +16.069 |
inform | +15.502 |
correspond | +15.238 |
ogether | +15.090 |
Neg logit contributions | |
preferring | -19.262 |
inability | -17.828 |
confines | -15.977 |
forgetting | -15.828 |
wanting | -15.792 |
Token | on |
Token ID | 319 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
campaigner | +20.725 |
journalist | +20.682 |
inform | +20.242 |
ogether | +20.014 |
shortly | +19.835 |
Neg logit contributions | |
preferring | -18.728 |
inability | -17.263 |
confines | -14.883 |
wanting | -14.785 |
龍契士 | -14.744 |
Token | 14 |
Token ID | 1478 |
Feature activation | -7.68e+00 |
Pos logit contributions | |
campaigner | +8.046 |
ogether | +7.992 |
journalist | +7.803 |
adel | +7.767 |
ilde | +7.262 |
Neg logit contributions | |
preferring | -12.093 |
inability | -11.227 |
wanting | -10.682 |
confines | -10.133 |
forgetting | -10.120 |
Token | May |
Token ID | 1737 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
ogether | +4.997 |
campaigner | +4.780 |
adel | +4.699 |
journalist | +4.601 |
ilde | +4.482 |
Neg logit contributions | |
preferring | -8.229 |
inability | -7.755 |
wanting | -7.277 |
confines | -6.982 |
choosing | -6.947 |
Token | after |
Token ID | 706 |
Feature activation | -9.46e+00 |
Pos logit contributions | |
ogether | +13.396 |
campaigner | +12.979 |
adel | +12.912 |
journalist | +12.671 |
ér | +12.277 |
Neg logit contributions | |
preferring | -13.774 |
inability | -13.211 |
wanting | -11.671 |
confines | -11.661 |
forgetting | -11.475 |
Token | a |
Token ID | 257 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
campaigner | +8.318 |
ogether | +8.317 |
adel | +8.048 |
journalist | +8.003 |
ilde | +7.820 |
Neg logit contributions | |
preferring | -7.559 |
inability | -6.910 |
wanting | -6.549 |
confines | -6.222 |
choosing | -6.008 |
Token | do |
Token ID | 466 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
ogether | +10.786 |
campaigner | +10.626 |
adel | +10.531 |
journalist | +10.297 |
ilde | +9.842 |
Neg logit contributions | |
preferring | -10.223 |
inability | -9.376 |
confines | -8.364 |
wanting | -8.335 |
choosing | -7.985 |
Token | more |
Token ID | 517 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
ogether | +11.955 |
adel | +11.276 |
campaigner | +11.229 |
journalist | +11.051 |
ilde | +10.446 |
Neg logit contributions | |
preferring | -13.499 |
inability | -12.375 |
confines | -11.418 |
wanting | -11.309 |
choosing | -10.877 |
Token | to |
Token ID | 284 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
ogether | +11.266 |
campaigner | +11.067 |
journalist | +10.854 |
adel | +10.784 |
ilde | +10.416 |
Neg logit contributions | |
preferring | -9.603 |
inability | -8.849 |
wanting | -7.922 |
confines | -7.696 |
choosing | -7.516 |
Token | make |
Token ID | 787 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
ogether | +9.646 |
campaigner | +9.448 |
adel | +9.226 |
journalist | +9.209 |
inform | +8.911 |
Neg logit contributions | |
preferring | -12.825 |
inability | -11.796 |
wanting | -10.757 |
confines | -10.638 |
choosing | -10.429 |
Token | it |
Token ID | 340 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
ogether | +12.073 |
adel | +11.413 |
campaigner | +11.127 |
ilde | +11.023 |
journalist | +11.013 |
Neg logit contributions | |
preferring | -13.502 |
inability | -12.616 |
confines | -11.351 |
wanting | -11.111 |
forgetting | -10.640 |
Token | a |
Token ID | 257 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
ogether | +17.903 |
campaigner | +17.416 |
happen | +17.375 |
adel | +17.343 |
journalist | +17.247 |
Neg logit contributions | |
preferring | -16.112 |
inability | -14.835 |
confines | -13.662 |
choosing | -12.432 |
wanting | -12.262 |
Token | truly |
Token ID | 4988 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
journalist | +20.425 |
campaigner | +20.308 |
ogether | +20.124 |
adel | +19.415 |
credible | +18.955 |
Neg logit contributions | |
preferring | -17.991 |
inability | -16.967 |
confines | -14.702 |
forgetting | -14.101 |
choosing | -13.648 |
Token | global |
Token ID | 3298 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
ogether | +18.830 |
journalist | +18.322 |
campaigner | +18.286 |
adel | +17.902 |
inform | +17.383 |
Neg logit contributions | |
preferring | -15.792 |
inability | -14.825 |
confines | -13.146 |
forgetting | -12.387 |
choosing | -12.078 |
Token | title |
Token ID | 3670 |
Feature activation | -9.47e+00 |
Pos logit contributions | |
campaigner | +16.111 |
ogether | +16.010 |
journalist | +15.713 |
adel | +15.453 |
ilde | +14.990 |
Neg logit contributions | |
preferring | -16.642 |
inability | -14.508 |
wanting | -13.011 |
confines | -12.882 |
forgetting | -12.759 |
Token | . |
Token ID | 13 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
ogether | +7.365 |
adel | +7.138 |
campaigner | +7.090 |
journalist | +6.818 |
ilde | +6.641 |
Neg logit contributions | |
preferring | -8.801 |
inability | -8.247 |
wanting | -7.500 |
confines | -7.389 |
choosing | -7.185 |
Token |
|
Token ID | 198 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
ogether | +2.474 |
adel | +2.387 |
campaigner | +2.369 |
ilde | +2.309 |
journalist | +2.264 |
Neg logit contributions | |
preferring | -3.395 |
inability | -3.161 |
wanting | -2.981 |
choosing | -2.851 |
confines | -2.840 |
Token | the |
Token ID | 262 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
ogether | +14.991 |
journalist | +14.754 |
adel | +14.751 |
campaigner | +14.585 |
ilde | +14.565 |
Neg logit contributions | |
preferring | -14.270 |
inability | -12.793 |
wanting | -11.510 |
confines | -11.493 |
forgetting | -11.099 |
Token | public |
Token ID | 1171 |
Feature activation | -4.70e+00 |
Pos logit contributions | |
preferring | +1.276 |
inability | +1.192 |
wanting | +1.134 |
choosing | +1.069 |
confines | +1.065 |
Neg logit contributions | |
ogether | -1.155 |
adel | -1.121 |
campaigner | -1.101 |
ilde | -1.088 |
ér | -1.044 |
Token | imagination |
Token ID | 13843 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
ogether | +4.926 |
campaigner | +4.824 |
adel | +4.805 |
ilde | +4.715 |
journalist | +4.634 |
Neg logit contributions | |
preferring | -3.345 |
inability | -3.002 |
wanting | -2.777 |
choosing | -2.587 |
confines | -2.584 |
Token | to |
Token ID | 284 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
ogether | +11.247 |
campaigner | +10.923 |
adel | +10.916 |
ilde | +10.644 |
journalist | +10.623 |
Neg logit contributions | |
preferring | -10.132 |
inability | -9.535 |
confines | -8.463 |
wanting | -8.321 |
choosing | -8.017 |
Token | become |
Token ID | 1716 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
ogether | +8.081 |
adel | +7.930 |
campaigner | +7.898 |
journalist | +7.721 |
ilde | +7.563 |
Neg logit contributions | |
preferring | -9.814 |
inability | -8.975 |
wanting | -8.388 |
confines | -8.162 |
choosing | -8.037 |
Token | a |
Token ID | 257 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
campaigner | +15.771 |
journalist | +15.617 |
adel | +15.564 |
ogether | +14.987 |
ilde | +14.588 |
Neg logit contributions | |
preferring | -15.561 |
inability | -14.174 |
confines | -12.868 |
wanting | -12.669 |
forgetting | -12.289 |
Token | phenomenon |
Token ID | 10733 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
journalist | +23.348 |
campaigner | +23.185 |
adel | +20.923 |
ilde | +20.258 |
ogether | +19.872 |
Neg logit contributions | |
preferring | -17.077 |
inability | -15.755 |
confines | -13.915 |
wanting | -13.252 |
forgetting | -12.972 |
Token | . |
Token ID | 13 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
campaigner | +13.228 |
adel | +13.159 |
ogether | +13.114 |
journalist | +12.889 |
ilde | +12.477 |
Neg logit contributions | |
preferring | -11.543 |
inability | -10.946 |
confines | -9.702 |
wanting | -9.605 |
choosing | -9.114 |
Token | You |
Token ID | 921 |
Feature activation | -9.71e+00 |
Pos logit contributions | |
ogether | +10.890 |
adel | +10.887 |
journalist | +10.685 |
campaigner | +10.673 |
ilde | +10.590 |
Neg logit contributions | |
preferring | -11.481 |
inability | -10.608 |
wanting | -9.494 |
forgetting | -9.283 |
confines | -9.226 |
Token | see |
Token ID | 766 |
Feature activation | -6.30e+00 |
Pos logit contributions | |
ogether | +7.880 |
campaigner | +7.620 |
adel | +7.604 |
journalist | +7.349 |
ilde | +7.342 |
Neg logit contributions | |
preferring | -8.621 |
inability | -7.940 |
wanting | -7.333 |
confines | -7.197 |
choosing | -6.991 |
Token | that |
Token ID | 326 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
ogether | +4.773 |
campaigner | +4.645 |
adel | +4.635 |
ilde | +4.500 |
journalist | +4.444 |
Neg logit contributions | |
preferring | -6.242 |
inability | -5.757 |
wanting | -5.424 |
confines | -5.222 |
choosing | -5.187 |
Token | matter |
Token ID | 2300 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
campaigner | +10.484 |
journalist | +10.288 |
ogether | +10.197 |
adel | +9.849 |
ilde | +9.498 |
Neg logit contributions | |
preferring | -12.331 |
inability | -11.429 |
wanting | -10.661 |
confines | -10.389 |
choosing | -9.972 |
Token | that |
Token ID | 326 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
ogether | +0.243 |
adel | +0.234 |
campaigner | +0.234 |
ilde | +0.228 |
journalist | +0.222 |
Neg logit contributions | |
preferring | -0.276 |
inability | -0.255 |
wanting | -0.243 |
choosing | -0.230 |
confines | -0.228 |
Token | needs |
Token ID | 2476 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
campaigner | +12.229 |
journalist | +12.030 |
ogether | +12.007 |
adel | +11.771 |
ilde | +11.657 |
Neg logit contributions | |
preferring | -13.244 |
inability | -11.993 |
wanting | -11.127 |
forgetting | -10.589 |
confines | -10.388 |
Token | to |
Token ID | 284 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
preferring | +10.458 |
inability | +9.539 |
wanting | +9.374 |
choosing | +8.930 |
forgetting | +8.491 |
Neg logit contributions | |
ogether | -10.750 |
adel | -10.477 |
ilde | -10.345 |
campaigner | -10.111 |
ér | -9.706 |
Token | be |
Token ID | 307 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
ogether | +8.031 |
campaigner | +7.878 |
adel | +7.540 |
occur | +7.525 |
journalist | +7.422 |
Neg logit contributions | |
preferring | -16.395 |
inability | -15.374 |
wanting | -14.518 |
forgetting | -13.789 |
confines | -13.755 |
Token | handled |
Token ID | 12118 |
Feature activation | -3.04e+01 |
Pos logit contributions | |
campaigner | +14.227 |
ogether | +13.850 |
journalist | +13.806 |
inform | +13.619 |
adel | +13.550 |
Neg logit contributions | |
preferring | -15.446 |
inability | -14.533 |
wanting | -12.811 |
confines | -12.104 |
forgetting | -11.908 |
Token | by |
Token ID | 416 |
Feature activation | -8.58e+00 |
Pos logit contributions | |
inform | +22.619 |
ogether | +21.945 |
campaigner | +21.420 |
journalist | +21.159 |
satisf | +20.838 |
Neg logit contributions | |
inability | -15.996 |
preferring | -15.592 |
confines | -13.029 |
forgetting | -13.005 |
wanting | -12.938 |
Token | parents |
Token ID | 3397 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
ogether | +6.521 |
campaigner | +6.433 |
adel | +6.250 |
journalist | +6.136 |
ilde | +6.033 |
Neg logit contributions | |
preferring | -8.001 |
inability | -7.496 |
wanting | -6.949 |
confines | -6.664 |
forgetting | -6.522 |
Token | in |
Token ID | 287 |
Feature activation | -9.07e-01 |
Pos logit contributions | |
ogether | +3.083 |
campaigner | +2.973 |
adel | +2.965 |
ilde | +2.868 |
journalist | +2.826 |
Neg logit contributions | |
preferring | -3.637 |
inability | -3.398 |
wanting | -3.170 |
confines | -3.039 |
choosing | -3.008 |
Token | a |
Token ID | 257 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
ogether | +0.767 |
campaigner | +0.741 |
adel | +0.741 |
ilde | +0.721 |
journalist | +0.704 |
Neg logit contributions | |
preferring | -0.842 |
inability | -0.778 |
wanting | -0.737 |
choosing | -0.696 |
confines | -0.694 |
Token | careful |
Token ID | 8161 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
campaigner | +10.814 |
ogether | +10.593 |
journalist | +10.553 |
adel | +10.148 |
dign | +9.828 |
Neg logit contributions | |
preferring | -12.686 |
inability | -11.991 |
wanting | -10.880 |
confines | -10.464 |
forgetting | -10.247 |
Token | at |
Token ID | 379 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
ogether | +2.491 |
campaigner | +2.423 |
adel | +2.415 |
ilde | +2.331 |
journalist | +2.312 |
Neg logit contributions | |
preferring | -3.218 |
inability | -2.982 |
wanting | -2.817 |
confines | -2.696 |
choosing | -2.688 |
Token | least |
Token ID | 1551 |
Feature activation | -6.49e+00 |
Pos logit contributions | |
preferring | +1.860 |
inability | +1.758 |
wanting | +1.679 |
choosing | +1.597 |
confines | +1.574 |
Neg logit contributions | |
ogether | -1.289 |
adel | -1.251 |
campaigner | -1.249 |
ilde | -1.194 |
ér | -1.168 |
Token | initially |
Token ID | 7317 |
Feature activation | -8.28e+00 |
Pos logit contributions | |
ogether | +5.000 |
campaigner | +4.951 |
adel | +4.926 |
journalist | +4.819 |
ilde | +4.703 |
Neg logit contributions | |
preferring | -6.090 |
inability | -5.608 |
wanting | -5.273 |
confines | -5.086 |
choosing | -5.036 |
Token | being |
Token ID | 852 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
ogether | +7.284 |
campaigner | +7.254 |
adel | +7.196 |
journalist | +7.121 |
ilde | +6.926 |
Neg logit contributions | |
preferring | -6.646 |
inability | -6.108 |
wanting | -5.556 |
confines | -5.413 |
choosing | -5.306 |
Token | received |
Token ID | 2722 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
campaigner | +9.421 |
journalist | +9.334 |
adel | +9.285 |
ogether | +9.280 |
ilde | +8.934 |
Neg logit contributions | |
preferring | -9.899 |
inability | -9.127 |
wanting | -8.251 |
confines | -8.193 |
choosing | -8.047 |
Token | well |
Token ID | 880 |
Feature activation | -3.02e+01 |
Pos logit contributions | |
journalist | +18.392 |
ogether | +18.176 |
campaigner | +17.936 |
inform | +17.895 |
adel | +17.800 |
Neg logit contributions | |
preferring | -13.979 |
inability | -13.110 |
confines | -11.823 |
forgetting | -11.419 |
choosing | -11.117 |
Token | inside |
Token ID | 2641 |
Feature activation | -7.49e+00 |
Pos logit contributions | |
journalist | +21.434 |
ogether | +21.383 |
campaigner | +20.913 |
inform | +20.856 |
adel | +20.607 |
Neg logit contributions | |
inability | -16.206 |
preferring | -16.128 |
forgetting | -13.387 |
addons | -13.250 |
confines | -13.183 |
Token | of |
Token ID | 286 |
Feature activation | -6.46e+00 |
Pos logit contributions | |
ogether | +5.347 |
campaigner | +5.186 |
adel | +5.153 |
ilde | +4.965 |
journalist | +4.962 |
Neg logit contributions | |
preferring | -7.560 |
inability | -7.078 |
wanting | -6.620 |
choosing | -6.378 |
forgetting | -6.315 |
Token | the |
Token ID | 262 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
ogether | +4.541 |
campaigner | +4.391 |
adel | +4.351 |
ilde | +4.210 |
journalist | +4.189 |
Neg logit contributions | |
preferring | -6.705 |
inability | -6.247 |
wanting | -5.876 |
choosing | -5.641 |
confines | -5.629 |
Token | McCain |
Token ID | 14264 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
preferring | +0.345 |
inability | +0.322 |
wanting | +0.307 |
confines | +0.293 |
choosing | +0.293 |
Neg logit contributions | |
ogether | -0.247 |
adel | -0.237 |
campaigner | -0.236 |
ilde | -0.231 |
ér | -0.222 |
Token | campaign |
Token ID | 1923 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
preferring | +2.583 |
inability | +2.432 |
wanting | +2.340 |
choosing | +2.234 |
confines | +2.231 |
Neg logit contributions | |
ogether | -1.433 |
adel | -1.341 |
campaigner | -1.331 |
ilde | -1.320 |
journalist | -1.255 |
Token | vital |
Token ID | 9204 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
campaigner | +6.692 |
ogether | +6.573 |
journalist | +6.458 |
adel | +6.446 |
ilde | +6.228 |
Neg logit contributions | |
preferring | -9.856 |
inability | -9.193 |
wanting | -8.451 |
confines | -8.446 |
choosing | -8.130 |
Token | to |
Token ID | 284 |
Feature activation | -7.96e+00 |
Pos logit contributions | |
ogether | +3.393 |
campaigner | +3.326 |
adel | +3.303 |
ilde | +3.239 |
journalist | +3.210 |
Neg logit contributions | |
preferring | -1.730 |
inability | -1.525 |
wanting | -1.380 |
choosing | -1.258 |
confines | -1.257 |
Token | building |
Token ID | 2615 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
ogether | +7.671 |
campaigner | +7.667 |
adel | +7.543 |
journalist | +7.371 |
ilde | +7.250 |
Neg logit contributions | |
preferring | -5.849 |
inability | -5.346 |
wanting | -4.799 |
confines | -4.678 |
forgetting | -4.498 |
Token | a |
Token ID | 257 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
campaigner | +15.281 |
journalist | +14.618 |
adel | +14.408 |
ogether | +14.389 |
inform | +13.668 |
Neg logit contributions | |
preferring | -14.889 |
inability | -13.653 |
confines | -12.330 |
wanting | -12.027 |
forgetting | -12.010 |
Token | strong |
Token ID | 1913 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
campaigner | +20.061 |
journalist | +19.354 |
adel | +18.273 |
ogether | +18.145 |
dign | +18.055 |
Neg logit contributions | |
preferring | -17.101 |
inability | -15.710 |
confines | -13.637 |
addons | -13.133 |
forgetting | -13.125 |
Token | , |
Token ID | 11 |
Feature activation | -3.01e+01 |
Pos logit contributions | |
campaigner | +18.203 |
journalist | +16.941 |
ogether | +16.622 |
adel | +16.258 |
isan | +15.717 |
Neg logit contributions | |
preferring | -16.872 |
inability | -14.757 |
forgetting | -13.534 |
wanting | -13.170 |
confines | -12.962 |
Token | sustainable |
Token ID | 13347 |
Feature activation | -2.19e+01 |
Pos logit contributions | |
campaigner | +22.520 |
journalist | +21.950 |
dign | +21.339 |
inform | +21.095 |
credible | +20.771 |
Neg logit contributions | |
preferring | -15.819 |
inability | -14.848 |
confines | -12.539 |
forgetting | -12.535 |
addons | -12.214 |
Token | relationship |
Token ID | 2776 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
campaigner | +15.880 |
journalist | +15.052 |
ogether | +14.717 |
adel | +14.703 |
isan | +13.972 |
Neg logit contributions | |
preferring | -17.079 |
inability | -14.905 |
forgetting | -13.623 |
wanting | -13.563 |
choosing | -13.231 |
Token | with |
Token ID | 351 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
ogether | +10.881 |
campaigner | +10.850 |
adel | +10.501 |
journalist | +10.470 |
ilde | +10.017 |
Neg logit contributions | |
preferring | -11.178 |
inability | -10.624 |
wanting | -9.450 |
confines | -9.401 |
forgetting | -9.111 |
Token | our |
Token ID | 674 |
Feature activation | -7.58e+00 |
Pos logit contributions | |
campaigner | +8.221 |
ogether | +7.998 |
journalist | +7.841 |
adel | +7.815 |
ilde | +7.347 |
Neg logit contributions | |
preferring | -12.687 |
inability | -11.861 |
wanting | -10.920 |
confines | -10.831 |
forgetting | -10.679 |
Token | supporters |
Token ID | 5941 |
Feature activation | -8.31e+00 |
Pos logit contributions | |
ogether | +4.766 |
campaigner | +4.728 |
adel | +4.605 |
journalist | +4.464 |
ilde | +4.338 |
Neg logit contributions | |
preferring | -8.266 |
inability | -7.666 |
wanting | -7.272 |
confines | -6.991 |
choosing | -6.973 |
Token | that |
Token ID | 326 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
ogether | +0.782 |
adel | +0.755 |
campaigner | +0.754 |
ilde | +0.735 |
journalist | +0.715 |
Neg logit contributions | |
preferring | -0.877 |
inability | -0.811 |
wanting | -0.769 |
choosing | -0.728 |
confines | -0.723 |
Token | Trump |
Token ID | 1301 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
campaigner | +13.366 |
ogether | +13.289 |
journalist | +13.035 |
adel | +12.724 |
ilde | +12.537 |
Neg logit contributions | |
preferring | -14.156 |
inability | -12.376 |
wanting | -12.092 |
forgetting | -11.555 |
choosing | -11.415 |
Token | had |
Token ID | 550 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
ogether | +1.334 |
adel | +1.285 |
campaigner | +1.284 |
ilde | +1.250 |
journalist | +1.217 |
Neg logit contributions | |
preferring | -1.582 |
inability | -1.463 |
wanting | -1.392 |
choosing | -1.319 |
confines | -1.312 |
Token | promised |
Token ID | 8072 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
preferring | +1.179 |
inability | +1.081 |
wanting | +1.033 |
choosing | +0.964 |
confines | +0.952 |
Neg logit contributions | |
ogether | -1.221 |
adel | -1.175 |
campaigner | -1.163 |
ilde | -1.145 |
ér | -1.108 |
Token | to |
Token ID | 284 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
ogether | +1.865 |
adel | +1.810 |
campaigner | +1.808 |
ilde | +1.770 |
journalist | +1.732 |
Neg logit contributions | |
preferring | -1.435 |
inability | -1.303 |
wanting | -1.221 |
choosing | -1.138 |
confines | -1.130 |
Token | accomplish |
Token ID | 9989 |
Feature activation | -3.01e+01 |
Pos logit contributions | |
campaigner | +9.635 |
ogether | +9.466 |
adel | +9.205 |
journalist | +9.189 |
ilde | +8.968 |
Neg logit contributions | |
preferring | -12.194 |
inability | -11.163 |
wanting | -10.485 |
confines | -10.148 |
choosing | -10.140 |
Token | . |
Token ID | 13 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
campaigner | +21.317 |
ogether | +20.880 |
adel | +20.580 |
journalist | +20.517 |
inform | +20.337 |
Neg logit contributions | |
preferring | -15.859 |
inability | -15.024 |
confines | -13.212 |
forgetting | -12.780 |
wanting | -12.354 |
Token |
|
Token ID | 198 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
ogether | +1.876 |
adel | +1.809 |
campaigner | +1.796 |
ilde | +1.753 |
journalist | +1.709 |
Neg logit contributions | |
preferring | -2.646 |
inability | -2.465 |
wanting | -2.340 |
choosing | -2.238 |
confines | -2.225 |
Token |
|
Token ID | 198 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
preferring | +1.715 |
inability | +1.587 |
wanting | +1.533 |
choosing | +1.442 |
confines | +1.423 |
Neg logit contributions | |
ogether | -1.534 |
campaigner | -1.479 |
adel | -1.452 |
ilde | -1.418 |
earthqu | -1.387 |
Token | � |
Token ID | 447 |
Feature activation | -4.32e+00 |
Pos logit contributions | |
ogether | +2.121 |
adel | +2.059 |
campaigner | +2.039 |
ilde | +2.003 |
journalist | +1.946 |
Neg logit contributions | |
preferring | -2.282 |
inability | -2.103 |
wanting | -1.985 |
choosing | -1.883 |
confines | -1.878 |
Token | � |
Token ID | 250 |
Feature activation | -5.44e-01 |
Pos logit contributions | |
ogether | +2.918 |
campaigner | +2.797 |
adel | +2.791 |
ilde | +2.699 |
journalist | +2.633 |
Neg logit contributions | |
preferring | -4.644 |
inability | -4.331 |
wanting | -4.139 |
confines | -3.951 |
choosing | -3.951 |
Token | I |
Token ID | 314 |
Feature activation | -8.34e+00 |
Pos logit contributions | |
ogether | +8.853 |
adel | +8.528 |
campaigner | +8.488 |
ilde | +8.285 |
journalist | +8.268 |
Neg logit contributions | |
preferring | -8.483 |
inability | -7.755 |
wanting | -7.107 |
confines | -6.891 |
choosing | -6.729 |
Token | hope |
Token ID | 2911 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
ogether | +5.948 |
adel | +5.724 |
campaigner | +5.667 |
ilde | +5.540 |
journalist | +5.415 |
Neg logit contributions | |
preferring | -8.409 |
inability | -7.710 |
wanting | -7.290 |
confines | -7.074 |
choosing | -7.012 |
Token | we |
Token ID | 356 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
ogether | +12.408 |
campaigner | +12.042 |
journalist | +11.903 |
ilde | +11.792 |
adel | +11.788 |
Neg logit contributions | |
preferring | -8.719 |
inability | -7.692 |
wanting | -7.004 |
confines | -6.769 |
choosing | -6.356 |
Token | will |
Token ID | 481 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
ogether | +9.430 |
campaigner | +9.322 |
adel | +9.112 |
journalist | +8.922 |
ér | +8.885 |
Neg logit contributions | |
preferring | -13.797 |
inability | -12.515 |
wanting | -11.625 |
confines | -11.393 |
choosing | -11.107 |
Token | be |
Token ID | 307 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
campaigner | +12.927 |
ogether | +12.899 |
occur | +12.602 |
inform | +12.577 |
adel | +12.496 |
Neg logit contributions | |
preferring | -16.856 |
inability | -15.080 |
wanting | -13.843 |
confines | -13.593 |
choosing | -13.136 |
Token | judged |
Token ID | 19589 |
Feature activation | -3.00e+01 |
Pos logit contributions | |
campaigner | +17.796 |
ogether | +17.700 |
adel | +17.530 |
journalist | +17.370 |
dign | +16.933 |
Neg logit contributions | |
preferring | -13.834 |
inability | -12.618 |
confines | -11.260 |
wanting | -10.439 |
ses | -9.921 |
Token | on |
Token ID | 319 |
Feature activation | -5.70e+00 |
Pos logit contributions | |
ogether | +21.831 |
inform | +21.592 |
journalist | +21.580 |
adel | +21.478 |
campaigner | +21.354 |
Neg logit contributions | |
preferring | -15.783 |
inability | -14.954 |
confines | -13.373 |
forgetting | -12.355 |
Untitled | -12.268 |
Token | how |
Token ID | 703 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
ogether | +5.078 |
campaigner | +4.911 |
adel | +4.877 |
ilde | +4.726 |
journalist | +4.710 |
Neg logit contributions | |
preferring | -4.901 |
inability | -4.486 |
wanting | -4.166 |
confines | -4.014 |
choosing | -3.917 |
Token | quickly |
Token ID | 2952 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
ogether | +12.978 |
campaigner | +12.976 |
journalist | +12.804 |
ilde | +12.538 |
adel | +12.304 |
Neg logit contributions | |
preferring | -10.638 |
inability | -9.699 |
confines | -8.636 |
wanting | -8.411 |
forgetting | -8.026 |
Token | we |
Token ID | 356 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
ogether | +15.693 |
campaigner | +15.500 |
journalist | +15.242 |
ilde | +15.042 |
ér | +14.934 |
Neg logit contributions | |
preferring | -14.177 |
inability | -12.698 |
wanting | -11.427 |
confines | -11.427 |
choosing | -10.455 |
Token | reacted |
Token ID | 22798 |
Feature activation | -6.04e+00 |
Pos logit contributions | |
ogether | +7.849 |
campaigner | +7.767 |
adel | +7.644 |
journalist | +7.470 |
ilde | +7.408 |
Neg logit contributions | |
preferring | -11.458 |
inability | -10.568 |
wanting | -9.791 |
confines | -9.514 |
choosing | -9.296 |
Token | instead |
Token ID | 2427 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
preferring | +7.474 |
inability | +6.924 |
wanting | +6.624 |
confines | +6.366 |
choosing | +6.351 |
Neg logit contributions | |
ogether | -5.911 |
adel | -5.660 |
ilde | -5.590 |
campaigner | -5.559 |
alysed | -5.235 |
Token | require |
Token ID | 2421 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
preferring | +0.414 |
inability | +0.382 |
wanting | +0.366 |
choosing | +0.348 |
confines | +0.347 |
Neg logit contributions | |
ogether | -0.327 |
adel | -0.314 |
campaigner | -0.313 |
ilde | -0.306 |
journalist | -0.294 |
Token | that |
Token ID | 326 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
ogether | +10.877 |
campaigner | +10.403 |
adel | +10.244 |
journalist | +10.132 |
ilde | +9.915 |
Neg logit contributions | |
preferring | -10.580 |
inability | -9.676 |
wanting | -9.089 |
confines | -8.803 |
forgetting | -8.576 |
Token | complaints |
Token ID | 9687 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
ogether | +13.262 |
campaigner | +12.940 |
journalist | +12.575 |
adel | +12.531 |
ilde | +12.186 |
Neg logit contributions | |
preferring | -12.670 |
inability | -11.468 |
wanting | -10.784 |
confines | -10.485 |
forgetting | -10.201 |
Token | be |
Token ID | 307 |
Feature activation | -2.67e+01 |
Pos logit contributions | |
ogether | +8.614 |
campaigner | +8.521 |
adel | +8.382 |
journalist | +8.261 |
ér | +8.040 |
Neg logit contributions | |
preferring | -9.366 |
inability | -8.583 |
wanting | -7.960 |
forgetting | -7.759 |
confines | -7.679 |
Token | processed |
Token ID | 13686 |
Feature activation | -3.00e+01 |
Pos logit contributions | |
journalist | +17.963 |
inform | +17.743 |
ogether | +17.689 |
campaigner | +17.248 |
correspond | +17.116 |
Neg logit contributions | |
preferring | -17.750 |
inability | -15.798 |
forgetting | -15.033 |
wanting | -14.326 |
sacrificing | -14.049 |
Token | � |
Token ID | 564 |
Feature activation | -8.77e+00 |
Pos logit contributions | |
inform | +21.839 |
ogether | +21.540 |
adel | +20.772 |
journalist | +20.726 |
correspond | +20.634 |
Neg logit contributions | |
preferring | -16.329 |
inability | -14.953 |
forgetting | -13.491 |
confines | -13.267 |
wanting | -13.211 |
Token | � |
Token ID | 250 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
ogether | +5.635 |
adel | +5.375 |
ilde | +5.268 |
campaigner | +5.199 |
journalist | +5.025 |
Neg logit contributions | |
preferring | -9.530 |
inability | -8.906 |
wanting | -8.459 |
confines | -8.098 |
choosing | -8.052 |
Token | prom |
Token ID | 16963 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
ogether | +15.518 |
adel | +15.023 |
ér | +14.385 |
ilde | +14.227 |
campaigner | +14.210 |
Neg logit contributions | |
preferring | -9.827 |
inability | -8.963 |
wanting | -8.057 |
confines | -7.730 |
forgetting | -7.418 |
Token | pt |
Token ID | 457 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
ogether | +12.609 |
adel | +12.027 |
ér | +11.518 |
ilde | +11.296 |
campaigner | +11.160 |
Neg logit contributions | |
preferring | -19.233 |
inability | -18.679 |
wanting | -16.983 |
forgetting | -16.669 |
confines | -16.447 |
Token | ly |
Token ID | 306 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
ogether | +14.320 |
adel | +13.377 |
ilde | +12.898 |
campaigner | +12.836 |
ér | +12.807 |
Neg logit contributions | |
preferring | -15.060 |
inability | -13.932 |
wanting | -12.974 |
forgetting | -12.426 |
confines | -12.324 |
Token | much |
Token ID | 881 |
Feature activation | -6.38e+00 |
Pos logit contributions | |
ogether | +12.927 |
adel | +12.379 |
journalist | +12.013 |
campaigner | +12.009 |
ér | +11.812 |
Neg logit contributions | |
preferring | -13.579 |
inability | -12.386 |
wanting | -11.477 |
confines | -11.326 |
choosing | -10.811 |
Token | more |
Token ID | 517 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
ogether | +4.113 |
adel | +3.976 |
campaigner | +3.954 |
journalist | +3.788 |
ilde | +3.741 |
Neg logit contributions | |
preferring | -6.888 |
inability | -6.511 |
wanting | -6.147 |
confines | -5.999 |
choosing | -5.898 |
Token | , |
Token ID | 11 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
ogether | +15.069 |
adel | +14.726 |
journalist | +14.681 |
campaigner | +14.637 |
ilde | +14.112 |
Neg logit contributions | |
preferring | -11.184 |
inability | -10.166 |
confines | -8.934 |
wanting | -8.886 |
choosing | -8.146 |
Token | and |
Token ID | 290 |
Feature activation | -4.19e+00 |
Pos logit contributions | |
ogether | +11.944 |
adel | +11.737 |
campaigner | +11.690 |
journalist | +11.490 |
ilde | +11.142 |
Neg logit contributions | |
preferring | -9.379 |
inability | -8.852 |
confines | -7.936 |
wanting | -7.768 |
choosing | -7.291 |
Token | do |
Token ID | 466 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
ogether | +3.538 |
campaigner | +3.437 |
adel | +3.431 |
ilde | +3.313 |
journalist | +3.294 |
Neg logit contributions | |
preferring | -3.798 |
inability | -3.503 |
wanting | -3.275 |
confines | -3.131 |
choosing | -3.106 |
Token | it |
Token ID | 340 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
ogether | +12.543 |
adel | +12.086 |
campaigner | +11.885 |
ér | +11.623 |
journalist | +11.604 |
Neg logit contributions | |
preferring | -11.688 |
inability | -10.875 |
confines | -9.932 |
wanting | -9.769 |
choosing | -9.251 |
Token | much |
Token ID | 881 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
ogether | +22.392 |
inform | +21.863 |
adel | +21.582 |
journalist | +21.548 |
campaigner | +21.146 |
Neg logit contributions | |
preferring | -15.474 |
inability | -14.757 |
confines | -13.412 |
Lost | -11.830 |
wanting | -11.810 |
Token | better |
Token ID | 1365 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
adel | +16.223 |
ogether | +16.143 |
campaigner | +15.897 |
journalist | +15.859 |
inform | +15.464 |
Neg logit contributions | |
preferring | -15.190 |
inability | -14.822 |
confines | -13.320 |
wanting | -13.023 |
forgetting | -12.411 |
Token | , |
Token ID | 11 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
ogether | +16.386 |
adel | +15.742 |
campaigner | +15.353 |
journalist | +15.219 |
ér | +15.157 |
Neg logit contributions | |
preferring | -13.770 |
inability | -12.949 |
wanting | -11.091 |
confines | -11.057 |
forgetting | -10.330 |
Token | in |
Token ID | 287 |
Feature activation | -4.52e+00 |
Pos logit contributions | |
ogether | +17.579 |
adel | +16.930 |
journalist | +16.925 |
campaigner | +16.881 |
ér | +16.328 |
Neg logit contributions | |
preferring | -12.517 |
inability | -12.020 |
confines | -10.489 |
wanting | -9.878 |
forgetting | -9.182 |
Token | the |
Token ID | 262 |
Feature activation | +6.89e+00 |
Pos logit contributions | |
ogether | +3.368 |
adel | +3.246 |
campaigner | +3.225 |
ilde | +3.134 |
journalist | +3.094 |
Neg logit contributions | |
preferring | -4.553 |
inability | -4.238 |
wanting | -3.988 |
confines | -3.835 |
choosing | -3.789 |
Token | Volunteers |
Token ID | 45646 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
ogether | +7.517 |
campaigner | +7.356 |
adel | +7.246 |
journalist | +7.064 |
ilde | +7.058 |
Neg logit contributions | |
preferring | -8.513 |
inability | -7.873 |
wanting | -7.394 |
confines | -7.134 |
choosing | -7.042 |
Token | who |
Token ID | 508 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
preferring | +1.849 |
inability | +1.705 |
wanting | +1.640 |
choosing | +1.551 |
confines | +1.521 |
Neg logit contributions | |
ogether | -1.563 |
adel | -1.504 |
campaigner | -1.494 |
ilde | -1.466 |
journalist | -1.407 |
Token | continue |
Token ID | 2555 |
Feature activation | +9.94e+00 |
Pos logit contributions | |
campaigner | +8.771 |
ogether | +8.616 |
adel | +8.519 |
journalist | +8.499 |
ilde | +8.188 |
Neg logit contributions | |
preferring | -11.741 |
inability | -10.818 |
wanting | -10.231 |
confines | -9.746 |
forgetting | -9.739 |
Token | to |
Token ID | 284 |
Feature activation | -1.42e+01 |
Pos logit contributions | |
preferring | +8.825 |
inability | +8.217 |
wanting | +7.946 |
choosing | +7.557 |
confines | +7.170 |
Neg logit contributions | |
ogether | -8.209 |
adel | -8.016 |
ilde | -7.761 |
campaigner | -7.535 |
ér | -7.392 |
Token | make |
Token ID | 787 |
Feature activation | -2.81e+01 |
Pos logit contributions | |
campaigner | +9.504 |
adel | +9.115 |
ogether | +9.102 |
journalist | +9.058 |
inform | +8.640 |
Neg logit contributions | |
preferring | -13.603 |
inability | -12.527 |
wanting | -11.814 |
confines | -11.387 |
forgetting | -11.350 |
Token | a |
Token ID | 257 |
Feature activation | -2.99e+01 |
Pos logit contributions | |
journalist | +18.252 |
campaigner | +18.076 |
dign | +17.768 |
meaningful | +17.646 |
ogether | +17.290 |
Neg logit contributions | |
preferring | -18.323 |
inability | -16.233 |
confines | -15.061 |
wanting | -15.036 |
forgetting | -14.032 |
Token | sustained |
Token ID | 12605 |
Feature activation | -2.69e+01 |
Pos logit contributions | |
journalist | +18.579 |
campaigner | +18.413 |
dign | +18.153 |
meaningful | +18.084 |
credible | +17.082 |
Neg logit contributions | |
preferring | -19.687 |
inability | -17.845 |
confines | -16.943 |
wanting | -15.805 |
quirks | -15.311 |
Token | and |
Token ID | 290 |
Feature activation | -3.33e+01 |
Pos logit contributions | |
campaigner | +17.506 |
journalist | +17.069 |
ogether | +15.838 |
inform | +15.833 |
dign | +15.814 |
Neg logit contributions | |
preferring | -18.837 |
confines | -15.788 |
inability | -15.727 |
wanting | -15.191 |
quirks | -14.975 |
Token | distinguished |
Token ID | 18876 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
dign | +22.255 |
meaningful | +21.888 |
campaigner | +20.867 |
journalist | +20.727 |
inform | +20.589 |
Neg logit contributions | |
preferring | -17.699 |
inability | -16.309 |
confines | -15.611 |
quirks | -13.913 |
forgetting | -13.540 |
Token | contribution |
Token ID | 10156 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
campaigner | +15.539 |
journalist | +14.954 |
ogether | +14.156 |
adel | +14.020 |
dign | +13.884 |
Neg logit contributions | |
preferring | -18.277 |
inability | -15.488 |
confines | -15.421 |
wanting | -15.383 |
forgetting | -14.332 |
Token | to |
Token ID | 284 |
Feature activation | -6.85e+00 |
Pos logit contributions | |
preferring | +1.103 |
inability | +0.951 |
wanting | +0.883 |
choosing | +0.801 |
confines | +0.766 |
Neg logit contributions | |
ogether | -2.459 |
adel | -2.408 |
campaigner | -2.397 |
ilde | -2.365 |
journalist | -2.306 |
Token | well |
Token ID | 880 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
ogether | +18.674 |
campaigner | +18.482 |
journalist | +18.183 |
adel | +18.161 |
inform | +17.455 |
Neg logit contributions | |
preferring | -13.934 |
inability | -12.653 |
confines | -11.551 |
wanting | -10.982 |
choosing | -10.851 |
Token | . |
Token ID | 13 |
Feature activation | -9.89e+00 |
Pos logit contributions | |
ogether | +17.754 |
campaigner | +17.231 |
adel | +16.963 |
journalist | +16.435 |
ilde | +16.173 |
Neg logit contributions | |
preferring | -14.299 |
inability | -13.839 |
confines | -11.653 |
wanting | -11.618 |
forgetting | -11.201 |
Token | Now |
Token ID | 2735 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
ogether | +7.662 |
adel | +7.559 |
journalist | +7.335 |
campaigner | +7.315 |
ilde | +7.268 |
Neg logit contributions | |
preferring | -9.073 |
inability | -8.401 |
wanting | -7.670 |
choosing | -7.456 |
confines | -7.425 |
Token | we |
Token ID | 356 |
Feature activation | -9.12e+00 |
Pos logit contributions | |
ogether | +10.142 |
adel | +10.027 |
campaigner | +9.945 |
journalist | +9.698 |
ilde | +9.633 |
Neg logit contributions | |
preferring | -10.731 |
inability | -9.767 |
wanting | -9.055 |
confines | -8.994 |
choosing | -8.552 |
Token | are |
Token ID | 389 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
ogether | +6.287 |
adel | +6.205 |
campaigner | +6.188 |
ilde | +5.991 |
journalist | +5.851 |
Neg logit contributions | |
preferring | -9.152 |
inability | -8.461 |
wanting | -7.909 |
confines | -7.785 |
choosing | -7.657 |
Token | playing |
Token ID | 2712 |
Feature activation | -2.95e+01 |
Pos logit contributions | |
ogether | +10.792 |
campaigner | +10.669 |
adel | +10.617 |
ilde | +10.349 |
journalist | +10.268 |
Neg logit contributions | |
preferring | -6.921 |
inability | -6.318 |
confines | -5.591 |
wanting | -5.504 |
choosing | -5.133 |
Token | well |
Token ID | 880 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
ogether | +20.732 |
campaigner | +20.541 |
journalist | +20.330 |
adel | +20.242 |
inform | +19.651 |
Neg logit contributions | |
preferring | -15.913 |
inability | -14.352 |
confines | -13.497 |
Untitled | -12.592 |
choosing | -12.584 |
Token | , |
Token ID | 11 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
ogether | +19.344 |
adel | +18.818 |
campaigner | +18.647 |
journalist | +17.983 |
ilde | +17.479 |
Neg logit contributions | |
preferring | -14.635 |
inability | -14.080 |
confines | -12.276 |
wanting | -11.628 |
choosing | -11.407 |
Token | it |
Token ID | 340 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
adel | +18.383 |
ogether | +18.378 |
campaigner | +18.060 |
journalist | +17.717 |
ilde | +17.301 |
Neg logit contributions | |
preferring | -11.996 |
inability | -11.433 |
confines | -10.688 |
wanting | -9.563 |
choosing | -9.145 |
Token | shows |
Token ID | 2523 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
ogether | +8.476 |
adel | +8.187 |
campaigner | +7.997 |
ilde | +7.963 |
ér | +7.668 |
Neg logit contributions | |
preferring | -11.266 |
inability | -10.408 |
wanting | -9.660 |
choosing | -9.269 |
confines | -9.267 |
Token | the |
Token ID | 262 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
ogether | +10.324 |
campaigner | +10.198 |
adel | +10.164 |
journalist | +9.904 |
ilde | +9.746 |
Neg logit contributions | |
preferring | -8.844 |
inability | -7.810 |
confines | -7.227 |
wanting | -7.186 |
choosing | -6.846 |
Token | Newcastle |
Token ID | 22410 |
Feature activation | +4.32e+00 |
Pos logit contributions | |
ogether | +2.359 |
campaigner | +2.292 |
adel | +2.291 |
ilde | +2.240 |
journalist | +2.196 |
Neg logit contributions | |
preferring | -1.773 |
inability | -1.607 |
wanting | -1.503 |
choosing | -1.401 |
confines | -1.392 |
Token | United |
Token ID | 1578 |
Feature activation | +1.36e+01 |
Pos logit contributions | |
preferring | +3.466 |
inability | +3.088 |
wanting | +3.024 |
choosing | +2.807 |
confines | +2.684 |
Neg logit contributions | |
ogether | -4.236 |
adel | -4.095 |
campaigner | -4.039 |
ilde | -4.009 |
ér | -3.874 |
Token | developing |
Token ID | 5922 |
Feature activation | -7.76e+00 |
Pos logit contributions | |
preferring | +11.763 |
wanting | +11.009 |
inability | +10.380 |
choosing | +10.267 |
forgetting | +9.630 |
Neg logit contributions | |
ogether | -11.069 |
adel | -10.468 |
ilde | -10.288 |
earthqu | -10.053 |
quished | -9.889 |
Token | a |
Token ID | 257 |
Feature activation | -2.09e+01 |
Pos logit contributions | |
ogether | +5.651 |
campaigner | +5.563 |
adel | +5.427 |
journalist | +5.240 |
ilde | +5.196 |
Neg logit contributions | |
preferring | -7.778 |
inability | -7.256 |
wanting | -6.783 |
confines | -6.557 |
choosing | -6.502 |
Token | meaningful |
Token ID | 11570 |
Feature activation | -1.95e+01 |
Pos logit contributions | |
campaigner | +16.223 |
journalist | +15.612 |
ogether | +15.206 |
adel | +14.745 |
isan | +14.437 |
Neg logit contributions | |
preferring | -15.440 |
inability | -14.087 |
confines | -12.428 |
wanting | -12.333 |
forgetting | -12.264 |
Token | and |
Token ID | 290 |
Feature activation | -2.95e+01 |
Pos logit contributions | |
campaigner | +14.983 |
journalist | +14.251 |
ogether | +13.966 |
isan | +13.564 |
adel | +13.364 |
Neg logit contributions | |
preferring | -15.196 |
inability | -13.270 |
wanting | -12.319 |
forgetting | -11.980 |
choosing | -11.909 |
Token | structured |
Token ID | 20793 |
Feature activation | -1.55e+01 |
Pos logit contributions | |
campaigner | +21.825 |
journalist | +21.451 |
dign | +21.166 |
inform | +20.815 |
credible | +20.509 |
Neg logit contributions | |
preferring | -16.101 |
inability | -14.984 |
addons | -12.939 |
confines | -12.557 |
forgetting | -12.507 |
Token | relationship |
Token ID | 2776 |
Feature activation | -9.57e+00 |
Pos logit contributions | |
campaigner | +12.380 |
journalist | +11.720 |
ogether | +11.681 |
adel | +11.116 |
isan | +11.046 |
Neg logit contributions | |
preferring | -12.839 |
inability | -11.525 |
wanting | -10.670 |
choosing | -10.227 |
forgetting | -10.211 |
Token | with |
Token ID | 351 |
Feature activation | -8.22e+00 |
Pos logit contributions | |
ogether | +7.016 |
campaigner | +6.882 |
adel | +6.732 |
journalist | +6.582 |
ilde | +6.448 |
Neg logit contributions | |
preferring | -9.132 |
inability | -8.621 |
wanting | -7.928 |
confines | -7.765 |
forgetting | -7.588 |
Token | the |
Token ID | 262 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
ogether | +5.690 |
campaigner | +5.672 |
adel | +5.516 |
journalist | +5.358 |
ilde | +5.262 |
Neg logit contributions | |
preferring | -8.309 |
inability | -7.797 |
wanting | -7.277 |
confines | -7.061 |
choosing | -6.957 |
Token | fans |
Token ID | 3296 |
Feature activation | -3.07e+00 |
Pos logit contributions | |
ogether | +0.905 |
adel | +0.870 |
campaigner | +0.868 |
ilde | +0.846 |
journalist | +0.818 |
Neg logit contributions | |
preferring | -1.182 |
inability | -1.098 |
wanting | -1.048 |
choosing | -0.995 |
confines | -0.991 |
Token | quite |
Token ID | 2407 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
ogether | +10.736 |
campaigner | +10.522 |
adel | +10.514 |
journalist | +10.242 |
ilde | +10.204 |
Neg logit contributions | |
preferring | -9.618 |
inability | -8.665 |
confines | -7.944 |
wanting | -7.885 |
choosing | -7.404 |
Token | easy |
Token ID | 2562 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
campaigner | +12.257 |
ogether | +12.154 |
journalist | +12.022 |
adel | +11.960 |
ilde | +11.673 |
Neg logit contributions | |
preferring | -12.573 |
inability | -11.408 |
confines | -10.682 |
wanting | -10.198 |
choosing | -9.833 |
Token | to |
Token ID | 284 |
Feature activation | -4.86e+00 |
Pos logit contributions | |
preferring | +9.681 |
inability | +8.963 |
wanting | +8.893 |
choosing | +8.400 |
forgetting | +8.184 |
Neg logit contributions | |
ogether | -8.268 |
adel | -7.982 |
ilde | -7.802 |
campaigner | -7.792 |
isan | -7.470 |
Token | sort |
Token ID | 3297 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
ogether | +3.587 |
campaigner | +3.501 |
adel | +3.480 |
ilde | +3.356 |
journalist | +3.308 |
Neg logit contributions | |
preferring | -4.951 |
inability | -4.584 |
wanting | -4.363 |
choosing | -4.156 |
confines | -4.150 |
Token | those |
Token ID | 883 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
ogether | +13.478 |
campaigner | +12.842 |
adel | +12.787 |
ilde | +12.652 |
ér | +12.629 |
Neg logit contributions | |
preferring | -14.386 |
inability | -12.897 |
confines | -12.263 |
wanting | -12.035 |
choosing | -11.580 |
Token | issues |
Token ID | 2428 |
Feature activation | -2.93e+01 |
Pos logit contributions | |
ogether | +12.931 |
campaigner | +12.705 |
journalist | +12.297 |
ér | +12.172 |
adel | +12.135 |
Neg logit contributions | |
preferring | -14.412 |
inability | -12.877 |
wanting | -11.909 |
choosing | -11.672 |
confines | -11.531 |
Token | . |
Token ID | 13 |
Feature activation | -6.87e+00 |
Pos logit contributions | |
ogether | +18.997 |
campaigner | +18.282 |
journalist | +18.066 |
adel | +18.012 |
inform | +17.655 |
Neg logit contributions | |
preferring | -19.253 |
inability | -17.931 |
confines | -16.218 |
wanting | -15.617 |
choosing | -14.967 |
Token | � |
Token ID | 447 |
Feature activation | -6.20e+00 |
Pos logit contributions | |
ogether | +4.799 |
adel | +4.646 |
campaigner | +4.580 |
ilde | +4.501 |
journalist | +4.424 |
Neg logit contributions | |
preferring | -7.168 |
inability | -6.700 |
wanting | -6.264 |
choosing | -6.032 |
confines | -6.017 |
Token | � |
Token ID | 251 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
ogether | +3.862 |
adel | +3.678 |
campaigner | +3.669 |
ilde | +3.580 |
journalist | +3.456 |
Neg logit contributions | |
preferring | -6.995 |
inability | -6.548 |
wanting | -6.275 |
choosing | -5.984 |
confines | -5.980 |
Token |
|
Token ID | 198 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
ogether | +2.429 |
campaigner | +2.332 |
adel | +2.331 |
ilde | +2.258 |
journalist | +2.211 |
Neg logit contributions | |
preferring | -3.370 |
inability | -3.141 |
wanting | -2.980 |
choosing | -2.844 |
confines | -2.837 |
Token |
|
Token ID | 198 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
ogether | +1.164 |
campaigner | +1.120 |
adel | +1.118 |
ilde | +1.086 |
journalist | +1.056 |
Neg logit contributions | |
preferring | -1.532 |
inability | -1.423 |
wanting | -1.356 |
choosing | -1.289 |
confines | -1.283 |
Token | to |
Token ID | 284 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
preferring | +9.887 |
inability | +8.977 |
wanting | +8.776 |
choosing | +8.599 |
forgetting | +8.210 |
Neg logit contributions | |
ogether | -8.171 |
adel | -7.741 |
campaigner | -7.719 |
ér | -7.272 |
alysed | -7.215 |
Token | include |
Token ID | 2291 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
preferring | +1.398 |
inability | +1.296 |
wanting | +1.240 |
choosing | +1.181 |
confines | +1.168 |
Neg logit contributions | |
ogether | -1.110 |
adel | -1.069 |
campaigner | -1.065 |
ilde | -1.033 |
journalist | -1.004 |
Token | "\ |
Token ID | 37082 |
Feature activation | +7.10e+00 |
Pos logit contributions | |
preferring | +1.361 |
inability | +1.263 |
wanting | +1.208 |
choosing | +1.151 |
confines | +1.141 |
Neg logit contributions | |
ogether | -1.050 |
adel | -1.007 |
campaigner | -1.006 |
ilde | -0.968 |
journalist | -0.948 |
Token | :" |
Token ID | 11097 |
Feature activation | -3.30e+00 |
Pos logit contributions | |
preferring | +5.969 |
inability | +5.468 |
wanting | +5.249 |
choosing | +4.947 |
confines | +4.888 |
Neg logit contributions | |
ogether | -6.160 |
campaigner | -6.031 |
adel | -5.847 |
ilde | -5.732 |
journalist | -5.722 |
Token | you |
Token ID | 345 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
ogether | +2.285 |
adel | +2.191 |
campaigner | +2.189 |
ilde | +2.128 |
journalist | +2.056 |
Neg logit contributions | |
preferring | -3.562 |
inability | -3.333 |
wanting | -3.177 |
choosing | -3.030 |
confines | -3.021 |
Token | have |
Token ID | 423 |
Feature activation | +3.20e+01 |
Pos logit contributions | |
preferring | +11.085 |
wanting | +10.130 |
inability | +9.984 |
choosing | +9.598 |
confines | +9.132 |
Neg logit contributions | |
ogether | -12.030 |
earthqu | -11.441 |
adel | -11.247 |
campaigner | -11.106 |
alysed | -10.978 |
Token | to |
Token ID | 284 |
Feature activation | +9.25e+00 |
Pos logit contributions | |
preferring | +20.856 |
to | +20.005 |
inability | +19.494 |
wanting | +19.347 |
to | +19.345 |
Neg logit contributions | |
ogether | -18.733 |
campaigner | -18.719 |
adel | -18.644 |
alysed | -17.719 |
ér | -17.338 |
Token | specify |
Token ID | 11986 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
preferring | +8.934 |
inability | +8.186 |
wanting | +8.056 |
choosing | +7.780 |
confines | +7.558 |
Neg logit contributions | |
ogether | -6.775 |
adel | -6.473 |
alysed | -6.419 |
campaigner | -6.402 |
earthqu | -6.061 |
Token | " |
Token ID | 366 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
preferring | +9.260 |
inability | +8.489 |
wanting | +8.292 |
choosing | +7.924 |
confines | +7.706 |
Neg logit contributions | |
ogether | -8.046 |
campaigner | -7.733 |
adel | -7.657 |
ér | -7.357 |
alysed | -7.287 |
Token | \\ |
Token ID | 6852 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
preferring | +10.159 |
inability | +9.372 |
wanting | +8.947 |
choosing | +8.601 |
to | +8.542 |
Neg logit contributions | |
ogether | -9.461 |
campaigner | -9.419 |
adel | -8.906 |
journalist | -8.901 |
ér | -8.751 |
Token | : |
Token ID | 25 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
preferring | +9.487 |
inability | +8.773 |
wanting | +8.490 |
choosing | +8.013 |
to | +7.948 |
Neg logit contributions | |
ogether | -8.280 |
campaigner | -8.231 |
adel | -7.871 |
ér | -7.782 |
journalist | -7.748 |
Token | , |
Token ID | 11 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
preferring | +4.466 |
inability | +4.075 |
wanting | +3.994 |
choosing | +3.791 |
confines | +3.660 |
Neg logit contributions | |
ogether | -3.483 |
adel | -3.352 |
campaigner | -3.315 |
ilde | -3.296 |
alysed | -3.107 |
Token | seeking |
Token ID | 6095 |
Feature activation | +8.76e+00 |
Pos logit contributions | |
ogether | +1.313 |
adel | +1.280 |
campaigner | +1.279 |
ilde | +1.258 |
journalist | +1.232 |
Neg logit contributions | |
preferring | -0.665 |
inability | -0.581 |
wanting | -0.538 |
choosing | -0.489 |
confines | -0.474 |
Token | to |
Token ID | 284 |
Feature activation | -6.01e+00 |
Pos logit contributions | |
preferring | +8.448 |
inability | +8.074 |
wanting | +7.647 |
choosing | +7.204 |
confines | +7.025 |
Neg logit contributions | |
ogether | -6.458 |
ilde | -6.224 |
campaigner | -6.175 |
adel | -6.143 |
alysed | -5.818 |
Token | force |
Token ID | 2700 |
Feature activation | -8.62e+00 |
Pos logit contributions | |
ogether | +4.605 |
campaigner | +4.480 |
adel | +4.458 |
ilde | +4.296 |
journalist | +4.270 |
Neg logit contributions | |
preferring | -5.938 |
inability | -5.482 |
wanting | -5.204 |
choosing | -4.953 |
confines | -4.910 |
Token | the |
Token ID | 262 |
Feature activation | +6.30e+00 |
Pos logit contributions | |
ogether | +6.066 |
adel | +5.806 |
campaigner | +5.790 |
ilde | +5.593 |
journalist | +5.483 |
Neg logit contributions | |
preferring | -8.927 |
inability | -8.283 |
wanting | -7.880 |
confines | -7.579 |
choosing | -7.473 |
Token | agency |
Token ID | 4086 |
Feature activation | +3.32e+01 |
Pos logit contributions | |
preferring | +5.081 |
inability | +4.788 |
wanting | +4.451 |
choosing | +4.224 |
confines | +4.176 |
Neg logit contributions | |
ogether | -5.738 |
adel | -5.637 |
campaigner | -5.559 |
ilde | -5.550 |
alysed | -5.410 |
Token | to |
Token ID | 284 |
Feature activation | -6.10e+00 |
Pos logit contributions | |
preferring | +22.089 |
inability | +20.996 |
to | +20.657 |
to | +20.436 |
wanting | +20.273 |
Neg logit contributions | |
ilde | -18.280 |
ogether | -17.689 |
campaigner | -17.219 |
isan | -17.081 |
adel | -16.879 |
Token | finish |
Token ID | 5461 |
Feature activation | -9.44e+00 |
Pos logit contributions | |
ogether | +4.201 |
campaigner | +4.055 |
adel | +4.032 |
ilde | +3.899 |
journalist | +3.858 |
Neg logit contributions | |
preferring | -6.459 |
inability | -6.021 |
wanting | -5.747 |
choosing | -5.452 |
confines | -5.444 |
Token | investigating |
Token ID | 10240 |
Feature activation | -1.52e+01 |
Pos logit contributions | |
ogether | +9.105 |
campaigner | +8.828 |
adel | +8.690 |
ilde | +8.527 |
ér | +8.503 |
Neg logit contributions | |
preferring | -7.002 |
inability | -6.299 |
wanting | -5.866 |
confines | -5.609 |
forgetting | -5.354 |
Token | civil |
Token ID | 3026 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
ogether | +12.271 |
campaigner | +12.097 |
adel | +11.738 |
journalist | +11.681 |
ilde | +11.262 |
Neg logit contributions | |
preferring | -12.104 |
inability | -10.923 |
wanting | -10.306 |
confines | -10.083 |
forgetting | -9.649 |
Token | - |
Token ID | 12 |
Feature activation | -7.77e+00 |
Pos logit contributions | |
ogether | +4.844 |
campaigner | +4.650 |
adel | +4.510 |
journalist | +4.322 |
ilde | +4.214 |
Neg logit contributions | |
preferring | -10.740 |
inability | -9.950 |
wanting | -9.731 |
choosing | -9.316 |
confines | -9.237 |
Token |
|
Token ID | 198 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
ogether | +0.037 |
campaigner | +0.035 |
adel | +0.035 |
ilde | +0.034 |
journalist | +0.033 |
Neg logit contributions | |
preferring | -0.047 |
inability | -0.044 |
wanting | -0.042 |
choosing | -0.039 |
confines | -0.039 |
Token |
|
Token ID | 198 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
ogether | +2.433 |
adel | +2.359 |
campaigner | +2.338 |
ilde | +2.281 |
journalist | +2.227 |
Neg logit contributions | |
preferring | -3.504 |
inability | -3.259 |
wanting | -3.089 |
choosing | -2.950 |
confines | -2.943 |
Token | And |
Token ID | 1870 |
Feature activation | -7.99e+00 |
Pos logit contributions | |
preferring | +0.145 |
inability | +0.133 |
wanting | +0.126 |
choosing | +0.119 |
confines | +0.118 |
Neg logit contributions | |
ogether | -0.142 |
campaigner | -0.138 |
adel | -0.137 |
ilde | -0.134 |
journalist | -0.131 |
Token | when |
Token ID | 618 |
Feature activation | +4.19e+00 |
Pos logit contributions | |
ogether | +6.460 |
campaigner | +6.318 |
adel | +6.212 |
ilde | +6.043 |
journalist | +6.041 |
Neg logit contributions | |
preferring | -7.237 |
inability | -6.706 |
wanting | -6.281 |
confines | -6.072 |
choosing | -5.910 |
Token | it |
Token ID | 340 |
Feature activation | +4.77e+00 |
Pos logit contributions | |
preferring | +4.303 |
inability | +3.971 |
wanting | +3.872 |
choosing | +3.723 |
confines | +3.571 |
Neg logit contributions | |
ogether | -3.168 |
adel | -3.043 |
campaigner | -2.960 |
ilde | -2.937 |
ér | -2.855 |
Token | comes |
Token ID | 2058 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
preferring | +4.916 |
inability | +4.616 |
wanting | +4.474 |
choosing | +4.258 |
confines | +4.220 |
Neg logit contributions | |
ogether | -3.471 |
adel | -3.280 |
campaigner | -3.229 |
ilde | -3.190 |
ér | -3.076 |
Token | to |
Token ID | 284 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
preferring | +24.212 |
wanting | +22.416 |
inability | +22.347 |
choosing | +22.042 |
to | +21.476 |
Neg logit contributions | |
ogether | -18.926 |
adel | -18.038 |
ilde | -18.019 |
isan | -17.187 |
ér | -16.707 |
Token | nodding |
Token ID | 47583 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
preferring | +19.395 |
wanting | +17.732 |
inability | +17.383 |
choosing | +17.164 |
forgetting | +16.162 |
Neg logit contributions | |
ogether | -13.757 |
ilde | -13.366 |
adel | -13.216 |
ér | -12.677 |
earthqu | -12.454 |
Token | off |
Token ID | 572 |
Feature activation | +5.27e+00 |
Pos logit contributions | |
ogether | +2.010 |
campaigner | +1.942 |
adel | +1.933 |
ilde | +1.878 |
journalist | +1.835 |
Neg logit contributions | |
preferring | -2.563 |
inability | -2.380 |
wanting | -2.260 |
choosing | -2.152 |
confines | -2.143 |
Token | on |
Token ID | 319 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
preferring | +5.527 |
inability | +5.115 |
wanting | +4.969 |
choosing | +4.697 |
forgetting | +4.602 |
Neg logit contributions | |
ogether | -3.804 |
adel | -3.654 |
campaigner | -3.528 |
ilde | -3.499 |
ér | -3.322 |
Token | the |
Token ID | 262 |
Feature activation | +1.68e+01 |
Pos logit contributions | |
preferring | +14.072 |
inability | +13.000 |
wanting | +12.819 |
choosing | +12.233 |
forgetting | +11.736 |
Neg logit contributions | |
ogether | -10.840 |
adel | -10.685 |
ilde | -10.458 |
ér | -9.928 |
campaigner | -9.841 |
Token | minutes |
Token ID | 2431 |
Feature activation | -3.39e+00 |
Pos logit contributions | |
preferring | +0.502 |
inability | +0.468 |
wanting | +0.448 |
choosing | +0.425 |
confines | +0.420 |
Neg logit contributions | |
ogether | -0.392 |
adel | -0.375 |
campaigner | -0.373 |
ilde | -0.366 |
ér | -0.351 |
Token | . |
Token ID | 13 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
ogether | +2.237 |
campaigner | +2.142 |
adel | +2.134 |
ilde | +2.044 |
journalist | +2.009 |
Neg logit contributions | |
preferring | -3.741 |
inability | -3.513 |
wanting | -3.342 |
confines | -3.200 |
choosing | -3.194 |
Token | From |
Token ID | 3574 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
ogether | +2.666 |
adel | +2.589 |
campaigner | +2.574 |
ilde | +2.504 |
journalist | +2.468 |
Neg logit contributions | |
preferring | -3.539 |
inability | -3.289 |
wanting | -3.097 |
choosing | -2.963 |
confines | -2.953 |
Token | M |
Token ID | 337 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
preferring | +10.141 |
inability | +9.414 |
wanting | +9.273 |
choosing | +8.837 |
forgetting | +8.485 |
Neg logit contributions | |
ogether | -7.884 |
adel | -7.645 |
ilde | -7.558 |
campaigner | -7.302 |
isan | -7.198 |
Token | iley |
Token ID | 9618 |
Feature activation | +6.62e+00 |
Pos logit contributions | |
ogether | +0.737 |
campaigner | +0.707 |
adel | +0.702 |
ilde | +0.679 |
journalist | +0.661 |
Neg logit contributions | |
preferring | -1.186 |
inability | -1.110 |
wanting | -1.061 |
choosing | -1.014 |
confines | -1.009 |
Token | Cyrus |
Token ID | 34305 |
Feature activation | +3.47e+01 |
Pos logit contributions | |
preferring | +6.120 |
inability | +5.594 |
wanting | +5.415 |
choosing | +5.165 |
forgetting | +4.973 |
Neg logit contributions | |
ogether | -5.515 |
ilde | -5.197 |
adel | -5.180 |
campaigner | -5.156 |
isan | -4.929 |
Token | phot |
Token ID | 2825 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
preferring | +25.209 |
wanting | +24.005 |
choosing | +22.698 |
inability | +22.535 |
to | +21.835 |
Neg logit contributions | |
ogether | -17.932 |
ilde | -16.830 |
isan | -15.782 |
owship | -15.570 |
emed | -15.288 |
Token | ob |
Token ID | 672 |
Feature activation | -5.10e+00 |
Pos logit contributions | |
ogether | +1.858 |
adel | +1.761 |
campaigner | +1.732 |
ilde | +1.642 |
journalist | +1.568 |
Neg logit contributions | |
preferring | -5.359 |
inability | -5.062 |
wanting | -4.878 |
confines | -4.698 |
choosing | -4.689 |
Token | omb |
Token ID | 2381 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
ogether | +2.658 |
adel | +2.541 |
campaigner | +2.485 |
ilde | +2.406 |
journalist | +2.288 |
Neg logit contributions | |
preferring | -6.384 |
inability | -6.002 |
wanting | -5.772 |
confines | -5.553 |
choosing | -5.539 |
Token | ing |
Token ID | 278 |
Feature activation | +8.39e+00 |
Pos logit contributions | |
preferring | +14.686 |
wanting | +13.817 |
inability | +13.635 |
choosing | +12.842 |
confines | +12.433 |
Neg logit contributions | |
ogether | -10.583 |
ilde | -10.009 |
campaigner | -9.748 |
isan | -9.526 |
adel | -9.239 |
Token | David |
Token ID | 3271 |
Feature activation | -3.56e-02 |
Pos logit contributions | |
preferring | +8.251 |
inability | +7.691 |
wanting | +7.524 |
choosing | +7.071 |
confines | +6.909 |
Neg logit contributions | |
ogether | -6.171 |
adel | -5.772 |
ilde | -5.694 |
isan | -5.629 |
campaigner | -5.596 |
Token | state |
Token ID | 1181 |
Feature activation | +4.88e+00 |
Pos logit contributions | |
preferring | +6.557 |
inability | +6.174 |
wanting | +5.923 |
choosing | +5.666 |
confines | +5.517 |
Neg logit contributions | |
ogether | -4.988 |
campaigner | -4.572 |
adel | -4.565 |
ilde | -4.560 |
ér | -4.432 |
Token | - |
Token ID | 12 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
preferring | +5.081 |
inability | +4.796 |
wanting | +4.576 |
choosing | +4.398 |
confines | +4.364 |
Neg logit contributions | |
ogether | -3.477 |
campaigner | -3.325 |
adel | -3.297 |
ilde | -3.280 |
ér | -3.053 |
Token | funded |
Token ID | 18246 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
preferring | +0.461 |
inability | +0.429 |
wanting | +0.410 |
choosing | +0.391 |
confines | +0.386 |
Neg logit contributions | |
ogether | -0.354 |
campaigner | -0.346 |
adel | -0.340 |
ilde | -0.335 |
journalist | -0.323 |
Token | private |
Token ID | 2839 |
Feature activation | -5.68e-02 |
Pos logit contributions | |
preferring | +1.718 |
inability | +1.596 |
wanting | +1.516 |
choosing | +1.442 |
confines | +1.429 |
Neg logit contributions | |
ogether | -1.493 |
adel | -1.420 |
campaigner | -1.411 |
ilde | -1.405 |
ér | -1.341 |
Token | adoption |
Token ID | 12695 |
Feature activation | -2.92e+00 |
Pos logit contributions | |
ogether | +0.053 |
adel | +0.051 |
campaigner | +0.051 |
ilde | +0.050 |
ér | +0.048 |
Neg logit contributions | |
preferring | -0.048 |
inability | -0.044 |
wanting | -0.042 |
choosing | -0.040 |
confines | -0.039 |
Token | agencies |
Token ID | 5942 |
Feature activation | +2.92e+01 |
Pos logit contributions | |
ogether | +2.185 |
campaigner | +2.124 |
adel | +2.110 |
ilde | +2.035 |
journalist | +2.003 |
Neg logit contributions | |
preferring | -2.960 |
inability | -2.759 |
wanting | -2.620 |
confines | -2.491 |
choosing | -2.490 |
Token | to |
Token ID | 284 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
preferring | +20.212 |
inability | +19.504 |
wanting | +19.310 |
to | +17.838 |
choosing | +17.783 |
Neg logit contributions | |
ilde | -19.426 |
ogether | -18.681 |
campaigner | -17.721 |
earthqu | -17.195 |
adel | -16.921 |
Token | turn |
Token ID | 1210 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
preferring | +0.127 |
inability | +0.118 |
wanting | +0.112 |
choosing | +0.106 |
confines | +0.105 |
Neg logit contributions | |
ogether | -0.118 |
adel | -0.114 |
campaigner | -0.113 |
ilde | -0.112 |
journalist | -0.107 |
Token | away |
Token ID | 1497 |
Feature activation | -4.27e+00 |
Pos logit contributions | |
ogether | +1.715 |
campaigner | +1.645 |
adel | +1.645 |
ilde | +1.591 |
journalist | +1.546 |
Neg logit contributions | |
preferring | -2.593 |
inability | -2.419 |
wanting | -2.311 |
choosing | -2.204 |
confines | -2.196 |
Token | prospective |
Token ID | 17530 |
Feature activation | -8.16e+00 |
Pos logit contributions | |
ogether | +3.253 |
campaigner | +3.193 |
adel | +3.158 |
ilde | +3.072 |
journalist | +3.045 |
Neg logit contributions | |
preferring | -4.182 |
inability | -3.863 |
wanting | -3.654 |
confines | -3.511 |
choosing | -3.476 |
Token | parents |
Token ID | 3397 |
Feature activation | +8.38e+00 |
Pos logit contributions | |
ogether | +6.104 |
campaigner | +6.097 |
adel | +6.011 |
journalist | +5.861 |
ilde | +5.774 |
Neg logit contributions | |
preferring | -7.677 |
inability | -7.093 |
wanting | -6.653 |
confines | -6.416 |
forgetting | -6.293 |
Token | � |
Token ID | 250 |
Feature activation | +3.07e+00 |
Pos logit contributions | |
ogether | +2.230 |
campaigner | +2.133 |
adel | +2.127 |
ilde | +2.075 |
journalist | +2.009 |
Neg logit contributions | |
preferring | -3.490 |
inability | -3.253 |
wanting | -3.112 |
choosing | -2.964 |
confines | -2.961 |
Token | Early |
Token ID | 20457 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
preferring | +2.807 |
inability | +2.587 |
wanting | +2.455 |
choosing | +2.322 |
confines | +2.296 |
Neg logit contributions | |
ogether | -2.598 |
campaigner | -2.542 |
adel | -2.523 |
ilde | -2.463 |
journalist | -2.390 |
Token | results |
Token ID | 2482 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
ogether | +11.269 |
campaigner | +11.219 |
adel | +10.928 |
journalist | +10.745 |
ilde | +10.626 |
Neg logit contributions | |
preferring | -10.764 |
inability | -9.651 |
wanting | -9.245 |
confines | -8.808 |
forgetting | -8.542 |
Token | from |
Token ID | 422 |
Feature activation | -6.25e+00 |
Pos logit contributions | |
ogether | +10.055 |
adel | +9.969 |
campaigner | +9.871 |
journalist | +9.701 |
ilde | +9.421 |
Neg logit contributions | |
preferring | -11.171 |
inability | -10.438 |
wanting | -9.778 |
confines | -9.502 |
forgetting | -9.351 |
Token | 2017 |
Token ID | 2177 |
Feature activation | -5.08e+00 |
Pos logit contributions | |
ogether | +4.597 |
adel | +4.465 |
campaigner | +4.436 |
journalist | +4.274 |
ilde | +4.245 |
Neg logit contributions | |
preferring | -6.264 |
inability | -5.788 |
wanting | -5.512 |
confines | -5.289 |
choosing | -5.202 |
Token | suggest |
Token ID | 1950 |
Feature activation | +7.22e+00 |
Pos logit contributions | |
ogether | +3.626 |
adel | +3.507 |
campaigner | +3.476 |
ilde | +3.337 |
journalist | +3.311 |
Neg logit contributions | |
preferring | -5.292 |
inability | -4.901 |
wanting | -4.682 |
confines | -4.476 |
choosing | -4.459 |
Token | the |
Token ID | 262 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
preferring | +5.857 |
inability | +5.441 |
wanting | +5.095 |
choosing | +4.851 |
confines | +4.681 |
Neg logit contributions | |
ogether | -6.670 |
campaigner | -6.483 |
adel | -6.389 |
ilde | -6.336 |
ér | -6.084 |
Token | individual |
Token ID | 1981 |
Feature activation | +4.29e+00 |
Pos logit contributions | |
preferring | +9.132 |
inability | +8.987 |
wanting | +8.157 |
choosing | +7.904 |
confines | +7.876 |
Neg logit contributions | |
ogether | -7.650 |
campaigner | -7.446 |
ilde | -7.388 |
adel | -7.382 |
ér | -6.965 |
Token | market |
Token ID | 1910 |
Feature activation | +7.71e+00 |
Pos logit contributions | |
preferring | +4.041 |
inability | +3.801 |
wanting | +3.576 |
choosing | +3.445 |
confines | +3.367 |
Neg logit contributions | |
ogether | -3.500 |
adel | -3.355 |
campaigner | -3.345 |
ilde | -3.333 |
ér | -3.173 |
Token | is |
Token ID | 318 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
preferring | +7.358 |
inability | +7.007 |
wanting | +6.559 |
confines | +6.306 |
choosing | +6.294 |
Neg logit contributions | |
ogether | -5.880 |
adel | -5.619 |
ilde | -5.578 |
campaigner | -5.551 |
isan | -5.238 |
Token | stabil |
Token ID | 14349 |
Feature activation | -9.12e+00 |
Pos logit contributions | |
ogether | +0.982 |
campaigner | +0.949 |
adel | +0.948 |
ilde | +0.925 |
journalist | +0.901 |
Neg logit contributions | |
preferring | -0.997 |
inability | -0.917 |
wanting | -0.868 |
choosing | -0.820 |
confines | -0.812 |
Token | ( |
Token ID | 357 |
Feature activation | +6.39e+00 |
Pos logit contributions | |
preferring | +3.013 |
inability | +2.764 |
wanting | +2.657 |
choosing | +2.495 |
confines | +2.470 |
Neg logit contributions | |
ogether | -2.733 |
campaigner | -2.637 |
adel | -2.617 |
ilde | -2.573 |
journalist | -2.477 |
Token | QL |
Token ID | 9711 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
preferring | +5.331 |
inability | +4.914 |
wanting | +4.695 |
choosing | +4.373 |
confines | +4.346 |
Neg logit contributions | |
ogether | -5.753 |
campaigner | -5.494 |
ilde | -5.373 |
adel | -5.235 |
journalist | -5.204 |
Token | D |
Token ID | 35 |
Feature activation | +3.91e+00 |
Pos logit contributions | |
preferring | +2.105 |
inability | +1.934 |
wanting | +1.820 |
choosing | +1.686 |
confines | +1.677 |
Neg logit contributions | |
ogether | -2.472 |
campaigner | -2.374 |
adel | -2.364 |
ilde | -2.333 |
journalist | -2.256 |
Token | ), |
Token ID | 828 |
Feature activation | +4.18e+00 |
Pos logit contributions | |
preferring | +3.564 |
inability | +3.288 |
wanting | +3.111 |
choosing | +2.947 |
confines | +2.893 |
Neg logit contributions | |
ogether | -3.374 |
adel | -3.207 |
campaigner | -3.197 |
ilde | -3.136 |
ér | -3.030 |
Token | South |
Token ID | 2520 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
preferring | +3.865 |
inability | +3.579 |
wanting | +3.455 |
choosing | +3.257 |
confines | +3.209 |
Neg logit contributions | |
ogether | -3.531 |
adel | -3.319 |
campaigner | -3.311 |
ilde | -3.304 |
alysed | -3.178 |
Token | Australia |
Token ID | 4505 |
Feature activation | +7.49e+00 |
Pos logit contributions | |
ogether | +2.051 |
adel | +1.975 |
campaigner | +1.972 |
ilde | +1.912 |
journalist | +1.863 |
Neg logit contributions | |
preferring | -2.712 |
inability | -2.521 |
wanting | -2.400 |
choosing | -2.283 |
confines | -2.273 |
Token | ( |
Token ID | 357 |
Feature activation | +9.66e+00 |
Pos logit contributions | |
preferring | +6.597 |
inability | +6.009 |
wanting | +5.795 |
choosing | +5.439 |
confines | +5.373 |
Neg logit contributions | |
ogether | -6.444 |
campaigner | -6.192 |
adel | -6.169 |
ilde | -6.074 |
journalist | -5.866 |
Token | SA |
Token ID | 4090 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
preferring | +7.795 |
inability | +7.143 |
wanting | +6.910 |
to | +6.449 |
choosing | +6.288 |
Neg logit contributions | |
ogether | -8.544 |
campaigner | -8.206 |
ilde | -7.922 |
journalist | -7.760 |
alysed | -7.730 |
Token | ), |
Token ID | 828 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
preferring | +0.100 |
inability | +0.092 |
wanting | +0.088 |
choosing | +0.083 |
confines | +0.082 |
Neg logit contributions | |
ogether | -0.084 |
adel | -0.081 |
campaigner | -0.081 |
ilde | -0.079 |
journalist | -0.077 |
Token | Tasmania |
Token ID | 46896 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
preferring | +2.025 |
inability | +1.883 |
wanting | +1.811 |
choosing | +1.721 |
confines | +1.698 |
Neg logit contributions | |
ogether | -1.590 |
adel | -1.503 |
campaigner | -1.503 |
ilde | -1.486 |
ér | -1.415 |
Token | ( |
Token ID | 357 |
Feature activation | +8.72e+00 |
Pos logit contributions | |
preferring | +1.957 |
inability | +1.810 |
wanting | +1.720 |
choosing | +1.629 |
confines | +1.620 |
Neg logit contributions | |
ogether | -1.691 |
campaigner | -1.630 |
adel | -1.629 |
ilde | -1.586 |
journalist | -1.545 |
Token | illegal |
Token ID | 5293 |
Feature activation | -9.07e+00 |
Pos logit contributions | |
ogether | +5.567 |
adel | +5.443 |
campaigner | +5.440 |
journalist | +5.242 |
ilde | +5.179 |
Neg logit contributions | |
preferring | -6.381 |
inability | -5.901 |
wanting | -5.496 |
confines | -5.250 |
choosing | -5.203 |
Token | . |
Token ID | 13 |
Feature activation | -5.15e-01 |
Pos logit contributions | |
ogether | +7.256 |
adel | +7.030 |
campaigner | +7.007 |
journalist | +6.748 |
ilde | +6.641 |
Neg logit contributions | |
preferring | -8.397 |
inability | -7.646 |
wanting | -7.194 |
choosing | -6.837 |
confines | -6.802 |
Token | It |
Token ID | 632 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
ogether | +0.414 |
campaigner | +0.399 |
adel | +0.398 |
ilde | +0.387 |
journalist | +0.375 |
Neg logit contributions | |
preferring | -0.501 |
inability | -0.465 |
wanting | -0.443 |
choosing | -0.420 |
confines | -0.418 |
Token | was |
Token ID | 373 |
Feature activation | -4.95e+00 |
Pos logit contributions | |
ogether | +3.560 |
adel | +3.429 |
campaigner | +3.410 |
ilde | +3.320 |
journalist | +3.239 |
Neg logit contributions | |
preferring | -4.620 |
inability | -4.270 |
wanting | -4.050 |
choosing | -3.849 |
confines | -3.838 |
Token | the |
Token ID | 262 |
Feature activation | +8.33e+00 |
Pos logit contributions | |
ogether | +4.046 |
campaigner | +3.924 |
adel | +3.910 |
ilde | +3.783 |
journalist | +3.770 |
Neg logit contributions | |
preferring | -4.638 |
inability | -4.265 |
wanting | -4.025 |
confines | -3.840 |
choosing | -3.802 |
Token | exact |
Token ID | 2748 |
Feature activation | +8.96e+00 |
Pos logit contributions | |
preferring | +7.400 |
inability | +7.207 |
wanting | +6.663 |
choosing | +6.407 |
confines | +6.391 |
Neg logit contributions | |
ogether | -6.796 |
adel | -6.689 |
ilde | -6.514 |
campaigner | -6.396 |
ér | -6.221 |
Token | opposite |
Token ID | 6697 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
preferring | +7.183 |
inability | +7.092 |
wanting | +6.477 |
confines | +6.198 |
choosing | +6.120 |
Neg logit contributions | |
ogether | -7.969 |
adel | -7.787 |
ilde | -7.612 |
campaigner | -7.548 |
ér | -7.309 |
Token | of |
Token ID | 286 |
Feature activation | +7.34e+00 |
Pos logit contributions | |
preferring | +11.548 |
inability | +10.823 |
wanting | +10.484 |
choosing | +9.814 |
forgetting | +9.683 |
Neg logit contributions | |
ogether | -10.498 |
adel | -10.043 |
ilde | -9.954 |
campaigner | -9.542 |
isan | -9.292 |
Token | The |
Token ID | 383 |
Feature activation | +6.16e+00 |
Pos logit contributions | |
preferring | +6.614 |
inability | +6.066 |
wanting | +5.938 |
choosing | +5.599 |
forgetting | +5.403 |
Neg logit contributions | |
ogether | -6.231 |
adel | -6.053 |
ilde | -5.960 |
campaigner | -5.856 |
ér | -5.631 |
Token | Pur |
Token ID | 9330 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
preferring | +5.398 |
inability | +5.123 |
wanting | +4.740 |
choosing | +4.540 |
confines | +4.528 |
Neg logit contributions | |
ogether | -5.274 |
adel | -5.172 |
campaigner | -5.020 |
ilde | -4.973 |
ér | -4.712 |
Token | ge |
Token ID | 469 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
preferring | +1.268 |
inability | +1.196 |
wanting | +1.148 |
choosing | +1.107 |
confines | +1.084 |
Neg logit contributions | |
ogether | -0.706 |
campaigner | -0.694 |
adel | -0.663 |
ilde | -0.645 |
journalist | -0.630 |
Token | , |
Token ID | 11 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
ogether | +5.921 |
campaigner | +5.778 |
adel | +5.738 |
journalist | +5.576 |
ilde | +5.480 |
Neg logit contributions | |
preferring | -8.365 |
inability | -7.846 |
wanting | -7.270 |
confines | -7.109 |
choosing | -6.963 |
Token | handcuffed |
Token ID | 41529 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
ogether | +2.118 |
campaigner | +2.048 |
adel | +2.046 |
ilde | +1.988 |
journalist | +1.948 |
Neg logit contributions | |
preferring | -2.394 |
inability | -2.213 |
wanting | -2.097 |
choosing | -1.987 |
confines | -1.980 |
Token | , |
Token ID | 11 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
ogether | +1.286 |
campaigner | +1.237 |
adel | +1.237 |
ilde | +1.200 |
journalist | +1.167 |
Neg logit contributions | |
preferring | -1.698 |
inability | -1.577 |
wanting | -1.503 |
choosing | -1.429 |
confines | -1.422 |
Token | and |
Token ID | 290 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
ogether | +1.813 |
campaigner | +1.736 |
adel | +1.735 |
ilde | +1.677 |
journalist | +1.627 |
Neg logit contributions | |
preferring | -2.976 |
inability | -2.783 |
wanting | -2.662 |
choosing | -2.544 |
confines | -2.534 |
Token | detained |
Token ID | 14847 |
Feature activation | -9.92e+00 |
Pos logit contributions | |
ogether | +0.020 |
adel | +0.019 |
campaigner | +0.019 |
ilde | +0.019 |
ér | +0.018 |
Neg logit contributions | |
preferring | -0.021 |
inability | -0.020 |
wanting | -0.019 |
choosing | -0.018 |
confines | -0.018 |
Token | for |
Token ID | 329 |
Feature activation | +7.36e+00 |
Pos logit contributions | |
ogether | +7.320 |
campaigner | +7.116 |
adel | +7.058 |
journalist | +6.901 |
ilde | +6.757 |
Neg logit contributions | |
preferring | -9.386 |
inability | -8.751 |
wanting | -8.092 |
confines | -7.886 |
choosing | -7.746 |
Token | nearly |
Token ID | 3016 |
Feature activation | +7.14e+00 |
Pos logit contributions | |
preferring | +6.957 |
inability | +6.539 |
wanting | +6.274 |
choosing | +5.932 |
forgetting | +5.770 |
Neg logit contributions | |
ogether | -6.060 |
ilde | -5.800 |
adel | -5.771 |
campaigner | -5.612 |
ér | -5.430 |
Token | five |
Token ID | 1936 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
preferring | +6.659 |
inability | +6.297 |
wanting | +6.003 |
choosing | +5.705 |
forgetting | +5.529 |
Neg logit contributions | |
ogether | -5.877 |
ilde | -5.645 |
adel | -5.613 |
campaigner | -5.540 |
ér | -5.284 |
Token | hours |
Token ID | 2250 |
Feature activation | -2.21e+00 |
Pos logit contributions | |
preferring | +2.077 |
inability | +1.937 |
wanting | +1.839 |
choosing | +1.743 |
confines | +1.728 |
Neg logit contributions | |
ogether | -1.897 |
adel | -1.847 |
campaigner | -1.819 |
ilde | -1.797 |
ér | -1.707 |
Token | because |
Token ID | 780 |
Feature activation | +4.87e+00 |
Pos logit contributions | |
ogether | +1.360 |
adel | +1.295 |
campaigner | +1.295 |
ilde | +1.247 |
journalist | +1.204 |
Neg logit contributions | |
preferring | -2.559 |
inability | -2.401 |
wanting | -2.303 |
choosing | -2.206 |
confines | -2.197 |
Token | he |
Token ID | 339 |
Feature activation | +8.17e+00 |
Pos logit contributions | |
preferring | +4.947 |
inability | +4.610 |
wanting | +4.430 |
choosing | +4.215 |
confines | +4.142 |
Neg logit contributions | |
ogether | -3.692 |
adel | -3.490 |
campaigner | -3.443 |
ilde | -3.436 |
ér | -3.216 |
Token | all |
Token ID | 477 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
ogether | +1.996 |
campaigner | +1.922 |
adel | +1.919 |
ilde | +1.869 |
journalist | +1.825 |
Neg logit contributions | |
preferring | -2.494 |
inability | -2.308 |
wanting | -2.190 |
choosing | -2.076 |
confines | -2.067 |
Token | particles |
Token ID | 13166 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
preferring | +0.576 |
inability | +0.531 |
wanting | +0.505 |
choosing | +0.480 |
confines | +0.477 |
Neg logit contributions | |
ogether | -0.530 |
adel | -0.514 |
campaigner | -0.511 |
ilde | -0.498 |
journalist | -0.484 |
Token | .) |
Token ID | 2014 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
preferring | +2.297 |
inability | +2.119 |
wanting | +2.061 |
choosing | +1.972 |
confines | +1.951 |
Neg logit contributions | |
ogether | -1.500 |
campaigner | -1.440 |
adel | -1.427 |
ilde | -1.386 |
journalist | -1.337 |
Token | In |
Token ID | 554 |
Feature activation | +8.54e+00 |
Pos logit contributions | |
preferring | +1.982 |
inability | +1.838 |
wanting | +1.761 |
choosing | +1.674 |
confines | +1.664 |
Neg logit contributions | |
ogether | -1.705 |
campaigner | -1.654 |
adel | -1.644 |
ilde | -1.588 |
journalist | -1.535 |
Token | the |
Token ID | 262 |
Feature activation | +1.47e+01 |
Pos logit contributions | |
preferring | +7.987 |
inability | +7.354 |
wanting | +7.072 |
choosing | +6.954 |
confines | +6.661 |
Neg logit contributions | |
ogether | -6.633 |
adel | -6.523 |
campaigner | -6.407 |
ilde | -6.233 |
isan | -6.042 |
Token | code |
Token ID | 2438 |
Feature activation | +9.77e+00 |
Pos logit contributions | |
preferring | +12.225 |
inability | +11.751 |
wanting | +10.871 |
confines | +10.765 |
choosing | +10.648 |
Neg logit contributions | |
ogether | -11.353 |
adel | -11.178 |
campaigner | -10.659 |
ilde | -10.572 |
alysed | -10.236 |
Token | , |
Token ID | 11 |
Feature activation | -2.62e+00 |
Pos logit contributions | |
preferring | +9.063 |
inability | +8.351 |
wanting | +8.108 |
choosing | +7.790 |
confines | +7.670 |
Neg logit contributions | |
ogether | -7.498 |
campaigner | -7.236 |
ilde | -6.973 |
adel | -6.973 |
ér | -6.694 |
Token | Uniform |
Token ID | 35712 |
Feature activation | +9.35e-01 |
Pos logit contributions | |
ogether | +1.943 |
campaigner | +1.868 |
adel | +1.866 |
ilde | +1.815 |
journalist | +1.768 |
Neg logit contributions | |
preferring | -2.701 |
inability | -2.514 |
wanting | -2.395 |
choosing | -2.270 |
confines | -2.269 |
Token | Grid |
Token ID | 41339 |
Feature activation | +7.49e+00 |
Pos logit contributions | |
preferring | +0.845 |
inability | +0.778 |
wanting | +0.736 |
choosing | +0.696 |
confines | +0.693 |
Neg logit contributions | |
ogether | -0.815 |
campaigner | -0.789 |
adel | -0.788 |
ilde | -0.766 |
journalist | -0.749 |
Token | :: |
Token ID | 3712 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
preferring | +6.979 |
inability | +6.467 |
wanting | +6.200 |
confines | +6.023 |
choosing | +5.913 |
Neg logit contributions | |
ogether | -5.834 |
campaigner | -5.669 |
adel | -5.656 |
ilde | -5.396 |
alysed | -5.255 |
Token | Acc |
Token ID | 17320 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
preferring | +9.554 |
inability | +8.960 |
wanting | +8.453 |
to | +8.387 |
choosing | +8.281 |
Neg logit contributions | |
ogether | -9.832 |
campaigner | -9.803 |
adel | -9.467 |
journalist | -9.346 |
ilde | -9.184 |
Token | br |
Token ID | 865 |
Feature activation | -5.36e+00 |
Pos logit contributions | |
preferring | +1.705 |
inability | +1.585 |
wanting | +1.497 |
choosing | +1.426 |
confines | +1.419 |
Neg logit contributions | |
ogether | -1.447 |
campaigner | -1.384 |
adel | -1.382 |
ilde | -1.364 |
ér | -1.314 |
Token | achy |
Token ID | 35586 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
ogether | +2.102 |
adel | +2.055 |
campaigner | +1.935 |
ilde | +1.888 |
ér | +1.727 |
Neg logit contributions | |
preferring | -7.368 |
inability | -6.986 |
wanting | -6.752 |
choosing | -6.504 |
confines | -6.492 |
Token | ot |
Token ID | 313 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
ogether | +0.739 |
adel | +0.697 |
campaigner | +0.694 |
ilde | +0.661 |
journalist | +0.632 |
Neg logit contributions | |
preferring | -1.925 |
inability | -1.819 |
wanting | -1.752 |
choosing | -1.686 |
confines | -1.679 |
Token | is |
Token ID | 271 |
Feature activation | -6.14e+00 |
Pos logit contributions | |
preferring | +0.392 |
inability | +0.367 |
wanting | +0.350 |
choosing | +0.334 |
confines | +0.332 |
Neg logit contributions | |
ogether | -0.257 |
campaigner | -0.247 |
adel | -0.244 |
ilde | -0.236 |
journalist | -0.232 |
Token | group |
Token ID | 1448 |
Feature activation | +7.32e-01 |
Pos logit contributions | |
ogether | +5.053 |
adel | +4.974 |
campaigner | +4.954 |
ilde | +4.750 |
journalist | +4.698 |
Neg logit contributions | |
preferring | -5.585 |
inability | -5.174 |
wanting | -4.913 |
choosing | -4.639 |
confines | -4.635 |
Token | identifies |
Token ID | 21079 |
Feature activation | -9.75e+00 |
Pos logit contributions | |
preferring | +0.767 |
inability | +0.711 |
wanting | +0.681 |
choosing | +0.651 |
confines | +0.643 |
Neg logit contributions | |
ogether | -0.537 |
campaigner | -0.516 |
adel | -0.510 |
ilde | -0.501 |
journalist | -0.483 |
Token | additional |
Token ID | 3224 |
Feature activation | -8.84e+00 |
Pos logit contributions | |
ogether | +7.533 |
adel | +7.425 |
campaigner | +7.415 |
journalist | +7.055 |
ilde | +6.989 |
Neg logit contributions | |
preferring | -8.797 |
inability | -8.171 |
wanting | -7.725 |
confines | -7.392 |
choosing | -7.300 |
Token | tax |
Token ID | 1687 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
ogether | +7.034 |
campaigner | +6.959 |
adel | +6.910 |
journalist | +6.603 |
ilde | +6.533 |
Neg logit contributions | |
preferring | -7.908 |
inability | -7.312 |
wanting | -6.918 |
confines | -6.539 |
choosing | -6.506 |
Token | a |
Token ID | 64 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
ogether | +6.722 |
adel | +6.627 |
campaigner | +6.359 |
ilde | +6.124 |
journalist | +5.959 |
Neg logit contributions | |
preferring | -10.428 |
inability | -9.769 |
wanting | -9.388 |
confines | -8.858 |
choosing | -8.828 |
Token | . |
Token ID | 13 |
Feature activation | -5.50e+00 |
Pos logit contributions | |
ogether | +1.183 |
campaigner | +1.137 |
adel | +1.136 |
ilde | +1.103 |
journalist | +1.070 |
Neg logit contributions | |
preferring | -1.635 |
inability | -1.521 |
wanting | -1.452 |
choosing | -1.382 |
confines | -1.374 |
Token | Australian |
Token ID | 6638 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
ogether | +4.441 |
adel | +4.372 |
campaigner | +4.327 |
ilde | +4.201 |
journalist | +4.177 |
Neg logit contributions | |
preferring | -5.152 |
inability | -4.779 |
wanting | -4.471 |
choosing | -4.279 |
confines | -4.216 |
Token | He |
Token ID | 679 |
Feature activation | -7.75e-01 |
Pos logit contributions | |
ogether | +4.625 |
adel | +4.495 |
campaigner | +4.486 |
journalist | +4.366 |
ilde | +4.339 |
Neg logit contributions | |
preferring | -5.698 |
inability | -5.296 |
wanting | -4.942 |
choosing | -4.727 |
confines | -4.708 |
Token | said |
Token ID | 531 |
Feature activation | +6.67e+00 |
Pos logit contributions | |
ogether | +0.617 |
campaigner | +0.595 |
adel | +0.594 |
ilde | +0.578 |
journalist | +0.561 |
Neg logit contributions | |
preferring | -0.760 |
inability | -0.704 |
wanting | -0.672 |
choosing | -0.637 |
confines | -0.635 |
Token | that |
Token ID | 326 |
Feature activation | -6.00e+00 |
Pos logit contributions | |
preferring | +6.060 |
inability | +5.659 |
wanting | +5.394 |
choosing | +5.148 |
confines | +4.968 |
Neg logit contributions | |
ogether | -5.524 |
adel | -5.334 |
campaigner | -5.269 |
ilde | -5.221 |
ér | -4.965 |
Token | his |
Token ID | 465 |
Feature activation | +5.15e+00 |
Pos logit contributions | |
ogether | +4.608 |
campaigner | +4.476 |
adel | +4.428 |
journalist | +4.277 |
ilde | +4.268 |
Neg logit contributions | |
preferring | -5.813 |
inability | -5.366 |
wanting | -5.090 |
confines | -4.855 |
choosing | -4.801 |
Token | team |
Token ID | 1074 |
Feature activation | +6.09e+00 |
Pos logit contributions | |
preferring | +5.494 |
inability | +5.271 |
wanting | +4.958 |
choosing | +4.760 |
confines | +4.696 |
Neg logit contributions | |
ogether | -3.559 |
adel | -3.438 |
campaigner | -3.358 |
ilde | -3.356 |
ér | -3.153 |
Token | and |
Token ID | 290 |
Feature activation | -4.93e+00 |
Pos logit contributions | |
preferring | +5.822 |
inability | +5.429 |
wanting | +5.243 |
choosing | +4.926 |
confines | +4.905 |
Neg logit contributions | |
ogether | -4.810 |
adel | -4.631 |
campaigner | -4.595 |
ilde | -4.575 |
ér | -4.328 |
Token | the |
Token ID | 262 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
ogether | +3.727 |
campaigner | +3.618 |
adel | +3.570 |
ilde | +3.466 |
journalist | +3.446 |
Neg logit contributions | |
preferring | -4.946 |
inability | -4.567 |
wanting | -4.345 |
choosing | -4.137 |
confines | -4.134 |
Token | laboratories |
Token ID | 35650 |
Feature activation | +5.23e+00 |
Pos logit contributions | |
ogether | +2.325 |
campaigner | +2.248 |
adel | +2.233 |
ilde | +2.162 |
journalist | +2.139 |
Neg logit contributions | |
preferring | -2.921 |
inability | -2.689 |
wanting | -2.563 |
choosing | -2.438 |
confines | -2.417 |
Token | they |
Token ID | 484 |
Feature activation | -8.36e+00 |
Pos logit contributions | |
preferring | +5.607 |
inability | +5.240 |
wanting | +5.100 |
choosing | +4.832 |
confines | +4.706 |
Neg logit contributions | |
ogether | -3.669 |
adel | -3.508 |
ilde | -3.428 |
campaigner | -3.389 |
isan | -3.182 |
Token | employed |
Token ID | 9322 |
Feature activation | +9.02e+00 |
Pos logit contributions | |
ogether | +5.987 |
campaigner | +5.868 |
adel | +5.866 |
journalist | +5.671 |
ilde | +5.565 |
Neg logit contributions | |
preferring | -8.412 |
inability | -7.813 |
wanting | -7.336 |
forgetting | -7.006 |
choosing | -6.971 |
Token | took |
Token ID | 1718 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
preferring | +8.957 |
inability | +8.326 |
wanting | +8.123 |
choosing | +7.708 |
confines | +7.468 |
Neg logit contributions | |
ogether | -6.618 |
ilde | -6.355 |
adel | -6.326 |
campaigner | -6.179 |
earthqu | -5.933 |
Token | , |
Token ID | 11 |
Feature activation | +8.18e+00 |
Pos logit contributions | |
preferring | +7.303 |
inability | +6.638 |
wanting | +6.605 |
choosing | +6.237 |
confines | +6.003 |
Neg logit contributions | |
ogether | -5.683 |
adel | -5.304 |
campaigner | -5.290 |
ilde | -5.186 |
ér | -5.095 |
Token | saying |
Token ID | 2282 |
Feature activation | +8.27e+00 |
Pos logit contributions | |
preferring | +7.155 |
wanting | +6.317 |
inability | +6.297 |
choosing | +6.012 |
forgetting | +5.696 |
Neg logit contributions | |
ogether | -7.452 |
adel | -6.989 |
campaigner | -6.913 |
ilde | -6.811 |
ér | -6.667 |
Token | he |
Token ID | 339 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
preferring | +7.951 |
inability | +7.557 |
wanting | +7.135 |
choosing | +6.839 |
forgetting | +6.617 |
Neg logit contributions | |
ogether | -6.398 |
adel | -6.087 |
campaigner | -6.053 |
ilde | -5.993 |
ér | -5.774 |
Token | 's |
Token ID | 338 |
Feature activation | +1.23e+01 |
Pos logit contributions | |
preferring | +10.916 |
inability | +10.098 |
wanting | +9.808 |
confines | +9.224 |
choosing | +9.146 |
Neg logit contributions | |
ogether | -11.354 |
earthqu | -11.057 |
campaigner | -10.690 |
adel | -10.651 |
ilde | -10.592 |
Token | now |
Token ID | 783 |
Feature activation | +9.40e+00 |
Pos logit contributions | |
preferring | +10.998 |
inability | +10.056 |
wanting | +9.920 |
choosing | +9.501 |
forgetting | +9.017 |
Neg logit contributions | |
ogether | -10.549 |
adel | -10.021 |
ilde | -9.840 |
ér | -9.552 |
campaigner | -9.533 |
Token | done |
Token ID | 1760 |
Feature activation | -5.78e-01 |
Pos logit contributions | |
preferring | +8.940 |
inability | +8.169 |
wanting | +7.996 |
choosing | +7.656 |
forgetting | +7.258 |
Neg logit contributions | |
ogether | -7.848 |
adel | -7.478 |
ilde | -7.277 |
campaigner | -7.212 |
ér | -7.075 |
Token | everything |
Token ID | 2279 |
Feature activation | +6.56e-01 |
Pos logit contributions | |
ogether | +0.468 |
adel | +0.452 |
campaigner | +0.451 |
ilde | +0.440 |
journalist | +0.427 |
Neg logit contributions | |
preferring | -0.560 |
inability | -0.518 |
wanting | -0.494 |
choosing | -0.470 |
confines | -0.463 |
Token | he |
Token ID | 339 |
Feature activation | +4.99e+00 |
Pos logit contributions | |
preferring | +0.722 |
inability | +0.675 |
wanting | +0.650 |
choosing | +0.620 |
confines | +0.615 |
Neg logit contributions | |
ogether | -0.444 |
adel | -0.431 |
campaigner | -0.425 |
ilde | -0.414 |
ér | -0.395 |
Token | can |
Token ID | 460 |
Feature activation | +2.09e+01 |
Pos logit contributions | |
preferring | +4.510 |
inability | +4.141 |
wanting | +4.076 |
confines | +3.810 |
choosing | +3.789 |
Neg logit contributions | |
ogether | -4.270 |
adel | -4.092 |
campaigner | -4.092 |
ilde | -3.980 |
ér | -3.898 |
Token | do |
Token ID | 466 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
preferring | +15.305 |
wanting | +14.715 |
inability | +14.218 |
to | +13.914 |
to | +13.648 |
Neg logit contributions | |
ogether | -14.662 |
earthqu | -14.572 |
adel | -14.361 |
ilde | -14.284 |
alysed | -14.078 |
Token | to |
Token ID | 284 |
Feature activation | +4.86e+00 |
Pos logit contributions | |
preferring | +15.166 |
wanting | +14.223 |
inability | +13.730 |
choosing | +13.085 |
to | +13.031 |
Neg logit contributions | |
adel | -14.259 |
ilde | -14.230 |
campaigner | -14.121 |
ogether | -14.089 |
earthqu | -13.877 |
Token | a |
Token ID | 257 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
ogether | +3.032 |
campaigner | +2.936 |
adel | +2.921 |
ilde | +2.829 |
journalist | +2.791 |
Neg logit contributions | |
preferring | -4.034 |
inability | -3.740 |
wanting | -3.558 |
choosing | -3.379 |
confines | -3.377 |
Token | humanitarian |
Token ID | 15706 |
Feature activation | -9.65e+00 |
Pos logit contributions | |
campaigner | +8.551 |
ogether | +8.432 |
journalist | +8.353 |
adel | +8.265 |
ilde | +8.051 |
Neg logit contributions | |
preferring | -9.335 |
inability | -8.400 |
wanting | -7.936 |
confines | -7.599 |
choosing | -7.431 |
Token | catastrophe |
Token ID | 27767 |
Feature activation | -5.73e+00 |
Pos logit contributions | |
campaigner | +7.014 |
ogether | +6.760 |
adel | +6.741 |
journalist | +6.703 |
ilde | +6.431 |
Neg logit contributions | |
preferring | -9.314 |
inability | -8.363 |
wanting | -8.146 |
confines | -7.684 |
choosing | -7.662 |
Token | , |
Token ID | 11 |
Feature activation | -7.04e+00 |
Pos logit contributions | |
ogether | +4.470 |
campaigner | +4.416 |
adel | +4.355 |
journalist | +4.194 |
ilde | +4.182 |
Neg logit contributions | |
preferring | -5.427 |
inability | -5.050 |
wanting | -4.724 |
confines | -4.538 |
choosing | -4.483 |
Token | it |
Token ID | 340 |
Feature activation | +4.34e+00 |
Pos logit contributions | |
ogether | +5.593 |
campaigner | +5.491 |
adel | +5.392 |
journalist | +5.345 |
ilde | +5.325 |
Neg logit contributions | |
preferring | -6.447 |
inability | -6.009 |
wanting | -5.653 |
confines | -5.444 |
choosing | -5.323 |
Token | accuses |
Token ID | 35062 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
preferring | +4.244 |
inability | +3.959 |
wanting | +3.796 |
choosing | +3.626 |
confines | +3.615 |
Neg logit contributions | |
ogether | -3.424 |
adel | -3.249 |
campaigner | -3.216 |
ilde | -3.149 |
ér | -3.044 |
Token | Russia |
Token ID | 3284 |
Feature activation | +7.03e+00 |
Pos logit contributions | |
ogether | +7.241 |
campaigner | +7.123 |
journalist | +6.962 |
adel | +6.870 |
ilde | +6.802 |
Neg logit contributions | |
preferring | -9.623 |
inability | -8.893 |
wanting | -8.414 |
confines | -8.152 |
choosing | -8.002 |
Token | without |
Token ID | 1231 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
preferring | +6.376 |
inability | +5.804 |
wanting | +5.655 |
choosing | +5.281 |
confines | +5.142 |
Neg logit contributions | |
ogether | -6.000 |
adel | -5.700 |
ilde | -5.650 |
campaigner | -5.645 |
ér | -5.350 |
Token | proof |
Token ID | 6617 |
Feature activation | +7.07e+00 |
Pos logit contributions | |
ogether | +2.481 |
campaigner | +2.429 |
adel | +2.412 |
ilde | +2.348 |
journalist | +2.330 |
Neg logit contributions | |
preferring | -2.334 |
inability | -2.149 |
wanting | -2.008 |
confines | -1.897 |
choosing | -1.896 |
Token | of |
Token ID | 286 |
Feature activation | +7.99e+00 |
Pos logit contributions | |
preferring | +6.167 |
inability | +5.546 |
wanting | +5.453 |
choosing | +5.065 |
confines | +4.917 |
Neg logit contributions | |
ogether | -6.237 |
adel | -5.926 |
campaigner | -5.906 |
ilde | -5.897 |
ér | -5.591 |
Token | doing |
Token ID | 1804 |
Feature activation | -4.88e+00 |
Pos logit contributions | |
preferring | +7.914 |
inability | +7.362 |
wanting | +7.183 |
choosing | +6.764 |
forgetting | +6.479 |
Neg logit contributions | |
ogether | -6.229 |
ilde | -6.020 |
adel | -6.018 |
campaigner | -5.739 |
ér | -5.613 |
Token | � |
Token ID | 247 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
ogether | +1.213 |
campaigner | +1.157 |
adel | +1.157 |
ilde | +1.115 |
journalist | +1.078 |
Neg logit contributions | |
preferring | -2.190 |
inability | -2.053 |
wanting | -1.968 |
choosing | -1.884 |
confines | -1.876 |
Token | s |
Token ID | 82 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
preferring | +2.471 |
inability | +2.248 |
wanting | +2.119 |
choosing | +1.939 |
confines | +1.929 |
Neg logit contributions | |
ogether | -3.448 |
campaigner | -3.373 |
adel | -3.344 |
ilde | -3.275 |
journalist | -3.221 |
Token | one |
Token ID | 530 |
Feature activation | +4.28e+00 |
Pos logit contributions | |
ogether | +3.330 |
adel | +3.219 |
campaigner | +3.218 |
ilde | +3.126 |
journalist | +3.072 |
Neg logit contributions | |
preferring | -3.643 |
inability | -3.358 |
wanting | -3.166 |
confines | -3.013 |
choosing | -2.987 |
Token | of |
Token ID | 286 |
Feature activation | +6.09e+00 |
Pos logit contributions | |
preferring | +3.873 |
inability | +3.585 |
wanting | +3.426 |
choosing | +3.206 |
confines | +3.148 |
Neg logit contributions | |
ogether | -3.696 |
adel | -3.567 |
campaigner | -3.519 |
ilde | -3.457 |
ér | -3.331 |
Token | the |
Token ID | 262 |
Feature activation | +7.88e+00 |
Pos logit contributions | |
preferring | +5.671 |
inability | +5.250 |
wanting | +5.071 |
choosing | +4.802 |
confines | +4.677 |
Neg logit contributions | |
ogether | -4.966 |
adel | -4.834 |
campaigner | -4.785 |
ilde | -4.666 |
ér | -4.457 |
Token | deleted |
Token ID | 13140 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
preferring | +7.329 |
inability | +6.869 |
wanting | +6.547 |
choosing | +6.275 |
confines | +6.169 |
Neg logit contributions | |
ogether | -6.263 |
adel | -6.182 |
ilde | -5.954 |
campaigner | -5.940 |
ér | -5.670 |
Token | scenes |
Token ID | 8188 |
Feature activation | -4.72e-01 |
Pos logit contributions | |
ogether | +8.358 |
campaigner | +8.102 |
adel | +8.075 |
ilde | +7.816 |
journalist | +7.755 |
Neg logit contributions | |
preferring | -10.347 |
inability | -9.522 |
wanting | -8.939 |
choosing | -8.537 |
confines | -8.454 |
Token | that |
Token ID | 326 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
ogether | +0.351 |
campaigner | +0.337 |
adel | +0.336 |
ilde | +0.327 |
journalist | +0.315 |
Neg logit contributions | |
preferring | -0.491 |
inability | -0.456 |
wanting | -0.437 |
choosing | -0.416 |
confines | -0.413 |
Token | appears |
Token ID | 3568 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
ogether | +9.284 |
campaigner | +9.020 |
adel | +8.984 |
journalist | +8.842 |
ilde | +8.697 |
Neg logit contributions | |
preferring | -10.708 |
inability | -9.809 |
wanting | -9.182 |
choosing | -8.653 |
confines | -8.622 |
Token | on |
Token ID | 319 |
Feature activation | -8.76e-01 |
Pos logit contributions | |
preferring | +2.855 |
inability | +2.663 |
wanting | +2.587 |
choosing | +2.459 |
confines | +2.423 |
Neg logit contributions | |
ogether | -1.692 |
campaigner | -1.622 |
adel | -1.604 |
ilde | -1.551 |
journalist | -1.492 |
Token | the |
Token ID | 262 |
Feature activation | +7.96e+00 |
Pos logit contributions | |
ogether | +0.677 |
adel | +0.653 |
campaigner | +0.652 |
ilde | +0.634 |
journalist | +0.613 |
Neg logit contributions | |
preferring | -0.880 |
inability | -0.818 |
wanting | -0.781 |
choosing | -0.742 |
confines | -0.736 |
Token | cause |
Token ID | 2728 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
preferring | +2.589 |
inability | +2.415 |
wanting | +2.290 |
choosing | +2.185 |
confines | +2.151 |
Neg logit contributions | |
ogether | -2.402 |
adel | -2.318 |
campaigner | -2.305 |
ilde | -2.280 |
ér | -2.181 |
Token | . |
Token ID | 13 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
preferring | +3.463 |
inability | +3.204 |
wanting | +3.118 |
choosing | +2.980 |
confines | +2.916 |
Neg logit contributions | |
ogether | -2.302 |
campaigner | -2.200 |
adel | -2.188 |
ilde | -2.148 |
journalist | -2.061 |
Token |
|
Token ID | 198 |
Feature activation | -5.31e+00 |
Pos logit contributions | |
ogether | +0.859 |
campaigner | +0.827 |
adel | +0.827 |
ilde | +0.802 |
journalist | +0.780 |
Neg logit contributions | |
preferring | -1.151 |
inability | -1.070 |
wanting | -1.019 |
choosing | -0.970 |
confines | -0.965 |
Token |
|
Token ID | 198 |
Feature activation | -5.79e-01 |
Pos logit contributions | |
ogether | +3.520 |
adel | +3.476 |
campaigner | +3.384 |
ilde | +3.342 |
journalist | +3.279 |
Neg logit contributions | |
preferring | -5.762 |
inability | -5.363 |
wanting | -5.050 |
confines | -4.853 |
choosing | -4.848 |
Token | Together |
Token ID | 41631 |
Feature activation | -1.31e+01 |
Pos logit contributions | |
ogether | +0.490 |
campaigner | +0.474 |
adel | +0.472 |
ilde | +0.460 |
journalist | +0.449 |
Neg logit contributions | |
preferring | -0.538 |
inability | -0.497 |
wanting | -0.472 |
choosing | -0.447 |
confines | -0.443 |
Token | , |
Token ID | 11 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
ogether | +9.528 |
campaigner | +9.107 |
adel | +8.976 |
ilde | +8.811 |
ér | +8.662 |
Neg logit contributions | |
preferring | -12.163 |
inability | -11.336 |
wanting | -10.532 |
confines | -10.211 |
forgetting | -9.905 |
Token | as |
Token ID | 355 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
ogether | +14.072 |
campaigner | +13.506 |
journalist | +13.397 |
adel | +13.077 |
ilde | +12.832 |
Neg logit contributions | |
preferring | -12.914 |
inability | -11.912 |
confines | -10.813 |
wanting | -10.785 |
forgetting | -10.061 |
Token | a |
Token ID | 257 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
ogether | +14.243 |
campaigner | +14.121 |
journalist | +13.886 |
adel | +13.447 |
isan | +13.133 |
Neg logit contributions | |
preferring | -12.945 |
inability | -11.839 |
wanting | -10.767 |
confines | -10.618 |
choosing | -10.013 |
Token | di |
Token ID | 2566 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
campaigner | +16.213 |
journalist | +15.954 |
ogether | +15.888 |
adel | +15.606 |
isan | +14.667 |
Neg logit contributions | |
preferring | -15.609 |
inability | -14.086 |
wanting | -12.888 |
confines | -12.571 |
choosing | -11.769 |
Token | as |
Token ID | 292 |
Feature activation | -7.71e+00 |
Pos logit contributions | |
ogether | +6.654 |
adel | +6.603 |
campaigner | +6.249 |
ilde | +6.199 |
journalist | +5.973 |
Neg logit contributions | |
preferring | -12.799 |
inability | -11.880 |
wanting | -11.346 |
confines | -11.010 |
choosing | -10.899 |
Token | pora |
Token ID | 38851 |
Feature activation | -9.77e+00 |
Pos logit contributions | |
ogether | +5.431 |
adel | +5.388 |
campaigner | +5.288 |
ilde | +5.068 |
journalist | +5.049 |
Neg logit contributions | |
preferring | -7.862 |
inability | -7.344 |
wanting | -6.996 |
confines | -6.760 |
choosing | -6.611 |
Token | We |
Token ID | 775 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
ogether | +4.415 |
adel | +4.294 |
campaigner | +4.185 |
ilde | +4.123 |
journalist | +4.110 |
Neg logit contributions | |
preferring | -6.479 |
inability | -6.034 |
wanting | -5.617 |
choosing | -5.422 |
confines | -5.400 |
Token | � |
Token ID | 447 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
ogether | +1.982 |
adel | +1.913 |
campaigner | +1.912 |
ilde | +1.858 |
journalist | +1.813 |
Neg logit contributions | |
preferring | -2.362 |
inability | -2.187 |
wanting | -2.075 |
choosing | -1.969 |
confines | -1.961 |
Token | � |
Token ID | 247 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
ogether | +1.321 |
campaigner | +1.267 |
adel | +1.266 |
ilde | +1.222 |
journalist | +1.189 |
Neg logit contributions | |
preferring | -2.025 |
inability | -1.891 |
wanting | -1.807 |
choosing | -1.725 |
confines | -1.715 |
Token | d |
Token ID | 67 |
Feature activation | -9.13e+00 |
Pos logit contributions | |
preferring | +3.479 |
inability | +3.213 |
wanting | +3.096 |
choosing | +2.936 |
confines | +2.856 |
Neg logit contributions | |
ogether | -2.877 |
campaigner | -2.807 |
adel | -2.746 |
ilde | -2.688 |
journalist | -2.646 |
Token | do |
Token ID | 466 |
Feature activation | -1.54e+01 |
Pos logit contributions | |
ogether | +6.264 |
adel | +6.133 |
campaigner | +6.088 |
journalist | +5.888 |
ilde | +5.738 |
Neg logit contributions | |
preferring | -9.361 |
inability | -8.748 |
wanting | -8.093 |
confines | -7.957 |
choosing | -7.782 |
Token | it |
Token ID | 340 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
ogether | +12.335 |
adel | +11.894 |
campaigner | +11.555 |
journalist | +11.503 |
ér | +11.146 |
Neg logit contributions | |
preferring | -12.672 |
inability | -11.580 |
wanting | -10.522 |
confines | -10.447 |
choosing | -9.933 |
Token | phon |
Token ID | 32896 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
ogether | +17.306 |
adel | +16.739 |
journalist | +16.506 |
campaigner | +16.363 |
inform | +16.029 |
Neg logit contributions | |
preferring | -13.565 |
inability | -12.727 |
confines | -11.264 |
wanting | -10.572 |
choosing | -10.292 |
Token | etically |
Token ID | 16877 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
ogether | +4.642 |
adel | +4.483 |
ilde | +4.012 |
campaigner | +3.917 |
ér | +3.763 |
Neg logit contributions | |
preferring | -14.268 |
inability | -13.531 |
wanting | -13.049 |
confines | -12.509 |
choosing | -12.432 |
Token | and |
Token ID | 290 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
ogether | +11.732 |
adel | +11.445 |
campaigner | +11.091 |
ilde | +11.008 |
journalist | +10.907 |
Neg logit contributions | |
preferring | -10.294 |
inability | -9.725 |
wanting | -8.606 |
confines | -8.526 |
choosing | -8.087 |
Token | I |
Token ID | 314 |
Feature activation | -8.25e+00 |
Pos logit contributions | |
adel | +12.669 |
campaigner | +12.600 |
ogether | +12.531 |
journalist | +12.496 |
ilde | +11.976 |
Neg logit contributions | |
preferring | -11.339 |
inability | -10.432 |
wanting | -9.462 |
confines | -9.373 |
choosing | -8.896 |
Token | � |
Token ID | 447 |
Feature activation | -5.23e+00 |
Pos logit contributions | |
ogether | +6.254 |
adel | +6.089 |
campaigner | +5.982 |
ilde | +5.847 |
journalist | +5.739 |
Neg logit contributions | |
preferring | -7.956 |
inability | -7.428 |
wanting | -6.911 |
confines | -6.708 |
choosing | -6.618 |
Token | such |
Token ID | 884 |
Feature activation | -3.76e+00 |
Pos logit contributions | |
preferring | +2.682 |
inability | +2.458 |
wanting | +2.357 |
choosing | +2.245 |
confines | +2.189 |
Neg logit contributions | |
ogether | -2.536 |
adel | -2.440 |
campaigner | -2.424 |
ilde | -2.398 |
ér | -2.311 |
Token | players |
Token ID | 1938 |
Feature activation | +5.11e+00 |
Pos logit contributions | |
ogether | +3.037 |
campaigner | +2.946 |
adel | +2.936 |
ilde | +2.838 |
journalist | +2.796 |
Neg logit contributions | |
preferring | -3.587 |
inability | -3.320 |
wanting | -3.144 |
confines | -2.975 |
choosing | -2.964 |
Token | that |
Token ID | 326 |
Feature activation | -9.44e+00 |
Pos logit contributions | |
preferring | +5.248 |
inability | +4.772 |
wanting | +4.720 |
choosing | +4.502 |
confines | +4.336 |
Neg logit contributions | |
ogether | -3.877 |
campaigner | -3.663 |
adel | -3.641 |
ilde | -3.635 |
ér | -3.462 |
Token | turned |
Token ID | 2900 |
Feature activation | -5.70e+00 |
Pos logit contributions | |
ogether | +6.759 |
adel | +6.714 |
campaigner | +6.672 |
journalist | +6.470 |
ilde | +6.321 |
Neg logit contributions | |
preferring | -9.091 |
inability | -8.438 |
wanting | -7.885 |
confines | -7.573 |
choosing | -7.505 |
Token | out |
Token ID | 503 |
Feature activation | +3.92e+00 |
Pos logit contributions | |
ogether | +4.250 |
campaigner | +4.113 |
adel | +4.107 |
ilde | +3.983 |
journalist | +3.930 |
Neg logit contributions | |
preferring | -5.715 |
inability | -5.303 |
wanting | -5.029 |
confines | -4.805 |
choosing | -4.782 |
Token | pretty |
Token ID | 2495 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
preferring | +3.815 |
inability | +3.517 |
wanting | +3.402 |
choosing | +3.223 |
confines | +3.136 |
Neg logit contributions | |
ogether | -3.140 |
campaigner | -2.975 |
adel | -2.957 |
ilde | -2.916 |
ér | -2.810 |
Token | okay |
Token ID | 8788 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
campaigner | +10.929 |
adel | +10.698 |
ogether | +10.682 |
journalist | +10.667 |
ilde | +10.158 |
Neg logit contributions | |
preferring | -15.474 |
inability | -14.683 |
confines | -13.714 |
wanting | -13.336 |
choosing | -12.888 |
Token | . |
Token ID | 13 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
ogether | +10.309 |
campaigner | +10.065 |
adel | +10.049 |
journalist | +9.634 |
ilde | +9.535 |
Neg logit contributions | |
preferring | -9.469 |
inability | -8.863 |
wanting | -8.032 |
confines | -7.736 |
forgetting | -7.469 |
Token | Most |
Token ID | 4042 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
ogether | +2.510 |
adel | +2.426 |
campaigner | +2.404 |
ilde | +2.339 |
journalist | +2.303 |
Neg logit contributions | |
preferring | -3.340 |
inability | -3.108 |
wanting | -2.935 |
choosing | -2.801 |
confines | -2.789 |
Token | recently |
Token ID | 2904 |
Feature activation | -2.72e+00 |
Pos logit contributions | |
ogether | +2.200 |
campaigner | +2.120 |
adel | +2.118 |
ilde | +2.048 |
journalist | +2.010 |
Neg logit contributions | |
preferring | -2.914 |
inability | -2.710 |
wanting | -2.576 |
choosing | -2.450 |
confines | -2.449 |
Token | , |
Token ID | 11 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
ogether | +2.023 |
adel | +1.952 |
campaigner | +1.950 |
ilde | +1.888 |
journalist | +1.840 |
Neg logit contributions | |
preferring | -2.797 |
inability | -2.603 |
wanting | -2.479 |
choosing | -2.358 |
confines | -2.353 |
Token | happens |
Token ID | 4325 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
preferring | +2.986 |
inability | +2.789 |
wanting | +2.686 |
confines | +2.563 |
choosing | +2.554 |
Neg logit contributions | |
ogether | -2.321 |
campaigner | -2.215 |
adel | -2.193 |
ilde | -2.146 |
ér | -2.079 |
Token | to |
Token ID | 284 |
Feature activation | -7.61e-01 |
Pos logit contributions | |
preferring | +10.851 |
inability | +10.050 |
wanting | +9.800 |
confines | +9.121 |
choosing | +9.093 |
Neg logit contributions | |
ogether | -12.213 |
adel | -11.685 |
campaigner | -11.630 |
ilde | -11.267 |
isan | -10.969 |
Token | be |
Token ID | 307 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
ogether | +0.423 |
campaigner | +0.402 |
adel | +0.401 |
ilde | +0.384 |
journalist | +0.370 |
Neg logit contributions | |
preferring | -0.928 |
inability | -0.871 |
wanting | -0.838 |
choosing | -0.805 |
confines | -0.801 |
Token | , |
Token ID | 11 |
Feature activation | -4.83e+00 |
Pos logit contributions | |
preferring | +0.220 |
inability | +0.204 |
wanting | +0.196 |
choosing | +0.187 |
confines | +0.185 |
Neg logit contributions | |
ogether | -0.165 |
campaigner | -0.159 |
adel | -0.158 |
ilde | -0.153 |
journalist | -0.149 |
Token | will |
Token ID | 481 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
ogether | +3.435 |
campaigner | +3.318 |
adel | +3.299 |
ilde | +3.194 |
journalist | +3.143 |
Neg logit contributions | |
preferring | -5.032 |
inability | -4.688 |
wanting | -4.457 |
choosing | -4.234 |
confines | -4.201 |
Token | likely |
Token ID | 1884 |
Feature activation | -1.47e+01 |
Pos logit contributions | |
ogether | +10.889 |
campaigner | +10.765 |
occur | +10.571 |
adel | +10.505 |
correspond | +10.374 |
Neg logit contributions | |
preferring | -14.913 |
inability | -13.589 |
wanting | -12.821 |
choosing | -12.129 |
confines | -12.045 |
Token | be |
Token ID | 307 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
ogether | +9.597 |
campaigner | +9.562 |
occur | +9.320 |
adel | +9.295 |
journalist | +9.112 |
Neg logit contributions | |
preferring | -13.822 |
inability | -12.755 |
wanting | -12.018 |
choosing | -11.458 |
confines | -11.333 |
Token | suspended |
Token ID | 9951 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
ogether | +8.158 |
campaigner | +8.066 |
adel | +7.993 |
journalist | +7.972 |
ilde | +7.754 |
Neg logit contributions | |
preferring | -8.998 |
inability | -8.247 |
wanting | -7.607 |
confines | -7.353 |
choosing | -7.239 |
Token | . |
Token ID | 13 |
Feature activation | -2.92e+00 |
Pos logit contributions | |
ogether | +12.260 |
adel | +11.788 |
campaigner | +11.628 |
journalist | +11.415 |
ilde | +11.254 |
Neg logit contributions | |
preferring | -11.153 |
inability | -10.265 |
wanting | -9.370 |
confines | -9.040 |
choosing | -8.831 |
Token | You |
Token ID | 921 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
ogether | +2.266 |
adel | +2.197 |
campaigner | +2.179 |
ilde | +2.127 |
journalist | +2.090 |
Neg logit contributions | |
preferring | -2.903 |
inability | -2.687 |
wanting | -2.541 |
choosing | -2.421 |
confines | -2.406 |
Token | agree |
Token ID | 4236 |
Feature activation | +2.11e+01 |
Pos logit contributions | |
preferring | +2.740 |
inability | +2.559 |
wanting | +2.449 |
choosing | +2.330 |
confines | +2.282 |
Neg logit contributions | |
ogether | -2.361 |
adel | -2.241 |
campaigner | -2.228 |
ilde | -2.214 |
ér | -2.126 |
Token | . |
Token ID | 13 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
preferring | +8.180 |
inability | +7.609 |
wanting | +7.603 |
choosing | +7.178 |
confines | +6.939 |
Neg logit contributions | |
ogether | -5.423 |
campaigner | -5.398 |
adel | -5.196 |
ilde | -5.190 |
ér | -4.930 |
Token | I |
Token ID | 314 |
Feature activation | -4.54e+00 |
Pos logit contributions | |
ogether | +7.937 |
adel | +7.828 |
ilde | +7.709 |
journalist | +7.531 |
campaigner | +7.494 |
Neg logit contributions | |
preferring | -9.698 |
inability | -8.952 |
wanting | -8.129 |
choosing | -7.898 |
confines | -7.772 |
Token | believe |
Token ID | 1975 |
Feature activation | -6.50e+00 |
Pos logit contributions | |
ogether | +3.526 |
adel | +3.424 |
campaigner | +3.391 |
ilde | +3.296 |
journalist | +3.233 |
Neg logit contributions | |
preferring | -4.468 |
inability | -4.148 |
wanting | -3.912 |
choosing | -3.744 |
confines | -3.723 |
Token | they |
Token ID | 484 |
Feature activation | +4.34e+00 |
Pos logit contributions | |
ogether | +5.909 |
adel | +5.754 |
campaigner | +5.713 |
ilde | +5.605 |
journalist | +5.545 |
Neg logit contributions | |
preferring | -5.429 |
inability | -4.943 |
wanting | -4.585 |
confines | -4.361 |
choosing | -4.317 |
Token | will |
Token ID | 481 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
preferring | +3.958 |
inability | +3.660 |
wanting | +3.552 |
choosing | +3.308 |
confines | +3.259 |
Neg logit contributions | |
ogether | -3.668 |
campaigner | -3.538 |
adel | -3.485 |
ilde | -3.475 |
ér | -3.365 |
Token | arrive |
Token ID | 9240 |
Feature activation | -2.86e+01 |
Pos logit contributions | |
ogether | +8.470 |
adel | +8.297 |
campaigner | +8.149 |
journalist | +8.043 |
inform | +7.804 |
Neg logit contributions | |
preferring | -12.206 |
inability | -11.302 |
wanting | -10.400 |
confines | -10.192 |
choosing | -10.081 |
Token | in |
Token ID | 287 |
Feature activation | -8.51e+00 |
Pos logit contributions | |
ogether | +20.791 |
inform | +20.648 |
adel | +20.406 |
journalist | +20.133 |
campaigner | +19.940 |
Neg logit contributions | |
preferring | -16.360 |
inability | -14.898 |
confines | -12.788 |
wanting | -11.870 |
choosing | -11.544 |
Token | an |
Token ID | 281 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
ogether | +6.028 |
adel | +5.922 |
campaigner | +5.797 |
journalist | +5.617 |
ilde | +5.603 |
Neg logit contributions | |
preferring | -8.631 |
inability | -7.845 |
wanting | -7.474 |
confines | -7.074 |
choosing | -7.072 |
Token | hour |
Token ID | 1711 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
ogether | +7.736 |
adel | +7.469 |
campaigner | +7.261 |
journalist | +7.108 |
ilde | +7.085 |
Neg logit contributions | |
preferring | -12.351 |
inability | -10.938 |
wanting | -10.617 |
choosing | -10.199 |
confines | -10.161 |
Token | or |
Token ID | 393 |
Feature activation | -8.72e+00 |
Pos logit contributions | |
ogether | +7.659 |
adel | +7.311 |
campaigner | +7.049 |
journalist | +6.900 |
ilde | +6.881 |
Neg logit contributions | |
preferring | -9.976 |
inability | -9.370 |
wanting | -8.644 |
confines | -8.314 |
choosing | -8.204 |
Token | two |
Token ID | 734 |
Feature activation | -7.20e+00 |
Pos logit contributions | |
ogether | +5.893 |
adel | +5.869 |
campaigner | +5.658 |
journalist | +5.476 |
ilde | +5.383 |
Neg logit contributions | |
preferring | -8.991 |
inability | -8.370 |
wanting | -7.899 |
confines | -7.655 |
choosing | -7.550 |