Token | ang |
Token ID | 3550 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
Filipino | +17.390 |
Manila | +16.965 |
Anaheim | +16.327 |
Huntington | +15.939 |
Hiroshima | +15.809 |
Neg logit contributions | |
Rhod | -13.814 |
crop | -13.195 |
� | -13.149 |
)", | -12.329 |
faces | -11.580 |
Token | kan |
Token ID | 43998 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Filipino | +18.932 |
Manila | +18.265 |
Anaheim | +17.750 |
ILCS | +17.365 |
Huntington | +17.032 |
Neg logit contributions | |
Rhod | -13.942 |
� | -13.454 |
crop | -13.158 |
)", | -12.575 |
faces | -11.387 |
Token | il |
Token ID | 346 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
Filipino | +14.120 |
Anaheim | +13.933 |
ILCS | +13.780 |
Manila | +13.740 |
wang | +13.696 |
Neg logit contributions | |
Rhod | -14.887 |
� | -13.356 |
)", | -13.115 |
crop | -13.031 |
scenery | -11.899 |
Token | ang |
Token ID | 648 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
Filipino | +13.043 |
wang | +12.629 |
Manila | +12.512 |
Anaheim | +12.503 |
ushi | +12.365 |
Neg logit contributions | |
Rhod | -14.846 |
� | -13.469 |
crop | -13.203 |
)", | -12.993 |
YD | -11.818 |
Token | an |
Token ID | 281 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
Filipino | +18.690 |
Manila | +17.869 |
Anaheim | +17.566 |
Huntington | +17.101 |
wang | +17.057 |
Neg logit contributions | |
Rhod | -14.851 |
� | -13.861 |
crop | -13.645 |
)", | -12.306 |
faces | -11.871 |
Token | ak |
Token ID | 461 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
Filipino | +11.277 |
ILCS | +11.116 |
Anaheim | +11.071 |
wang | +10.822 |
Manila | +10.780 |
Neg logit contributions | |
Rhod | -13.101 |
� | -11.911 |
)", | -11.640 |
crop | -11.489 |
scenery | -10.222 |
Token | ay |
Token ID | 38762 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
Filipino | +18.218 |
wang | +18.125 |
Anaheim | +17.816 |
kit | +17.726 |
chant | +17.706 |
Neg logit contributions | |
Rhod | -17.677 |
� | -14.981 |
crop | -14.892 |
)", | -14.760 |
scenery | -13.605 |
Token | n |
Token ID | 299 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
Filipino | +18.895 |
Manila | +18.214 |
Anaheim | +17.901 |
ILCS | +17.142 |
Huntington | +17.035 |
Neg logit contributions | |
Rhod | -14.760 |
� | -13.924 |
crop | -13.478 |
)", | -13.052 |
faces | -12.039 |
Token | al |
Token ID | 282 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
Filipino | +11.067 |
wang | +10.849 |
endo | +10.843 |
ushi | +10.669 |
eno | +10.634 |
Neg logit contributions | |
Rhod | -14.583 |
)", | -12.930 |
� | -12.849 |
crop | -12.529 |
mileage | -12.067 |
Token | al |
Token ID | 282 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
Filipino | +13.138 |
wang | +13.070 |
ushi | +13.008 |
Anaheim | +12.810 |
eno | +12.687 |
Neg logit contributions | |
Rhod | -15.434 |
� | -13.706 |
)", | -13.599 |
crop | -13.306 |
FSA | -12.294 |
Token | ay |
Token ID | 323 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Filipino | +14.396 |
wang | +13.914 |
Anaheim | +13.865 |
ushi | +13.777 |
eno | +13.673 |
Neg logit contributions | |
Rhod | -15.857 |
� | -14.184 |
crop | -13.981 |
)", | -13.846 |
YD | -12.606 |
Token | At |
Token ID | 1629 |
Feature activation | +7.34e-01 |
Pos logit contributions | |
ILCS | +12.580 |
Hiroshima | +12.569 |
Anaheim | +12.251 |
Filipino | +12.235 |
Karachi | +12.073 |
Neg logit contributions | |
Rhod | -13.642 |
)", | -13.102 |
crop | -13.012 |
� | -13.007 |
graded | -12.323 |
Token | the |
Token ID | 262 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
Hiroshima | +7.854 |
ILCS | +7.758 |
Anaheim | +7.624 |
Filipino | +7.526 |
endo | +7.437 |
Neg logit contributions | |
Rhod | -7.328 |
� | -6.909 |
)", | -6.673 |
crop | -6.596 |
faces | -5.686 |
Token | end |
Token ID | 886 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
Hiroshima | +12.708 |
Filipino | +12.336 |
Anaheim | +12.269 |
Manila | +12.126 |
Saras | +12.078 |
Neg logit contributions | |
Rhod | -9.834 |
� | -9.605 |
)", | -9.310 |
crop | -9.262 |
YD | -7.834 |
Token | of |
Token ID | 286 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
ILCS | +9.900 |
Hiroshima | +9.893 |
Filipino | +9.690 |
chant | +9.647 |
Anaheim | +9.593 |
Neg logit contributions | |
Rhod | -12.212 |
� | -11.753 |
)", | -11.669 |
crop | -11.256 |
YD | -10.298 |
Token | the |
Token ID | 262 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
Hiroshima | +15.310 |
Saras | +14.950 |
Karachi | +14.923 |
Mumbai | +14.696 |
Anaheim | +14.570 |
Neg logit contributions | |
Rhod | -15.248 |
� | -14.709 |
crop | -14.441 |
)", | -14.303 |
YD | -13.162 |
Token | eighth |
Token ID | 16974 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
Hiroshima | +16.125 |
boiler | +15.505 |
Karachi | +15.414 |
Mumbai | +15.394 |
Filipino | +15.383 |
Neg logit contributions | |
� | -15.145 |
crop | -14.927 |
Rhod | -14.886 |
)", | -14.209 |
YD | -13.460 |
Token | over |
Token ID | 625 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
Karachi | +17.398 |
ILCS | +17.162 |
Mumbai | +17.068 |
boiler | +16.893 |
Saras | +16.875 |
Neg logit contributions | |
� | -15.608 |
Rhod | -15.232 |
)", | -14.929 |
crop | -14.460 |
faces | -14.174 |
Token | they |
Token ID | 484 |
Feature activation | +7.90e-01 |
Pos logit contributions | |
Hiroshima | +14.799 |
Filipino | +14.569 |
Karachi | +14.316 |
ILCS | +14.266 |
chant | +14.164 |
Neg logit contributions | |
Rhod | -13.617 |
� | -13.446 |
)", | -13.113 |
crop | -12.384 |
YD | -11.688 |
Token | are |
Token ID | 389 |
Feature activation | +8.17e-01 |
Pos logit contributions | |
Hiroshima | +8.556 |
ILCS | +8.398 |
Filipino | +8.303 |
Anaheim | +8.269 |
Huntington | +8.070 |
Neg logit contributions | |
Rhod | -7.746 |
� | -7.060 |
crop | -6.875 |
)", | -6.823 |
faces | -5.971 |
Token | 43 |
Token ID | 5946 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
Hiroshima | +8.594 |
Filipino | +8.390 |
Anaheim | +8.298 |
ILCS | +8.208 |
Huntington | +8.127 |
Neg logit contributions | |
Rhod | -8.090 |
� | -7.711 |
crop | -7.497 |
)", | -7.398 |
YD | -6.416 |
Token | for |
Token ID | 329 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
ickets | +13.950 |
ILCS | +13.717 |
Hiroshima | +13.682 |
Filipino | +13.392 |
wang | +13.203 |
Neg logit contributions | |
Rhod | -14.594 |
� | -13.502 |
crop | -13.033 |
)", | -12.976 |
YD | -11.211 |
Token | itt |
Token ID | 715 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
ILCS | +1.770 |
Hiroshima | +1.573 |
Anaheim | +1.540 |
Filipino | +1.535 |
chant | +1.497 |
Neg logit contributions | |
Rhod | -5.427 |
� | -5.159 |
)", | -5.081 |
crop | -5.050 |
recapt | -4.645 |
Token | les |
Token ID | 829 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
ILCS | +2.500 |
Hiroshima | +2.352 |
Anaheim | +2.338 |
Filipino | +2.310 |
chant | +2.248 |
Neg logit contributions | |
Rhod | -3.942 |
� | -3.717 |
)", | -3.641 |
crop | -3.579 |
recapt | -3.265 |
Token | ea |
Token ID | 18213 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
Rhod | +1.881 |
� | +1.788 |
crop | +1.655 |
)", | +1.650 |
faces | +1.264 |
Neg logit contributions | |
ILCS | -4.336 |
Hiroshima | -4.207 |
Anaheim | -4.137 |
Filipino | -4.131 |
Huntington | -4.105 |
Token | Community |
Token ID | 8108 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
Filipino | +14.557 |
Anaheim | +14.472 |
ILCS | +14.395 |
Hiroshima | +14.322 |
Manila | +14.262 |
Neg logit contributions | |
Rhod | -15.382 |
crop | -14.271 |
)", | -14.125 |
� | -14.125 |
faces | -12.684 |
Token | Connect |
Token ID | 8113 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
ILCS | +10.954 |
Filipino | +10.605 |
Hiroshima | +10.592 |
Manila | +10.494 |
Anaheim | +10.346 |
Neg logit contributions | |
Rhod | -9.525 |
crop | -9.095 |
� | -9.052 |
)", | -8.871 |
faces | -7.564 |
Token | ions |
Token ID | 507 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
ILCS | +3.668 |
Hiroshima | +3.554 |
Anaheim | +3.533 |
Filipino | +3.518 |
Manila | +3.436 |
Neg logit contributions | |
Rhod | -2.744 |
� | -2.544 |
)", | -2.444 |
crop | -2.403 |
recapt | -2.057 |
Token | ' |
Token ID | 6 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
Manila | +15.751 |
Hiroshima | +15.747 |
Filipino | +15.729 |
Anaheim | +15.093 |
Ballard | +14.749 |
Neg logit contributions | |
� | -17.730 |
Rhod | -17.437 |
crop | -17.344 |
)", | -16.790 |
faces | -15.086 |
Token | Emergency |
Token ID | 18154 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
Filipino | +14.024 |
Manila | +13.710 |
Hiroshima | +13.481 |
Anaheim | +13.454 |
ILCS | +13.396 |
Neg logit contributions | |
� | -12.761 |
Rhod | -12.686 |
)", | -12.449 |
crop | -12.417 |
YD | -11.060 |
Token | Relief |
Token ID | 30323 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
ILCS | +10.086 |
Filipino | +9.820 |
Hiroshima | +9.817 |
Anaheim | +9.770 |
Manila | +9.559 |
Neg logit contributions | |
Rhod | -10.777 |
� | -10.325 |
crop | -10.159 |
)", | -9.857 |
faces | -8.946 |
Token | , |
Token ID | 11 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
ILCS | +13.467 |
Anaheim | +13.266 |
Hiroshima | +13.265 |
Filipino | +13.252 |
Manila | +13.154 |
Neg logit contributions | |
Rhod | -14.306 |
� | -13.931 |
crop | -13.588 |
)", | -13.318 |
faces | -11.741 |
Token | K |
Token ID | 509 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
Filipino | +13.337 |
Manila | +13.116 |
Hiroshima | +13.109 |
ILCS | +13.068 |
Anaheim | +13.027 |
Neg logit contributions | |
Rhod | -12.613 |
� | -12.539 |
crop | -12.469 |
)", | -12.201 |
faces | -10.966 |
Token | � |
Token ID | 447 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
� | +5.517 |
Rhod | +5.270 |
crop | +4.743 |
)", | +4.716 |
\/ | +3.626 |
Neg logit contributions | |
Hiroshima | -11.625 |
ILCS | -11.556 |
Filipino | -11.249 |
Huntington | -11.123 |
boiler | -11.062 |
Token | � |
Token ID | 247 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
ILCS | +2.706 |
Hiroshima | +2.595 |
Anaheim | +2.582 |
Filipino | +2.571 |
Huntington | +2.506 |
Neg logit contributions | |
Rhod | -2.321 |
� | -2.153 |
)", | -2.097 |
crop | -2.059 |
recapt | -1.780 |
Token | t |
Token ID | 83 |
Feature activation | +8.72e-01 |
Pos logit contributions | |
Rhod | +1.068 |
� | +1.018 |
)", | +0.981 |
crop | +0.969 |
faces | +0.829 |
Neg logit contributions | |
ILCS | -1.222 |
Hiroshima | -1.167 |
Anaheim | -1.162 |
Filipino | -1.158 |
Huntington | -1.120 |
Token | own |
Token ID | 898 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
ILCS | +9.043 |
Anaheim | +8.794 |
Hiroshima | +8.487 |
Filipino | +8.404 |
Huntington | +8.329 |
Neg logit contributions | |
Rhod | -8.899 |
� | -8.037 |
)", | -8.036 |
crop | -7.959 |
YD | -7.072 |
Token | some |
Token ID | 617 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
Anaheim | +12.267 |
Filipino | +12.091 |
Huntington | +11.768 |
ILCS | +11.620 |
Hiroshima | +11.611 |
Neg logit contributions | |
Rhod | -10.663 |
)", | -10.105 |
� | -10.080 |
crop | -10.028 |
faces | -8.366 |
Token | of |
Token ID | 286 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
Anaheim | +13.987 |
ILCS | +13.900 |
Filipino | +13.731 |
Huntington | +13.484 |
Hiroshima | +13.308 |
Neg logit contributions | |
Rhod | -12.155 |
)", | -11.723 |
crop | -11.654 |
� | -11.648 |
YD | -9.466 |
Token | the |
Token ID | 262 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Anaheim | +18.759 |
Huntington | +17.631 |
ILCS | +17.629 |
Filipino | +17.483 |
Manila | +17.421 |
Neg logit contributions | |
)", | -15.179 |
Rhod | -14.826 |
crop | -14.763 |
� | -13.736 |
faces | -12.269 |
Token | necessary |
Token ID | 3306 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Anaheim | +14.823 |
Filipino | +14.470 |
ILCS | +14.274 |
Huntington | +14.228 |
Manila | +14.167 |
Neg logit contributions | |
Rhod | -12.577 |
crop | -12.230 |
)", | -12.229 |
� | -11.922 |
YD | -9.944 |
Token | ID |
Token ID | 4522 |
Feature activation | +8.16e-01 |
Pos logit contributions | |
Anaheim | +14.317 |
ILCS | +13.996 |
Huntington | +13.924 |
Filipino | +13.848 |
boiler | +13.754 |
Neg logit contributions | |
Rhod | -13.195 |
crop | -12.766 |
)", | -12.469 |
� | -12.242 |
�醒 | -10.271 |
Token | cards |
Token ID | 4116 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
ILCS | +7.268 |
Anaheim | +7.216 |
Filipino | +6.865 |
Huntington | +6.806 |
endo | +6.772 |
Neg logit contributions | |
Rhod | -9.426 |
)", | -8.892 |
� | -8.789 |
crop | -8.747 |
recapt | -7.501 |
Token | like |
Token ID | 588 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
Anaheim | +10.197 |
ILCS | +10.157 |
Filipino | +9.679 |
Hiroshima | +9.604 |
Huntington | +9.502 |
Neg logit contributions | |
Rhod | -13.434 |
)", | -12.736 |
crop | -12.415 |
� | -12.314 |
faces | -10.649 |
Token | which |
Token ID | 543 |
Feature activation | +8.82e-01 |
Pos logit contributions | |
ILCS | +7.011 |
Hiroshima | +6.850 |
Anaheim | +6.824 |
Filipino | +6.782 |
Huntington | +6.569 |
Neg logit contributions | |
Rhod | -8.058 |
� | -7.659 |
)", | -7.490 |
crop | -7.353 |
faces | -6.466 |
Token | is |
Token ID | 318 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
Anaheim | +7.998 |
Hiroshima | +7.900 |
Filipino | +7.838 |
ILCS | +7.767 |
Huntington | +7.665 |
Neg logit contributions | |
Rhod | -9.603 |
)", | -9.318 |
� | -9.241 |
crop | -9.148 |
faces | -7.739 |
Token | $ |
Token ID | 720 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
Anaheim | +10.715 |
Hiroshima | +10.608 |
Filipino | +10.528 |
Huntington | +10.313 |
ILCS | +10.139 |
Neg logit contributions | |
Rhod | -11.852 |
� | -11.501 |
)", | -11.268 |
crop | -11.077 |
faces | -9.955 |
Token | 40 |
Token ID | 1821 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
ILCS | +1.442 |
Hiroshima | +1.378 |
Anaheim | +1.366 |
Filipino | +1.360 |
Huntington | +1.322 |
Neg logit contributions | |
Rhod | -1.630 |
� | -1.534 |
)", | -1.489 |
crop | -1.463 |
recapt | -1.299 |
Token | more |
Token ID | 517 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
ILCS | +9.518 |
Hiroshima | +9.085 |
Filipino | +9.019 |
Anaheim | +8.800 |
Huntington | +8.638 |
Neg logit contributions | |
Rhod | -12.097 |
� | -11.414 |
)", | -11.277 |
crop | -10.996 |
faces | -9.912 |
Token | than |
Token ID | 621 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
ILCS | +5.489 |
Hiroshima | +5.394 |
Anaheim | +5.337 |
Filipino | +5.317 |
Huntington | +5.199 |
Neg logit contributions | |
Rhod | -5.787 |
� | -5.497 |
)", | -5.379 |
crop | -5.306 |
faces | -4.676 |
Token | the |
Token ID | 262 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
Anaheim | +16.817 |
Hiroshima | +16.583 |
Huntington | +16.400 |
ILCS | +16.209 |
Filipino | +16.179 |
Neg logit contributions | |
� | -16.691 |
)", | -16.016 |
Rhod | -16.001 |
crop | -15.888 |
faces | -14.100 |
Token | standard |
Token ID | 3210 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
Hiroshima | +12.754 |
Anaheim | +12.684 |
Filipino | +12.662 |
ILCS | +12.512 |
Huntington | +12.473 |
Neg logit contributions | |
Rhod | -12.208 |
� | -12.168 |
crop | -11.789 |
)", | -11.678 |
faces | -10.387 |
Token | game |
Token ID | 983 |
Feature activation | +6.27e-01 |
Pos logit contributions | |
Filipino | +12.079 |
Anaheim | +11.975 |
Hiroshima | +11.844 |
Huntington | +11.708 |
ILCS | +11.565 |
Neg logit contributions | |
� | -12.349 |
Rhod | -12.254 |
crop | -11.630 |
)", | -11.526 |
faces | -10.455 |
Token | . |
Token ID | 13 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
ILCS | +6.131 |
Hiroshima | +5.986 |
Anaheim | +5.978 |
Filipino | +5.884 |
Huntington | +5.713 |
Neg logit contributions | |
Rhod | -6.986 |
� | -6.706 |
)", | -6.517 |
crop | -6.345 |
faces | -5.614 |
Token | It |
Token ID | 632 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
Anaheim | +9.217 |
Filipino | +9.029 |
Hiroshima | +9.001 |
ILCS | +8.992 |
Huntington | +8.883 |
Neg logit contributions | |
Rhod | -10.993 |
� | -10.980 |
)", | -10.695 |
crop | -10.522 |
reconc | -9.744 |
Token | 2 |
Token ID | 362 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
ILCS | +7.543 |
Anaheim | +7.115 |
Filipino | +7.035 |
boiler | +6.903 |
Hiroshima | +6.891 |
Neg logit contributions | |
Rhod | -11.332 |
� | -10.755 |
)", | -10.582 |
crop | -10.330 |
faces | -9.271 |
Token | 3 |
Token ID | 513 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
Anaheim | +11.121 |
boiler | +10.974 |
ILCS | +10.761 |
Hiroshima | +10.428 |
quist | +10.341 |
Neg logit contributions | |
Rhod | -17.867 |
)", | -17.711 |
� | -17.174 |
crop | -15.853 |
YD | -14.439 |
Token | 4 |
Token ID | 604 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
ILCS | +12.181 |
boiler | +11.539 |
Anaheim | +11.369 |
Filipino | +11.014 |
Ballard | +10.642 |
Neg logit contributions | |
Rhod | -17.794 |
)", | -17.391 |
� | -17.309 |
crop | -16.081 |
YD | -14.211 |
Token | 5 |
Token ID | 642 |
Feature activation | +8.27e-01 |
Pos logit contributions | |
ILCS | +8.283 |
boiler | +7.696 |
Anaheim | +7.636 |
Hiroshima | +7.577 |
Filipino | +7.548 |
Neg logit contributions | |
Rhod | -13.134 |
� | -12.451 |
)", | -12.295 |
crop | -11.897 |
YD | -10.394 |
Token | 6 |
Token ID | 718 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
ILCS | +7.093 |
Hiroshima | +6.556 |
Anaheim | +6.440 |
Filipino | +6.390 |
boiler | +6.344 |
Neg logit contributions | |
Rhod | -10.279 |
� | -9.798 |
)", | -9.522 |
crop | -9.247 |
YD | -8.420 |
Token | 7 |
Token ID | 767 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
boiler | +12.201 |
Huntington | +11.960 |
Hiroshima | +11.891 |
Anaheim | +11.535 |
ILCS | +11.482 |
Neg logit contributions | |
)", | -20.325 |
� | -19.821 |
Rhod | -19.550 |
crop | -18.439 |
Constantin | -16.485 |
Token | 8 |
Token ID | 807 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
ILCS | +13.948 |
boiler | +12.879 |
Anaheim | +12.300 |
Huntington | +12.224 |
Manila | +12.091 |
Neg logit contributions | |
)", | -20.834 |
� | -20.551 |
Rhod | -20.418 |
crop | -19.383 |
etsk | -17.029 |
Token | 9 |
Token ID | 860 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ILCS | +10.262 |
boiler | +9.962 |
Anaheim | +9.837 |
Hiroshima | +9.727 |
Filipino | +9.534 |
Neg logit contributions | |
Rhod | -16.718 |
)", | -16.637 |
� | -15.654 |
crop | -15.215 |
etsk | -13.625 |
Token | 10 |
Token ID | 838 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
ILCS | +8.975 |
boiler | +8.521 |
Anaheim | +8.449 |
Filipino | +8.216 |
Hiroshima | +8.087 |
Neg logit contributions | |
Rhod | -14.572 |
)", | -14.557 |
� | -14.063 |
crop | -13.354 |
etsk | -12.190 |
Token | 11 |
Token ID | 1367 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
ILCS | +8.013 |
Anaheim | +7.677 |
Huntington | +7.623 |
Hiroshima | +7.615 |
chant | +7.555 |
Neg logit contributions | |
Rhod | -13.481 |
)", | -13.241 |
� | -13.202 |
crop | -12.431 |
faces | -11.467 |
Token | 12 |
Token ID | 1105 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
ILCS | +9.172 |
Anaheim | +9.100 |
boiler | +9.021 |
Filipino | +8.889 |
chant | +8.741 |
Neg logit contributions | |
Rhod | -17.072 |
� | -16.922 |
)", | -16.855 |
crop | -15.985 |
faces | -14.392 |
Token | the |
Token ID | 262 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
Anaheim | +5.948 |
ILCS | +5.912 |
Hiroshima | +5.856 |
Filipino | +5.705 |
Huntington | +5.634 |
Neg logit contributions | |
Rhod | -5.779 |
� | -5.453 |
)", | -5.375 |
crop | -5.270 |
faces | -4.527 |
Token | Flyers |
Token ID | 30652 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
Anaheim | +5.167 |
Hiroshima | +5.136 |
ILCS | +5.032 |
Filipino | +4.986 |
Huntington | +4.848 |
Neg logit contributions | |
Rhod | -5.502 |
� | -5.286 |
)", | -5.100 |
crop | -5.054 |
faces | -4.413 |
Token | with |
Token ID | 351 |
Feature activation | +9.04e-01 |
Pos logit contributions | |
ILCS | +4.706 |
Hiroshima | +4.693 |
Anaheim | +4.672 |
Filipino | +4.584 |
Huntington | +4.498 |
Neg logit contributions | |
Rhod | -4.569 |
� | -4.289 |
)", | -4.221 |
crop | -4.144 |
faces | -3.580 |
Token | just |
Token ID | 655 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
Anaheim | +9.623 |
ILCS | +9.323 |
Hiroshima | +9.321 |
Filipino | +9.160 |
Huntington | +9.030 |
Neg logit contributions | |
Rhod | -8.786 |
� | -8.269 |
)", | -8.244 |
crop | -8.163 |
YD | -6.878 |
Token | over |
Token ID | 625 |
Feature activation | +9.56e-01 |
Pos logit contributions | |
Anaheim | +6.671 |
ILCS | +6.617 |
Hiroshima | +6.606 |
Filipino | +6.512 |
Manila | +6.326 |
Neg logit contributions | |
Rhod | -6.067 |
� | -5.695 |
crop | -5.688 |
)", | -5.653 |
faces | -4.743 |
Token | six |
Token ID | 2237 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
Anaheim | +9.945 |
Hiroshima | +9.864 |
Filipino | +9.462 |
Manila | +9.271 |
ILCS | +9.239 |
Neg logit contributions | |
Rhod | -9.271 |
� | -8.887 |
)", | -8.740 |
crop | -8.657 |
YD | -7.342 |
Token | minutes |
Token ID | 2431 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
Anaheim | +13.466 |
Hiroshima | +12.487 |
ILCS | +11.816 |
Filipino | +11.570 |
boiler | +11.390 |
Neg logit contributions | |
crop | -21.435 |
Rhod | -20.857 |
)", | -20.265 |
� | -20.217 |
vre | -17.655 |
Token | remaining |
Token ID | 5637 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
Hiroshima | +10.656 |
Anaheim | +10.624 |
Filipino | +10.452 |
ILCS | +10.329 |
boiler | +10.155 |
Neg logit contributions | |
Rhod | -16.148 |
crop | -15.549 |
� | -15.505 |
)", | -14.939 |
YD | -13.530 |
Token | gave |
Token ID | 2921 |
Feature activation | +9.46e-01 |
Pos logit contributions | |
Hiroshima | +5.120 |
Anaheim | +5.099 |
ILCS | +5.097 |
Filipino | +5.013 |
Huntington | +4.884 |
Neg logit contributions | |
Rhod | -5.232 |
� | -4.891 |
)", | -4.811 |
crop | -4.751 |
faces | -4.076 |
Token | them |
Token ID | 606 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
Anaheim | +9.467 |
Hiroshima | +9.087 |
ILCS | +8.872 |
Filipino | +8.803 |
Huntington | +8.730 |
Neg logit contributions | |
Rhod | -9.928 |
� | -9.504 |
)", | -9.345 |
crop | -9.135 |
faces | -7.981 |
Token | an |
Token ID | 281 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
ILCS | +6.077 |
Hiroshima | +6.059 |
Anaheim | +6.053 |
Filipino | +5.958 |
Huntington | +5.819 |
Neg logit contributions | |
Rhod | -5.491 |
� | -5.142 |
)", | -5.096 |
crop | -5.001 |
faces | -4.322 |
Token | that |
Token ID | 326 |
Feature activation | +6.39e-01 |
Pos logit contributions | |
Hiroshima | +8.178 |
Anaheim | +8.061 |
Filipino | +7.892 |
ILCS | +7.852 |
Huntington | +7.718 |
Neg logit contributions | |
Rhod | -10.050 |
� | -9.653 |
)", | -9.598 |
crop | -9.412 |
YD | -8.118 |
Token | scored |
Token ID | 7781 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
Hiroshima | +7.185 |
Anaheim | +7.096 |
Filipino | +7.005 |
ILCS | +6.903 |
Huntington | +6.887 |
Neg logit contributions | |
Rhod | -6.163 |
� | -5.911 |
)", | -5.831 |
crop | -5.775 |
faces | -4.875 |
Token | Michael |
Token ID | 3899 |
Feature activation | +9.60e-01 |
Pos logit contributions | |
Hiroshima | +12.081 |
Anaheim | +11.836 |
Filipino | +11.665 |
Huntington | +11.409 |
Manila | +11.128 |
Neg logit contributions | |
� | -10.051 |
Rhod | -9.906 |
)", | -9.748 |
crop | -9.651 |
YD | -8.173 |
Token | Morse |
Token ID | 44049 |
Feature activation | +8.29e-01 |
Pos logit contributions | |
Hiroshima | +9.346 |
ILCS | +9.331 |
Huntington | +9.323 |
Anaheim | +9.196 |
Filipino | +9.098 |
Neg logit contributions | |
Rhod | -9.437 |
� | -9.292 |
crop | -9.208 |
)", | -9.108 |
grading | -7.924 |
Token | to |
Token ID | 284 |
Feature activation | +8.29e-01 |
Pos logit contributions | |
Hiroshima | +7.740 |
Anaheim | +7.627 |
ILCS | +7.612 |
Filipino | +7.393 |
Huntington | +7.335 |
Neg logit contributions | |
Rhod | -9.189 |
)", | -8.685 |
� | -8.664 |
crop | -8.516 |
faces | -7.552 |
Token | tie |
Token ID | 9839 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
Hiroshima | +8.889 |
Anaheim | +8.833 |
Filipino | +8.636 |
Huntington | +8.416 |
Manila | +8.377 |
Neg logit contributions | |
Rhod | -8.166 |
� | -7.727 |
)", | -7.478 |
crop | -7.314 |
faces | -6.548 |
Token | and |
Token ID | 290 |
Feature activation | +8.00e-01 |
Pos logit contributions | |
Anaheim | +15.776 |
Hiroshima | +15.422 |
Filipino | +14.656 |
Huntington | +14.349 |
Manila | +14.220 |
Neg logit contributions | |
)", | -18.798 |
� | -18.242 |
Rhod | -18.219 |
crop | -17.782 |
faces | -15.696 |
Token | Ian |
Token ID | 12930 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
Hiroshima | +8.725 |
Anaheim | +8.696 |
Filipino | +8.569 |
ILCS | +8.305 |
Huntington | +8.301 |
Neg logit contributions | |
Rhod | -7.570 |
� | -7.256 |
)", | -7.091 |
crop | -7.005 |
faces | -6.044 |
Token | Desmond |
Token ID | 41045 |
Feature activation | +8.76e-01 |
Pos logit contributions | |
Filipino | +7.582 |
Huntington | +7.515 |
Anaheim | +7.377 |
Manila | +7.233 |
Hiroshima | +7.196 |
Neg logit contributions | |
Rhod | -11.717 |
crop | -11.713 |
� | -11.445 |
)", | -11.089 |
YD | -10.296 |
Token | to |
Token ID | 284 |
Feature activation | +8.59e-01 |
Pos logit contributions | |
Hiroshima | +8.664 |
Anaheim | +8.493 |
Filipino | +8.475 |
ILCS | +8.127 |
Huntington | +8.124 |
Neg logit contributions | |
Rhod | -9.047 |
� | -8.693 |
crop | -8.631 |
)", | -8.578 |
faces | -7.445 |
Token | take |
Token ID | 1011 |
Feature activation | +8.45e-01 |
Pos logit contributions | |
Hiroshima | +9.161 |
Anaheim | +9.107 |
Filipino | +8.974 |
Huntington | +8.737 |
Manila | +8.678 |
Neg logit contributions | |
Rhod | -8.321 |
� | -8.008 |
)", | -7.704 |
crop | -7.546 |
faces | -6.626 |
Token | n |
Token ID | 299 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
Filipino | +16.955 |
Manila | +16.435 |
Anaheim | +16.122 |
Huntington | +15.652 |
Hiroshima | +15.621 |
Neg logit contributions | |
Rhod | -14.622 |
crop | -13.513 |
� | -13.042 |
)", | -12.398 |
faces | -11.847 |
Token | atin |
Token ID | 10680 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Filipino | +12.210 |
endo | +11.827 |
wang | +11.825 |
Manila | +11.620 |
Anaheim | +11.571 |
Neg logit contributions | |
Rhod | -15.739 |
)", | -14.287 |
crop | -13.946 |
� | -13.717 |
mileage | -12.990 |
Token | ang |
Token ID | 3550 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
Filipino | +14.921 |
Manila | +14.389 |
Anaheim | +14.237 |
Hiroshima | +13.858 |
Huntington | +13.811 |
Neg logit contributions | |
Rhod | -13.642 |
crop | -12.417 |
� | -12.220 |
)", | -11.670 |
faces | -10.862 |
Token | at |
Token ID | 379 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Filipino | +16.493 |
Manila | +16.050 |
Anaheim | +15.880 |
ILCS | +15.405 |
Hiroshima | +15.243 |
Neg logit contributions | |
Rhod | -12.847 |
crop | -12.187 |
� | -11.953 |
)", | -11.709 |
faces | -10.486 |
Token | ing |
Token ID | 278 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
Filipino | +15.044 |
Anaheim | +14.650 |
Manila | +14.545 |
ILCS | +14.263 |
wang | +14.222 |
Neg logit contributions | |
Rhod | -14.299 |
� | -12.859 |
)", | -12.682 |
crop | -12.427 |
faces | -11.122 |
Token | k |
Token ID | 479 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
Filipino | +15.765 |
Manila | +15.279 |
Hiroshima | +15.233 |
Anaheim | +15.064 |
Huntington | +14.593 |
Neg logit contributions | |
Rhod | -13.166 |
� | -12.285 |
crop | -12.255 |
)", | -11.685 |
faces | -10.812 |
Token | amp |
Token ID | 696 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
endo | +16.945 |
eno | +16.869 |
wang | +16.862 |
ushi | +16.603 |
chant | +16.051 |
Neg logit contributions | |
Rhod | -17.599 |
)", | -15.040 |
crop | -14.972 |
mileage | -14.305 |
� | -14.262 |
Token | anya |
Token ID | 34183 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
ushi | +9.882 |
endo | +9.820 |
Filipino | +9.761 |
ILCS | +9.753 |
Anaheim | +9.707 |
Neg logit contributions | |
Rhod | -11.891 |
� | -10.597 |
)", | -10.522 |
crop | -10.360 |
YD | -9.438 |
Token | bast |
Token ID | 19918 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
Filipino | +13.818 |
Anaheim | +13.493 |
Manila | +13.365 |
Hiroshima | +13.098 |
ILCS | +13.081 |
Neg logit contributions | |
Rhod | -13.490 |
crop | -12.562 |
� | -12.101 |
)", | -11.572 |
faces | -11.250 |
Token | a |
Token ID | 64 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
ILCS | +9.111 |
Filipino | +9.066 |
ushi | +9.014 |
Anaheim | +8.971 |
wang | +8.913 |
Neg logit contributions | |
Rhod | -10.794 |
� | -9.871 |
crop | -9.580 |
)", | -9.568 |
YD | -8.495 |
Token | l |
Token ID | 300 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
Filipino | +13.106 |
Anaheim | +12.821 |
Manila | +12.793 |
ILCS | +12.528 |
Hiroshima | +12.476 |
Neg logit contributions | |
Rhod | -12.457 |
crop | -11.516 |
� | -10.885 |
)", | -10.747 |
faces | -10.137 |
Token | ild |
Token ID | 688 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
ILCS | +2.461 |
Hiroshima | +2.332 |
Anaheim | +2.322 |
Filipino | +2.314 |
Huntington | +2.234 |
Neg logit contributions | |
Rhod | -3.331 |
� | -3.133 |
)", | -3.062 |
crop | -3.028 |
recapt | -2.703 |
Token | on |
Token ID | 261 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
ILCS | +0.152 |
Hiroshima | +0.145 |
Anaheim | +0.143 |
Filipino | +0.143 |
Huntington | +0.139 |
Neg logit contributions | |
Rhod | -0.172 |
� | -0.162 |
)", | -0.157 |
crop | -0.155 |
recapt | -0.137 |
Token | an |
Token ID | 272 |
Feature activation | +9.71e-01 |
Pos logit contributions | |
Rhod | +1.213 |
� | +1.145 |
)", | +1.102 |
crop | +1.092 |
faces | +0.947 |
Neg logit contributions | |
ILCS | -1.269 |
Hiroshima | -1.212 |
Filipino | -1.186 |
Anaheim | -1.184 |
Huntington | -1.161 |
Token | Un |
Token ID | 791 |
Feature activation | +9.54e-01 |
Pos logit contributions | |
ILCS | +9.175 |
Filipino | +8.887 |
Anaheim | +8.780 |
Hiroshima | +8.714 |
Manila | +8.688 |
Neg logit contributions | |
Rhod | -10.325 |
crop | -9.690 |
� | -9.627 |
)", | -9.393 |
faces | -8.479 |
Token | iting |
Token ID | 1780 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
ILCS | +4.767 |
quist | +4.296 |
chant | +4.288 |
endo | +4.229 |
ushi | +4.132 |
Neg logit contributions | |
Rhod | -14.506 |
� | -13.519 |
)", | -13.453 |
crop | -13.429 |
YD | -12.565 |
Token | Care |
Token ID | 7276 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
ILCS | +6.918 |
Anaheim | +6.733 |
Hiroshima | +6.726 |
Filipino | +6.693 |
Manila | +6.539 |
Neg logit contributions | |
Rhod | -4.934 |
� | -4.605 |
crop | -4.416 |
)", | -4.389 |
faces | -3.746 |
Token | 's |
Token ID | 338 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Filipino | +15.632 |
Manila | +15.477 |
Anaheim | +15.360 |
Hiroshima | +15.358 |
ILCS | +14.922 |
Neg logit contributions | |
Rhod | -16.202 |
crop | -16.064 |
� | -15.562 |
)", | -15.410 |
faces | -13.602 |
Token | financial |
Token ID | 3176 |
Feature activation | +8.67e-01 |
Pos logit contributions | |
Filipino | +14.437 |
ILCS | +14.170 |
Manila | +14.037 |
Hiroshima | +13.961 |
Anaheim | +13.873 |
Neg logit contributions | |
� | -12.730 |
Rhod | -12.698 |
)", | -12.201 |
crop | -12.125 |
YD | -10.962 |
Token | counselling |
Token ID | 47586 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
ILCS | +8.105 |
Filipino | +7.706 |
Anaheim | +7.502 |
Hiroshima | +7.495 |
Manila | +7.400 |
Neg logit contributions | |
Rhod | -9.814 |
� | -9.314 |
)", | -8.954 |
crop | -8.793 |
YD | -8.001 |
Token | service |
Token ID | 2139 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
ILCS | +10.304 |
Filipino | +10.202 |
boiler | +10.094 |
Hiroshima | +10.046 |
Anaheim | +10.036 |
Neg logit contributions | |
Rhod | -11.858 |
� | -11.602 |
crop | -11.335 |
)", | -10.977 |
faces | -9.913 |
Token | or |
Token ID | 393 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
Hiroshima | +12.645 |
ILCS | +12.637 |
Filipino | +12.594 |
Anaheim | +12.391 |
Manila | +12.298 |
Neg logit contributions | |
� | -14.875 |
Rhod | -14.664 |
crop | -14.369 |
)", | -14.138 |
faces | -12.953 |
Token | kan |
Token ID | 43998 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Filipino | +18.932 |
Manila | +18.265 |
Anaheim | +17.750 |
ILCS | +17.365 |
Huntington | +17.032 |
Neg logit contributions | |
Rhod | -13.942 |
� | -13.454 |
crop | -13.158 |
)", | -12.575 |
faces | -11.387 |
Token | il |
Token ID | 346 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
Filipino | +14.120 |
Anaheim | +13.933 |
ILCS | +13.780 |
Manila | +13.740 |
wang | +13.696 |
Neg logit contributions | |
Rhod | -14.887 |
� | -13.356 |
)", | -13.115 |
crop | -13.031 |
scenery | -11.899 |
Token | ang |
Token ID | 648 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
Filipino | +13.043 |
wang | +12.629 |
Manila | +12.512 |
Anaheim | +12.503 |
ushi | +12.365 |
Neg logit contributions | |
Rhod | -14.846 |
� | -13.469 |
crop | -13.203 |
)", | -12.993 |
YD | -11.818 |
Token | an |
Token ID | 281 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
Filipino | +18.690 |
Manila | +17.869 |
Anaheim | +17.566 |
Huntington | +17.101 |
wang | +17.057 |
Neg logit contributions | |
Rhod | -14.851 |
� | -13.861 |
crop | -13.645 |
)", | -12.306 |
faces | -11.871 |
Token | ak |
Token ID | 461 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
Filipino | +11.277 |
ILCS | +11.116 |
Anaheim | +11.071 |
wang | +10.822 |
Manila | +10.780 |
Neg logit contributions | |
Rhod | -13.101 |
� | -11.911 |
)", | -11.640 |
crop | -11.489 |
scenery | -10.222 |
Token | ay |
Token ID | 38762 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
Filipino | +18.218 |
wang | +18.125 |
Anaheim | +17.816 |
kit | +17.726 |
chant | +17.706 |
Neg logit contributions | |
Rhod | -17.677 |
� | -14.981 |
crop | -14.892 |
)", | -14.760 |
scenery | -13.605 |
Token | n |
Token ID | 299 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
Filipino | +18.895 |
Manila | +18.214 |
Anaheim | +17.901 |
ILCS | +17.142 |
Huntington | +17.035 |
Neg logit contributions | |
Rhod | -14.760 |
� | -13.924 |
crop | -13.478 |
)", | -13.052 |
faces | -12.039 |
Token | al |
Token ID | 282 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
Filipino | +11.067 |
wang | +10.849 |
endo | +10.843 |
ushi | +10.669 |
eno | +10.634 |
Neg logit contributions | |
Rhod | -14.583 |
)", | -12.930 |
� | -12.849 |
crop | -12.529 |
mileage | -12.067 |
Token | al |
Token ID | 282 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
Filipino | +13.138 |
wang | +13.070 |
ushi | +13.008 |
Anaheim | +12.810 |
eno | +12.687 |
Neg logit contributions | |
Rhod | -15.434 |
� | -13.706 |
)", | -13.599 |
crop | -13.306 |
FSA | -12.294 |
Token | ay |
Token ID | 323 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Filipino | +14.396 |
wang | +13.914 |
Anaheim | +13.865 |
ushi | +13.777 |
eno | +13.673 |
Neg logit contributions | |
Rhod | -15.857 |
� | -14.184 |
crop | -13.981 |
)", | -13.846 |
YD | -12.606 |
Token | o |
Token ID | 78 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
Filipino | +13.963 |
Anaheim | +13.479 |
eno | +13.347 |
Manila | +13.235 |
endo | +13.210 |
Neg logit contributions | |
Rhod | -14.496 |
� | -12.904 |
crop | -12.759 |
)", | -12.468 |
YD | -11.521 |
Token | wa |
Token ID | 10247 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Filipino | +13.501 |
Manila | +13.115 |
Anaheim | +13.024 |
wang | +12.988 |
Huntington | +12.619 |
Neg logit contributions | |
Rhod | -13.174 |
crop | -12.038 |
� | -11.567 |
)", | -11.321 |
faces | -10.522 |
Token | na |
Token ID | 12385 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
Filipino | +14.227 |
Manila | +13.722 |
Anaheim | +13.480 |
Hiroshima | +13.205 |
wang | +13.111 |
Neg logit contributions | |
Rhod | -14.311 |
crop | -13.468 |
� | -12.653 |
)", | -12.112 |
faces | -11.638 |
Token | ang |
Token ID | 3550 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
Filipino | +17.390 |
Manila | +16.965 |
Anaheim | +16.327 |
Huntington | +15.939 |
Hiroshima | +15.809 |
Neg logit contributions | |
Rhod | -13.814 |
crop | -13.195 |
� | -13.149 |
)", | -12.329 |
faces | -11.580 |
Token | kan |
Token ID | 43998 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Filipino | +18.932 |
Manila | +18.265 |
Anaheim | +17.750 |
ILCS | +17.365 |
Huntington | +17.032 |
Neg logit contributions | |
Rhod | -13.942 |
� | -13.454 |
crop | -13.158 |
)", | -12.575 |
faces | -11.387 |
Token | il |
Token ID | 346 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
Filipino | +14.120 |
Anaheim | +13.933 |
ILCS | +13.780 |
Manila | +13.740 |
wang | +13.696 |
Neg logit contributions | |
Rhod | -14.887 |
� | -13.356 |
)", | -13.115 |
crop | -13.031 |
scenery | -11.899 |
Token | ang |
Token ID | 648 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
Filipino | +13.043 |
wang | +12.629 |
Manila | +12.512 |
Anaheim | +12.503 |
ushi | +12.365 |
Neg logit contributions | |
Rhod | -14.846 |
� | -13.469 |
crop | -13.203 |
)", | -12.993 |
YD | -11.818 |
Token | an |
Token ID | 281 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
Filipino | +18.690 |
Manila | +17.869 |
Anaheim | +17.566 |
Huntington | +17.101 |
wang | +17.057 |
Neg logit contributions | |
Rhod | -14.851 |
� | -13.861 |
crop | -13.645 |
)", | -12.306 |
faces | -11.871 |
Token | ak |
Token ID | 461 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
Filipino | +11.277 |
ILCS | +11.116 |
Anaheim | +11.071 |
wang | +10.822 |
Manila | +10.780 |
Neg logit contributions | |
Rhod | -13.101 |
� | -11.911 |
)", | -11.640 |
crop | -11.489 |
scenery | -10.222 |
Token | ay |
Token ID | 38762 |
Feature activation | +2.00e+00 |
Pos logit contributions | |
Filipino | +18.218 |
wang | +18.125 |
Anaheim | +17.816 |
kit | +17.726 |
chant | +17.706 |
Neg logit contributions | |
Rhod | -17.677 |
� | -14.981 |
crop | -14.892 |
)", | -14.760 |
scenery | -13.605 |
Token | n |
Token ID | 299 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
Filipino | +18.895 |
Manila | +18.214 |
Anaheim | +17.901 |
ILCS | +17.142 |
Huntington | +17.035 |
Neg logit contributions | |
Rhod | -14.760 |
� | -13.924 |
crop | -13.478 |
)", | -13.052 |
faces | -12.039 |
Token | al |
Token ID | 282 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
Filipino | +11.067 |
wang | +10.849 |
endo | +10.843 |
ushi | +10.669 |
eno | +10.634 |
Neg logit contributions | |
Rhod | -14.583 |
)", | -12.930 |
� | -12.849 |
crop | -12.529 |
mileage | -12.067 |
Token | � |
Token ID | 247 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
ILCS | +1.696 |
Hiroshima | +1.630 |
Anaheim | +1.617 |
Filipino | +1.613 |
Huntington | +1.574 |
Neg logit contributions | |
Rhod | -1.397 |
� | -1.300 |
)", | -1.256 |
crop | -1.233 |
recapt | -1.062 |
Token | ve |
Token ID | 303 |
Feature activation | +9.05e-01 |
Pos logit contributions | |
Rhod | +2.242 |
� | +2.149 |
)", | +2.047 |
crop | +2.030 |
faces | +1.733 |
Neg logit contributions | |
ILCS | -2.721 |
Hiroshima | -2.604 |
Filipino | -2.572 |
Anaheim | -2.570 |
Huntington | -2.488 |
Token | had |
Token ID | 550 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
Anaheim | +8.985 |
ILCS | +8.834 |
Hiroshima | +8.832 |
Filipino | +8.781 |
Huntington | +8.598 |
Neg logit contributions | |
Rhod | -9.126 |
crop | -8.608 |
� | -8.552 |
)", | -8.525 |
faces | -7.509 |
Token | a |
Token ID | 257 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
Anaheim | +13.457 |
Hiroshima | +12.969 |
Filipino | +12.887 |
ILCS | +12.837 |
Huntington | +12.837 |
Neg logit contributions | |
Rhod | -12.186 |
crop | -12.160 |
)", | -11.745 |
� | -11.411 |
faces | -9.846 |
Token | lot |
Token ID | 1256 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
Filipino | +15.011 |
Anaheim | +14.719 |
Hiroshima | +14.675 |
Huntington | +14.642 |
Manila | +14.343 |
Neg logit contributions | |
Rhod | -13.733 |
crop | -13.515 |
)", | -13.439 |
� | -13.250 |
faces | -11.932 |
Token | of |
Token ID | 286 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
ILCS | +9.505 |
Anaheim | +9.216 |
Hiroshima | +8.802 |
chant | +8.722 |
Filipino | +8.682 |
Neg logit contributions | |
Rhod | -13.119 |
)", | -12.411 |
crop | -12.089 |
� | -11.996 |
YD | -10.639 |
Token | practice |
Token ID | 3357 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
Anaheim | +17.307 |
Filipino | +16.810 |
boiler | +16.451 |
ILCS | +16.299 |
Huntington | +16.271 |
Neg logit contributions | |
crop | -15.128 |
Rhod | -14.682 |
)", | -14.491 |
� | -14.046 |
�醒 | -12.928 |
Token | with |
Token ID | 351 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
Anaheim | +13.539 |
Hiroshima | +13.107 |
Filipino | +13.071 |
Huntington | +13.060 |
Manila | +12.831 |
Neg logit contributions | |
Rhod | -12.686 |
)", | -12.360 |
crop | -12.256 |
� | -11.779 |
�醒 | -9.909 |
Token | it |
Token ID | 340 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
Anaheim | +14.390 |
Filipino | +14.143 |
Huntington | +13.826 |
Hiroshima | +13.815 |
ILCS | +13.769 |
Neg logit contributions | |
Rhod | -11.918 |
crop | -11.686 |
)", | -11.670 |
� | -11.516 |
faces | -9.442 |
Token | , |
Token ID | 11 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
ILCS | +3.880 |
Anaheim | +3.724 |
Hiroshima | +3.710 |
Filipino | +3.666 |
Huntington | +3.582 |
Neg logit contributions | |
Rhod | -3.980 |
� | -3.692 |
)", | -3.653 |
crop | -3.570 |
faces | -3.108 |
Token | since |
Token ID | 1201 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
ILCS | +4.826 |
Hiroshima | +4.671 |
Anaheim | +4.670 |
Filipino | +4.616 |
Huntington | +4.511 |
Neg logit contributions | |
Rhod | -4.409 |
� | -4.105 |
)", | -4.054 |
crop | -3.961 |
faces | -3.428 |
Token | 's |
Token ID | 338 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Filipino | +15.632 |
Manila | +15.477 |
Anaheim | +15.360 |
Hiroshima | +15.358 |
ILCS | +14.922 |
Neg logit contributions | |
Rhod | -16.202 |
crop | -16.064 |
� | -15.562 |
)", | -15.410 |
faces | -13.602 |
Token | financial |
Token ID | 3176 |
Feature activation | +8.67e-01 |
Pos logit contributions | |
Filipino | +14.437 |
ILCS | +14.170 |
Manila | +14.037 |
Hiroshima | +13.961 |
Anaheim | +13.873 |
Neg logit contributions | |
� | -12.730 |
Rhod | -12.698 |
)", | -12.201 |
crop | -12.125 |
YD | -10.962 |
Token | counselling |
Token ID | 47586 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
ILCS | +8.105 |
Filipino | +7.706 |
Anaheim | +7.502 |
Hiroshima | +7.495 |
Manila | +7.400 |
Neg logit contributions | |
Rhod | -9.814 |
� | -9.314 |
)", | -8.954 |
crop | -8.793 |
YD | -8.001 |
Token | service |
Token ID | 2139 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
ILCS | +10.304 |
Filipino | +10.202 |
boiler | +10.094 |
Hiroshima | +10.046 |
Anaheim | +10.036 |
Neg logit contributions | |
Rhod | -11.858 |
� | -11.602 |
crop | -11.335 |
)", | -10.977 |
faces | -9.913 |
Token | or |
Token ID | 393 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
Hiroshima | +12.645 |
ILCS | +12.637 |
Filipino | +12.594 |
Anaheim | +12.391 |
Manila | +12.298 |
Neg logit contributions | |
� | -14.875 |
Rhod | -14.664 |
crop | -14.369 |
)", | -14.138 |
faces | -12.953 |
Token | call |
Token ID | 869 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
Filipino | +15.120 |
Hiroshima | +14.919 |
Huntington | +14.845 |
Anaheim | +14.813 |
Manila | +14.675 |
Neg logit contributions | |
� | -13.693 |
)", | -12.645 |
crop | -12.595 |
Rhod | -12.560 |
YD | -11.679 |
Token | K |
Token ID | 509 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
Filipino | +14.561 |
Anaheim | +14.192 |
Manila | +13.956 |
Chinatown | +13.882 |
Hiroshima | +13.755 |
Neg logit contributions | |
� | -16.823 |
crop | -16.401 |
)", | -15.955 |
Rhod | -15.855 |
YD | -14.875 |
Token | ild |
Token ID | 688 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
ILCS | +3.610 |
Anaheim | +3.401 |
Hiroshima | +3.400 |
Filipino | +3.389 |
chant | +3.267 |
Neg logit contributions | |
Rhod | -5.217 |
� | -4.889 |
)", | -4.811 |
crop | -4.757 |
recapt | -4.268 |
Token | on |
Token ID | 261 |
Feature activation | -1.21e-04 |
Pos logit contributions | |
ILCS | +2.315 |
Anaheim | +2.207 |
Hiroshima | +2.201 |
Filipino | +2.187 |
endo | +2.125 |
Neg logit contributions | |
Rhod | -2.957 |
� | -2.782 |
)", | -2.712 |
crop | -2.659 |
recapt | -2.375 |
Token | an |
Token ID | 272 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
Rhod | +0.001 |
� | +0.001 |
)", | +0.001 |
crop | +0.001 |
recapt | +0.001 |
Neg logit contributions | |
ILCS | -0.001 |
Hiroshima | -0.001 |
Anaheim | -0.001 |
Filipino | -0.001 |
Huntington | -0.001 |
Token | for |
Token ID | 329 |
Feature activation | +7.46e-01 |
Pos logit contributions | |
Filipino | +13.586 |
Anaheim | +13.411 |
ILCS | +13.279 |
Manila | +13.219 |
Hiroshima | +13.201 |
Neg logit contributions | |
Rhod | -13.832 |
crop | -13.200 |
)", | -12.724 |
� | -12.676 |
faces | -11.472 |
Token | Ireland |
Token ID | 7517 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
ILCS | +0.680 |
Hiroshima | +0.650 |
Anaheim | +0.645 |
Filipino | +0.642 |
Huntington | +0.625 |
Neg logit contributions | |
Rhod | -0.671 |
� | -0.629 |
)", | -0.607 |
crop | -0.597 |
recapt | -0.524 |
Token | in |
Token ID | 287 |
Feature activation | +8.10e-01 |
Pos logit contributions | |
ILCS | +1.323 |
Hiroshima | +1.266 |
Anaheim | +1.255 |
Filipino | +1.251 |
Huntington | +1.218 |
Neg logit contributions | |
Rhod | -1.321 |
� | -1.240 |
)", | -1.199 |
crop | -1.180 |
recapt | -1.036 |
Token | front |
Token ID | 2166 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
Hiroshima | +7.718 |
Anaheim | +7.610 |
ILCS | +7.579 |
Filipino | +7.450 |
Manila | +7.402 |
Neg logit contributions | |
Rhod | -8.673 |
)", | -8.277 |
crop | -8.243 |
� | -8.100 |
faces | -7.162 |
Token | just |
Token ID | 655 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
Hiroshima | +9.394 |
Anaheim | +9.188 |
ILCS | +8.885 |
Filipino | +8.765 |
Huntington | +8.740 |
Neg logit contributions | |
Rhod | -11.336 |
)", | -11.156 |
� | -10.761 |
crop | -10.734 |
YD | -9.484 |
Token | two |
Token ID | 734 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
ILCS | +2.070 |
Hiroshima | +1.995 |
Anaheim | +1.971 |
Filipino | +1.968 |
Huntington | +1.911 |
Neg logit contributions | |
Rhod | -2.188 |
� | -2.060 |
)", | -2.007 |
crop | -1.976 |
faces | -1.727 |
Token | minutes |
Token ID | 2431 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
Hiroshima | +12.187 |
ILCS | +11.612 |
Anaheim | +11.555 |
Filipino | +11.212 |
boiler | +11.078 |
Neg logit contributions | |
crop | -18.080 |
Rhod | -18.075 |
)", | -17.749 |
� | -17.199 |
faces | -15.045 |
Token | earlier |
Token ID | 2961 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
ILCS | +12.640 |
Hiroshima | +12.376 |
Filipino | +11.532 |
Huntington | +11.383 |
boiler | +11.308 |
Neg logit contributions | |
� | -19.589 |
crop | -19.194 |
Rhod | -19.077 |
)", | -18.670 |
YD | -16.469 |
Token | when |
Token ID | 618 |
Feature activation | +9.15e-01 |
Pos logit contributions | |
Hiroshima | +10.059 |
ILCS | +9.962 |
Anaheim | +9.921 |
Filipino | +9.451 |
Huntington | +9.391 |
Neg logit contributions | |
)", | -13.371 |
Rhod | -13.157 |
crop | -12.972 |
� | -12.807 |
YD | -11.117 |
Token | Danny |
Token ID | 15105 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
Hiroshima | +8.992 |
ILCS | +8.943 |
Anaheim | +8.845 |
Filipino | +8.799 |
Huntington | +8.566 |
Neg logit contributions | |
Rhod | -9.202 |
� | -8.867 |
)", | -8.837 |
crop | -8.827 |
faces | -7.705 |
Token | Kane |
Token ID | 20055 |
Feature activation | +9.55e-01 |
Pos logit contributions | |
ILCS | +5.148 |
Hiroshima | +4.986 |
Anaheim | +4.917 |
Filipino | +4.912 |
Huntington | +4.849 |
Neg logit contributions | |
Rhod | -4.688 |
� | -4.452 |
)", | -4.349 |
crop | -4.295 |
recapt | -3.711 |
Token | hit |
Token ID | 2277 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
ILCS | +9.964 |
Hiroshima | +9.940 |
Anaheim | +9.701 |
Filipino | +9.620 |
Huntington | +9.554 |
Neg logit contributions | |
Rhod | -9.012 |
)", | -8.456 |
crop | -8.277 |
� | -8.099 |
YD | -7.010 |
Token | gave |
Token ID | 2921 |
Feature activation | +9.46e-01 |
Pos logit contributions | |
Hiroshima | +5.120 |
Anaheim | +5.099 |
ILCS | +5.097 |
Filipino | +5.013 |
Huntington | +4.884 |
Neg logit contributions | |
Rhod | -5.232 |
� | -4.891 |
)", | -4.811 |
crop | -4.751 |
faces | -4.076 |
Token | them |
Token ID | 606 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
Anaheim | +9.467 |
Hiroshima | +9.087 |
ILCS | +8.872 |
Filipino | +8.803 |
Huntington | +8.730 |
Neg logit contributions | |
Rhod | -9.928 |
� | -9.504 |
)", | -9.345 |
crop | -9.135 |
faces | -7.981 |
Token | an |
Token ID | 281 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
ILCS | +6.077 |
Hiroshima | +6.059 |
Anaheim | +6.053 |
Filipino | +5.958 |
Huntington | +5.819 |
Neg logit contributions | |
Rhod | -5.491 |
� | -5.142 |
)", | -5.096 |
crop | -5.001 |
faces | -4.322 |
Token | opportunity |
Token ID | 3663 |
Feature activation | +4.37e-01 |
Pos logit contributions | |
Anaheim | +11.787 |
Hiroshima | +11.148 |
ILCS | +10.913 |
Huntington | +10.533 |
Filipino | +10.499 |
Neg logit contributions | |
Rhod | -13.274 |
)", | -12.456 |
� | -12.161 |
crop | -12.127 |
YD | -10.680 |
Token | to |
Token ID | 284 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
ILCS | +4.159 |
Hiroshima | +4.046 |
Anaheim | +4.041 |
Filipino | +3.944 |
Huntington | +3.847 |
Neg logit contributions | |
Rhod | -5.216 |
� | -4.922 |
)", | -4.885 |
crop | -4.754 |
faces | -4.203 |
Token | tie |
Token ID | 9839 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
ILCS | +4.311 |
Hiroshima | +4.281 |
Anaheim | +4.257 |
Filipino | +4.202 |
Huntington | +4.104 |
Neg logit contributions | |
Rhod | -3.755 |
� | -3.501 |
)", | -3.371 |
crop | -3.303 |
faces | -2.882 |
Token | the |
Token ID | 262 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
Anaheim | +15.814 |
Hiroshima | +14.530 |
Huntington | +13.979 |
Filipino | +13.698 |
Manila | +13.577 |
Neg logit contributions | |
Rhod | -18.458 |
)", | -17.864 |
� | -16.991 |
crop | -16.674 |
vre | -14.645 |
Token | game |
Token ID | 983 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
Anaheim | +9.444 |
Hiroshima | +9.034 |
Filipino | +8.764 |
Huntington | +8.411 |
Chinatown | +8.347 |
Neg logit contributions | |
Rhod | -12.528 |
� | -12.384 |
crop | -12.190 |
)", | -12.104 |
YD | -10.512 |
Token | and |
Token ID | 290 |
Feature activation | +3.38e-01 |
Pos logit contributions | |
Anaheim | +9.821 |
Hiroshima | +9.588 |
Filipino | +9.120 |
Manila | +9.113 |
Huntington | +8.998 |
Neg logit contributions | |
Rhod | -12.622 |
)", | -11.852 |
� | -11.812 |
crop | -11.483 |
YD | -9.953 |
Token | they |
Token ID | 484 |
Feature activation | -3.60e-02 |
Pos logit contributions | |
ILCS | +3.864 |
Anaheim | +3.843 |
Hiroshima | +3.827 |
Filipino | +3.768 |
Huntington | +3.693 |
Neg logit contributions | |
Rhod | -3.377 |
� | -3.172 |
)", | -3.085 |
crop | -3.014 |
faces | -2.618 |
Token | did |
Token ID | 750 |
Feature activation | +5.25e-01 |
Pos logit contributions | |
Rhod | +0.357 |
� | +0.334 |
)", | +0.321 |
crop | +0.314 |
recapt | +0.279 |
Neg logit contributions | |
ILCS | -0.435 |
Hiroshima | -0.410 |
Anaheim | -0.408 |
Filipino | -0.408 |
Huntington | -0.398 |
Token | over |
Token ID | 625 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
Karachi | +13.495 |
Hiroshima | +13.453 |
boiler | +13.431 |
Mumbai | +13.399 |
ILCS | +13.266 |
Neg logit contributions | |
Rhod | -14.184 |
� | -13.793 |
)", | -13.133 |
crop | -12.874 |
faces | -11.983 |
Token | of |
Token ID | 286 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
Hiroshima | +13.948 |
ILCS | +13.454 |
Filipino | +13.333 |
Karachi | +13.176 |
Anaheim | +13.086 |
Neg logit contributions | |
Rhod | -13.906 |
)", | -13.183 |
� | -13.084 |
crop | -11.727 |
YD | -11.492 |
Token | the |
Token ID | 262 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
Hiroshima | +13.201 |
Filipino | +12.927 |
Anaheim | +12.732 |
Karachi | +12.661 |
Saras | +12.620 |
Neg logit contributions | |
� | -11.760 |
Rhod | -11.751 |
)", | -11.036 |
crop | -10.974 |
YD | -10.264 |
Token | reply |
Token ID | 10971 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
Hiroshima | +15.267 |
Filipino | +14.982 |
Anaheim | +14.556 |
Saras | +14.527 |
Karachi | +14.500 |
Neg logit contributions | |
� | -11.767 |
Rhod | -11.202 |
crop | -10.882 |
)", | -10.768 |
YD | -9.921 |
Token | for |
Token ID | 329 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
Filipino | +13.183 |
Hiroshima | +13.140 |
boiler | +12.918 |
ILCS | +12.588 |
Huntington | +12.482 |
Neg logit contributions | |
Rhod | -13.076 |
� | -12.536 |
)", | -12.281 |
crop | -11.811 |
YD | -10.681 |
Token | four |
Token ID | 1440 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
Hiroshima | +10.399 |
Anaheim | +10.037 |
ILCS | +10.025 |
Filipino | +9.966 |
Karachi | +9.803 |
Neg logit contributions | |
Rhod | -10.343 |
� | -10.056 |
crop | -9.602 |
)", | -9.434 |
YD | -8.516 |
Token | . |
Token ID | 13 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
Hiroshima | +16.103 |
ickets | +15.825 |
Karachi | +15.777 |
ILCS | +15.594 |
boiler | +15.587 |
Neg logit contributions | |
Rhod | -15.666 |
� | -14.771 |
crop | -14.445 |
)", | -14.050 |
YD | -12.556 |
Token | Cher |
Token ID | 19305 |
Feature activation | -1.74e-01 |
Pos logit contributions | |
ILCS | +11.754 |
Hiroshima | +11.724 |
Filipino | +11.558 |
Anaheim | +11.370 |
Karachi | +11.356 |
Neg logit contributions | |
Rhod | -12.705 |
� | -12.257 |
crop | -11.950 |
)", | -11.867 |
graded | -11.336 |
Token | rene |
Token ID | 25924 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
Rhod | +2.045 |
� | +1.947 |
)", | +1.856 |
crop | +1.832 |
faces | +1.631 |
Neg logit contributions | |
ILCS | -1.778 |
Hiroshima | -1.702 |
Filipino | -1.679 |
Anaheim | -1.677 |
Huntington | -1.619 |
Token | and |
Token ID | 290 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
Hiroshima | +12.821 |
Huntington | +12.557 |
ILCS | +12.477 |
Anaheim | +12.453 |
Filipino | +12.347 |
Neg logit contributions | |
Rhod | -12.411 |
)", | -11.938 |
� | -11.834 |
crop | -11.757 |
YD | -10.330 |
Token | I |
Token ID | 314 |
Feature activation | +5.41e-01 |
Pos logit contributions | |
ILCS | +4.455 |
Hiroshima | +4.337 |
Filipino | +4.279 |
Anaheim | +4.269 |
Huntington | +4.148 |
Neg logit contributions | |
Rhod | -4.586 |
� | -4.383 |
)", | -4.228 |
crop | -4.183 |
faces | -3.632 |
Token | nat |
Token ID | 34664 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
Filipino | +18.826 |
Manila | +18.244 |
Anaheim | +17.645 |
Huntington | +17.031 |
ILCS | +16.918 |
Neg logit contributions | |
Rhod | -13.940 |
� | -13.700 |
crop | -13.524 |
)", | -12.513 |
faces | -11.523 |
Token | ut |
Token ID | 315 |
Feature activation | +9.91e-01 |
Pos logit contributions | |
Filipino | +10.833 |
ushi | +10.741 |
wang | +10.741 |
endo | +10.624 |
Anaheim | +10.584 |
Neg logit contributions | |
Rhod | -13.083 |
)", | -11.905 |
� | -11.539 |
crop | -11.375 |
YD | -10.421 |
Token | u |
Token ID | 84 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
Filipino | +9.420 |
ILCS | +9.222 |
Anaheim | +9.067 |
Manila | +9.063 |
wang | +8.977 |
Neg logit contributions | |
Rhod | -10.625 |
� | -9.773 |
)", | -9.644 |
crop | -9.621 |
faces | -8.299 |
Token | wa |
Token ID | 10247 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Filipino | +13.501 |
Manila | +13.115 |
Anaheim | +13.024 |
wang | +12.988 |
Huntington | +12.619 |
Neg logit contributions | |
Rhod | -13.174 |
crop | -12.038 |
� | -11.567 |
)", | -11.321 |
faces | -10.522 |
Token | na |
Token ID | 12385 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
Filipino | +14.227 |
Manila | +13.722 |
Anaheim | +13.480 |
Hiroshima | +13.205 |
wang | +13.111 |
Neg logit contributions | |
Rhod | -14.311 |
crop | -13.468 |
� | -12.653 |
)", | -12.112 |
faces | -11.638 |
Token | ang |
Token ID | 3550 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
Filipino | +17.390 |
Manila | +16.965 |
Anaheim | +16.327 |
Huntington | +15.939 |
Hiroshima | +15.809 |
Neg logit contributions | |
Rhod | -13.814 |
crop | -13.195 |
� | -13.149 |
)", | -12.329 |
faces | -11.580 |
Token | kan |
Token ID | 43998 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Filipino | +18.932 |
Manila | +18.265 |
Anaheim | +17.750 |
ILCS | +17.365 |
Huntington | +17.032 |
Neg logit contributions | |
Rhod | -13.942 |
� | -13.454 |
crop | -13.158 |
)", | -12.575 |
faces | -11.387 |
Token | il |
Token ID | 346 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
Filipino | +14.120 |
Anaheim | +13.933 |
ILCS | +13.780 |
Manila | +13.740 |
wang | +13.696 |
Neg logit contributions | |
Rhod | -14.887 |
� | -13.356 |
)", | -13.115 |
crop | -13.031 |
scenery | -11.899 |
Token | ang |
Token ID | 648 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
Filipino | +13.043 |
wang | +12.629 |
Manila | +12.512 |
Anaheim | +12.503 |
ushi | +12.365 |
Neg logit contributions | |
Rhod | -14.846 |
� | -13.469 |
crop | -13.203 |
)", | -12.993 |
YD | -11.818 |
Token | an |
Token ID | 281 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
Filipino | +18.690 |
Manila | +17.869 |
Anaheim | +17.566 |
Huntington | +17.101 |
wang | +17.057 |
Neg logit contributions | |
Rhod | -14.851 |
� | -13.861 |
crop | -13.645 |
)", | -12.306 |
faces | -11.871 |
Token | ak |
Token ID | 461 |
Feature activation | +2.23e+00 |
Pos logit contributions | |
Filipino | +11.277 |
ILCS | +11.116 |
Anaheim | +11.071 |
wang | +10.822 |
Manila | +10.780 |
Neg logit contributions | |
Rhod | -13.101 |
� | -11.911 |
)", | -11.640 |
crop | -11.489 |
scenery | -10.222 |
Token | 1 |
Token ID | 16 |
Feature activation | +9.26e-01 |
Pos logit contributions | |
ILCS | +7.033 |
chant | +6.603 |
Anaheim | +6.594 |
Filipino | +6.587 |
Hiroshima | +6.585 |
Neg logit contributions | |
Rhod | -8.419 |
)", | -7.651 |
� | -7.561 |
crop | -7.121 |
graded | -6.575 |
Token | 2 |
Token ID | 362 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
ILCS | +7.543 |
Anaheim | +7.115 |
Filipino | +7.035 |
boiler | +6.903 |
Hiroshima | +6.891 |
Neg logit contributions | |
Rhod | -11.332 |
� | -10.755 |
)", | -10.582 |
crop | -10.330 |
faces | -9.271 |
Token | 3 |
Token ID | 513 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
Anaheim | +11.121 |
boiler | +10.974 |
ILCS | +10.761 |
Hiroshima | +10.428 |
quist | +10.341 |
Neg logit contributions | |
Rhod | -17.867 |
)", | -17.711 |
� | -17.174 |
crop | -15.853 |
YD | -14.439 |
Token | 4 |
Token ID | 604 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
ILCS | +12.181 |
boiler | +11.539 |
Anaheim | +11.369 |
Filipino | +11.014 |
Ballard | +10.642 |
Neg logit contributions | |
Rhod | -17.794 |
)", | -17.391 |
� | -17.309 |
crop | -16.081 |
YD | -14.211 |
Token | 5 |
Token ID | 642 |
Feature activation | +8.27e-01 |
Pos logit contributions | |
ILCS | +8.283 |
boiler | +7.696 |
Anaheim | +7.636 |
Hiroshima | +7.577 |
Filipino | +7.548 |
Neg logit contributions | |
Rhod | -13.134 |
� | -12.451 |
)", | -12.295 |
crop | -11.897 |
YD | -10.394 |
Token | 6 |
Token ID | 718 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
ILCS | +7.093 |
Hiroshima | +6.556 |
Anaheim | +6.440 |
Filipino | +6.390 |
boiler | +6.344 |
Neg logit contributions | |
Rhod | -10.279 |
� | -9.798 |
)", | -9.522 |
crop | -9.247 |
YD | -8.420 |
Token | 7 |
Token ID | 767 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
boiler | +12.201 |
Huntington | +11.960 |
Hiroshima | +11.891 |
Anaheim | +11.535 |
ILCS | +11.482 |
Neg logit contributions | |
)", | -20.325 |
� | -19.821 |
Rhod | -19.550 |
crop | -18.439 |
Constantin | -16.485 |
Token | 8 |
Token ID | 807 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
ILCS | +13.948 |
boiler | +12.879 |
Anaheim | +12.300 |
Huntington | +12.224 |
Manila | +12.091 |
Neg logit contributions | |
)", | -20.834 |
� | -20.551 |
Rhod | -20.418 |
crop | -19.383 |
etsk | -17.029 |
Token | 9 |
Token ID | 860 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ILCS | +10.262 |
boiler | +9.962 |
Anaheim | +9.837 |
Hiroshima | +9.727 |
Filipino | +9.534 |
Neg logit contributions | |
Rhod | -16.718 |
)", | -16.637 |
� | -15.654 |
crop | -15.215 |
etsk | -13.625 |
Token | 10 |
Token ID | 838 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
ILCS | +8.975 |
boiler | +8.521 |
Anaheim | +8.449 |
Filipino | +8.216 |
Hiroshima | +8.087 |
Neg logit contributions | |
Rhod | -14.572 |
)", | -14.557 |
� | -14.063 |
crop | -13.354 |
etsk | -12.190 |
Token | 11 |
Token ID | 1367 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
ILCS | +8.013 |
Anaheim | +7.677 |
Huntington | +7.623 |
Hiroshima | +7.615 |
chant | +7.555 |
Neg logit contributions | |
Rhod | -13.481 |
)", | -13.241 |
� | -13.202 |
crop | -12.431 |
faces | -11.467 |
Token | dug |
Token ID | 18735 |
Feature activation | +6.06e-01 |
Pos logit contributions | |
Hiroshima | +13.906 |
Anaheim | +13.820 |
Filipino | +13.573 |
Huntington | +13.221 |
Manila | +13.154 |
Neg logit contributions | |
� | -11.414 |
Rhod | -11.139 |
)", | -11.134 |
crop | -10.701 |
YD | -9.107 |
Token | out |
Token ID | 448 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
Hiroshima | +4.619 |
ILCS | +4.593 |
Anaheim | +4.552 |
Filipino | +4.444 |
endo | +4.425 |
Neg logit contributions | |
Rhod | -8.082 |
� | -7.657 |
)", | -7.446 |
crop | -7.353 |
YD | -6.501 |
Token | , |
Token ID | 11 |
Feature activation | +7.66e-01 |
Pos logit contributions | |
Hiroshima | +11.133 |
Anaheim | +11.022 |
Filipino | +10.621 |
boiler | +10.520 |
Manila | +10.349 |
Neg logit contributions | |
Rhod | -13.100 |
)", | -12.934 |
� | -12.523 |
crop | -12.112 |
YD | -10.704 |
Token | then |
Token ID | 788 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
Anaheim | +8.041 |
Hiroshima | +8.006 |
ILCS | +7.970 |
Filipino | +7.850 |
Huntington | +7.650 |
Neg logit contributions | |
Rhod | -7.656 |
� | -7.307 |
)", | -7.286 |
crop | -7.132 |
YD | -6.121 |
Token | walked |
Token ID | 6807 |
Feature activation | +9.17e-01 |
Pos logit contributions | |
ILCS | +5.301 |
Hiroshima | +5.288 |
Anaheim | +5.247 |
Filipino | +5.187 |
Huntington | +5.104 |
Neg logit contributions | |
Rhod | -4.551 |
� | -4.267 |
)", | -4.221 |
crop | -4.156 |
faces | -3.542 |
Token | into |
Token ID | 656 |
Feature activation | +1.94e+00 |
Pos logit contributions | |
Hiroshima | +9.437 |
Anaheim | +9.232 |
Filipino | +9.211 |
Huntington | +9.083 |
ILCS | +8.957 |
Neg logit contributions | |
Rhod | -8.854 |
� | -8.826 |
)", | -8.598 |
crop | -8.403 |
YD | -7.202 |
Token | the |
Token ID | 262 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
Anaheim | +17.599 |
Hiroshima | +17.507 |
Huntington | +17.098 |
Filipino | +16.594 |
Saras | +16.478 |
Neg logit contributions | |
)", | -14.291 |
Rhod | -13.972 |
� | -13.961 |
crop | -13.563 |
YD | -12.149 |
Token | clubhouse |
Token ID | 48018 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
Hiroshima | +13.868 |
Anaheim | +13.831 |
Filipino | +13.437 |
Huntington | +13.332 |
Manila | +13.013 |
Neg logit contributions | |
� | -11.841 |
Rhod | -11.593 |
)", | -11.571 |
crop | -11.101 |
YD | -9.767 |
Token | , |
Token ID | 11 |
Feature activation | +8.49e-01 |
Pos logit contributions | |
Hiroshima | +12.382 |
Anaheim | +12.215 |
Filipino | +11.781 |
boiler | +11.718 |
Manila | +11.501 |
Neg logit contributions | |
Rhod | -13.378 |
)", | -13.214 |
� | -12.991 |
crop | -12.785 |
etsk | -10.856 |
Token | which |
Token ID | 543 |
Feature activation | +4.92e-01 |
Pos logit contributions | |
Anaheim | +8.836 |
Hiroshima | +8.796 |
ILCS | +8.694 |
Filipino | +8.577 |
Huntington | +8.395 |
Neg logit contributions | |
Rhod | -8.353 |
)", | -7.981 |
� | -7.955 |
crop | -7.827 |
YD | -6.684 |
Token | was |
Token ID | 373 |
Feature activation | +6.32e-01 |
Pos logit contributions | |
ILCS | +5.363 |
Hiroshima | +5.350 |
Anaheim | +5.306 |
Filipino | +5.247 |
Huntington | +5.153 |
Neg logit contributions | |
Rhod | -5.005 |
� | -4.718 |
)", | -4.714 |
crop | -4.611 |
faces | -3.898 |
Token | two |
Token ID | 734 |
Feature activation | -9.99e-01 |
Pos logit contributions | |
Rhod | +8.977 |
� | +7.546 |
grading | +7.115 |
crop | +7.024 |
graded | +6.980 |
Neg logit contributions | |
ILCS | -16.468 |
endo | -15.344 |
chant | -15.343 |
wang | -15.327 |
ushi | -14.947 |
Token | seasons |
Token ID | 7028 |
Feature activation | -3.31e-01 |
Pos logit contributions | |
Rhod | +6.632 |
� | +5.954 |
crop | +5.169 |
)", | +5.145 |
grading | +5.085 |
Neg logit contributions | |
ILCS | -13.217 |
chant | -12.715 |
endo | -12.617 |
wang | -12.593 |
Filipino | -12.406 |
Token | . |
Token ID | 13 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
Rhod | +3.271 |
� | +3.061 |
crop | +2.871 |
)", | +2.849 |
graded | +2.570 |
Neg logit contributions | |
ILCS | -3.855 |
Filipino | -3.683 |
Hiroshima | -3.679 |
Anaheim | -3.620 |
Huntington | -3.561 |
Token |
|
Token ID | 198 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
Rhod | +14.611 |
� | +12.028 |
Tate | +11.965 |
)", | +11.787 |
crop | +11.736 |
Neg logit contributions | |
ILCS | -14.049 |
endo | -13.615 |
ushi | -13.418 |
roxy | -13.384 |
chant | -13.362 |
Token |
|
Token ID | 198 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
Rhod | +5.834 |
� | +5.554 |
crop | +5.345 |
)", | +5.255 |
faces | +4.442 |
Neg logit contributions | |
ILCS | -10.063 |
Hiroshima | -9.257 |
boiler | -9.248 |
Filipino | -9.114 |
ushi | -8.996 |
Token | After |
Token ID | 3260 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
� | +13.207 |
crop | +13.160 |
Rhod | +12.738 |
)", | +12.463 |
YD | +12.241 |
Neg logit contributions | |
ILCS | -16.185 |
boiler | -15.512 |
Hiroshima | -15.413 |
Filipino | -15.348 |
Manila | -15.159 |
Token | Oklahoma |
Token ID | 10433 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
Rhod | +19.889 |
grading | +18.478 |
recapt | +17.632 |
� | +17.531 |
graded | +17.354 |
Neg logit contributions | |
ILCS | -16.391 |
chant | -13.845 |
endo | -13.823 |
Japanese | -13.710 |
quist | -13.530 |
Token | 's |
Token ID | 338 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
Rhod | +17.123 |
graded | +16.263 |
recapt | +15.991 |
� | +15.426 |
grading | +15.012 |
Neg logit contributions | |
ILCS | -17.859 |
chant | -16.084 |
Japanese | -15.787 |
wang | -15.728 |
endo | -15.717 |
Token | failure |
Token ID | 5287 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Rhod | +15.668 |
recapt | +13.317 |
grading | +13.091 |
tire | +13.000 |
� | +12.883 |
Neg logit contributions | |
ILCS | -15.235 |
wang | -14.005 |
chant | -13.862 |
endo | -13.672 |
quist | -13.348 |
Token | , |
Token ID | 11 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
Rhod | +9.645 |
� | +8.608 |
crop | +8.161 |
grading | +8.041 |
)", | +7.787 |
Neg logit contributions | |
ILCS | -15.394 |
Filipino | -14.141 |
wang | -13.802 |
endo | -13.736 |
Hiroshima | -13.491 |
Token | the |
Token ID | 262 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Rhod | +15.146 |
� | +13.078 |
Tate | +12.678 |
crop | +12.646 |
graded | +12.580 |
Neg logit contributions | |
ILCS | -13.810 |
endo | -12.829 |
wang | -12.467 |
Japanese | -12.410 |
ushi | -12.404 |
Token | - |
Token ID | 12 |
Feature activation | -2.89e-01 |
Pos logit contributions | |
Rhod | +4.595 |
� | +4.241 |
)", | +4.106 |
crop | +4.063 |
recapt | +3.648 |
Neg logit contributions | |
ILCS | -5.391 |
Hiroshima | -5.092 |
Anaheim | -4.949 |
Filipino | -4.920 |
endo | -4.888 |
Token | read |
Token ID | 961 |
Feature activation | -3.14e-01 |
Pos logit contributions | |
Rhod | +3.024 |
� | +2.896 |
crop | +2.877 |
)", | +2.801 |
faces | +2.530 |
Neg logit contributions | |
ILCS | -3.225 |
Hiroshima | -3.055 |
Filipino | -3.001 |
Anaheim | -2.972 |
Huntington | -2.930 |
Token | : |
Token ID | 25 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
Rhod | +3.283 |
� | +3.058 |
crop | +2.947 |
)", | +2.903 |
recapt | +2.570 |
Neg logit contributions | |
ILCS | -3.525 |
Hiroshima | -3.352 |
Filipino | -3.292 |
Anaheim | -3.275 |
Huntington | -3.239 |
Token |
|
Token ID | 198 |
Feature activation | -4.84e-01 |
Pos logit contributions | |
Rhod | +9.857 |
� | +9.109 |
crop | +8.701 |
)", | +8.170 |
graded | +7.733 |
Neg logit contributions | |
ILCS | -11.812 |
Hiroshima | -11.106 |
Filipino | -10.866 |
ushi | -10.702 |
chant | -10.630 |
Token |
|
Token ID | 198 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
Rhod | +4.327 |
� | +4.096 |
crop | +3.953 |
)", | +3.932 |
faces | +3.352 |
Neg logit contributions | |
ILCS | -6.067 |
Hiroshima | -5.656 |
Filipino | -5.557 |
boiler | -5.511 |
Anaheim | -5.509 |
Token | If |
Token ID | 1532 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
� | +13.596 |
crop | +13.203 |
Rhod | +12.769 |
)", | +12.122 |
YD | +11.838 |
Neg logit contributions | |
ILCS | -14.423 |
Hiroshima | -13.732 |
Filipino | -13.677 |
Manila | -13.619 |
boiler | -13.340 |
Token | all |
Token ID | 477 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
Rhod | +19.512 |
� | +17.533 |
graded | +16.757 |
Buc | +16.595 |
Tate | +16.558 |
Neg logit contributions | |
ILCS | -16.105 |
chant | -15.035 |
Japanese | -14.276 |
endo | -14.110 |
Filipino | -13.975 |
Token | that |
Token ID | 326 |
Feature activation | -7.20e-01 |
Pos logit contributions | |
Rhod | +9.354 |
� | +7.916 |
crop | +7.228 |
graded | +7.223 |
)", | +7.072 |
Neg logit contributions | |
ILCS | -13.798 |
ushi | -12.735 |
chant | -12.700 |
Hiroshima | -12.324 |
Filipino | -12.269 |
Token | wasn |
Token ID | 2492 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
Rhod | +7.034 |
� | +6.377 |
crop | +5.921 |
)", | +5.907 |
recapt | +5.623 |
Neg logit contributions | |
ILCS | -8.475 |
chant | -7.558 |
Hiroshima | -7.502 |
ushi | -7.440 |
Filipino | -7.386 |
Token | 't |
Token ID | 470 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
Rhod | +4.261 |
� | +3.744 |
crop | +3.643 |
)", | +3.629 |
YD | +2.290 |
Neg logit contributions | |
ILCS | -16.512 |
Hiroshima | -15.430 |
boiler | -15.236 |
Huntington | -14.969 |
unden | -14.965 |
Token | enough |
Token ID | 1576 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
Rhod | +3.511 |
� | +3.157 |
)", | +3.007 |
crop | +2.970 |
recapt | +2.675 |
Neg logit contributions | |
ILCS | -4.634 |
Hiroshima | -4.303 |
Anaheim | -4.250 |
chant | -4.245 |
Filipino | -4.229 |
Token | , |
Token ID | 11 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
Rhod | +4.327 |
� | +4.081 |
)", | +3.711 |
crop | +3.690 |
recapt | +3.310 |
Neg logit contributions | |
ILCS | -5.522 |
Hiroshima | -5.146 |
Anaheim | -5.146 |
Filipino | -5.079 |
chant | -5.038 |
Token | warned |
Token ID | 7728 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
Rhod | +4.958 |
� | +4.527 |
)", | +4.223 |
crop | +4.138 |
recapt | +3.991 |
Neg logit contributions | |
ILCS | -5.856 |
Anaheim | -5.253 |
Hiroshima | -5.230 |
Filipino | -5.210 |
chant | -5.165 |
Token | the |
Token ID | 262 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
Rhod | +11.408 |
� | +10.037 |
crop | +9.450 |
)", | +9.391 |
recapt | +9.177 |
Neg logit contributions | |
ILCS | -15.254 |
chant | -12.555 |
endo | -12.429 |
API | -12.183 |
eno | -12.076 |
Token | Syrians |
Token ID | 26648 |
Feature activation | -6.68e-01 |
Pos logit contributions | |
Rhod | +11.829 |
� | +10.132 |
)", | +9.837 |
regime | +9.752 |
FSA | +9.721 |
Neg logit contributions | |
ILCS | -12.415 |
chant | -10.825 |
endo | -10.575 |
wang | -10.373 |
ushi | -10.364 |
Token | that |
Token ID | 326 |
Feature activation | -9.93e-01 |
Pos logit contributions | |
Rhod | +5.947 |
� | +5.169 |
)", | +5.028 |
crop | +4.899 |
recapt | +4.623 |
Neg logit contributions | |
ILCS | -8.445 |
Anaheim | -7.598 |
endo | -7.567 |
Hiroshima | -7.549 |
Filipino | -7.457 |
Token | if |
Token ID | 611 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
Rhod | +8.949 |
� | +8.047 |
)", | +7.776 |
recapt | +7.652 |
crop | +7.386 |
Neg logit contributions | |
ILCS | -11.632 |
chant | -10.212 |
endo | -10.145 |
wang | -9.772 |
ickets | -9.759 |
Token | they |
Token ID | 484 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
Rhod | +17.682 |
recapt | +16.329 |
regime | +16.327 |
FSA | +16.282 |
� | +15.567 |
Neg logit contributions | |
ILCS | -19.558 |
chant | -16.690 |
endo | -15.966 |
quist | -15.171 |
wang | -15.123 |
Token | did |
Token ID | 750 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
Rhod | +9.130 |
� | +8.441 |
recapt | +8.383 |
)", | +7.898 |
tire | +7.752 |
Neg logit contributions | |
ILCS | -14.431 |
wang | -12.591 |
endo | -12.495 |
API | -12.379 |
ushi | -12.344 |
Token | not |
Token ID | 407 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
Rhod | +9.656 |
� | +8.459 |
recapt | +8.334 |
)", | +8.057 |
crop | +7.926 |
Neg logit contributions | |
ILCS | -16.635 |
wang | -14.714 |
chant | -14.480 |
Anaheim | -14.413 |
endo | -14.316 |
Token | take |
Token ID | 1011 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
Rhod | +5.263 |
� | +4.916 |
)", | +4.828 |
crop | +4.609 |
recapt | +4.594 |
Neg logit contributions | |
ILCS | -7.580 |
Anaheim | -6.999 |
Filipino | -6.916 |
Hiroshima | -6.894 |
Huntington | -6.864 |
Token | measures |
Token ID | 5260 |
Feature activation | -4.21e-01 |
Pos logit contributions | |
Rhod | +9.718 |
� | +8.922 |
)", | +8.309 |
recapt | +8.019 |
crop | +7.995 |
Neg logit contributions | |
ILCS | -12.171 |
endo | -10.986 |
chant | -10.856 |
quist | -10.717 |
wang | -10.694 |
Token | seasons |
Token ID | 7028 |
Feature activation | -3.31e-01 |
Pos logit contributions | |
Rhod | +6.632 |
� | +5.954 |
crop | +5.169 |
)", | +5.145 |
grading | +5.085 |
Neg logit contributions | |
ILCS | -13.217 |
chant | -12.715 |
endo | -12.617 |
wang | -12.593 |
Filipino | -12.406 |
Token | . |
Token ID | 13 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
Rhod | +3.271 |
� | +3.061 |
crop | +2.871 |
)", | +2.849 |
graded | +2.570 |
Neg logit contributions | |
ILCS | -3.855 |
Filipino | -3.683 |
Hiroshima | -3.679 |
Anaheim | -3.620 |
Huntington | -3.561 |
Token |
|
Token ID | 198 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
Rhod | +14.611 |
� | +12.028 |
Tate | +11.965 |
)", | +11.787 |
crop | +11.736 |
Neg logit contributions | |
ILCS | -14.049 |
endo | -13.615 |
ushi | -13.418 |
roxy | -13.384 |
chant | -13.362 |
Token |
|
Token ID | 198 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
Rhod | +5.834 |
� | +5.554 |
crop | +5.345 |
)", | +5.255 |
faces | +4.442 |
Neg logit contributions | |
ILCS | -10.063 |
Hiroshima | -9.257 |
boiler | -9.248 |
Filipino | -9.114 |
ushi | -8.996 |
Token | After |
Token ID | 3260 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
� | +13.207 |
crop | +13.160 |
Rhod | +12.738 |
)", | +12.463 |
YD | +12.241 |
Neg logit contributions | |
ILCS | -16.185 |
boiler | -15.512 |
Hiroshima | -15.413 |
Filipino | -15.348 |
Manila | -15.159 |
Token | Oklahoma |
Token ID | 10433 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
Rhod | +19.889 |
grading | +18.478 |
recapt | +17.632 |
� | +17.531 |
graded | +17.354 |
Neg logit contributions | |
ILCS | -16.391 |
chant | -13.845 |
endo | -13.823 |
Japanese | -13.710 |
quist | -13.530 |
Token | 's |
Token ID | 338 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
Rhod | +17.123 |
graded | +16.263 |
recapt | +15.991 |
� | +15.426 |
grading | +15.012 |
Neg logit contributions | |
ILCS | -17.859 |
chant | -16.084 |
Japanese | -15.787 |
wang | -15.728 |
endo | -15.717 |
Token | failure |
Token ID | 5287 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Rhod | +15.668 |
recapt | +13.317 |
grading | +13.091 |
tire | +13.000 |
� | +12.883 |
Neg logit contributions | |
ILCS | -15.235 |
wang | -14.005 |
chant | -13.862 |
endo | -13.672 |
quist | -13.348 |
Token | , |
Token ID | 11 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
Rhod | +9.645 |
� | +8.608 |
crop | +8.161 |
grading | +8.041 |
)", | +7.787 |
Neg logit contributions | |
ILCS | -15.394 |
Filipino | -14.141 |
wang | -13.802 |
endo | -13.736 |
Hiroshima | -13.491 |
Token | the |
Token ID | 262 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Rhod | +15.146 |
� | +13.078 |
Tate | +12.678 |
crop | +12.646 |
graded | +12.580 |
Neg logit contributions | |
ILCS | -13.810 |
endo | -12.829 |
wang | -12.467 |
Japanese | -12.410 |
ushi | -12.404 |
Token | Oklahoma |
Token ID | 10433 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
Rhod | +15.238 |
Buc | +13.223 |
Cycl | +13.077 |
� | +13.030 |
crop | +12.802 |
Neg logit contributions | |
ILCS | -14.398 |
endo | -14.086 |
chant | -13.828 |
wang | -13.644 |
Japanese | -13.497 |
Token | Syrians |
Token ID | 26648 |
Feature activation | -6.37e-01 |
Pos logit contributions | |
Rhod | +11.044 |
� | +9.409 |
)", | +9.319 |
crop | +9.101 |
borders | +9.048 |
Neg logit contributions | |
ILCS | -13.610 |
ushi | -12.567 |
eno | -12.357 |
Anaheim | -12.154 |
chant | -12.129 |
Token | in |
Token ID | 287 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
Rhod | +5.642 |
)", | +5.065 |
� | +4.944 |
crop | +4.569 |
recapt | +4.368 |
Neg logit contributions | |
ILCS | -7.890 |
Anaheim | -7.357 |
endo | -7.290 |
Hiroshima | -7.267 |
Filipino | -7.211 |
Token | a |
Token ID | 257 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
Rhod | +11.315 |
� | +10.190 |
)", | +9.945 |
recapt | +9.349 |
FSA | +9.156 |
Neg logit contributions | |
ILCS | -13.083 |
endo | -11.954 |
wang | -11.849 |
Japanese | -11.832 |
chant | -11.807 |
Token | free |
Token ID | 1479 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
Rhod | +13.837 |
)", | +11.943 |
� | +11.877 |
regime | +11.850 |
graded | +11.601 |
Neg logit contributions | |
ILCS | -16.648 |
chant | -15.463 |
endo | -15.165 |
ushi | -14.970 |
ickets | -14.868 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
Rhod | +13.528 |
� | +12.379 |
regime | +11.664 |
borders | +11.657 |
)", | +11.149 |
Neg logit contributions | |
ushi | -18.176 |
ickets | -18.132 |
ILCS | -17.904 |
quist | -17.107 |
Japanese | -17.008 |
Token | democratic |
Token ID | 10518 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
Rhod | +10.169 |
� | +8.151 |
)", | +7.898 |
graded | +7.882 |
borders | +7.774 |
Neg logit contributions | |
ILCS | -16.738 |
ickets | -16.059 |
endo | -15.988 |
chant | -15.975 |
quist | -15.812 |
Token | country |
Token ID | 1499 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
Rhod | +15.543 |
regime | +14.877 |
borders | +13.909 |
� | +13.715 |
direction | +13.460 |
Neg logit contributions | |
ickets | -19.595 |
ILCS | -19.487 |
ushi | -19.225 |
quist | -18.757 |
eno | -18.425 |
Token | that |
Token ID | 326 |
Feature activation | -7.63e-01 |
Pos logit contributions | |
Rhod | +10.071 |
)", | +8.945 |
� | +8.474 |
recapt | +7.864 |
borders | +7.609 |
Neg logit contributions | |
ILCS | -17.228 |
ushi | -16.026 |
ickets | -15.935 |
endo | -15.891 |
Ballard | -15.651 |
Token | ensures |
Token ID | 19047 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
Rhod | +7.345 |
� | +6.766 |
)", | +6.357 |
recapt | +5.961 |
borders | +5.904 |
Neg logit contributions | |
ILCS | -8.732 |
chant | -8.020 |
Hiroshima | -7.975 |
endo | -7.918 |
Anaheim | -7.885 |
Token | equal |
Token ID | 4961 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
Rhod | +14.864 |
freedoms | +13.638 |
borders | +13.429 |
� | +13.417 |
regime | +12.926 |
Neg logit contributions | |
ILCS | -19.132 |
quist | -16.999 |
chant | -16.411 |
endo | -16.142 |
ickets | -16.062 |
Token | and |
Token ID | 290 |
Feature activation | -6.81e-01 |
Pos logit contributions | |
Rhod | +6.718 |
� | +6.129 |
borders | +5.586 |
freedoms | +5.537 |
)", | +5.397 |
Neg logit contributions | |
ILCS | -13.666 |
endo | -13.117 |
chant | -12.991 |
quist | -12.951 |
eno | -12.802 |
Token | . |
Token ID | 13 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
Rhod | +7.226 |
� | +6.627 |
crop | +6.335 |
recapt | +5.619 |
)", | +5.583 |
Neg logit contributions | |
ILCS | -10.263 |
Filipino | -9.377 |
Hiroshima | -9.254 |
wang | -9.131 |
endo | -9.000 |
Token | Expect |
Token ID | 23600 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
Rhod | +13.087 |
� | +11.338 |
crop | +10.734 |
)", | +10.398 |
Tate | +10.333 |
Neg logit contributions | |
ILCS | -13.702 |
chant | -13.296 |
boiler | -13.060 |
ushi | -12.861 |
roxy | -12.760 |
Token | it |
Token ID | 340 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
Rhod | +15.506 |
� | +14.274 |
crop | +13.466 |
)", | +13.117 |
Tate | +12.722 |
Neg logit contributions | |
ILCS | -12.886 |
chant | -12.172 |
Filipino | -12.141 |
Hiroshima | -11.930 |
Japanese | -11.741 |
Token | to |
Token ID | 284 |
Feature activation | -8.48e-01 |
Pos logit contributions | |
Rhod | +9.659 |
� | +8.844 |
crop | +8.175 |
)", | +8.010 |
recapt | +7.929 |
Neg logit contributions | |
ILCS | -13.995 |
Filipino | -12.648 |
Hiroshima | -12.494 |
chant | -12.191 |
Japanese | -12.111 |
Token | return |
Token ID | 1441 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
Rhod | +6.478 |
� | +6.239 |
)", | +6.011 |
crop | +5.932 |
recapt | +5.796 |
Neg logit contributions | |
ILCS | -11.127 |
Hiroshima | -9.952 |
Filipino | -9.923 |
endo | -9.657 |
Anaheim | -9.654 |
Token | for |
Token ID | 329 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
Rhod | +10.280 |
� | +9.318 |
crop | +8.655 |
)", | +8.573 |
recapt | +8.555 |
Neg logit contributions | |
ILCS | -13.597 |
chant | -12.458 |
Filipino | -12.110 |
wang | -11.989 |
Japanese | -11.945 |
Token | Round |
Token ID | 10485 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
Rhod | +17.552 |
� | +15.747 |
crop | +15.539 |
recapt | +15.377 |
Tate | +15.304 |
Neg logit contributions | |
ILCS | -17.208 |
chant | -15.529 |
wang | -15.396 |
Japanese | -15.213 |
quist | -14.819 |
Token | 2 |
Token ID | 362 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Rhod | +7.834 |
� | +7.252 |
crop | +6.872 |
)", | +6.604 |
faces | +5.868 |
Neg logit contributions | |
ILCS | -9.080 |
chant | -8.192 |
Filipino | -8.182 |
boiler | -8.017 |
Hiroshima | -7.997 |
Token | , |
Token ID | 11 |
Feature activation | -8.06e-01 |
Pos logit contributions | |
Rhod | +9.251 |
� | +8.537 |
crop | +8.185 |
)", | +7.798 |
grading | +7.539 |
Neg logit contributions | |
ILCS | -13.192 |
Filipino | -12.481 |
chant | -12.232 |
Hiroshima | -12.164 |
wang | -12.151 |
Token | as |
Token ID | 355 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Rhod | +8.049 |
� | +7.277 |
)", | +6.975 |
crop | +6.892 |
graded | +6.550 |
Neg logit contributions | |
ILCS | -8.648 |
chant | -8.036 |
Filipino | -8.026 |
endo | -7.978 |
wang | -7.925 |
Token | the |
Token ID | 262 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
Rhod | +14.116 |
� | +12.436 |
crop | +12.006 |
)", | +11.938 |
graded | +11.561 |
Neg logit contributions | |
ILCS | -12.792 |
chant | -12.178 |
quist | -11.732 |
Filipino | -11.658 |
ushi | -11.596 |
Token | that |
Token ID | 326 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
Rhod | +4.206 |
� | +3.828 |
)", | +3.663 |
crop | +3.643 |
recapt | +3.267 |
Neg logit contributions | |
ILCS | -4.811 |
Hiroshima | -4.452 |
endo | -4.396 |
Anaheim | -4.385 |
chant | -4.384 |
Token | could |
Token ID | 714 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
Rhod | +11.047 |
� | +9.555 |
)", | +8.744 |
crop | +8.718 |
borders | +8.475 |
Neg logit contributions | |
ILCS | -13.181 |
endo | -11.914 |
chant | -11.635 |
ushi | -11.627 |
Hiroshima | -11.490 |
Token | have |
Token ID | 423 |
Feature activation | +3.97e-02 |
Pos logit contributions | |
ILCS | +1.773 |
Hiroshima | +1.704 |
Anaheim | +1.689 |
Filipino | +1.685 |
Huntington | +1.642 |
Neg logit contributions | |
Rhod | -1.585 |
� | -1.482 |
)", | -1.431 |
crop | -1.406 |
faces | -1.220 |
Token | helped |
Token ID | 4193 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
ILCS | +0.491 |
Hiroshima | +0.472 |
Anaheim | +0.468 |
Filipino | +0.466 |
Huntington | +0.455 |
Neg logit contributions | |
Rhod | -0.379 |
� | -0.351 |
)", | -0.339 |
crop | -0.331 |
recapt | -0.287 |
Token | to |
Token ID | 284 |
Feature activation | -8.24e-01 |
Pos logit contributions | |
Rhod | +12.887 |
� | +11.800 |
)", | +11.035 |
crop | +10.950 |
recapt | +10.681 |
Neg logit contributions | |
ILCS | -13.423 |
endo | -12.416 |
chant | -11.935 |
quist | -11.817 |
ushi | -11.762 |
Token | push |
Token ID | 4574 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
Rhod | +7.538 |
� | +6.976 |
)", | +6.650 |
recapt | +6.524 |
crop | +6.509 |
Neg logit contributions | |
ILCS | -9.361 |
endo | -8.808 |
chant | -8.669 |
Hiroshima | -8.669 |
Anaheim | -8.612 |
Token | the |
Token ID | 262 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
Rhod | +18.472 |
� | +16.213 |
borders | +15.139 |
boundaries | +14.982 |
recapt | +14.926 |
Neg logit contributions | |
ILCS | -17.908 |
endo | -15.864 |
quist | -15.778 |
chant | -15.660 |
ushi | -14.949 |
Token | island |
Token ID | 7022 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
Rhod | +17.208 |
� | +14.881 |
boundaries | +14.591 |
borders | +14.532 |
regime | +14.496 |
Neg logit contributions | |
ILCS | -15.860 |
endo | -14.897 |
chant | -14.478 |
ushi | -14.114 |
quist | -13.911 |
Token | 's |
Token ID | 338 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
Rhod | +11.132 |
� | +10.007 |
crop | +9.358 |
)", | +9.263 |
boundaries | +8.575 |
Neg logit contributions | |
ILCS | -13.857 |
Hiroshima | -13.049 |
endo | -12.411 |
Anaheim | -12.404 |
ushi | -12.386 |
Token | territorial |
Token ID | 22414 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Rhod | +11.437 |
� | +9.881 |
)", | +9.594 |
borders | +9.373 |
boundaries | +9.299 |
Neg logit contributions | |
ILCS | -12.749 |
endo | -12.274 |
chant | -12.182 |
Hiroshima | -12.028 |
Anaheim | -11.605 |
Token | conflict |
Token ID | 5358 |
Feature activation | -8.84e-01 |
Pos logit contributions | |
Rhod | +10.208 |
boundaries | +8.906 |
� | +8.763 |
)", | +8.717 |
recapt | +8.491 |
Neg logit contributions | |
ILCS | -13.318 |
endo | -13.137 |
Hiroshima | -13.085 |
chant | -12.727 |
Anaheim | -12.546 |
Token | rate |
Token ID | 2494 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
Rhod | +4.555 |
� | +4.491 |
crop | +3.788 |
recapt | +3.606 |
)", | +3.560 |
Neg logit contributions | |
ILCS | -10.251 |
Filipino | -9.824 |
Hiroshima | -9.792 |
endo | -9.742 |
wang | -9.674 |
Token | , |
Token ID | 11 |
Feature activation | +8.15e-02 |
Pos logit contributions | |
Rhod | +2.794 |
� | +2.657 |
crop | +2.493 |
)", | +2.464 |
recapt | +2.222 |
Neg logit contributions | |
ILCS | -3.298 |
Hiroshima | -3.161 |
Filipino | -3.147 |
Anaheim | -3.093 |
Huntington | -3.051 |
Token | the |
Token ID | 262 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
ILCS | +0.931 |
Hiroshima | +0.891 |
Filipino | +0.881 |
Anaheim | +0.881 |
Huntington | +0.857 |
Neg logit contributions | |
Rhod | -0.855 |
� | -0.802 |
)", | -0.771 |
crop | -0.758 |
recapt | -0.666 |
Token | second |
Token ID | 1218 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ILCS | +3.175 |
Hiroshima | +3.079 |
Anaheim | +3.054 |
Filipino | +3.027 |
Huntington | +2.935 |
Neg logit contributions | |
Rhod | -3.742 |
� | -3.539 |
)", | -3.465 |
crop | -3.424 |
faces | -3.032 |
Token | best |
Token ID | 1266 |
Feature activation | -7.34e-01 |
Pos logit contributions | |
ILCS | +2.239 |
Hiroshima | +2.162 |
Anaheim | +2.146 |
Filipino | +2.137 |
Huntington | +2.066 |
Neg logit contributions | |
Rhod | -2.840 |
� | -2.679 |
)", | -2.626 |
crop | -2.574 |
faces | -2.301 |
Token | among |
Token ID | 1871 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Rhod | +6.137 |
� | +5.750 |
graded | +5.238 |
crop | +5.192 |
)", | +5.184 |
Neg logit contributions | |
ILCS | -9.094 |
Hiroshima | -8.420 |
ushi | -8.367 |
endo | -8.304 |
wang | -8.269 |
Token | the |
Token ID | 262 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
Rhod | +16.203 |
graded | +15.438 |
perimeter | +15.081 |
� | +14.854 |
Buc | +14.727 |
Neg logit contributions | |
ILCS | -17.270 |
Hiroshima | -16.034 |
chant | -15.886 |
Japanese | -15.583 |
wang | -15.579 |
Token | prospects |
Token ID | 13285 |
Feature activation | -8.50e-01 |
Pos logit contributions | |
Rhod | +15.776 |
� | +14.707 |
Buc | +14.055 |
Cycl | +13.839 |
crop | +13.760 |
Neg logit contributions | |
ILCS | -15.431 |
chant | -15.401 |
endo | -15.383 |
wang | -14.923 |
Hiroshima | -14.612 |
Token | chart |
Token ID | 8262 |
Feature activation | -2.40e-01 |
Pos logit contributions | |
Rhod | +8.024 |
� | +7.343 |
graded | +6.802 |
crop | +6.693 |
grading | +6.637 |
Neg logit contributions | |
ILCS | -9.346 |
Filipino | -8.749 |
chant | -8.726 |
endo | -8.724 |
Hiroshima | -8.694 |
Token | ed |
Token ID | 276 |
Feature activation | -6.28e-01 |
Pos logit contributions | |
Rhod | +2.202 |
� | +2.066 |
crop | +1.944 |
)", | +1.913 |
graded | +1.708 |
Neg logit contributions | |
ILCS | -2.965 |
Hiroshima | -2.862 |
Filipino | -2.851 |
Anaheim | -2.823 |
Huntington | -2.771 |
Token | for |
Token ID | 329 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
Rhod | +5.881 |
� | +5.639 |
crop | +5.231 |
)", | +5.051 |
graded | +4.735 |
Neg logit contributions | |
ILCS | -7.062 |
Filipino | -6.888 |
Hiroshima | -6.817 |
Anaheim | -6.661 |
Manila | -6.614 |
Token | and |
Token ID | 290 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Rhod | +5.520 |
� | +5.127 |
crop | +4.789 |
)", | +4.627 |
graded | +4.355 |
Neg logit contributions | |
ILCS | -7.138 |
Filipino | -6.689 |
Hiroshima | -6.642 |
Anaheim | -6.542 |
chant | -6.431 |
Token | Bell |
Token ID | 7459 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
Rhod | +13.429 |
)", | +11.664 |
� | +11.581 |
crop | +11.461 |
recapt | +11.122 |
Neg logit contributions | |
ILCS | -11.644 |
chant | -10.892 |
Hiroshima | -10.305 |
endo | -10.157 |
ushi | -10.144 |
Token | . |
Token ID | 13 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
Rhod | +6.938 |
� | +6.471 |
crop | +6.210 |
)", | +5.908 |
recapt | +5.547 |
Neg logit contributions | |
ILCS | -8.535 |
Hiroshima | -8.096 |
Filipino | -8.026 |
Anaheim | -7.869 |
chant | -7.649 |
Token |
|
Token ID | 198 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
Rhod | +14.211 |
� | +12.148 |
crop | +11.797 |
)", | +11.375 |
Cycl | +11.358 |
Neg logit contributions | |
chant | -13.751 |
ILCS | -13.593 |
endo | -13.291 |
ushi | -13.119 |
boiler | -13.023 |
Token |
|
Token ID | 198 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
Rhod | +5.596 |
� | +5.296 |
crop | +5.141 |
)", | +5.049 |
faces | +4.298 |
Neg logit contributions | |
ILCS | -9.215 |
Hiroshima | -8.544 |
boiler | -8.444 |
Filipino | -8.407 |
Anaheim | -8.262 |
Token | Should |
Token ID | 19926 |
Feature activation | -2.11e+00 |
Pos logit contributions | |
� | +14.021 |
crop | +13.740 |
Rhod | +13.079 |
YD | +12.663 |
)", | +12.482 |
Neg logit contributions | |
ILCS | -14.714 |
Filipino | -14.460 |
Hiroshima | -14.409 |
boiler | -14.299 |
Manila | -14.247 |
Token | Oklahoma |
Token ID | 10433 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
Rhod | +18.595 |
� | +16.746 |
crop | +16.653 |
)", | +15.979 |
graded | +15.665 |
Neg logit contributions | |
ILCS | -14.194 |
chant | -13.956 |
Japanese | -13.279 |
Filipino | -13.271 |
ushi | -12.842 |
Token | use |
Token ID | 779 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
Rhod | +12.187 |
recapt | +11.206 |
� | +11.187 |
)", | +10.816 |
crop | +10.639 |
Neg logit contributions | |
ILCS | -14.086 |
chant | -12.729 |
Filipino | -12.305 |
Hiroshima | -12.147 |
Japanese | -12.009 |
Token | its |
Token ID | 663 |
Feature activation | -6.78e-01 |
Pos logit contributions | |
Rhod | +14.863 |
� | +13.260 |
Tate | +12.564 |
)", | +12.540 |
crop | +12.481 |
Neg logit contributions | |
ILCS | -13.465 |
chant | -12.372 |
Japanese | -12.258 |
wang | -12.217 |
ushi | -12.113 |
Token | personnel |
Token ID | 8213 |
Feature activation | -6.36e-01 |
Pos logit contributions | |
Rhod | +6.817 |
� | +6.155 |
)", | +5.960 |
crop | +5.925 |
graded | +5.438 |
Neg logit contributions | |
ILCS | -7.312 |
chant | -6.866 |
Filipino | -6.816 |
endo | -6.814 |
Hiroshima | -6.801 |
Token | optim |
Token ID | 6436 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
Rhod | +5.927 |
� | +5.387 |
crop | +5.076 |
)", | +4.980 |
recapt | +4.727 |
Neg logit contributions | |
ILCS | -7.503 |
Filipino | -6.992 |
Hiroshima | -6.988 |
endo | -6.978 |
chant | -6.969 |
Token | performance |
Token ID | 2854 |
Feature activation | -9.99e-01 |
Pos logit contributions | |
Rhod | +9.240 |
� | +8.569 |
)", | +7.908 |
crop | +7.797 |
recapt | +7.727 |
Neg logit contributions | |
ILCS | -9.997 |
Hiroshima | -9.134 |
Filipino | -8.952 |
endo | -8.911 |
chant | -8.903 |
Token | was |
Token ID | 373 |
Feature activation | -3.04e-01 |
Pos logit contributions | |
Rhod | +8.324 |
� | +7.911 |
graded | +7.269 |
recapt | +7.266 |
)", | +7.039 |
Neg logit contributions | |
ILCS | -11.782 |
Filipino | -10.676 |
Hiroshima | -10.654 |
endo | -10.525 |
Huntington | -10.440 |
Token | a |
Token ID | 257 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
Rhod | +3.086 |
� | +2.859 |
)", | +2.765 |
crop | +2.687 |
recapt | +2.457 |
Neg logit contributions | |
ILCS | -3.559 |
Hiroshima | -3.352 |
Filipino | -3.297 |
Anaheim | -3.272 |
chant | -3.244 |
Token | signature |
Token ID | 9877 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Rhod | +4.781 |
� | +4.349 |
)", | +4.204 |
crop | +4.101 |
recapt | +3.802 |
Neg logit contributions | |
ILCS | -5.372 |
Anaheim | -4.951 |
Hiroshima | -4.943 |
Filipino | -4.911 |
endo | -4.894 |
Token | game |
Token ID | 983 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
Rhod | +10.258 |
� | +9.426 |
crop | +8.786 |
)", | +8.615 |
recapt | +8.545 |
Neg logit contributions | |
ILCS | -12.356 |
ushi | -11.437 |
Hiroshima | -11.437 |
wang | -11.407 |
endo | -11.290 |
Token | for |
Token ID | 329 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
Rhod | +8.728 |
� | +8.464 |
crop | +7.713 |
)", | +7.313 |
recapt | +7.276 |
Neg logit contributions | |
ILCS | -11.959 |
Hiroshima | -11.050 |
Filipino | -10.881 |
wang | -10.745 |
Huntington | -10.720 |
Token | the |
Token ID | 262 |
Feature activation | -1.93e+00 |
Pos logit contributions | |
Rhod | +18.142 |
� | +15.452 |
recapt | +15.300 |
Cycl | +15.068 |
)", | +15.001 |
Neg logit contributions | |
ILCS | -15.479 |
Japanese | -14.161 |
wang | -14.005 |
chant | -13.845 |
ushi | -13.643 |
Token | H |
Token ID | 367 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Rhod | +17.183 |
Cycl | +15.250 |
� | +14.780 |
Buc | +14.657 |
recapt | +14.263 |
Neg logit contributions | |
ILCS | -15.135 |
wang | -14.272 |
Japanese | -14.138 |
endo | -14.065 |
chant | -13.971 |
Token | ogs |
Token ID | 18463 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
� | +10.185 |
Rhod | +9.918 |
)", | +9.136 |
YD | +9.073 |
crop | +8.960 |
Neg logit contributions | |
ILCS | -13.382 |
Hiroshima | -12.612 |
Manila | -12.468 |
Filipino | -12.445 |
Anaheim | -12.211 |
Token | � |
Token ID | 447 |
Feature activation | -4.26e-01 |
Pos logit contributions | |
Rhod | +10.863 |
� | +10.165 |
crop | +9.319 |
recapt | +9.164 |
)", | +8.917 |
Neg logit contributions | |
ILCS | -13.982 |
Filipino | -13.403 |
Hiroshima | -13.174 |
Manila | -12.934 |
wang | -12.737 |
Token | � |
Token ID | 247 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
Rhod | +3.518 |
� | +3.219 |
)", | +3.028 |
crop | +2.914 |
graded | +2.535 |
Neg logit contributions | |
ILCS | -5.664 |
Hiroshima | -5.482 |
Filipino | -5.394 |
Anaheim | -5.362 |
Manila | -5.286 |
Token | in |
Token ID | 287 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
Rhod | +8.500 |
� | +7.855 |
)", | +7.527 |
crop | +7.084 |
recapt | +7.050 |
Neg logit contributions | |
ILCS | -12.364 |
endo | -11.409 |
Filipino | -11.156 |
chant | -11.118 |
Hiroshima | -11.028 |
Token | the |
Token ID | 262 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
Rhod | +10.448 |
� | +9.346 |
recapt | +8.882 |
)", | +8.836 |
crop | +8.779 |
Neg logit contributions | |
ILCS | -12.507 |
chant | -11.216 |
endo | -11.120 |
API | -11.108 |
Japanese | -11.105 |
Token | revolution |
Token ID | 5854 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
Rhod | +13.276 |
� | +11.395 |
recapt | +11.119 |
regime | +10.630 |
FSA | +10.467 |
Neg logit contributions | |
ILCS | -15.296 |
API | -13.705 |
chant | -13.672 |
wang | -13.231 |
quist | -13.212 |
Token | - |
Token ID | 12 |
Feature activation | -5.56e-01 |
Pos logit contributions | |
Rhod | +10.782 |
� | +10.381 |
crop | +9.358 |
)", | +9.352 |
recapt | +9.045 |
Neg logit contributions | |
ILCS | -13.081 |
Filipino | -11.689 |
Anaheim | -11.467 |
chant | -11.438 |
API | -11.383 |
Token | wr |
Token ID | 18351 |
Feature activation | -3.97e-01 |
Pos logit contributions | |
Rhod | +5.287 |
� | +5.047 |
crop | +4.921 |
)", | +4.727 |
faces | +4.356 |
Neg logit contributions | |
ILCS | -6.656 |
Filipino | -6.037 |
Hiroshima | -5.999 |
Ballard | -5.967 |
Anaheim | -5.915 |
Token | acked |
Token ID | 6021 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
Rhod | +3.189 |
� | +3.096 |
)", | +2.876 |
crop | +2.772 |
recapt | +2.428 |
Neg logit contributions | |
ILCS | -5.296 |
Filipino | -5.037 |
Huntington | -4.982 |
Hiroshima | -4.921 |
Anaheim | -4.866 |
Token | nation |
Token ID | 3277 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
Rhod | +17.160 |
regime | +14.853 |
� | +14.717 |
recapt | +14.587 |
countryside | +14.521 |
Neg logit contributions | |
ILCS | -17.309 |
API | -16.214 |
chant | -15.923 |
Japanese | -15.853 |
deck | -15.605 |
Token | , |
Token ID | 11 |
Feature activation | -7.04e-01 |
Pos logit contributions | |
Rhod | +12.190 |
� | +11.825 |
)", | +11.266 |
crop | +10.455 |
recapt | +10.357 |
Neg logit contributions | |
ILCS | -15.954 |
Filipino | -14.954 |
endo | -14.509 |
boiler | -14.442 |
Anaheim | -14.304 |
Token | a |
Token ID | 257 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
Rhod | +7.511 |
� | +6.736 |
)", | +6.422 |
crop | +6.252 |
recapt | +6.047 |
Neg logit contributions | |
ILCS | -7.509 |
chant | -6.877 |
endo | -6.837 |
Anaheim | -6.717 |
Hiroshima | -6.647 |
Token | senior |
Token ID | 4664 |
Feature activation | -5.09e-01 |
Pos logit contributions | |
Rhod | +3.062 |
� | +2.784 |
)", | +2.693 |
crop | +2.624 |
recapt | +2.412 |
Neg logit contributions | |
ILCS | -3.214 |
Anaheim | -2.987 |
Hiroshima | -2.968 |
chant | -2.942 |
endo | -2.913 |
Token | U |
Token ID | 471 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
Rhod | +5.276 |
� | +4.650 |
)", | +4.474 |
crop | +4.373 |
FSA | +4.098 |
Neg logit contributions | |
ILCS | -5.845 |
chant | -5.350 |
Hiroshima | -5.289 |
Anaheim | -5.276 |
endo | -5.275 |
Token | season |
Token ID | 1622 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
Rhod | +9.761 |
� | +8.595 |
recapt | +7.488 |
)", | +7.471 |
crop | +7.424 |
Neg logit contributions | |
ILCS | -14.871 |
chant | -13.734 |
wang | -13.429 |
Hiroshima | -13.087 |
Filipino | -13.058 |
Token | with |
Token ID | 351 |
Feature activation | -8.86e-01 |
Pos logit contributions | |
Rhod | +3.694 |
� | +3.412 |
)", | +3.233 |
crop | +3.159 |
graded | +3.001 |
Neg logit contributions | |
ILCS | -3.806 |
Hiroshima | -3.476 |
Filipino | -3.408 |
chant | -3.403 |
Anaheim | -3.361 |
Token | 10 |
Token ID | 838 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Rhod | +8.486 |
� | +7.778 |
)", | +7.297 |
crop | +7.091 |
graded | +7.013 |
Neg logit contributions | |
ILCS | -9.875 |
chant | -8.694 |
Hiroshima | -8.639 |
Filipino | -8.598 |
wang | -8.493 |
Token | 26 |
Token ID | 2075 |
Feature activation | -9.48e-01 |
Pos logit contributions | |
Rhod | +9.908 |
� | +9.604 |
)", | +8.598 |
crop | +8.529 |
graded | +8.359 |
Neg logit contributions | |
ILCS | -12.684 |
Hiroshima | -11.605 |
Huntington | -11.328 |
Filipino | -11.305 |
Anaheim | -11.260 |
Token | yards |
Token ID | 5695 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
Rhod | +6.833 |
� | +6.493 |
crop | +5.686 |
)", | +5.538 |
graded | +5.489 |
Neg logit contributions | |
ILCS | -11.976 |
Hiroshima | -11.476 |
ushi | -11.300 |
Anaheim | -11.190 |
Filipino | -11.170 |
Token | at |
Token ID | 379 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
Rhod | +4.412 |
� | +4.112 |
)", | +3.741 |
crop | +3.691 |
recapt | +3.481 |
Neg logit contributions | |
ILCS | -5.880 |
Hiroshima | -5.555 |
Filipino | -5.462 |
Anaheim | -5.416 |
Huntington | -5.411 |
Token | 5 |
Token ID | 642 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Rhod | +17.055 |
� | +14.914 |
)", | +14.495 |
Ole | +14.428 |
recapt | +14.354 |
Neg logit contributions | |
ILCS | -15.836 |
quist | -14.215 |
Japanese | -14.207 |
endo | -13.849 |
ushi | -13.747 |
Token | . |
Token ID | 13 |
Feature activation | -6.36e-01 |
Pos logit contributions | |
Rhod | +9.252 |
� | +8.813 |
)", | +7.938 |
crop | +7.915 |
YD | +7.354 |
Neg logit contributions | |
ILCS | -11.229 |
Filipino | -10.892 |
Anaheim | -10.736 |
Hiroshima | -10.584 |
endo | -10.497 |
Token | 4 |
Token ID | 19 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
Rhod | +6.079 |
� | +5.731 |
crop | +5.506 |
)", | +5.444 |
YD | +4.774 |
Neg logit contributions | |
ILCS | -7.153 |
Hiroshima | -6.859 |
Filipino | -6.847 |
boiler | -6.742 |
Anaheim | -6.629 |
Token | yards |
Token ID | 5695 |
Feature activation | -6.64e-01 |
Pos logit contributions | |
Rhod | +7.386 |
� | +7.361 |
crop | +6.045 |
)", | +5.948 |
graded | +5.880 |
Neg logit contributions | |
ILCS | -13.925 |
ushi | -13.040 |
Filipino | -12.947 |
Anaheim | -12.888 |
Manila | -12.832 |
Token | per |
Token ID | 583 |
Feature activation | -8.81e-01 |
Pos logit contributions | |
Rhod | +6.344 |
� | +6.076 |
)", | +5.622 |
crop | +5.545 |
graded | +5.304 |
Neg logit contributions | |
ILCS | -7.544 |
chant | -6.944 |
endo | -6.927 |
Hiroshima | -6.922 |
Filipino | -6.880 |
Token | scene |
Token ID | 3715 |
Feature activation | -7.82e-01 |
Pos logit contributions | |
Rhod | +8.577 |
� | +7.573 |
crop | +7.069 |
scenery | +6.916 |
)", | +6.635 |
Neg logit contributions | |
ILCS | -12.391 |
wang | -12.270 |
Hiroshima | -12.050 |
ushi | -11.653 |
Filipino | -11.622 |
Token | to |
Token ID | 284 |
Feature activation | -7.44e-01 |
Pos logit contributions | |
Rhod | +6.898 |
� | +6.630 |
crop | +6.007 |
)", | +5.862 |
recapt | +5.683 |
Neg logit contributions | |
ILCS | -9.236 |
Hiroshima | -8.620 |
Filipino | -8.511 |
Huntington | -8.346 |
chant | -8.342 |
Token | become |
Token ID | 1716 |
Feature activation | -9.68e-01 |
Pos logit contributions | |
Rhod | +6.780 |
� | +6.296 |
crop | +5.934 |
)", | +5.924 |
recapt | +5.773 |
Neg logit contributions | |
ILCS | -8.967 |
chant | -8.042 |
Hiroshima | -8.018 |
Filipino | -7.944 |
wang | -7.800 |
Token | the |
Token ID | 262 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Rhod | +8.184 |
� | +7.634 |
crop | +7.226 |
)", | +6.993 |
recapt | +6.369 |
Neg logit contributions | |
ILCS | -11.019 |
Hiroshima | -10.290 |
Filipino | -10.289 |
chant | -10.128 |
wang | -10.091 |
Token | first |
Token ID | 717 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
Rhod | +11.490 |
� | +10.362 |
crop | +9.564 |
)", | +9.467 |
Cycl | +9.467 |
Neg logit contributions | |
ILCS | -12.090 |
chant | -11.113 |
wang | -11.097 |
endo | -11.075 |
Filipino | -10.709 |
Token | freshman |
Token ID | 18621 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
Rhod | +18.054 |
� | +16.217 |
crop | +15.739 |
Cycl | +15.281 |
graded | +15.240 |
Neg logit contributions | |
ILCS | -14.851 |
chant | -12.850 |
wang | -12.784 |
Hiroshima | -12.739 |
endo | -12.736 |
Token | in |
Token ID | 287 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
Rhod | +15.808 |
� | +14.643 |
graded | +14.311 |
recapt | +13.892 |
crop | +13.850 |
Neg logit contributions | |
ILCS | -17.261 |
wang | -14.919 |
chant | -14.862 |
Hiroshima | -14.824 |
endo | -14.659 |
Token | SEC |
Token ID | 10729 |
Feature activation | -9.69e-01 |
Pos logit contributions | |
Rhod | +13.561 |
� | +12.875 |
recapt | +11.816 |
crop | +11.543 |
Grey | +11.411 |
Neg logit contributions | |
ILCS | -14.102 |
endo | -12.552 |
wang | -12.398 |
Hiroshima | -12.300 |
Filipino | -12.295 |
Token | history |
Token ID | 2106 |
Feature activation | -6.18e-01 |
Pos logit contributions | |
Rhod | +7.597 |
� | +7.051 |
)", | +6.503 |
crop | +6.469 |
recapt | +6.113 |
Neg logit contributions | |
ILCS | -11.744 |
Hiroshima | -11.364 |
Filipino | -11.158 |
chant | -10.936 |
Anaheim | -10.780 |
Token | to |
Token ID | 284 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
Rhod | +5.900 |
� | +5.774 |
crop | +5.166 |
)", | +5.124 |
recapt | +4.850 |
Neg logit contributions | |
ILCS | -7.109 |
Filipino | -6.615 |
Hiroshima | -6.600 |
Anaheim | -6.439 |
endo | -6.428 |
Token | gain |
Token ID | 4461 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
Rhod | +9.833 |
recapt | +9.531 |
� | +9.529 |
graded | +8.774 |
sack | +8.680 |
Neg logit contributions | |
ILCS | -15.065 |
chant | -12.947 |
Filipino | -12.736 |
ushi | -12.601 |
Hiroshima | -12.446 |
Token | passing |
Token ID | 6427 |
Feature activation | -4.12e-01 |
Pos logit contributions | |
Rhod | +5.358 |
� | +4.982 |
crop | +4.750 |
)", | +4.589 |
recapt | +4.261 |
Neg logit contributions | |
ILCS | -6.809 |
Hiroshima | -6.505 |
endo | -6.325 |
Anaheim | -6.313 |
Filipino | -6.285 |
Token | game |
Token ID | 983 |
Feature activation | -4.92e-01 |
Pos logit contributions | |
Rhod | +4.252 |
� | +3.957 |
crop | +3.751 |
)", | +3.683 |
recapt | +3.393 |
Neg logit contributions | |
ILCS | -4.731 |
Hiroshima | -4.305 |
endo | -4.273 |
Filipino | -4.267 |
Anaheim | -4.220 |
Token | . |
Token ID | 13 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
Rhod | +4.657 |
� | +4.314 |
crop | +4.060 |
)", | +3.949 |
recapt | +3.695 |
Neg logit contributions | |
ILCS | -5.825 |
Filipino | -5.458 |
Hiroshima | -5.400 |
Anaheim | -5.321 |
endo | -5.250 |
Token |
|
Token ID | 198 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
Rhod | +13.127 |
� | +11.200 |
crop | +11.001 |
)", | +10.729 |
Cycl | +10.559 |
Neg logit contributions | |
ILCS | -13.157 |
chant | -12.855 |
endo | -12.612 |
ushi | -12.454 |
boiler | -12.369 |
Token |
|
Token ID | 198 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
Rhod | +5.233 |
� | +4.934 |
crop | +4.802 |
)", | +4.729 |
faces | +4.021 |
Neg logit contributions | |
ILCS | -8.223 |
Hiroshima | -7.646 |
Filipino | -7.528 |
boiler | -7.515 |
Anaheim | -7.406 |
Token | Can |
Token ID | 6090 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
crop | +13.343 |
� | +13.336 |
Rhod | +12.464 |
YD | +12.118 |
)", | +11.933 |
Neg logit contributions | |
ILCS | -14.457 |
Filipino | -14.305 |
Manila | -14.076 |
Hiroshima | -14.062 |
boiler | -13.924 |
Token | Baylor |
Token ID | 28245 |
Feature activation | -8.90e-01 |
Pos logit contributions | |
Rhod | +17.959 |
crop | +16.101 |
)", | +15.682 |
� | +15.669 |
Tate | +15.197 |
Neg logit contributions | |
ILCS | -14.412 |
Filipino | -13.113 |
Hiroshima | -12.840 |
chant | -12.799 |
boiler | -12.670 |
Token | beat |
Token ID | 4405 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
Rhod | +8.647 |
� | +7.736 |
)", | +7.647 |
recapt | +7.560 |
crop | +7.481 |
Neg logit contributions | |
ILCS | -9.607 |
chant | -8.806 |
endo | -8.679 |
Hiroshima | -8.609 |
Filipino | -8.581 |
Token | this |
Token ID | 428 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
Rhod | +14.253 |
� | +12.688 |
crop | +12.132 |
)", | +12.018 |
Cycl | +11.665 |
Neg logit contributions | |
ILCS | -13.736 |
chant | -13.113 |
wang | -12.851 |
Japanese | -12.758 |
endo | -12.670 |
Token | style |
Token ID | 3918 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
Rhod | +10.946 |
� | +9.667 |
crop | +9.575 |
)", | +9.142 |
graded | +8.841 |
Neg logit contributions | |
ILCS | -10.859 |
endo | -9.834 |
chant | -9.761 |
wang | -9.730 |
Filipino | -9.606 |
Token | of |
Token ID | 286 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Rhod | +5.476 |
� | +5.048 |
crop | +4.753 |
)", | +4.529 |
recapt | +4.242 |
Neg logit contributions | |
ILCS | -7.716 |
Filipino | -7.008 |
Hiroshima | -6.952 |
Anaheim | -6.879 |
wang | -6.851 |
Token | for |
Token ID | 329 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
Rhod | +10.280 |
� | +9.318 |
crop | +8.655 |
)", | +8.573 |
recapt | +8.555 |
Neg logit contributions | |
ILCS | -13.597 |
chant | -12.458 |
Filipino | -12.110 |
wang | -11.989 |
Japanese | -11.945 |
Token | Round |
Token ID | 10485 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
Rhod | +17.552 |
� | +15.747 |
crop | +15.539 |
recapt | +15.377 |
Tate | +15.304 |
Neg logit contributions | |
ILCS | -17.208 |
chant | -15.529 |
wang | -15.396 |
Japanese | -15.213 |
quist | -14.819 |
Token | 2 |
Token ID | 362 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Rhod | +7.834 |
� | +7.252 |
crop | +6.872 |
)", | +6.604 |
faces | +5.868 |
Neg logit contributions | |
ILCS | -9.080 |
chant | -8.192 |
Filipino | -8.182 |
boiler | -8.017 |
Hiroshima | -7.997 |
Token | , |
Token ID | 11 |
Feature activation | -8.06e-01 |
Pos logit contributions | |
Rhod | +9.251 |
� | +8.537 |
crop | +8.185 |
)", | +7.798 |
grading | +7.539 |
Neg logit contributions | |
ILCS | -13.192 |
Filipino | -12.481 |
chant | -12.232 |
Hiroshima | -12.164 |
wang | -12.151 |
Token | as |
Token ID | 355 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Rhod | +8.049 |
� | +7.277 |
)", | +6.975 |
crop | +6.892 |
graded | +6.550 |
Neg logit contributions | |
ILCS | -8.648 |
chant | -8.036 |
Filipino | -8.026 |
endo | -7.978 |
wang | -7.925 |
Token | the |
Token ID | 262 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
Rhod | +14.116 |
� | +12.436 |
crop | +12.006 |
)", | +11.938 |
graded | +11.561 |
Neg logit contributions | |
ILCS | -12.792 |
chant | -12.178 |
quist | -11.732 |
Filipino | -11.658 |
ushi | -11.596 |
Token | Soon |
Token ID | 15894 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
Rhod | +16.763 |
Buc | +15.168 |
Cycl | +14.874 |
� | +14.739 |
)", | +13.996 |
Neg logit contributions | |
ILCS | -15.997 |
chant | -15.644 |
endo | -15.414 |
wang | -14.789 |
eno | -14.516 |
Token | ers |
Token ID | 364 |
Feature activation | -8.90e-01 |
Pos logit contributions | |
Rhod | +0.144 |
� | +0.137 |
)", | +0.133 |
crop | +0.132 |
faces | +0.118 |
Neg logit contributions | |
ILCS | -0.101 |
Hiroshima | -0.096 |
Anaheim | -0.094 |
Filipino | -0.094 |
Huntington | -0.091 |
Token | re |
Token ID | 302 |
Feature activation | -6.81e-01 |
Pos logit contributions | |
Rhod | +7.647 |
� | +6.878 |
recapt | +6.711 |
)", | +6.693 |
crop | +6.443 |
Neg logit contributions | |
ILCS | -10.668 |
Filipino | -9.523 |
chant | -9.519 |
endo | -9.400 |
Hiroshima | -9.369 |
Token | - |
Token ID | 12 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Rhod | +6.648 |
� | +6.565 |
crop | +6.520 |
)", | +6.141 |
faces | +5.623 |
Neg logit contributions | |
ILCS | -7.604 |
Filipino | -7.055 |
Hiroshima | -6.906 |
Manila | -6.759 |
Huntington | -6.749 |
Token | em |
Token ID | 368 |
Feature activation | +2.22e-02 |
Pos logit contributions | |
crop | +11.655 |
� | +10.791 |
Rhod | +10.484 |
)", | +10.301 |
faces | +10.233 |
Neg logit contributions | |
ILCS | -10.061 |
Filipino | -9.042 |
Ballard | -8.657 |
Hiroshima | -8.625 |
Manila | -8.578 |
Token | extremely |
Token ID | 4457 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
Rhod | +8.817 |
� | +8.339 |
crop | +7.787 |
)", | +7.666 |
recapt | +7.476 |
Neg logit contributions | |
ILCS | -9.820 |
Hiroshima | -8.744 |
chant | -8.694 |
Filipino | -8.626 |
endo | -8.528 |
Token | successful |
Token ID | 4388 |
Feature activation | -7.74e-01 |
Pos logit contributions | |
Rhod | +5.775 |
� | +5.362 |
)", | +5.056 |
crop | +4.945 |
graded | +4.612 |
Neg logit contributions | |
ILCS | -7.774 |
Hiroshima | -7.313 |
chant | -7.134 |
Anaheim | -7.091 |
endo | -7.059 |
Token | in |
Token ID | 287 |
Feature activation | -6.97e-01 |
Pos logit contributions | |
Rhod | +7.057 |
� | +6.596 |
crop | +6.135 |
recapt | +6.057 |
)", | +5.880 |
Neg logit contributions | |
ILCS | -8.992 |
Hiroshima | -8.399 |
Filipino | -8.286 |
endo | -8.166 |
wang | -8.018 |
Token | similar |
Token ID | 2092 |
Feature activation | -9.66e-01 |
Pos logit contributions | |
Rhod | +7.130 |
� | +6.605 |
crop | +6.301 |
recapt | +6.174 |
)", | +6.159 |
Neg logit contributions | |
ILCS | -7.728 |
Hiroshima | -6.929 |
endo | -6.826 |
Filipino | -6.777 |
chant | -6.744 |
Token | situations |
Token ID | 7445 |
Feature activation | -6.24e-01 |
Pos logit contributions | |
Rhod | +7.150 |
� | +6.771 |
crop | +6.176 |
)", | +5.977 |
recapt | +5.710 |
Neg logit contributions | |
ILCS | -12.132 |
Hiroshima | -11.515 |
wang | -11.103 |
chant | -11.079 |
Filipino | -11.076 |
Token | at |
Token ID | 379 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
Rhod | +5.790 |
� | +5.517 |
crop | +5.026 |
)", | +4.825 |
recapt | +4.674 |
Neg logit contributions | |
ILCS | -7.376 |
Filipino | -6.891 |
Hiroshima | -6.869 |
endo | -6.726 |
Anaheim | -6.665 |
Token | Ole |
Token ID | 30093 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
Rhod | +17.999 |
� | +16.310 |
Ole | +15.488 |
Tate | +15.109 |
recapt | +15.089 |
Neg logit contributions | |
ILCS | -14.706 |
chant | -13.638 |
Japanese | -13.572 |
quist | -13.438 |
wang | -13.370 |
Token | Miss |
Token ID | 4544 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
Rhod | +4.333 |
� | +3.857 |
crop | +3.593 |
)", | +3.589 |
YD | +2.523 |
Neg logit contributions | |
ILCS | -12.850 |
Hiroshima | -12.303 |
Filipino | -12.253 |
chant | -12.228 |
endo | -12.167 |
Token | . |
Token ID | 13 |
Feature activation | -8.79e-01 |
Pos logit contributions | |
Rhod | +8.388 |
� | +8.231 |
crop | +7.417 |
)", | +6.682 |
grading | +6.561 |
Neg logit contributions | |
ILCS | -12.097 |
Filipino | -11.634 |
Hiroshima | -11.313 |
endo | -11.134 |
wang | -11.077 |
Token |
|
Token ID | 198 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
Rhod | +8.744 |
� | +8.045 |
crop | +7.389 |
)", | +7.326 |
Cycl | +6.716 |
Neg logit contributions | |
ILCS | -9.208 |
chant | -8.608 |
boiler | -8.576 |
endo | -8.529 |
ushi | -8.478 |
Token |
|
Token ID | 198 |
Feature activation | -8.64e-01 |
Pos logit contributions | |
Rhod | +2.705 |
� | +2.562 |
)", | +2.465 |
crop | +2.455 |
faces | +2.112 |
Neg logit contributions | |
ILCS | -3.196 |
Hiroshima | -3.020 |
Filipino | -2.965 |
Anaheim | -2.949 |
Huntington | -2.893 |
Token | ving |
Token ID | 1075 |
Feature activation | -8.62e-01 |
Pos logit contributions | |
Rhod | +2.580 |
� | +2.485 |
crop | +2.360 |
)", | +2.345 |
faces | +2.123 |
Neg logit contributions | |
ILCS | -1.950 |
Hiroshima | -1.871 |
Anaheim | -1.835 |
Filipino | -1.830 |
Huntington | -1.775 |
Token | the |
Token ID | 262 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
Rhod | +7.905 |
� | +6.963 |
crop | +6.781 |
)", | +6.656 |
graded | +6.131 |
Neg logit contributions | |
ILCS | -9.789 |
Hiroshima | -9.092 |
chant | -9.072 |
Filipino | -8.979 |
endo | -8.882 |
Token | flats |
Token ID | 38157 |
Feature activation | -7.64e-01 |
Pos logit contributions | |
Rhod | +10.920 |
� | +9.511 |
perimeter | +9.271 |
crop | +9.205 |
)", | +9.166 |
Neg logit contributions | |
ILCS | -12.839 |
chant | -12.174 |
ushi | -12.100 |
Hiroshima | -12.040 |
endo | -11.956 |
Token | : |
Token ID | 25 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Rhod | +6.866 |
� | +6.378 |
crop | +6.077 |
)", | +5.788 |
graded | +5.548 |
Neg logit contributions | |
ILCS | -8.722 |
Hiroshima | -8.396 |
Filipino | -8.370 |
Anaheim | -8.239 |
Huntington | -8.094 |
Token |
|
Token ID | 198 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
Rhod | +12.619 |
crop | +11.395 |
� | +11.372 |
)", | +10.325 |
graded | +10.070 |
Neg logit contributions | |
ILCS | -13.748 |
Hiroshima | -12.695 |
Filipino | -12.642 |
endo | -12.465 |
ushi | -12.383 |
Token |
|
Token ID | 198 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
Rhod | +4.652 |
� | +4.405 |
crop | +4.259 |
)", | +4.223 |
faces | +3.616 |
Neg logit contributions | |
ILCS | -6.856 |
Hiroshima | -6.358 |
Filipino | -6.262 |
boiler | -6.229 |
Anaheim | -6.183 |
Token | This |
Token ID | 1212 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
crop | +14.889 |
� | +14.645 |
YD | +13.989 |
Rhod | +13.642 |
)", | +13.514 |
Neg logit contributions | |
ILCS | -17.106 |
Hiroshima | -16.585 |
Filipino | -16.256 |
Manila | -16.198 |
boiler | -16.135 |
Token | has |
Token ID | 468 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
Rhod | +13.610 |
� | +12.185 |
grading | +11.896 |
graded | +11.867 |
crop | +11.837 |
Neg logit contributions | |
ILCS | -15.402 |
endo | -13.735 |
wang | -13.202 |
ickets | -13.109 |
Hiroshima | -12.913 |
Token | proven |
Token ID | 9157 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
Rhod | +5.437 |
� | +5.039 |
)", | +4.749 |
crop | +4.663 |
graded | +4.450 |
Neg logit contributions | |
ILCS | -6.497 |
Hiroshima | -5.928 |
Filipino | -5.878 |
endo | -5.870 |
chant | -5.860 |
Token | vex |
Token ID | 41548 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
Rhod | +4.458 |
� | +4.172 |
crop | +3.971 |
)", | +3.958 |
recapt | +3.537 |
Neg logit contributions | |
ILCS | -5.185 |
Hiroshima | -4.787 |
Filipino | -4.707 |
Anaheim | -4.663 |
endo | -4.638 |
Token | ing |
Token ID | 278 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
Rhod | +5.634 |
� | +5.216 |
crop | +5.123 |
)", | +5.003 |
recapt | +4.438 |
Neg logit contributions | |
ILCS | -4.626 |
Hiroshima | -4.420 |
Filipino | -4.337 |
Anaheim | -4.314 |
Huntington | -4.167 |
Token | These |
Token ID | 2312 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
Rhod | +12.491 |
� | +10.539 |
crop | +9.959 |
)", | +9.815 |
Cycl | +9.622 |
Neg logit contributions | |
ILCS | -12.526 |
chant | -12.217 |
boiler | -11.933 |
ushi | -11.911 |
wang | -11.880 |
Token | two |
Token ID | 734 |
Feature activation | -9.97e-01 |
Pos logit contributions | |
Rhod | +11.110 |
� | +9.747 |
)", | +9.504 |
graded | +9.323 |
crop | +8.993 |
Neg logit contributions | |
ILCS | -13.393 |
endo | -12.905 |
chant | -12.792 |
Hiroshima | -12.652 |
ushi | -12.327 |
Token | lead |
Token ID | 1085 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
Rhod | +9.421 |
� | +8.303 |
)", | +8.168 |
graded | +7.887 |
crop | +7.769 |
Neg logit contributions | |
ILCS | -10.450 |
chant | -10.028 |
Hiroshima | -9.922 |
endo | -9.867 |
ushi | -9.688 |
Token | the |
Token ID | 262 |
Feature activation | -1.88e+00 |
Pos logit contributions | |
Rhod | +11.731 |
� | +10.580 |
crop | +10.272 |
)", | +9.650 |
graded | +9.393 |
Neg logit contributions | |
ILCS | -12.785 |
Hiroshima | -11.350 |
chant | -11.224 |
wang | -11.190 |
Filipino | -11.168 |
Token | team |
Token ID | 1074 |
Feature activation | -8.02e-01 |
Pos logit contributions | |
Rhod | +15.704 |
Buc | +13.380 |
Cycl | +13.337 |
perimeter | +13.262 |
� | +13.187 |
Neg logit contributions | |
ILCS | -16.227 |
wang | -15.975 |
chant | -15.798 |
endo | -15.184 |
ushi | -15.019 |
Token | in |
Token ID | 287 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
Rhod | +7.424 |
� | +6.371 |
crop | +6.228 |
)", | +6.177 |
graded | +5.910 |
Neg logit contributions | |
ILCS | -9.556 |
chant | -8.596 |
Hiroshima | -8.580 |
Filipino | -8.567 |
wang | -8.510 |
Token | tackles |
Token ID | 18034 |
Feature activation | -9.39e-01 |
Pos logit contributions | |
Rhod | +15.900 |
sack | +15.095 |
graded | +14.992 |
recapt | +14.623 |
grading | +14.610 |
Neg logit contributions | |
ILCS | -16.368 |
endo | -15.406 |
ushi | -14.924 |
chant | -14.908 |
wang | -14.706 |
Token | at |
Token ID | 379 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Rhod | +8.490 |
� | +7.565 |
graded | +7.071 |
crop | +7.066 |
recapt | +6.844 |
Neg logit contributions | |
ILCS | -10.950 |
Filipino | -9.858 |
Hiroshima | -9.848 |
endo | -9.777 |
ushi | -9.720 |
Token | 61 |
Token ID | 8454 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Rhod | +15.358 |
graded | +13.499 |
)", | +13.375 |
� | +13.064 |
recapt | +13.029 |
Neg logit contributions | |
ILCS | -15.407 |
ushi | -13.766 |
endo | -13.705 |
chant | -13.501 |
quist | -13.457 |
Token | and |
Token ID | 290 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
Rhod | +10.811 |
� | +10.215 |
graded | +9.504 |
crop | +9.484 |
grading | +9.161 |
Neg logit contributions | |
ILCS | -15.114 |
ushi | -14.598 |
Hiroshima | -14.516 |
Filipino | -14.365 |
Manila | -14.299 |
Token | 60 |
Token ID | 3126 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Rhod | +12.677 |
graded | +10.922 |
� | +10.798 |
)", | +10.599 |
recapt | +10.344 |
Neg logit contributions | |
ILCS | -13.183 |
chant | -11.855 |
ushi | -11.851 |
Hiroshima | -11.704 |
Filipino | -11.483 |
Token | dé |
Token ID | 39073 |
Feature activation | -8.75e-01 |
Pos logit contributions | |
Rhod | +15.546 |
� | +15.282 |
)", | +14.519 |
crop | +13.831 |
recapt | +13.456 |
Neg logit contributions | |
ILCS | -12.923 |
Anaheim | -12.164 |
Huntington | -12.061 |
Hiroshima | -12.055 |
Filipino | -11.916 |
Token | ser |
Token ID | 2655 |
Feature activation | -6.73e-01 |
Pos logit contributions | |
Rhod | +9.501 |
� | +9.375 |
crop | +9.123 |
)", | +8.896 |
faces | +8.279 |
Neg logit contributions | |
ILCS | -8.066 |
Huntington | -7.666 |
Hiroshima | -7.645 |
Filipino | -7.579 |
Anaheim | -7.454 |
Token | te |
Token ID | 660 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
� | +6.729 |
Rhod | +6.673 |
)", | +6.295 |
crop | +6.156 |
faces | +5.744 |
Neg logit contributions | |
ILCS | -7.424 |
Hiroshima | -6.993 |
Huntington | -6.944 |
Filipino | -6.892 |
Anaheim | -6.885 |
Token | ur |
Token ID | 333 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
� | +14.139 |
Rhod | +13.758 |
)", | +12.880 |
crop | +12.788 |
recapt | +11.853 |
Neg logit contributions | |
ILCS | -11.818 |
Huntington | -11.179 |
Anaheim | -10.953 |
Hiroshima | -10.826 |
Filipino | -10.628 |
Token | du |
Token ID | 7043 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
Rhod | +15.015 |
� | +14.841 |
)", | +14.175 |
crop | +13.336 |
tire | +13.078 |
Neg logit contributions | |
ILCS | -13.014 |
Huntington | -12.486 |
Anaheim | -12.200 |
Hiroshima | -12.134 |
Filipino | -12.051 |
Token | programme |
Token ID | 11383 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
Rhod | +11.491 |
� | +11.054 |
)", | +10.767 |
crop | +10.481 |
recapt | +9.966 |
Neg logit contributions | |
ILCS | -10.008 |
Hiroshima | -9.230 |
Japanese | -8.949 |
Anaheim | -8.909 |
Filipino | -8.886 |
Token | C |
Token ID | 327 |
Feature activation | -5.13e-01 |
Pos logit contributions | |
Rhod | +17.549 |
)", | +17.184 |
� | +16.758 |
Cycl | +15.903 |
crop | +15.850 |
Neg logit contributions | |
ILCS | -13.627 |
Japanese | -12.687 |
wang | -12.457 |
Huntington | -12.438 |
ushi | -12.385 |
Token | . |
Token ID | 13 |
Feature activation | -4.46e-01 |
Pos logit contributions | |
Rhod | +4.602 |
� | +4.455 |
)", | +4.235 |
crop | +4.108 |
YD | +3.614 |
Neg logit contributions | |
ILCS | -6.030 |
Hiroshima | -5.965 |
Filipino | -5.820 |
Anaheim | -5.793 |
Huntington | -5.741 |
Token | O |
Token ID | 46 |
Feature activation | -5.20e-01 |
Pos logit contributions | |
Rhod | +4.126 |
� | +3.824 |
)", | +3.774 |
crop | +3.653 |
YD | +3.156 |
Neg logit contributions | |
ILCS | -5.394 |
Hiroshima | -5.231 |
Filipino | -5.073 |
Anaheim | -5.069 |
chant | -5.043 |
Token | . |
Token ID | 13 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
Rhod | +4.723 |
� | +4.408 |
)", | +4.230 |
crop | +4.124 |
YD | +3.530 |
Neg logit contributions | |
ILCS | -6.326 |
Hiroshima | -6.127 |
Anaheim | -6.002 |
Filipino | -5.932 |
boiler | -5.923 |
Token | R |
Token ID | 49 |
Feature activation | -5.81e-01 |
Pos logit contributions | |
Rhod | +4.674 |
� | +4.284 |
)", | +4.094 |
crop | +3.965 |
YD | +3.465 |
Neg logit contributions | |
ILCS | -6.116 |
Hiroshima | -5.899 |
Anaheim | -5.751 |
Filipino | -5.684 |
boiler | -5.646 |
Token | -- |
Token ID | 1377 |
Feature activation | -8.92e-01 |
Pos logit contributions | |
Rhod | +9.349 |
� | +8.597 |
crop | +8.199 |
graded | +7.697 |
grading | +7.675 |
Neg logit contributions | |
ILCS | -13.080 |
Filipino | -12.246 |
Hiroshima | -12.244 |
wang | -12.059 |
chant | -11.941 |
Token | the |
Token ID | 262 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
Rhod | +8.946 |
� | +8.264 |
crop | +7.745 |
)", | +7.689 |
recapt | +7.445 |
Neg logit contributions | |
ILCS | -9.228 |
Filipino | -8.481 |
endo | -8.395 |
chant | -8.378 |
wang | -8.350 |
Token | fourth |
Token ID | 5544 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
Rhod | +16.396 |
Buc | +14.794 |
� | +14.534 |
Cycl | +14.191 |
recapt | +14.005 |
Neg logit contributions | |
ILCS | -15.999 |
endo | -15.053 |
chant | -14.567 |
wang | -14.560 |
eno | -14.222 |
Token | - |
Token ID | 12 |
Feature activation | -7.87e-01 |
Pos logit contributions | |
Rhod | +14.843 |
� | +13.422 |
recapt | +12.381 |
graded | +12.095 |
crop | +12.033 |
Neg logit contributions | |
ILCS | -17.323 |
endo | -16.440 |
chant | -15.478 |
roxy | -15.417 |
wang | -15.303 |
Token | low |
Token ID | 9319 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Rhod | +7.323 |
� | +7.252 |
crop | +7.207 |
)", | +6.620 |
faces | +6.211 |
Neg logit contributions | |
ILCS | -8.925 |
Hiroshima | -8.224 |
Filipino | -8.105 |
Anaheim | -7.991 |
Manila | -7.983 |
Token | est |
Token ID | 395 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
Rhod | +7.139 |
� | +6.759 |
crop | +6.167 |
)", | +5.948 |
graded | +5.895 |
Neg logit contributions | |
ILCS | -13.229 |
Hiroshima | -13.069 |
Filipino | -12.829 |
Anaheim | -12.689 |
Huntington | -12.522 |
Token | yards |
Token ID | 5695 |
Feature activation | -6.73e-01 |
Pos logit contributions | |
Rhod | +15.773 |
graded | +15.586 |
sack | +15.071 |
grading | +14.959 |
recapt | +14.459 |
Neg logit contributions | |
ILCS | -15.604 |
chant | -15.508 |
wang | -15.284 |
quist | -15.001 |
endo | -14.922 |
Token | - |
Token ID | 12 |
Feature activation | -7.43e-01 |
Pos logit contributions | |
Rhod | +6.427 |
� | +5.969 |
)", | +5.698 |
crop | +5.629 |
graded | +5.369 |
Neg logit contributions | |
ILCS | -7.641 |
Hiroshima | -7.112 |
endo | -7.088 |
Filipino | -7.084 |
chant | -7.016 |
Token | per |
Token ID | 525 |
Feature activation | -7.60e-01 |
Pos logit contributions | |
Rhod | +7.497 |
� | +7.295 |
crop | +7.179 |
)", | +6.862 |
faces | +6.470 |
Neg logit contributions | |
ILCS | -7.958 |
Filipino | -7.367 |
Hiroshima | -7.225 |
Huntington | -7.089 |
Manila | -7.083 |
Token | - |
Token ID | 12 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
Rhod | +6.830 |
� | +6.560 |
crop | +6.214 |
)", | +6.195 |
recapt | +5.729 |
Neg logit contributions | |
ILCS | -8.784 |
Filipino | -8.308 |
Hiroshima | -8.300 |
Huntington | -8.156 |
Anaheim | -8.080 |
Token | play |
Token ID | 1759 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
crop | +9.951 |
� | +9.916 |
Rhod | +9.292 |
faces | +8.907 |
recapt | +8.753 |
Neg logit contributions | |
ILCS | -12.576 |
Filipino | -11.615 |
Huntington | -11.458 |
Hiroshima | -11.408 |
Anaheim | -11.011 |
Token |
|
Token ID | 198 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
Rhod | +1.308 |
� | +1.232 |
)", | +1.196 |
crop | +1.181 |
faces | +1.026 |
Neg logit contributions | |
ILCS | -1.403 |
Hiroshima | -1.325 |
Filipino | -1.303 |
Anaheim | -1.301 |
Huntington | -1.271 |
Token | Ice |
Token ID | 23709 |
Feature activation | -5.38e-01 |
Pos logit contributions | |
ILCS | +3.022 |
Hiroshima | +2.906 |
Anaheim | +2.884 |
Filipino | +2.872 |
chant | +2.796 |
Neg logit contributions | |
Rhod | -2.930 |
� | -2.713 |
)", | -2.628 |
crop | -2.570 |
recapt | -2.266 |
Token | Fields |
Token ID | 23948 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
Rhod | +4.437 |
� | +4.214 |
crop | +4.084 |
)", | +3.926 |
faces | +3.506 |
Neg logit contributions | |
ILCS | -6.949 |
Hiroshima | -6.611 |
Filipino | -6.525 |
Anaheim | -6.419 |
Huntington | -6.413 |
Token | was |
Token ID | 373 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
Rhod | +0.190 |
� | +0.178 |
)", | +0.171 |
crop | +0.169 |
recapt | +0.150 |
Neg logit contributions | |
ILCS | -0.195 |
Hiroshima | -0.184 |
Filipino | -0.183 |
Anaheim | -0.182 |
Huntington | -0.178 |
Token | one |
Token ID | 530 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
ILCS | +2.151 |
Hiroshima | +2.075 |
Anaheim | +2.062 |
Filipino | +2.051 |
Huntington | +2.000 |
Neg logit contributions | |
Rhod | -1.834 |
� | -1.716 |
)", | -1.657 |
crop | -1.627 |
faces | -1.402 |
Token | of |
Token ID | 286 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ILCS | +3.575 |
Hiroshima | +3.435 |
Anaheim | +3.421 |
Filipino | +3.384 |
Huntington | +3.304 |
Neg logit contributions | |
Rhod | -3.940 |
� | -3.723 |
)", | -3.635 |
crop | -3.542 |
faces | -3.138 |
Token | the |
Token ID | 262 |
Feature activation | +7.43e-01 |
Pos logit contributions | |
Anaheim | +11.206 |
Hiroshima | +10.897 |
ILCS | +10.879 |
Ballard | +10.833 |
Filipino | +10.714 |
Neg logit contributions | |
� | -12.195 |
Rhod | -12.098 |
)", | -11.897 |
crop | -11.585 |
faces | -10.011 |
Token | maps |
Token ID | 8739 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
ILCS | +7.824 |
Anaheim | +7.737 |
Hiroshima | +7.710 |
Filipino | +7.654 |
Huntington | +7.432 |
Neg logit contributions | |
Rhod | -7.452 |
� | -7.155 |
)", | -6.972 |
crop | -6.874 |
YD | -5.788 |
Token | exclusive |
Token ID | 8568 |
Feature activation | -2.80e-01 |
Pos logit contributions | |
ILCS | +4.789 |
Anaheim | +4.719 |
Hiroshima | +4.713 |
Filipino | +4.665 |
Huntington | +4.550 |
Neg logit contributions | |
Rhod | -4.285 |
� | -4.087 |
)", | -3.962 |
crop | -3.903 |
faces | -3.292 |
Token | to |
Token ID | 284 |
Feature activation | +5.39e-01 |
Pos logit contributions | |
Rhod | +2.963 |
� | +2.727 |
)", | +2.634 |
crop | +2.626 |
recapt | +2.355 |
Neg logit contributions | |
ILCS | -3.170 |
Hiroshima | -2.967 |
Filipino | -2.922 |
Anaheim | -2.891 |
chant | -2.888 |
Token | Halo |
Token ID | 18597 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
ILCS | +4.574 |
Hiroshima | +4.449 |
Anaheim | +4.441 |
Filipino | +4.412 |
Huntington | +4.275 |
Neg logit contributions | |
Rhod | -6.840 |
� | -6.638 |
)", | -6.428 |
crop | -6.292 |
faces | -5.697 |
Token | around |
Token ID | 1088 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
ILCS | +0.229 |
Hiroshima | +0.218 |
Anaheim | +0.216 |
Filipino | +0.216 |
Huntington | +0.211 |
Neg logit contributions | |
Rhod | -0.219 |
� | -0.207 |
)", | -0.199 |
crop | -0.195 |
recapt | -0.171 |
Token | 23 |
Token ID | 2242 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
ILCS | +7.178 |
Hiroshima | +7.173 |
Anaheim | +7.063 |
Filipino | +7.040 |
Manila | +6.837 |
Neg logit contributions | |
Rhod | -7.703 |
� | -7.210 |
)", | -7.170 |
crop | -7.041 |
faces | -6.311 |
Token | : |
Token ID | 25 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
ILCS | +5.140 |
Hiroshima | +4.936 |
Anaheim | +4.866 |
Filipino | +4.865 |
Huntington | +4.734 |
Neg logit contributions | |
Rhod | -5.900 |
� | -5.491 |
)", | -5.335 |
crop | -5.323 |
faces | -4.730 |
Token | 30 |
Token ID | 1270 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
ILCS | +4.511 |
Hiroshima | +4.289 |
Filipino | +4.238 |
Anaheim | +4.237 |
Manila | +4.029 |
Neg logit contributions | |
Rhod | -8.348 |
� | -7.883 |
)", | -7.738 |
crop | -7.688 |
recapt | -7.009 |
Token | on |
Token ID | 319 |
Feature activation | +1.29e-01 |
Pos logit contributions | |
ILCS | +3.000 |
Hiroshima | +2.882 |
Anaheim | +2.843 |
Filipino | +2.842 |
Huntington | +2.747 |
Neg logit contributions | |
Rhod | -3.266 |
� | -3.039 |
)", | -2.972 |
crop | -2.931 |
faces | -2.587 |
Token | Thursday |
Token ID | 3635 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
ILCS | +1.486 |
Hiroshima | +1.428 |
Anaheim | +1.416 |
Filipino | +1.411 |
Huntington | +1.376 |
Neg logit contributions | |
Rhod | -1.338 |
� | -1.251 |
)", | -1.209 |
crop | -1.188 |
recapt | -1.032 |
Token | , |
Token ID | 11 |
Feature activation | +6.78e-01 |
Pos logit contributions | |
ILCS | +10.796 |
Anaheim | +10.616 |
Hiroshima | +10.505 |
Filipino | +10.196 |
Manila | +10.105 |
Neg logit contributions | |
Rhod | -13.211 |
crop | -12.267 |
)", | -12.196 |
� | -11.814 |
faces | -10.814 |
Token | March |
Token ID | 2805 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
ILCS | +6.270 |
Hiroshima | +6.262 |
Anaheim | +6.254 |
Filipino | +6.190 |
Manila | +6.003 |
Neg logit contributions | |
Rhod | -7.759 |
� | -7.290 |
)", | -7.226 |
crop | -7.169 |
faces | -6.402 |
Token | 24 |
Token ID | 1987 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
ILCS | +2.436 |
Hiroshima | +2.341 |
Anaheim | +2.327 |
Filipino | +2.317 |
Huntington | +2.236 |
Neg logit contributions | |
Rhod | -3.420 |
� | -3.249 |
)", | -3.163 |
crop | -3.135 |
recapt | -2.807 |
Token | th |
Token ID | 400 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
ILCS | +8.733 |
Hiroshima | +8.464 |
Anaheim | +8.381 |
Filipino | +8.205 |
Manila | +7.915 |
Neg logit contributions | |
Rhod | -12.284 |
)", | -11.326 |
� | -11.101 |
crop | -10.886 |
recapt | -9.807 |
Token | . |
Token ID | 13 |
Feature activation | +5.12e-01 |
Pos logit contributions | |
ILCS | +9.276 |
Anaheim | +9.147 |
Hiroshima | +9.095 |
Filipino | +8.765 |
Manila | +8.591 |
Neg logit contributions | |
Rhod | -12.164 |
)", | -11.161 |
� | -11.007 |
crop | -10.999 |
faces | -9.703 |
Token | for |
Token ID | 329 |
Feature activation | +5.35e-02 |
Pos logit contributions | |
Rhod | +0.006 |
� | +0.006 |
)", | +0.006 |
crop | +0.006 |
recapt | +0.005 |
Neg logit contributions | |
ILCS | -0.006 |
Hiroshima | -0.006 |
Anaheim | -0.006 |
Filipino | -0.006 |
Huntington | -0.006 |
Token | power |
Token ID | 1176 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
ILCS | +0.623 |
Hiroshima | +0.596 |
Anaheim | +0.590 |
Filipino | +0.589 |
Huntington | +0.574 |
Neg logit contributions | |
Rhod | -0.550 |
� | -0.515 |
)", | -0.496 |
crop | -0.485 |
recapt | -0.425 |
Token | and |
Token ID | 290 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
Rhod | +1.294 |
� | +1.231 |
)", | +1.176 |
crop | +1.157 |
recapt | +1.023 |
Neg logit contributions | |
ILCS | -1.357 |
Hiroshima | -1.307 |
Filipino | -1.295 |
Anaheim | -1.284 |
Huntington | -1.255 |
Token | position |
Token ID | 2292 |
Feature activation | -2.79e-01 |
Pos logit contributions | |
Rhod | +2.394 |
� | +2.231 |
)", | +2.143 |
crop | +2.080 |
recapt | +1.892 |
Neg logit contributions | |
ILCS | -2.891 |
Hiroshima | -2.785 |
Filipino | -2.731 |
Anaheim | -2.728 |
chant | -2.685 |
Token | , |
Token ID | 11 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
Rhod | +2.842 |
� | +2.745 |
)", | +2.525 |
crop | +2.504 |
recapt | +2.233 |
Neg logit contributions | |
ILCS | -3.193 |
Hiroshima | -3.066 |
Filipino | -3.035 |
Anaheim | -2.987 |
chant | -2.966 |
Token | as |
Token ID | 355 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
ILCS | +4.201 |
Hiroshima | +4.039 |
Anaheim | +4.029 |
Filipino | +3.988 |
Huntington | +3.899 |
Neg logit contributions | |
Rhod | -5.193 |
� | -4.890 |
)", | -4.840 |
crop | -4.757 |
faces | -4.205 |
Token | the |
Token ID | 262 |
Feature activation | +5.14e-01 |
Pos logit contributions | |
ILCS | +11.256 |
Anaheim | +11.236 |
Hiroshima | +11.080 |
Huntington | +10.870 |
Ballard | +10.752 |
Neg logit contributions | |
Rhod | -10.069 |
� | -9.689 |
)", | -9.527 |
crop | -9.370 |
YD | -8.032 |
Token | city |
Token ID | 1748 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
ILCS | +5.860 |
Anaheim | +5.667 |
Hiroshima | +5.651 |
Filipino | +5.598 |
Huntington | +5.489 |
Neg logit contributions | |
Rhod | -5.046 |
� | -4.802 |
)", | -4.650 |
crop | -4.556 |
faces | -3.895 |
Token | hall |
Token ID | 6899 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
ILCS | +3.207 |
Hiroshima | +3.086 |
Anaheim | +3.074 |
Filipino | +3.047 |
Huntington | +2.976 |
Neg logit contributions | |
Rhod | -3.207 |
� | -3.001 |
)", | -2.947 |
crop | -2.891 |
recapt | -2.494 |
Token | is |
Token ID | 318 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
ILCS | +3.549 |
Hiroshima | +3.388 |
Anaheim | +3.384 |
Filipino | +3.353 |
Huntington | +3.262 |
Neg logit contributions | |
Rhod | -3.353 |
� | -3.119 |
)", | -3.068 |
crop | -3.006 |
faces | -2.579 |
Token | being |
Token ID | 852 |
Feature activation | +6.24e-02 |
Pos logit contributions | |
ILCS | +3.255 |
Hiroshima | +3.150 |
Anaheim | +3.136 |
Filipino | +3.115 |
Huntington | +3.041 |
Neg logit contributions | |
Rhod | -3.018 |
� | -2.813 |
)", | -2.744 |
crop | -2.702 |
faces | -2.352 |
Token | and |
Token ID | 290 |
Feature activation | +7.44e-01 |
Pos logit contributions | |
ILCS | +7.704 |
Hiroshima | +7.605 |
Anaheim | +7.463 |
Filipino | +7.245 |
Chinatown | +7.110 |
Neg logit contributions | |
Rhod | -9.226 |
)", | -8.765 |
� | -8.540 |
crop | -8.434 |
faces | -7.348 |
Token | Barcelona |
Token ID | 15142 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
Hiroshima | +7.653 |
Anaheim | +7.557 |
ILCS | +7.345 |
Filipino | +7.339 |
Manila | +7.332 |
Neg logit contributions | |
Rhod | -7.948 |
� | -7.516 |
)", | -7.366 |
crop | -7.317 |
YD | -6.431 |
Token | . |
Token ID | 13 |
Feature activation | -8.94e-02 |
Pos logit contributions | |
ILCS | +4.514 |
Hiroshima | +4.339 |
Anaheim | +4.309 |
Filipino | +4.234 |
Huntington | +4.147 |
Neg logit contributions | |
Rhod | -5.165 |
)", | -4.804 |
� | -4.775 |
crop | -4.664 |
faces | -4.085 |
Token | It |
Token ID | 632 |
Feature activation | -4.51e-02 |
Pos logit contributions | |
Rhod | +1.010 |
� | +0.950 |
)", | +0.908 |
crop | +0.899 |
recapt | +0.790 |
Neg logit contributions | |
ILCS | -0.952 |
Hiroshima | -0.896 |
Anaheim | -0.885 |
Filipino | -0.884 |
endo | -0.865 |
Token | took |
Token ID | 1718 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
Rhod | +0.477 |
� | +0.454 |
)", | +0.431 |
crop | +0.427 |
recapt | +0.379 |
Neg logit contributions | |
ILCS | -0.511 |
Hiroshima | -0.485 |
Filipino | -0.482 |
Anaheim | -0.479 |
Huntington | -0.466 |
Token | centuries |
Token ID | 10675 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
Rhod | +4.696 |
� | +4.462 |
)", | +4.207 |
crop | +4.124 |
recapt | +3.702 |
Neg logit contributions | |
ILCS | -5.898 |
Hiroshima | -5.377 |
Anaheim | -5.294 |
Filipino | -5.279 |
chant | -5.244 |
Token | for |
Token ID | 329 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
ILCS | +10.639 |
Hiroshima | +10.502 |
Filipino | +10.409 |
Anaheim | +10.165 |
chant | +9.885 |
Neg logit contributions | |
Rhod | -15.006 |
)", | -14.286 |
crop | -13.671 |
� | -13.349 |
faces | -12.122 |
Token | Bangkok |
Token ID | 35007 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
ILCS | +3.066 |
Hiroshima | +2.991 |
Anaheim | +2.965 |
Filipino | +2.965 |
Huntington | +2.890 |
Neg logit contributions | |
Rhod | -2.905 |
� | -2.729 |
)", | -2.651 |
crop | -2.590 |
faces | -2.250 |
Token | to |
Token ID | 284 |
Feature activation | +5.83e-01 |
Pos logit contributions | |
ILCS | +1.710 |
Hiroshima | +1.636 |
Anaheim | +1.621 |
Filipino | +1.617 |
Huntington | +1.571 |
Neg logit contributions | |
Rhod | -1.859 |
� | -1.748 |
)", | -1.698 |
crop | -1.670 |
recapt | -1.470 |
Token | develop |
Token ID | 1205 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
Hiroshima | +6.098 |
ILCS | +6.056 |
Filipino | +5.997 |
Anaheim | +5.990 |
Huntington | +5.868 |
Neg logit contributions | |
Rhod | -6.282 |
� | -5.781 |
)", | -5.609 |
crop | -5.492 |
YD | -4.844 |
Token | its |
Token ID | 663 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
ILCS | +2.127 |
Hiroshima | +2.054 |
Anaheim | +2.038 |
Filipino | +2.037 |
Huntington | +1.983 |
Neg logit contributions | |
Rhod | -1.994 |
� | -1.861 |
)", | -1.813 |
crop | -1.769 |
faces | -1.540 |
Token | different |
Token ID | 1180 |
Feature activation | +2.65e-01 |
Pos logit contributions | |
ILCS | +2.252 |
Hiroshima | +2.172 |
Filipino | +2.164 |
Anaheim | +2.157 |
Huntington | +2.106 |
Neg logit contributions | |
Rhod | -2.212 |
� | -2.088 |
)", | -2.009 |
crop | -1.982 |
faces | -1.735 |
Token | from |
Token ID | 422 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
ILCS | +2.683 |
Hiroshima | +2.587 |
Anaheim | +2.561 |
Filipino | +2.551 |
Huntington | +2.480 |
Neg logit contributions | |
Rhod | -3.074 |
� | -2.900 |
)", | -2.814 |
crop | -2.780 |
faces | -2.451 |
Token | what |
Token ID | 644 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
Hiroshima | +11.348 |
Anaheim | +11.088 |
Filipino | +10.808 |
Manila | +10.624 |
Huntington | +10.423 |
Neg logit contributions | |
Rhod | -10.598 |
� | -10.285 |
crop | -10.253 |
)", | -10.209 |
faces | -8.818 |
Token | it |
Token ID | 340 |
Feature activation | -5.23e-02 |
Pos logit contributions | |
Hiroshima | +8.712 |
Anaheim | +8.524 |
Filipino | +8.442 |
Manila | +8.223 |
ILCS | +8.167 |
Neg logit contributions | |
Rhod | -8.282 |
� | -7.941 |
crop | -7.924 |
)", | -7.862 |
faces | -6.693 |
Token | was |
Token ID | 373 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
Rhod | +0.515 |
� | +0.482 |
)", | +0.459 |
crop | +0.449 |
recapt | +0.396 |
Neg logit contributions | |
ILCS | -0.636 |
Hiroshima | -0.604 |
Filipino | -0.598 |
Anaheim | -0.597 |
chant | -0.582 |
Token | in |
Token ID | 287 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
Rhod | +1.357 |
� | +1.275 |
)", | +1.226 |
crop | +1.187 |
recapt | +1.061 |
Neg logit contributions | |
ILCS | -1.431 |
Hiroshima | -1.345 |
Filipino | -1.345 |
Anaheim | -1.340 |
chant | -1.308 |
Token | the |
Token ID | 262 |
Feature activation | +9.49e-01 |
Pos logit contributions | |
Hiroshima | +13.719 |
Anaheim | +13.035 |
Manila | +12.304 |
Filipino | +12.073 |
Japan | +11.955 |
Neg logit contributions | |
� | -14.240 |
Rhod | -14.201 |
crop | -14.100 |
)", | -13.545 |
faces | -12.541 |
Token | ' |
Token ID | 705 |
Feature activation | +5.41e-01 |
Pos logit contributions | |
Hiroshima | +9.882 |
Anaheim | +9.656 |
Filipino | +9.493 |
Manila | +9.270 |
Huntington | +9.075 |
Neg logit contributions | |
Rhod | -9.201 |
crop | -9.144 |
� | -9.134 |
)", | -8.856 |
faces | -7.720 |
Token | 80 |
Token ID | 1795 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
ILCS | +5.011 |
Hiroshima | +4.892 |
Anaheim | +4.801 |
Filipino | +4.785 |
chant | +4.674 |
Neg logit contributions | |
Rhod | -6.500 |
� | -6.131 |
)", | -5.969 |
crop | -5.791 |
recapt | -5.232 |
Token | s |
Token ID | 82 |
Feature activation | +5.25e-01 |
Pos logit contributions | |
ILCS | +3.895 |
Hiroshima | +3.766 |
Anaheim | +3.738 |
Filipino | +3.737 |
Manila | +3.589 |
Neg logit contributions | |
Rhod | -5.752 |
� | -5.388 |
)", | -5.226 |
crop | -5.141 |
recapt | -4.600 |
Token | , |
Token ID | 11 |
Feature activation | +8.71e-01 |
Pos logit contributions | |
ILCS | +5.347 |
Hiroshima | +5.219 |
Anaheim | +5.194 |
Filipino | +5.100 |
Huntington | +4.972 |
Neg logit contributions | |
Rhod | -5.868 |
� | -5.439 |
crop | -5.341 |
)", | -5.312 |
faces | -4.679 |
Token | flight |
Token ID | 22560 |
Feature activation | +9.84e-02 |
Pos logit contributions | |
ILCS | +1.740 |
Hiroshima | +1.668 |
Anaheim | +1.657 |
Filipino | +1.652 |
Huntington | +1.606 |
Neg logit contributions | |
Rhod | -1.753 |
� | -1.645 |
)", | -1.595 |
crop | -1.565 |
faces | -1.369 |
Token | to |
Token ID | 284 |
Feature activation | -7.41e-03 |
Pos logit contributions | |
ILCS | +1.108 |
Hiroshima | +1.061 |
Anaheim | +1.051 |
Filipino | +1.048 |
Huntington | +1.021 |
Neg logit contributions | |
Rhod | -1.049 |
� | -0.982 |
)", | -0.949 |
crop | -0.933 |
recapt | -0.816 |
Token | support |
Token ID | 1104 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
Rhod | +0.076 |
� | +0.070 |
)", | +0.068 |
crop | +0.067 |
recapt | +0.058 |
Neg logit contributions | |
ILCS | -0.088 |
Hiroshima | -0.083 |
Anaheim | -0.082 |
Filipino | -0.082 |
Huntington | -0.080 |
Token | the |
Token ID | 262 |
Feature activation | +7.29e-02 |
Pos logit contributions | |
ILCS | +3.578 |
Hiroshima | +3.540 |
Filipino | +3.506 |
Anaheim | +3.481 |
Huntington | +3.396 |
Neg logit contributions | |
Rhod | -3.494 |
� | -3.322 |
)", | -3.206 |
crop | -3.129 |
faces | -2.762 |
Token | ISS |
Token ID | 33805 |
Feature activation | -6.14e-02 |
Pos logit contributions | |
ILCS | +0.831 |
Hiroshima | +0.795 |
Anaheim | +0.789 |
Filipino | +0.786 |
Huntington | +0.766 |
Neg logit contributions | |
Rhod | -0.769 |
� | -0.717 |
)", | -0.694 |
crop | -0.683 |
recapt | -0.596 |
Token | and |
Token ID | 290 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
Rhod | +0.637 |
� | +0.595 |
)", | +0.571 |
crop | +0.566 |
recapt | +0.496 |
Neg logit contributions | |
ILCS | -0.716 |
Hiroshima | -0.680 |
Anaheim | -0.671 |
Filipino | -0.669 |
Huntington | -0.653 |
Token | the |
Token ID | 262 |
Feature activation | -8.24e-02 |
Pos logit contributions | |
ILCS | +3.588 |
Hiroshima | +3.526 |
Filipino | +3.486 |
Anaheim | +3.478 |
Huntington | +3.385 |
Neg logit contributions | |
Rhod | -3.626 |
� | -3.471 |
)", | -3.338 |
crop | -3.265 |
faces | -2.900 |
Token | development |
Token ID | 2478 |
Feature activation | -3.44e-02 |
Pos logit contributions | |
Rhod | +0.875 |
� | +0.801 |
)", | +0.780 |
crop | +0.772 |
recapt | +0.683 |
Neg logit contributions | |
ILCS | -0.946 |
Hiroshima | -0.890 |
Anaheim | -0.884 |
Filipino | -0.877 |
chant | -0.862 |
Token | of |
Token ID | 286 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
Rhod | +0.362 |
� | +0.336 |
)", | +0.325 |
crop | +0.321 |
recapt | +0.282 |
Neg logit contributions | |
ILCS | -0.393 |
Hiroshima | -0.376 |
Anaheim | -0.372 |
Filipino | -0.371 |
Huntington | -0.361 |
Token | next |
Token ID | 1306 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
ILCS | +4.112 |
Hiroshima | +4.067 |
Filipino | +4.039 |
Anaheim | +4.010 |
Huntington | +3.926 |
Neg logit contributions | |
Rhod | -3.883 |
� | -3.748 |
)", | -3.590 |
crop | -3.494 |
faces | -3.080 |
Token | - |
Token ID | 12 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
ILCS | +3.336 |
Hiroshima | +3.208 |
Filipino | +3.186 |
Anaheim | +3.185 |
Huntington | +3.078 |
Neg logit contributions | |
Rhod | -4.040 |
� | -3.808 |
)", | -3.716 |
crop | -3.621 |
faces | -3.220 |
Token | I |
Token ID | 314 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
ILCS | +1.429 |
Hiroshima | +1.372 |
Anaheim | +1.360 |
Filipino | +1.355 |
Huntington | +1.319 |
Neg logit contributions | |
Rhod | -1.501 |
� | -1.411 |
)", | -1.369 |
crop | -1.345 |
faces | -1.180 |
Token | � |
Token ID | 447 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
Rhod | +2.415 |
� | +2.321 |
)", | +2.182 |
crop | +2.146 |
recapt | +1.901 |
Neg logit contributions | |
ILCS | -3.023 |
Hiroshima | -2.849 |
Filipino | -2.834 |
Anaheim | -2.817 |
Huntington | -2.748 |
Token | � |
Token ID | 247 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
Rhod | +2.040 |
� | +1.954 |
)", | +1.821 |
crop | +1.774 |
faces | +1.497 |
Neg logit contributions | |
ILCS | -3.017 |
Hiroshima | -2.940 |
Anaheim | -2.898 |
Filipino | -2.885 |
Huntington | -2.829 |
Token | d |
Token ID | 67 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
Rhod | +4.028 |
� | +3.933 |
crop | +3.717 |
)", | +3.710 |
faces | +3.134 |
Neg logit contributions | |
ILCS | -5.059 |
Hiroshima | -4.852 |
Anaheim | -4.822 |
Filipino | -4.822 |
Huntington | -4.658 |
Token | argue |
Token ID | 7267 |
Feature activation | -3.96e-01 |
Pos logit contributions | |
ILCS | +0.406 |
Hiroshima | +0.391 |
Anaheim | +0.388 |
Filipino | +0.387 |
Huntington | +0.378 |
Neg logit contributions | |
Rhod | -0.323 |
� | -0.300 |
)", | -0.289 |
crop | -0.284 |
recapt | -0.244 |
Token | that |
Token ID | 326 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
Rhod | +3.323 |
� | +3.140 |
crop | +2.914 |
)", | +2.865 |
recapt | +2.520 |
Neg logit contributions | |
ILCS | -5.302 |
Hiroshima | -4.912 |
Filipino | -4.886 |
Anaheim | -4.813 |
chant | -4.748 |
Token | it |
Token ID | 340 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
ILCS | +4.030 |
Hiroshima | +3.962 |
Anaheim | +3.949 |
Filipino | +3.911 |
Huntington | +3.835 |
Neg logit contributions | |
Rhod | -4.095 |
� | -3.833 |
)", | -3.739 |
crop | -3.660 |
faces | -3.202 |
Token | � |
Token ID | 447 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
Rhod | +1.171 |
� | +1.128 |
)", | +1.062 |
crop | +1.058 |
recapt | +0.926 |
Neg logit contributions | |
ILCS | -1.399 |
Hiroshima | -1.331 |
Filipino | -1.320 |
Anaheim | -1.312 |
Huntington | -1.280 |
Token | � |
Token ID | 247 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
ILCS | +4.065 |
Hiroshima | +3.875 |
Anaheim | +3.860 |
Filipino | +3.859 |
Huntington | +3.747 |
Neg logit contributions | |
Rhod | -3.820 |
� | -3.511 |
)", | -3.456 |
crop | -3.399 |
recapt | -2.979 |
Token | s |
Token ID | 82 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
ILCS | +2.132 |
Hiroshima | +2.036 |
Anaheim | +2.015 |
Filipino | +2.008 |
Huntington | +1.951 |
Neg logit contributions | |
Rhod | -2.525 |
� | -2.377 |
)", | -2.309 |
crop | -2.273 |
recapt | -2.016 |
Token | a |
Token ID | 257 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ILCS | +1.778 |
Hiroshima | +1.716 |
Anaheim | +1.703 |
Filipino | +1.697 |
Huntington | +1.656 |
Neg logit contributions | |
Rhod | -1.583 |
� | -1.477 |
)", | -1.427 |
crop | -1.400 |
faces | -1.213 |
Token | the |
Token ID | 262 |
Feature activation | +8.00e-02 |
Pos logit contributions | |
Rhod | +3.112 |
� | +2.798 |
)", | +2.750 |
crop | +2.693 |
recapt | +2.460 |
Neg logit contributions | |
ILCS | -3.138 |
Hiroshima | -2.882 |
Filipino | -2.864 |
endo | -2.832 |
Anaheim | -2.829 |
Token | paper |
Token ID | 3348 |
Feature activation | -1.99e-01 |
Pos logit contributions | |
ILCS | +0.906 |
Hiroshima | +0.867 |
Anaheim | +0.858 |
Filipino | +0.857 |
Huntington | +0.834 |
Neg logit contributions | |
Rhod | -0.850 |
� | -0.793 |
)", | -0.767 |
crop | -0.754 |
recapt | -0.659 |
Token | asked |
Token ID | 1965 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
Rhod | +2.066 |
� | +1.910 |
)", | +1.838 |
crop | +1.838 |
recapt | +1.642 |
Neg logit contributions | |
ILCS | -2.321 |
Hiroshima | -2.160 |
Filipino | -2.138 |
Anaheim | -2.124 |
endo | -2.084 |
Token | artist |
Token ID | 6802 |
Feature activation | +5.04e-02 |
Pos logit contributions | |
Rhod | +1.959 |
� | +1.794 |
)", | +1.762 |
crop | +1.703 |
recapt | +1.534 |
Neg logit contributions | |
ILCS | -1.977 |
Hiroshima | -1.827 |
Filipino | -1.811 |
Anaheim | -1.796 |
chant | -1.787 |
Token | Mary |
Token ID | 5335 |
Feature activation | -3.76e-02 |
Pos logit contributions | |
ILCS | +0.493 |
Hiroshima | +0.463 |
Anaheim | +0.460 |
Filipino | +0.458 |
chant | +0.443 |
Neg logit contributions | |
Rhod | -0.618 |
� | -0.579 |
)", | -0.563 |
crop | -0.554 |
recapt | -0.496 |
Token | Anne |
Token ID | 15397 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
Rhod | +0.413 |
� | +0.383 |
)", | +0.369 |
crop | +0.364 |
faces | +0.319 |
Neg logit contributions | |
ILCS | -0.417 |
Hiroshima | -0.395 |
Anaheim | -0.393 |
Filipino | -0.390 |
chant | -0.377 |
Token | Bark |
Token ID | 20511 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
ILCS | +2.296 |
Hiroshima | +2.205 |
Anaheim | +2.186 |
Filipino | +2.179 |
Huntington | +2.127 |
Neg logit contributions | |
Rhod | -2.133 |
� | -2.000 |
)", | -1.935 |
crop | -1.902 |
recapt | -1.656 |
Token | house |
Token ID | 4803 |
Feature activation | -3.96e-02 |
Pos logit contributions | |
Rhod | +0.228 |
� | +0.215 |
)", | +0.208 |
crop | +0.206 |
faces | +0.182 |
Neg logit contributions | |
ILCS | -0.198 |
Hiroshima | -0.187 |
Anaheim | -0.186 |
Filipino | -0.184 |
Huntington | -0.178 |
Token | why |
Token ID | 1521 |
Feature activation | -3.79e-01 |
Pos logit contributions | |
Rhod | +0.444 |
� | +0.416 |
)", | +0.401 |
crop | +0.395 |
recapt | +0.350 |
Neg logit contributions | |
ILCS | -0.431 |
Hiroshima | -0.404 |
Anaheim | -0.402 |
Filipino | -0.400 |
chant | -0.388 |
Token | the |
Token ID | 262 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
Rhod | +4.156 |
� | +3.666 |
)", | +3.637 |
crop | +3.580 |
recapt | +3.224 |
Neg logit contributions | |
ILCS | -4.207 |
Filipino | -3.822 |
Hiroshima | -3.811 |
chant | -3.793 |
endo | -3.773 |
Token | squirrel |
Token ID | 33039 |
Feature activation | -5.09e-01 |
Pos logit contributions | |
Rhod | +3.053 |
� | +2.767 |
)", | +2.688 |
crop | +2.638 |
recapt | +2.351 |
Neg logit contributions | |
ILCS | -3.392 |
Hiroshima | -3.139 |
Filipino | -3.093 |
chant | -3.061 |
Anaheim | -3.057 |
Token | other |
Token ID | 584 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
ILCS | +2.844 |
Hiroshima | +2.763 |
Filipino | +2.742 |
Anaheim | +2.741 |
Huntington | +2.647 |
Neg logit contributions | |
Rhod | -2.757 |
� | -2.596 |
)", | -2.526 |
crop | -2.501 |
faces | -2.141 |
Token | hand |
Token ID | 1021 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
ILCS | +2.457 |
Hiroshima | +2.358 |
Anaheim | +2.338 |
Filipino | +2.333 |
Huntington | +2.250 |
Neg logit contributions | |
Rhod | -3.402 |
� | -3.217 |
)", | -3.151 |
crop | -3.095 |
recapt | -2.763 |
Token | , |
Token ID | 11 |
Feature activation | +9.82e-02 |
Pos logit contributions | |
Rhod | +3.151 |
� | +2.930 |
)", | +2.739 |
crop | +2.689 |
recapt | +2.346 |
Neg logit contributions | |
ILCS | -4.256 |
Hiroshima | -3.976 |
Filipino | -3.968 |
Anaheim | -3.945 |
chant | -3.917 |
Token | shouldn |
Token ID | 6584 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
ILCS | +1.031 |
Hiroshima | +0.988 |
Anaheim | +0.979 |
Filipino | +0.976 |
Huntington | +0.949 |
Neg logit contributions | |
Rhod | -1.118 |
� | -1.053 |
)", | -1.021 |
crop | -1.006 |
recapt | -0.884 |
Token | � |
Token ID | 447 |
Feature activation | -9.41e-02 |
Pos logit contributions | |
Rhod | +3.295 |
� | +3.066 |
)", | +2.755 |
crop | +2.735 |
recapt | +2.305 |
Neg logit contributions | |
ILCS | -6.059 |
Hiroshima | -5.795 |
Filipino | -5.713 |
Anaheim | -5.695 |
Huntington | -5.685 |
Token | � |
Token ID | 247 |
Feature activation | +8.88e-03 |
Pos logit contributions | |
Rhod | +0.897 |
� | +0.849 |
)", | +0.800 |
crop | +0.781 |
faces | +0.672 |
Neg logit contributions | |
ILCS | -1.159 |
Hiroshima | -1.119 |
Anaheim | -1.104 |
Filipino | -1.102 |
Huntington | -1.080 |
Token | t |
Token ID | 83 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
ILCS | +0.096 |
Hiroshima | +0.091 |
Anaheim | +0.091 |
Filipino | +0.090 |
Huntington | +0.087 |
Neg logit contributions | |
Rhod | -0.099 |
� | -0.094 |
)", | -0.090 |
crop | -0.089 |
faces | -0.078 |
Token | we |
Token ID | 356 |
Feature activation | +2.99e-02 |
Pos logit contributions | |
ILCS | +1.542 |
Hiroshima | +1.478 |
Anaheim | +1.464 |
Filipino | +1.461 |
Huntington | +1.420 |
Neg logit contributions | |
Rhod | -1.621 |
� | -1.525 |
)", | -1.480 |
crop | -1.456 |
recapt | -1.279 |
Token | always |
Token ID | 1464 |
Feature activation | +4.12e-01 |
Pos logit contributions | |
ILCS | +0.357 |
Hiroshima | +0.342 |
Anaheim | +0.340 |
Filipino | +0.339 |
Huntington | +0.330 |
Neg logit contributions | |
Rhod | -0.298 |
� | -0.277 |
)", | -0.268 |
crop | -0.263 |
recapt | -0.227 |
Token | � |
Token ID | 564 |
Feature activation | -3.64e-03 |
Pos logit contributions | |
ILCS | +4.788 |
Hiroshima | +4.692 |
Anaheim | +4.621 |
Filipino | +4.590 |
Huntington | +4.506 |
Neg logit contributions | |
Rhod | -4.102 |
� | -3.789 |
)", | -3.650 |
crop | -3.646 |
faces | -3.128 |
Token | � |
Token ID | 246 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
Rhod | +0.035 |
� | +0.033 |
)", | +0.032 |
crop | +0.031 |
faces | +0.027 |
Neg logit contributions | |
ILCS | -0.044 |
Hiroshima | -0.043 |
Anaheim | -0.042 |
Filipino | -0.042 |
Huntington | -0.041 |
Token | Amy |
Token ID | 14235 |
Feature activation | -4.90e-01 |
Pos logit contributions | |
Rhod | +3.748 |
� | +3.415 |
)", | +3.332 |
crop | +3.242 |
faces | +2.877 |
Neg logit contributions | |
ILCS | -3.349 |
Hiroshima | -3.077 |
Filipino | -3.043 |
Anaheim | -3.040 |
chant | -2.986 |
Token | Sed |
Token ID | 22710 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
Rhod | +4.883 |
� | +4.455 |
crop | +4.214 |
)", | +4.185 |
recapt | +3.785 |
Neg logit contributions | |
ILCS | -5.710 |
Filipino | -5.403 |
Hiroshima | -5.398 |
Anaheim | -5.377 |
chant | -5.241 |
Token | aris |
Token ID | 20066 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
ILCS | +0.127 |
Hiroshima | +0.121 |
Anaheim | +0.120 |
Filipino | +0.120 |
Huntington | +0.116 |
Neg logit contributions | |
Rhod | -0.146 |
� | -0.138 |
)", | -0.134 |
crop | -0.132 |
recapt | -0.117 |
Token | is |
Token ID | 318 |
Feature activation | -8.40e-02 |
Pos logit contributions | |
Rhod | +1.550 |
� | +1.454 |
)", | +1.391 |
crop | +1.372 |
recapt | +1.228 |
Neg logit contributions | |
ILCS | -1.652 |
Hiroshima | -1.561 |
Anaheim | -1.548 |
Filipino | -1.541 |
Huntington | -1.498 |
Token | pleasantly |
Token ID | 42683 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
Rhod | +0.855 |
� | +0.793 |
)", | +0.767 |
crop | +0.754 |
recapt | +0.668 |
Neg logit contributions | |
ILCS | -0.991 |
Hiroshima | -0.938 |
Anaheim | -0.928 |
Filipino | -0.925 |
chant | -0.903 |
Token | der |
Token ID | 4587 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
Rhod | +1.141 |
� | +1.059 |
)", | +1.035 |
crop | +1.013 |
recapt | +0.912 |
Neg logit contributions | |
ILCS | -1.176 |
Hiroshima | -1.111 |
Anaheim | -1.102 |
Filipino | -1.094 |
Huntington | -1.070 |
Token | anged |
Token ID | 5102 |
Feature activation | -6.71e-02 |
Pos logit contributions | |
ILCS | +3.184 |
Hiroshima | +3.029 |
Anaheim | +3.012 |
Filipino | +2.998 |
Huntington | +2.893 |
Neg logit contributions | |
Rhod | -4.493 |
� | -4.251 |
)", | -4.150 |
crop | -4.063 |
recapt | -3.658 |
Token | . |
Token ID | 13 |
Feature activation | +3.13e-02 |
Pos logit contributions | |
Rhod | +0.719 |
� | +0.668 |
)", | +0.643 |
crop | +0.638 |
recapt | +0.565 |
Neg logit contributions | |
ILCS | -0.756 |
Hiroshima | -0.713 |
Anaheim | -0.708 |
Filipino | -0.706 |
Huntington | -0.690 |
Token | There |
Token ID | 1318 |
Feature activation | -1.24e-03 |
Pos logit contributions | |
ILCS | +0.325 |
Hiroshima | +0.307 |
Filipino | +0.304 |
Anaheim | +0.304 |
Huntington | +0.295 |
Neg logit contributions | |
Rhod | -0.364 |
� | -0.340 |
)", | -0.330 |
crop | -0.325 |
faces | -0.286 |
Token | � |
Token ID | 447 |
Feature activation | -4.05e-01 |
Pos logit contributions | |
Rhod | +0.014 |
� | +0.013 |
)", | +0.013 |
crop | +0.013 |
faces | +0.011 |
Neg logit contributions | |
ILCS | -0.013 |
Hiroshima | -0.013 |
Anaheim | -0.012 |
Filipino | -0.012 |
Huntington | -0.012 |
Token | � |
Token ID | 247 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
Rhod | +4.032 |
� | +3.883 |
)", | +3.602 |
crop | +3.570 |
faces | +3.162 |
Neg logit contributions | |
ILCS | -4.609 |
Hiroshima | -4.447 |
Filipino | -4.415 |
Anaheim | -4.402 |
Huntington | -4.335 |
Token | new |
Token ID | 649 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
Rhod | +1.500 |
� | +1.367 |
)", | +1.339 |
crop | +1.302 |
recapt | +1.148 |
Neg logit contributions | |
ILCS | -1.749 |
Anaheim | -1.643 |
Hiroshima | -1.639 |
Filipino | -1.605 |
endo | -1.590 |
Token | fair |
Token ID | 3148 |
Feature activation | -3.50e-01 |
Pos logit contributions | |
Rhod | +2.451 |
� | +2.188 |
)", | +2.164 |
crop | +2.096 |
graded | +1.790 |
Neg logit contributions | |
ILCS | -3.785 |
Hiroshima | -3.507 |
Anaheim | -3.506 |
endo | -3.462 |
wang | -3.427 |
Token | one |
Token ID | 530 |
Feature activation | -7.12e-02 |
Pos logit contributions | |
Rhod | +3.401 |
� | +3.212 |
)", | +3.063 |
crop | +3.012 |
grading | +2.629 |
Neg logit contributions | |
ILCS | -4.183 |
Hiroshima | -3.994 |
Anaheim | -3.964 |
Huntington | -3.899 |
Filipino | -3.879 |
Token | based |
Token ID | 1912 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
Rhod | +0.704 |
� | +0.656 |
)", | +0.639 |
crop | +0.620 |
recapt | +0.543 |
Neg logit contributions | |
ILCS | -0.853 |
Hiroshima | -0.814 |
Anaheim | -0.809 |
Filipino | -0.800 |
Huntington | -0.789 |
Token | on |
Token ID | 319 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
Rhod | +1.004 |
� | +0.922 |
)", | +0.896 |
crop | +0.864 |
recapt | +0.746 |
Neg logit contributions | |
ILCS | -1.421 |
Hiroshima | -1.352 |
Anaheim | -1.339 |
Filipino | -1.333 |
Huntington | -1.317 |
Token | the |
Token ID | 262 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
Rhod | +1.057 |
� | +0.970 |
)", | +0.947 |
crop | +0.921 |
recapt | +0.814 |
Neg logit contributions | |
ILCS | -1.193 |
Hiroshima | -1.113 |
Anaheim | -1.111 |
Filipino | -1.094 |
chant | -1.076 |
Token | principles |
Token ID | 7811 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
Rhod | +3.085 |
� | +2.773 |
)", | +2.723 |
crop | +2.627 |
recapt | +2.378 |
Neg logit contributions | |
ILCS | -3.566 |
Anaheim | -3.283 |
Hiroshima | -3.268 |
endo | -3.231 |
chant | -3.227 |
Token | of |
Token ID | 286 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
ILCS | +2.057 |
Hiroshima | +1.971 |
Anaheim | +1.953 |
Filipino | +1.949 |
Huntington | +1.897 |
Neg logit contributions | |
Rhod | -2.029 |
� | -1.903 |
)", | -1.841 |
crop | -1.813 |
recapt | -1.584 |
Token | independence |
Token ID | 10404 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
Rhod | +2.234 |
� | +2.024 |
)", | +1.981 |
crop | +1.920 |
recapt | +1.692 |
Neg logit contributions | |
ILCS | -2.682 |
Anaheim | -2.472 |
Hiroshima | -2.464 |
Filipino | -2.428 |
chant | -2.402 |
Token | , |
Token ID | 11 |
Feature activation | -3.99e-01 |
Pos logit contributions | |
Rhod | +2.827 |
� | +2.649 |
)", | +2.565 |
crop | +2.455 |
recapt | +2.214 |
Neg logit contributions | |
ILCS | -3.713 |
Hiroshima | -3.528 |
Anaheim | -3.513 |
Filipino | -3.430 |
Huntington | -3.414 |
Token | equality |
Token ID | 10537 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
Rhod | +3.710 |
� | +3.345 |
)", | +3.243 |
crop | +3.149 |
recapt | +2.817 |
Neg logit contributions | |
ILCS | -5.047 |
Anaheim | -4.684 |
Hiroshima | -4.669 |
endo | -4.557 |
Filipino | -4.553 |
Token | are |
Token ID | 389 |
Feature activation | -8.28e-02 |
Pos logit contributions | |
ILCS | +1.007 |
Hiroshima | +0.955 |
Anaheim | +0.944 |
Filipino | +0.944 |
Huntington | +0.916 |
Neg logit contributions | |
Rhod | -1.068 |
� | -1.004 |
)", | -0.970 |
crop | -0.960 |
recapt | -0.846 |
Token | six |
Token ID | 2237 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
Rhod | +0.876 |
� | +0.809 |
)", | +0.784 |
crop | +0.776 |
recapt | +0.686 |
Neg logit contributions | |
ILCS | -0.945 |
Hiroshima | -0.894 |
Filipino | -0.887 |
Anaheim | -0.885 |
chant | -0.865 |
Token | preset |
Token ID | 38266 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
ILCS | +0.154 |
Hiroshima | +0.147 |
Filipino | +0.146 |
Anaheim | +0.146 |
Huntington | +0.142 |
Neg logit contributions | |
Rhod | -0.142 |
� | -0.132 |
)", | -0.128 |
crop | -0.126 |
recapt | -0.110 |
Token | modes |
Token ID | 12881 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
Rhod | +5.091 |
� | +4.637 |
crop | +4.437 |
)", | +4.435 |
tire | +4.078 |
Neg logit contributions | |
ILCS | -5.781 |
Filipino | -5.475 |
Hiroshima | -5.405 |
Anaheim | -5.325 |
wang | -5.317 |
Token | for |
Token ID | 329 |
Feature activation | -6.32e-01 |
Pos logit contributions | |
ILCS | +2.387 |
Hiroshima | +2.297 |
Anaheim | +2.281 |
Filipino | +2.267 |
Huntington | +2.210 |
Neg logit contributions | |
Rhod | -2.491 |
� | -2.350 |
)", | -2.280 |
crop | -2.238 |
faces | -1.955 |
Token | the |
Token ID | 262 |
Feature activation | -8.37e-01 |
Pos logit contributions | |
Rhod | +6.160 |
� | +5.380 |
crop | +5.281 |
)", | +5.135 |
recapt | +4.841 |
Neg logit contributions | |
ILCS | -7.433 |
Hiroshima | -6.832 |
Filipino | -6.772 |
chant | -6.770 |
wang | -6.660 |
Token | truck |
Token ID | 7779 |
Feature activation | -5.27e-01 |
Pos logit contributions | |
Rhod | +7.891 |
� | +6.964 |
crop | +6.873 |
)", | +6.597 |
tire | +6.385 |
Neg logit contributions | |
ILCS | -9.517 |
wang | -8.597 |
Hiroshima | -8.586 |
Filipino | -8.581 |
chant | -8.564 |
Token | depending |
Token ID | 6906 |
Feature activation | -5.69e-01 |
Pos logit contributions | |
Rhod | +5.102 |
� | +4.600 |
crop | +4.545 |
)", | +4.453 |
recapt | +4.043 |
Neg logit contributions | |
ILCS | -6.335 |
Filipino | -5.748 |
Hiroshima | -5.742 |
Anaheim | -5.652 |
chant | -5.634 |
Token | on |
Token ID | 319 |
Feature activation | -7.67e-01 |
Pos logit contributions | |
Rhod | +4.332 |
� | +3.937 |
crop | +3.722 |
)", | +3.621 |
graded | +3.124 |
Neg logit contributions | |
ILCS | -7.861 |
Hiroshima | -7.401 |
Anaheim | -7.317 |
Filipino | -7.306 |
Huntington | -7.220 |
Token | terrain |
Token ID | 15510 |
Feature activation | -8.77e-01 |
Pos logit contributions | |
Rhod | +8.099 |
� | +7.347 |
crop | +7.112 |
tire | +6.945 |
)", | +6.889 |
Neg logit contributions | |
ILCS | -7.918 |
Hiroshima | -7.387 |
Filipino | -7.219 |
ushi | -7.156 |
endo | -7.125 |
Token | and |
Token ID | 290 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
Rhod | +7.362 |
� | +6.654 |
crop | +6.315 |
)", | +5.947 |
grading | +5.936 |
Neg logit contributions | |
ILCS | -10.996 |
Hiroshima | -10.070 |
Filipino | -9.990 |
chant | -9.911 |
endo | -9.910 |
Token | and |
Token ID | 290 |
Feature activation | -7.44e-01 |
Pos logit contributions | |
Rhod | +0.797 |
� | +0.746 |
)", | +0.719 |
crop | +0.712 |
faces | +0.622 |
Neg logit contributions | |
ILCS | -0.787 |
Hiroshima | -0.751 |
Anaheim | -0.745 |
Filipino | -0.744 |
Huntington | -0.722 |
Token | First |
Token ID | 3274 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
Rhod | +8.048 |
� | +6.961 |
)", | +6.896 |
crop | +6.729 |
recapt | +6.511 |
Neg logit contributions | |
ILCS | -7.766 |
Filipino | -7.053 |
chant | -6.973 |
endo | -6.968 |
Hiroshima | -6.955 |
Token | Strike |
Token ID | 12282 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
Rhod | +1.632 |
� | +1.530 |
)", | +1.475 |
crop | +1.470 |
faces | +1.298 |
Neg logit contributions | |
ILCS | -1.375 |
Hiroshima | -1.296 |
Filipino | -1.294 |
Anaheim | -1.288 |
chant | -1.250 |
Token | within |
Token ID | 1626 |
Feature activation | +1.81e-02 |
Pos logit contributions | |
Rhod | +2.284 |
� | +2.120 |
)", | +2.037 |
crop | +1.991 |
recapt | +1.781 |
Neg logit contributions | |
ILCS | -2.468 |
Hiroshima | -2.319 |
Anaheim | -2.287 |
Filipino | -2.284 |
endo | -2.240 |
Token | days |
Token ID | 1528 |
Feature activation | +3.92e-01 |
Pos logit contributions | |
ILCS | +0.218 |
Hiroshima | +0.208 |
Filipino | +0.207 |
Anaheim | +0.207 |
Huntington | +0.202 |
Neg logit contributions | |
Rhod | -0.179 |
� | -0.165 |
)", | -0.159 |
crop | -0.156 |
recapt | -0.135 |
Token | . |
Token ID | 13 |
Feature activation | -5.36e-01 |
Pos logit contributions | |
ILCS | +4.021 |
Hiroshima | +3.896 |
Filipino | +3.821 |
Anaheim | +3.809 |
Huntington | +3.704 |
Neg logit contributions | |
Rhod | -4.438 |
� | -4.212 |
)", | -4.071 |
crop | -4.030 |
faces | -3.547 |
Token | Fin |
Token ID | 4463 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
Rhod | +5.798 |
� | +5.210 |
)", | +5.022 |
crop | +4.904 |
recapt | +4.351 |
Neg logit contributions | |
ILCS | -5.795 |
Hiroshima | -5.297 |
Filipino | -5.295 |
Anaheim | -5.257 |
chant | -5.253 |
Token | ishing |
Token ID | 3929 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
ILCS | +1.519 |
Hiroshima | +1.449 |
Anaheim | +1.438 |
Filipino | +1.433 |
Huntington | +1.392 |
Neg logit contributions | |
Rhod | -1.716 |
� | -1.615 |
)", | -1.569 |
crop | -1.544 |
recapt | -1.365 |
Token | The |
Token ID | 383 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
Rhod | +2.905 |
� | +2.662 |
)", | +2.586 |
crop | +2.508 |
recapt | +2.249 |
Neg logit contributions | |
ILCS | -3.008 |
Hiroshima | -2.818 |
Filipino | -2.809 |
Anaheim | -2.799 |
Huntington | -2.717 |
Token | Flood |
Token ID | 25588 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
Rhod | +9.091 |
� | +7.965 |
crop | +7.771 |
)", | +7.638 |
Grey | +7.077 |
Neg logit contributions | |
ILCS | -11.300 |
Hiroshima | -10.380 |
boiler | -10.164 |
Filipino | -10.115 |
Anaheim | -10.095 |
Token | perhaps |
Token ID | 3737 |
Feature activation | -1.61e-01 |
Pos logit contributions | |
Rhod | +3.697 |
� | +3.406 |
)", | +3.297 |
crop | +3.233 |
recapt | +2.865 |
Neg logit contributions | |
ILCS | -3.944 |
Hiroshima | -3.793 |
Anaheim | -3.737 |
Filipino | -3.730 |
Huntington | -3.629 |
Token | correspondent |
Token ID | 21076 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
Filipino | +5.533 |
Hiroshima | +5.493 |
ILCS | +5.439 |
Anaheim | +5.330 |
Manila | +5.277 |
Neg logit contributions | |
Rhod | -5.425 |
� | -5.148 |
)", | -4.982 |
crop | -4.892 |
faces | -4.281 |
Token | in |
Token ID | 287 |
Feature activation | -2.95e-01 |
Pos logit contributions | |
Rhod | +1.822 |
� | +1.679 |
)", | +1.592 |
crop | +1.564 |
recapt | +1.431 |
Neg logit contributions | |
ILCS | -2.044 |
Anaheim | -1.927 |
Hiroshima | -1.927 |
Filipino | -1.896 |
Huntington | -1.863 |
Token | Somalia |
Token ID | 23918 |
Feature activation | -5.35e-01 |
Pos logit contributions | |
Rhod | +3.244 |
� | +2.998 |
)", | +2.923 |
crop | +2.840 |
recapt | +2.608 |
Neg logit contributions | |
ILCS | -3.220 |
Filipino | -2.954 |
Hiroshima | -2.946 |
chant | -2.942 |
Anaheim | -2.927 |
Token | says |
Token ID | 1139 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
Rhod | +5.393 |
� | +4.937 |
)", | +4.557 |
crop | +4.527 |
recapt | +4.322 |
Neg logit contributions | |
ILCS | -6.213 |
Anaheim | -5.825 |
Hiroshima | -5.738 |
chant | -5.723 |
Filipino | -5.619 |
Token | the |
Token ID | 262 |
Feature activation | -5.73e-01 |
Pos logit contributions | |
Rhod | +4.603 |
� | +4.170 |
)", | +4.044 |
crop | +3.908 |
recapt | +3.764 |
Neg logit contributions | |
ILCS | -5.516 |
Hiroshima | -5.034 |
chant | -4.996 |
Anaheim | -4.954 |
endo | -4.886 |
Token | Ethiop |
Token ID | 23230 |
Feature activation | -3.91e-01 |
Pos logit contributions | |
Rhod | +5.793 |
� | +5.236 |
)", | +5.070 |
crop | +4.901 |
recapt | +4.860 |
Neg logit contributions | |
ILCS | -6.519 |
Hiroshima | -6.050 |
chant | -6.044 |
Anaheim | -5.922 |
endo | -5.853 |
Token | ians |
Token ID | 1547 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
Rhod | +3.489 |
� | +3.164 |
)", | +3.110 |
crop | +2.992 |
recapt | +2.637 |
Neg logit contributions | |
ILCS | -4.988 |
Hiroshima | -4.746 |
Anaheim | -4.718 |
Huntington | -4.649 |
Filipino | -4.591 |
Token | have |
Token ID | 423 |
Feature activation | -3.19e-01 |
Pos logit contributions | |
Rhod | +4.175 |
� | +3.823 |
)", | +3.670 |
crop | +3.515 |
recapt | +3.466 |
Neg logit contributions | |
ILCS | -5.282 |
Hiroshima | -4.860 |
Anaheim | -4.859 |
Filipino | -4.768 |
endo | -4.734 |
Token | captured |
Token ID | 7907 |
Feature activation | -9.28e-01 |
Pos logit contributions | |
Rhod | +3.327 |
� | +3.056 |
)", | +2.963 |
crop | +2.828 |
recapt | +2.780 |
Neg logit contributions | |
ILCS | -3.716 |
Anaheim | -3.386 |
Hiroshima | -3.385 |
chant | -3.326 |
endo | -3.295 |
Token | a |
Token ID | 257 |
Feature activation | -5.44e-01 |
Pos logit contributions | |
Rhod | +8.583 |
� | +7.667 |
recapt | +7.296 |
)", | +7.256 |
crop | +7.174 |
Neg logit contributions | |
ILCS | -10.676 |
chant | -9.689 |
endo | -9.488 |
eno | -9.272 |
Hiroshima | -9.266 |
Token | key |
Token ID | 1994 |
Feature activation | -7.70e-01 |
Pos logit contributions | |
Rhod | +5.189 |
� | +4.657 |
crop | +4.488 |
)", | +4.456 |
recapt | +4.270 |
Neg logit contributions | |
ILCS | -6.541 |
endo | -6.027 |
chant | -6.026 |
Anaheim | -5.996 |
Hiroshima | -5.952 |
Token | a |
Token ID | 257 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
ILCS | +5.204 |
Filipino | +5.199 |
Hiroshima | +5.191 |
Anaheim | +5.131 |
Manila | +5.073 |
Neg logit contributions | |
Rhod | -4.125 |
� | -3.875 |
)", | -3.792 |
crop | -3.672 |
faces | -3.195 |
Token | statement |
Token ID | 2643 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
ILCS | +2.588 |
Hiroshima | +2.520 |
Filipino | +2.503 |
Anaheim | +2.482 |
Manila | +2.413 |
Neg logit contributions | |
Rhod | -2.716 |
� | -2.572 |
)", | -2.499 |
crop | -2.446 |
faces | -2.163 |
Token | . |
Token ID | 13 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
ILCS | +1.145 |
Hiroshima | +1.092 |
Anaheim | +1.083 |
Filipino | +1.076 |
Huntington | +1.051 |
Neg logit contributions | |
Rhod | -1.157 |
� | -1.086 |
)", | -1.048 |
crop | -1.030 |
recapt | -0.910 |
Token | � |
Token ID | 564 |
Feature activation | -5.74e-02 |
Pos logit contributions | |
ILCS | +3.598 |
Hiroshima | +3.459 |
Anaheim | +3.445 |
Filipino | +3.444 |
Huntington | +3.308 |
Neg logit contributions | |
Rhod | -4.317 |
� | -4.043 |
)", | -3.972 |
crop | -3.909 |
faces | -3.475 |
Token | � |
Token ID | 250 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
Rhod | +0.657 |
� | +0.624 |
)", | +0.599 |
crop | +0.589 |
faces | +0.524 |
Neg logit contributions | |
ILCS | -0.600 |
Hiroshima | -0.570 |
Anaheim | -0.561 |
Filipino | -0.558 |
Huntington | -0.548 |
Token | The |
Token ID | 464 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
ILCS | +3.208 |
Hiroshima | +3.072 |
Filipino | +3.061 |
Anaheim | +3.055 |
Huntington | +2.936 |
Neg logit contributions | |
Rhod | -3.862 |
� | -3.602 |
)", | -3.512 |
crop | -3.462 |
faces | -3.079 |
Token | United |
Token ID | 1578 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
Rhod | +1.738 |
� | +1.613 |
)", | +1.565 |
crop | +1.538 |
recapt | +1.381 |
Neg logit contributions | |
ILCS | -1.737 |
Hiroshima | -1.626 |
Anaheim | -1.616 |
chant | -1.589 |
Filipino | -1.583 |
Token | States |
Token ID | 1829 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
ILCS | +1.829 |
Hiroshima | +1.765 |
Anaheim | +1.753 |
Filipino | +1.747 |
Huntington | +1.711 |
Neg logit contributions | |
Rhod | -1.125 |
� | -1.033 |
)", | -0.990 |
crop | -0.968 |
recapt | -0.804 |
Token | intends |
Token ID | 19582 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
ILCS | +1.846 |
Hiroshima | +1.772 |
Anaheim | +1.756 |
Filipino | +1.752 |
Huntington | +1.703 |
Neg logit contributions | |
Rhod | -1.812 |
� | -1.702 |
)", | -1.647 |
crop | -1.622 |
faces | -1.412 |
Token | to |
Token ID | 284 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
Rhod | +1.833 |
� | +1.729 |
)", | +1.675 |
crop | +1.632 |
recapt | +1.465 |
Neg logit contributions | |
ILCS | -1.822 |
Hiroshima | -1.706 |
Anaheim | -1.693 |
Filipino | -1.681 |
Huntington | -1.661 |
Token | remain |
Token ID | 3520 |
Feature activation | -3.18e-01 |
Pos logit contributions | |
ILCS | +1.397 |
Hiroshima | +1.348 |
Anaheim | +1.334 |
Filipino | +1.333 |
Huntington | +1.297 |
Neg logit contributions | |
Rhod | -1.174 |
� | -1.094 |
)", | -1.055 |
crop | -1.037 |
faces | -0.893 |
Token | among |
Token ID | 1871 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Rhod | +6.137 |
� | +5.750 |
graded | +5.238 |
crop | +5.192 |
)", | +5.184 |
Neg logit contributions | |
ILCS | -9.094 |
Hiroshima | -8.420 |
ushi | -8.367 |
endo | -8.304 |
wang | -8.269 |
Token | the |
Token ID | 262 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
Rhod | +16.203 |
graded | +15.438 |
perimeter | +15.081 |
� | +14.854 |
Buc | +14.727 |
Neg logit contributions | |
ILCS | -17.270 |
Hiroshima | -16.034 |
chant | -15.886 |
Japanese | -15.583 |
wang | -15.579 |
Token | prospects |
Token ID | 13285 |
Feature activation | -8.50e-01 |
Pos logit contributions | |
Rhod | +15.776 |
� | +14.707 |
Buc | +14.055 |
Cycl | +13.839 |
crop | +13.760 |
Neg logit contributions | |
ILCS | -15.431 |
chant | -15.401 |
endo | -15.383 |
wang | -14.923 |
Hiroshima | -14.612 |
Token | chart |
Token ID | 8262 |
Feature activation | -2.40e-01 |
Pos logit contributions | |
Rhod | +8.024 |
� | +7.343 |
graded | +6.802 |
crop | +6.693 |
grading | +6.637 |
Neg logit contributions | |
ILCS | -9.346 |
Filipino | -8.749 |
chant | -8.726 |
endo | -8.724 |
Hiroshima | -8.694 |
Token | ed |
Token ID | 276 |
Feature activation | -6.28e-01 |
Pos logit contributions | |
Rhod | +2.202 |
� | +2.066 |
crop | +1.944 |
)", | +1.913 |
graded | +1.708 |
Neg logit contributions | |
ILCS | -2.965 |
Hiroshima | -2.862 |
Filipino | -2.851 |
Anaheim | -2.823 |
Huntington | -2.771 |
Token | for |
Token ID | 329 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
Rhod | +5.881 |
� | +5.639 |
crop | +5.231 |
)", | +5.051 |
graded | +4.735 |
Neg logit contributions | |
ILCS | -7.062 |
Filipino | -6.888 |
Hiroshima | -6.817 |
Anaheim | -6.661 |
Manila | -6.614 |
Token | Harmon |
Token ID | 39712 |
Feature activation | -8.86e-01 |
Pos logit contributions | |
Rhod | +15.495 |
� | +14.818 |
crop | +14.445 |
grading | +14.384 |
graded | +14.219 |
Neg logit contributions | |
ILCS | -14.261 |
chant | -13.445 |
Hiroshima | -13.200 |
Japanese | -13.123 |
quist | -13.007 |
Token | � |
Token ID | 447 |
Feature activation | +2.84e-02 |
Pos logit contributions | |
Rhod | +9.648 |
� | +9.293 |
crop | +8.627 |
)", | +8.192 |
graded | +8.110 |
Neg logit contributions | |
Hiroshima | -8.087 |
Filipino | -7.915 |
ILCS | -7.750 |
Manila | -7.706 |
Anaheim | -7.646 |
Token | � |
Token ID | 247 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
ILCS | +0.350 |
Hiroshima | +0.338 |
Anaheim | +0.334 |
Filipino | +0.334 |
Huntington | +0.326 |
Neg logit contributions | |
Rhod | -0.273 |
� | -0.254 |
)", | -0.243 |
crop | -0.238 |
faces | -0.204 |
Token | s |
Token ID | 82 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
Rhod | +9.722 |
� | +9.443 |
crop | +9.246 |
)", | +8.596 |
graded | +7.997 |
Neg logit contributions | |
ILCS | -10.653 |
Hiroshima | -10.389 |
Filipino | -10.235 |
Anaheim | -9.868 |
Manila | -9.831 |
Token | Re |
Token ID | 797 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
Rhod | +15.701 |
� | +14.465 |
crop | +14.293 |
grading | +14.222 |
graded | +13.926 |
Neg logit contributions | |
ILCS | -12.285 |
chant | -12.119 |
Japanese | -11.843 |
endo | -11.725 |
Hiroshima | -11.700 |
Token | . |
Token ID | 13 |
Feature activation | -8.47e-01 |
Pos logit contributions | |
Rhod | +3.295 |
� | +3.159 |
)", | +2.980 |
crop | +2.909 |
recapt | +2.652 |
Neg logit contributions | |
ILCS | -3.392 |
Filipino | -3.255 |
Anaheim | -3.218 |
Hiroshima | -3.211 |
chant | -3.145 |
Token |
|
Token ID | 198 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
Rhod | +8.450 |
� | +7.772 |
crop | +7.196 |
)", | +7.161 |
Carbon | +6.479 |
Neg logit contributions | |
ILCS | -9.123 |
chant | -8.449 |
Filipino | -8.413 |
Anaheim | -8.197 |
endo | -8.143 |
Token |
|
Token ID | 198 |
Feature activation | -9.67e-01 |
Pos logit contributions | |
Rhod | +2.688 |
� | +2.540 |
)", | +2.448 |
crop | +2.434 |
faces | +2.100 |
Neg logit contributions | |
ILCS | -3.155 |
Hiroshima | -2.964 |
Filipino | -2.916 |
Anaheim | -2.906 |
Huntington | -2.847 |
Token | The |
Token ID | 464 |
Feature activation | -5.47e-01 |
Pos logit contributions | |
� | +9.287 |
Rhod | +9.060 |
crop | +8.944 |
)", | +8.679 |
faces | +7.916 |
Neg logit contributions | |
ILCS | -10.066 |
Filipino | -9.512 |
Anaheim | -9.443 |
Manila | -9.297 |
Hiroshima | -9.286 |
Token | values |
Token ID | 3815 |
Feature activation | -5.08e-01 |
Pos logit contributions | |
Rhod | +5.676 |
� | +5.184 |
)", | +5.058 |
crop | +4.900 |
recapt | +4.501 |
Neg logit contributions | |
ILCS | -6.024 |
Filipino | -5.625 |
chant | -5.547 |
Anaheim | -5.521 |
Hiroshima | -5.479 |
Token | of |
Token ID | 286 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Rhod | +4.963 |
� | +4.607 |
)", | +4.345 |
crop | +4.275 |
recapt | +3.901 |
Neg logit contributions | |
ILCS | -5.979 |
Filipino | -5.575 |
Anaheim | -5.557 |
chant | -5.507 |
Hiroshima | -5.439 |
Token | the |
Token ID | 262 |
Feature activation | -8.18e-01 |
Pos logit contributions | |
Rhod | +12.559 |
� | +11.867 |
crop | +10.620 |
)", | +10.608 |
recapt | +10.183 |
Neg logit contributions | |
ILCS | -14.164 |
ushi | -13.630 |
Filipino | -13.197 |
chant | -13.188 |
Japanese | -12.816 |
Token | first |
Token ID | 717 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
Rhod | +7.962 |
� | +7.357 |
)", | +7.026 |
crop | +6.872 |
recapt | +6.422 |
Neg logit contributions | |
ILCS | -8.827 |
ushi | -8.319 |
Filipino | -8.275 |
chant | -8.143 |
endo | -8.091 |
Token | two |
Token ID | 734 |
Feature activation | -7.68e-01 |
Pos logit contributions | |
Rhod | +8.628 |
� | +7.851 |
)", | +7.435 |
crop | +7.227 |
graded | +6.841 |
Neg logit contributions | |
ILCS | -12.036 |
ushi | -11.079 |
endo | -10.917 |
Anaheim | -10.900 |
chant | -10.855 |
Token | of |
Token ID | 286 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
Rhod | +6.380 |
� | +5.882 |
)", | +5.623 |
crop | +5.360 |
graded | +4.986 |
Neg logit contributions | |
ILCS | -9.308 |
Filipino | -8.759 |
ushi | -8.714 |
chant | -8.665 |
Hiroshima | -8.615 |
Token | the |
Token ID | 262 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
Rhod | +7.441 |
� | +6.853 |
)", | +6.095 |
crop | +5.860 |
graded | +5.325 |
Neg logit contributions | |
ILCS | -12.969 |
ushi | -12.441 |
Filipino | -12.307 |
chant | -12.045 |
Japanese | -12.041 |
Token | addition |
Token ID | 3090 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
Rhod | +9.360 |
� | +8.385 |
crop | +8.007 |
)", | +7.988 |
scenery | +7.416 |
Neg logit contributions | |
ILCS | -10.013 |
chant | -9.134 |
Hiroshima | -8.842 |
endo | -8.802 |
wang | -8.766 |
Token | of |
Token ID | 286 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Rhod | +4.148 |
� | +3.806 |
)", | +3.618 |
crop | +3.610 |
recapt | +3.155 |
Neg logit contributions | |
ILCS | -5.170 |
Hiroshima | -4.840 |
Filipino | -4.789 |
Anaheim | -4.787 |
Huntington | -4.657 |
Token | Boise |
Token ID | 38830 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
Rhod | +12.402 |
� | +10.954 |
crop | +10.499 |
)", | +10.288 |
graded | +9.722 |
Neg logit contributions | |
ILCS | -12.781 |
chant | -11.331 |
Japanese | -11.081 |
wang | -11.077 |
quist | -10.991 |
Token | State |
Token ID | 1812 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
Rhod | +6.379 |
� | +5.818 |
)", | +4.611 |
crop | +4.458 |
scenery | +3.800 |
Neg logit contributions | |
ILCS | -16.888 |
Hiroshima | -15.840 |
wang | -15.792 |
chant | -15.731 |
endo | -15.656 |
Token | after |
Token ID | 706 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
Rhod | +6.421 |
� | +5.924 |
crop | +5.442 |
)", | +5.359 |
graded | +4.818 |
Neg logit contributions | |
ILCS | -8.586 |
Filipino | -7.803 |
Hiroshima | -7.797 |
chant | -7.761 |
wang | -7.673 |
Token | the |
Token ID | 262 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
Rhod | +10.838 |
� | +9.850 |
)", | +9.178 |
grading | +9.043 |
crop | +8.974 |
Neg logit contributions | |
ILCS | -11.634 |
chant | -10.302 |
Japanese | -10.184 |
quist | -10.098 |
wang | -9.961 |
Token | season |
Token ID | 1622 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
Rhod | +14.301 |
� | +12.763 |
crop | +11.980 |
Cycl | +11.647 |
)", | +11.613 |
Neg logit contributions | |
ILCS | -13.164 |
chant | -12.460 |
wang | -12.368 |
Japanese | -12.050 |
eno | -11.752 |
Token | . |
Token ID | 13 |
Feature activation | -8.52e-01 |
Pos logit contributions | |
Rhod | +1.179 |
� | +1.100 |
)", | +1.046 |
crop | +1.037 |
recapt | +0.920 |
Neg logit contributions | |
ILCS | -1.345 |
Hiroshima | -1.267 |
Filipino | -1.254 |
Anaheim | -1.247 |
chant | -1.226 |
Token |
|
Token ID | 198 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
Rhod | +8.955 |
� | +7.884 |
crop | +7.474 |
)", | +7.265 |
Carbon | +6.662 |
Neg logit contributions | |
ILCS | -8.986 |
chant | -8.466 |
ushi | -8.194 |
endo | -8.169 |
wang | -8.097 |
Token |
|
Token ID | 198 |
Feature activation | -7.49e-01 |
Pos logit contributions | |
Rhod | +1.426 |
� | +1.345 |
)", | +1.298 |
crop | +1.287 |
faces | +1.119 |
Neg logit contributions | |
ILCS | -1.525 |
Hiroshima | -1.441 |
Filipino | -1.420 |
Anaheim | -1.418 |
Huntington | -1.383 |
Token | Last |
Token ID | 5956 |
Feature activation | -5.21e-01 |
Pos logit contributions | |
Rhod | +7.047 |
� | +7.039 |
crop | +6.769 |
)", | +6.414 |
YD | +6.008 |
Neg logit contributions | |
ILCS | -8.424 |
Hiroshima | -7.984 |
Filipino | -7.861 |
Manila | -7.726 |
Anaheim | -7.722 |
Token | class |
Token ID | 1398 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
Rhod | +5.204 |
� | +4.685 |
crop | +4.573 |
)", | +4.413 |
graded | +3.936 |
Neg logit contributions | |
ILCS | -7.808 |
Hiroshima | -7.463 |
Anaheim | -7.334 |
wang | -7.271 |
Filipino | -7.229 |
Token | that |
Token ID | 326 |
Feature activation | -7.79e-01 |
Pos logit contributions | |
Rhod | +8.733 |
� | +7.857 |
crop | +7.517 |
)", | +7.234 |
graded | +7.229 |
Neg logit contributions | |
ILCS | -11.326 |
Hiroshima | -10.664 |
Filipino | -10.445 |
endo | -10.371 |
wang | -10.356 |
Token | includes |
Token ID | 3407 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
Rhod | +7.756 |
� | +7.226 |
crop | +6.740 |
)", | +6.715 |
graded | +6.513 |
Neg logit contributions | |
ILCS | -8.365 |
Hiroshima | -7.820 |
chant | -7.715 |
Filipino | -7.582 |
endo | -7.569 |
Token | Theo |
Token ID | 43999 |
Feature activation | -7.70e-01 |
Pos logit contributions | |
Rhod | +18.037 |
� | +16.335 |
crop | +15.701 |
)", | +15.289 |
graded | +14.791 |
Neg logit contributions | |
ILCS | -12.567 |
chant | -12.019 |
ushi | -11.652 |
endo | -11.501 |
quist | -11.494 |
Token | Howard |
Token ID | 8442 |
Feature activation | -8.30e-01 |
Pos logit contributions | |
Rhod | +7.151 |
� | +6.141 |
)", | +5.758 |
crop | +5.302 |
recapt | +4.983 |
Neg logit contributions | |
ILCS | -9.560 |
Hiroshima | -8.966 |
endo | -8.930 |
chant | -8.817 |
Japanese | -8.695 |
Token | , |
Token ID | 11 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
Rhod | +7.227 |
� | +6.878 |
crop | +6.125 |
)", | +6.015 |
recapt | +5.613 |
Neg logit contributions | |
ILCS | -9.640 |
Hiroshima | -9.358 |
Filipino | -9.056 |
chant | -8.972 |
Anaheim | -8.837 |
Token | D |
Token ID | 360 |
Feature activation | -9.30e-01 |
Pos logit contributions | |
Rhod | +18.031 |
� | +15.375 |
crop | +14.909 |
)", | +14.488 |
Miles | +14.238 |
Neg logit contributions | |
ILCS | -11.980 |
chant | -11.594 |
ushi | -11.457 |
quist | -11.400 |
endo | -11.349 |
Token | ym |
Token ID | 4948 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
Rhod | +9.965 |
� | +9.679 |
crop | +9.039 |
)", | +8.860 |
YD | +8.160 |
Neg logit contributions | |
ILCS | -8.982 |
Hiroshima | -8.610 |
Filipino | -8.270 |
Anaheim | -8.213 |
boiler | -8.096 |
Token | ond |
Token ID | 623 |
Feature activation | -7.20e-01 |
Pos logit contributions | |
Rhod | +1.828 |
� | +1.738 |
)", | +1.682 |
crop | +1.676 |
recapt | +1.510 |
Neg logit contributions | |
ILCS | -1.132 |
Hiroshima | -1.062 |
Anaheim | -1.052 |
Filipino | -1.033 |
Huntington | -0.996 |
Token | Lee |
Token ID | 5741 |
Feature activation | -6.75e-01 |
Pos logit contributions | |
Rhod | +8.143 |
� | +7.227 |
)", | +7.082 |
crop | +6.947 |
Tate | +6.098 |
Neg logit contributions | |
ILCS | -7.323 |
boiler | -6.586 |
Hiroshima | -6.567 |
Anaheim | -6.536 |
Filipino | -6.502 |
Token | , |
Token ID | 11 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
Rhod | +6.174 |
� | +5.670 |
crop | +5.275 |
)", | +5.135 |
graded | +4.412 |
Neg logit contributions | |
ILCS | -8.152 |
Hiroshima | -7.585 |
Filipino | -7.583 |
Anaheim | -7.478 |
chant | -7.456 |
Token | sorts |
Token ID | 10524 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
Rhod | +7.202 |
� | +6.392 |
crop | +6.228 |
)", | +6.052 |
recapt | +5.650 |
Neg logit contributions | |
ILCS | -8.108 |
chant | -7.643 |
Filipino | -7.504 |
wang | -7.458 |
Hiroshima | -7.412 |
Token | in |
Token ID | 287 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
Rhod | +10.752 |
� | +9.805 |
crop | +9.147 |
graded | +8.983 |
grading | +8.830 |
Neg logit contributions | |
ILCS | -15.301 |
Filipino | -14.301 |
Hiroshima | -13.895 |
wang | -13.776 |
ushi | -13.763 |
Token | a |
Token ID | 257 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
Rhod | +14.555 |
crop | +12.634 |
grading | +12.546 |
graded | +12.351 |
� | +12.332 |
Neg logit contributions | |
ILCS | -14.875 |
chant | -12.888 |
wang | -12.746 |
endo | -12.722 |
Japanese | -12.617 |
Token | blow |
Token ID | 6611 |
Feature activation | -4.77e-01 |
Pos logit contributions | |
Rhod | +14.097 |
graded | +11.687 |
� | +11.588 |
grading | +11.568 |
tire | +11.422 |
Neg logit contributions | |
ILCS | -14.757 |
chant | -13.023 |
endo | -12.763 |
wang | -12.748 |
quist | -12.496 |
Token | out |
Token ID | 448 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
Rhod | +4.898 |
� | +4.463 |
crop | +4.423 |
)", | +4.232 |
recapt | +3.861 |
Neg logit contributions | |
ILCS | -5.616 |
Hiroshima | -5.126 |
Filipino | -5.122 |
Anaheim | -5.093 |
Huntington | -4.942 |
Token | victory |
Token ID | 5373 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
Rhod | +12.705 |
� | +10.437 |
grading | +10.056 |
)", | +9.947 |
crop | +9.923 |
Neg logit contributions | |
ILCS | -17.593 |
chant | -16.170 |
wang | -16.115 |
quist | -15.682 |
Filipino | -15.470 |
Token | . |
Token ID | 13 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
Rhod | +11.516 |
� | +9.715 |
recapt | +9.232 |
crop | +9.084 |
graded | +9.051 |
Neg logit contributions | |
ILCS | -18.065 |
wang | -16.703 |
Filipino | -16.352 |
chant | -16.076 |
API | -15.841 |
Token | In |
Token ID | 554 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
Rhod | +14.436 |
Tate | +11.967 |
)", | +11.827 |
� | +11.766 |
crop | +11.654 |
Neg logit contributions | |
ILCS | -14.419 |
endo | -13.663 |
chant | -13.544 |
roxy | -13.505 |
ushi | -13.499 |
Token | 2014 |
Token ID | 1946 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
Rhod | +14.884 |
crop | +13.060 |
� | +12.965 |
grading | +12.724 |
)", | +12.672 |
Neg logit contributions | |
ILCS | -14.497 |
wang | -12.478 |
Japanese | -12.438 |
Filipino | -12.165 |
endo | -11.996 |
Token | , |
Token ID | 11 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
Rhod | +8.404 |
� | +7.197 |
crop | +6.786 |
)", | +6.672 |
graded | +6.450 |
Neg logit contributions | |
ILCS | -13.235 |
Filipino | -12.155 |
wang | -12.073 |
ushi | -11.891 |
Hiroshima | -11.860 |
Token | Texas |
Token ID | 3936 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
Rhod | +13.987 |
� | +11.705 |
)", | +11.623 |
Tate | +11.525 |
graded | +11.513 |
Neg logit contributions | |
ILCS | -15.136 |
endo | -13.685 |
wang | -13.474 |
ushi | -13.430 |
Japanese | -13.164 |