Token | , |
Token ID | 11 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
BT | +0.192 |
Dollar | +0.188 |
cour | +0.182 |
FW | +0.179 |
rentals | +0.173 |
Neg logit contributions | |
idious | -0.266 |
urnal | -0.252 |
ocate | -0.252 |
onential | -0.249 |
enary | -0.247 |
Token | Nick |
Token ID | 8047 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
idious | +4.973 |
urnal | +4.682 |
ocate | +4.656 |
enary | +4.555 |
onential | +4.552 |
Neg logit contributions | |
BT | -3.693 |
Dollar | -3.534 |
cour | -3.471 |
FW | -3.449 |
rentals | -3.303 |
Token | y |
Token ID | 88 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
Dollar | +5.713 |
BT | +5.432 |
cour | +5.165 |
FW | +5.038 |
fav | +4.745 |
Neg logit contributions | |
idious | -13.086 |
ocate | -12.575 |
onential | -12.540 |
urnal | -12.317 |
enary | -12.257 |
Token | Butt |
Token ID | 36041 |
Feature activation | -5.57e+00 |
Pos logit contributions | |
Dollar | +4.209 |
BT | +4.025 |
cour | +3.653 |
fav | +3.537 |
FW | +3.523 |
Neg logit contributions | |
idious | -13.000 |
ocate | -12.378 |
urnal | -12.332 |
enary | -12.243 |
onential | -12.227 |
Token | , |
Token ID | 11 |
Feature activation | -4.88e+00 |
Pos logit contributions | |
idious | +5.372 |
urnal | +5.041 |
ocate | +5.027 |
onential | +4.968 |
enary | +4.940 |
Neg logit contributions | |
BT | -4.287 |
Dollar | -4.186 |
cour | -4.062 |
FW | -4.014 |
rentals | -3.900 |
Token | David |
Token ID | 3271 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
idious | +4.884 |
urnal | +4.600 |
ocate | +4.585 |
enary | +4.477 |
onential | +4.472 |
Neg logit contributions | |
BT | -3.646 |
Dollar | -3.476 |
cour | -3.427 |
FW | -3.392 |
rentals | -3.252 |
Token | Beckham |
Token ID | 37244 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
Dollar | +9.998 |
Stub | +8.761 |
BT | +8.582 |
cour | +7.950 |
FW | +7.926 |
Neg logit contributions | |
idious | -20.732 |
onential | -20.716 |
urnal | -20.323 |
enary | -20.176 |
ocate | -19.662 |
Token | , |
Token ID | 11 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
BT | +0.920 |
Dollar | +0.897 |
cour | +0.868 |
FW | +0.856 |
rentals | +0.826 |
Neg logit contributions | |
idious | -1.299 |
urnal | -1.232 |
ocate | -1.231 |
onential | -1.217 |
enary | -1.207 |
Token | Robbie |
Token ID | 34855 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
idious | +4.681 |
urnal | +4.411 |
ocate | +4.411 |
enary | +4.297 |
onential | +4.292 |
Neg logit contributions | |
BT | -3.402 |
Dollar | -3.243 |
cour | -3.201 |
FW | -3.157 |
rentals | -3.029 |
Token | Savage |
Token ID | 22287 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
BT | +0.613 |
Dollar | +0.595 |
cour | +0.572 |
FW | +0.562 |
fav | +0.537 |
Neg logit contributions | |
idious | -1.162 |
urnal | -1.106 |
ocate | -1.106 |
onential | -1.096 |
enary | -1.089 |
Token | , |
Token ID | 11 |
Feature activation | -4.11e+00 |
Pos logit contributions | |
idious | +3.031 |
urnal | +2.854 |
ocate | +2.851 |
onential | +2.812 |
enary | +2.805 |
Neg logit contributions | |
BT | -2.300 |
Dollar | -2.251 |
cour | -2.177 |
FW | -2.157 |
rentals | -2.087 |
Token | Cyrus |
Token ID | 34305 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
BT | +2.902 |
Dollar | +2.879 |
cour | +2.746 |
FW | +2.697 |
fav | +2.615 |
Neg logit contributions | |
idious | -6.503 |
urnal | -6.280 |
onential | -6.224 |
enary | -6.190 |
ocate | -6.125 |
Token | phot |
Token ID | 2825 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
idious | +4.230 |
ocate | +4.001 |
urnal | +3.986 |
onential | +3.925 |
enary | +3.906 |
Neg logit contributions | |
BT | -3.555 |
Dollar | -3.425 |
cour | -3.338 |
FW | -3.306 |
rentals | -3.172 |
Token | ob |
Token ID | 672 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
idious | +0.929 |
ocate | +0.863 |
urnal | +0.863 |
onential | +0.849 |
enary | +0.841 |
Neg logit contributions | |
BT | -1.174 |
Dollar | -1.152 |
cour | -1.125 |
FW | -1.114 |
rentals | -1.086 |
Token | omb |
Token ID | 2381 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
idious | +0.901 |
ocate | +0.821 |
urnal | +0.818 |
onential | +0.799 |
enary | +0.788 |
Neg logit contributions | |
BT | -1.755 |
Dollar | -1.730 |
cour | -1.690 |
FW | -1.681 |
rentals | -1.646 |
Token | ing |
Token ID | 278 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
idious | +2.011 |
urnal | +1.903 |
ocate | +1.900 |
onential | +1.880 |
enary | +1.870 |
Neg logit contributions | |
BT | -1.484 |
Dollar | -1.438 |
cour | -1.395 |
FW | -1.378 |
rentals | -1.325 |
Token | David |
Token ID | 3271 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
BT | +0.886 |
Dollar | +0.878 |
cour | +0.835 |
FW | +0.826 |
fav | +0.810 |
Neg logit contributions | |
idious | -1.194 |
urnal | -1.131 |
ocate | -1.127 |
onential | -1.118 |
enary | -1.108 |
Token | Cameron |
Token ID | 10821 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
Dollar | +10.941 |
BT | +9.741 |
Stub | +9.241 |
cour | +9.018 |
FW | +8.989 |
Neg logit contributions | |
idious | -19.703 |
onential | -19.344 |
enary | -19.205 |
urnal | -18.907 |
ocate | -18.854 |
Token | at |
Token ID | 379 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
BT | +0.953 |
Dollar | +0.940 |
cour | +0.905 |
FW | +0.889 |
fav | +0.872 |
Neg logit contributions | |
idious | -1.290 |
urnal | -1.226 |
ocate | -1.222 |
onential | -1.215 |
enary | -1.199 |
Token | Wim |
Token ID | 39999 |
Feature activation | +7.19e+00 |
Pos logit contributions | |
BT | +2.326 |
Dollar | +2.319 |
cour | +2.183 |
FW | +2.156 |
fav | +2.131 |
Neg logit contributions | |
idious | -3.194 |
urnal | -3.021 |
ocate | -3.005 |
onential | -3.000 |
enary | -2.945 |
Token | bledon |
Token ID | 49258 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
BT | +2.079 |
Dollar | +1.851 |
cour | +1.796 |
FW | +1.628 |
FB | +1.323 |
Neg logit contributions | |
idious | -10.521 |
urnal | -10.193 |
ocate | -10.131 |
onential | -10.056 |
enary | -9.863 |
Token | , |
Token ID | 11 |
Feature activation | -3.09e+00 |
Pos logit contributions | |
BT | +1.487 |
Dollar | +1.465 |
cour | +1.419 |
FW | +1.387 |
rentals | +1.357 |
Neg logit contributions | |
idious | -2.113 |
urnal | -1.996 |
ocate | -1.981 |
onential | -1.975 |
enary | -1.944 |
Token | certain |
Token ID | 1728 |
Feature activation | +2.65e+00 |
Pos logit contributions | |
Dollar | +2.341 |
BT | +2.339 |
cour | +2.238 |
FW | +2.200 |
fav | +2.167 |
Neg logit contributions | |
idious | -3.126 |
urnal | -2.965 |
onential | -2.947 |
ocate | -2.940 |
enary | -2.898 |
Token | guys |
Token ID | 3730 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
BT | +1.861 |
Dollar | +1.839 |
cour | +1.775 |
FW | +1.734 |
fav | +1.716 |
Neg logit contributions | |
idious | -2.781 |
urnal | -2.642 |
ocate | -2.636 |
onential | -2.635 |
enary | -2.589 |
Token | , |
Token ID | 11 |
Feature activation | +6.15e+00 |
Pos logit contributions | |
BT | +1.170 |
Dollar | +1.147 |
cour | +1.115 |
FW | +1.090 |
fav | +1.064 |
Neg logit contributions | |
idious | -1.719 |
urnal | -1.635 |
ocate | -1.629 |
onential | -1.624 |
enary | -1.598 |
Token | � |
Token ID | 447 |
Feature activation | +2.48e+00 |
Pos logit contributions | |
Dollar | +4.364 |
BT | +4.329 |
cour | +4.179 |
FW | +4.087 |
fav | +4.044 |
Neg logit contributions | |
idious | -6.185 |
urnal | -5.923 |
onential | -5.852 |
enary | -5.800 |
ocate | -5.799 |
Token | � |
Token ID | 251 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
BT | +2.012 |
Dollar | +1.967 |
cour | +1.915 |
FW | +1.883 |
rentals | +1.835 |
Neg logit contributions | |
idious | -2.366 |
ocate | -2.236 |
urnal | -2.216 |
onential | -2.191 |
enary | -2.169 |
Token | David |
Token ID | 3271 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
BT | +1.686 |
Dollar | +1.632 |
cour | +1.607 |
FW | +1.574 |
fav | +1.516 |
Neg logit contributions | |
idious | -2.093 |
urnal | -1.992 |
ocate | -1.977 |
onential | -1.968 |
enary | -1.940 |
Token | Clarkson |
Token ID | 40524 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
Dollar | +11.425 |
BT | +10.095 |
Stub | +10.038 |
cour | +9.317 |
FW | +9.081 |
Neg logit contributions | |
idious | -19.913 |
onential | -19.489 |
urnal | -18.951 |
enary | -18.498 |
ocate | -18.247 |
Token | said |
Token ID | 531 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
idious | +2.363 |
ocate | +2.228 |
urnal | +2.218 |
onential | +2.187 |
enary | +2.180 |
Neg logit contributions | |
BT | -1.997 |
Dollar | -1.959 |
cour | -1.896 |
FW | -1.882 |
rentals | -1.820 |
Token | . |
Token ID | 13 |
Feature activation | -6.89e-01 |
Pos logit contributions | |
idious | +2.113 |
urnal | +1.995 |
ocate | +1.993 |
onential | +1.967 |
enary | +1.958 |
Neg logit contributions | |
BT | -1.568 |
Dollar | -1.532 |
cour | -1.478 |
FW | -1.465 |
rentals | -1.413 |
Token | � |
Token ID | 564 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
idious | +0.750 |
ocate | +0.713 |
urnal | +0.712 |
onential | +0.704 |
enary | +0.700 |
Neg logit contributions | |
BT | -0.464 |
Dollar | -0.452 |
cour | -0.435 |
FW | -0.430 |
rentals | -0.414 |
Token | � |
Token ID | 250 |
Feature activation | -2.63e+00 |
Pos logit contributions | |
BT | +0.289 |
Dollar | +0.283 |
cour | +0.275 |
FW | +0.272 |
rentals | +0.264 |
Neg logit contributions | |
idious | -0.324 |
ocate | -0.305 |
urnal | -0.304 |
onential | -0.300 |
enary | -0.298 |
Token | his |
Token ID | 465 |
Feature activation | -9.19e-01 |
Pos logit contributions | |
idious | +4.756 |
ocate | +4.490 |
urnal | +4.477 |
onential | +4.414 |
enary | +4.398 |
Neg logit contributions | |
BT | -3.359 |
Dollar | -3.201 |
cour | -3.142 |
FW | -3.118 |
rentals | -2.976 |
Token | highly |
Token ID | 4047 |
Feature activation | +4.47e+00 |
Pos logit contributions | |
idious | +0.914 |
urnal | +0.864 |
ocate | +0.862 |
onential | +0.853 |
enary | +0.846 |
Neg logit contributions | |
BT | -0.710 |
Dollar | -0.695 |
cour | -0.673 |
FW | -0.664 |
rentals | -0.644 |
Token | paid |
Token ID | 3432 |
Feature activation | +7.04e+00 |
Pos logit contributions | |
BT | +2.673 |
Dollar | +2.616 |
cour | +2.529 |
FW | +2.471 |
fav | +2.399 |
Neg logit contributions | |
idious | -5.140 |
urnal | -4.898 |
ocate | -4.893 |
onential | -4.885 |
enary | -4.819 |
Token | linem |
Token ID | 22774 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
Dollar | +5.153 |
BT | +4.976 |
cour | +4.847 |
rentals | +4.779 |
fav | +4.762 |
Neg logit contributions | |
idious | -6.896 |
onential | -6.641 |
urnal | -6.624 |
ocate | -6.468 |
enary | -6.452 |
Token | ates |
Token ID | 689 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
BT | +1.475 |
Dollar | +1.428 |
cour | +1.413 |
FW | +1.385 |
fav | +1.354 |
Neg logit contributions | |
idious | -1.185 |
urnal | -1.098 |
onential | -1.096 |
ocate | -1.082 |
enary | -1.064 |
Token | David |
Token ID | 3271 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
BT | +1.200 |
Dollar | +1.169 |
cour | +1.131 |
FW | +1.115 |
rentals | +1.076 |
Neg logit contributions | |
idious | -1.751 |
urnal | -1.659 |
ocate | -1.658 |
onential | -1.640 |
enary | -1.628 |
Token | De |
Token ID | 1024 |
Feature activation | +8.03e+00 |
Pos logit contributions | |
Dollar | +10.045 |
BT | +9.113 |
Stub | +8.802 |
FW | +8.507 |
cour | +8.102 |
Neg logit contributions | |
idious | -20.585 |
onential | -20.049 |
urnal | -19.811 |
enary | -19.591 |
ocate | -18.997 |
Token | Cast |
Token ID | 19248 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
BT | +4.805 |
Dollar | +4.321 |
cour | +4.259 |
FW | +4.219 |
rentals | +4.154 |
Neg logit contributions | |
idious | -9.412 |
enary | -8.869 |
ocate | -8.864 |
onential | -8.820 |
urnal | -8.798 |
Token | ro |
Token ID | 305 |
Feature activation | -6.50e-02 |
Pos logit contributions | |
BT | +1.378 |
Dollar | +1.376 |
cour | +1.327 |
FW | +1.299 |
fav | +1.269 |
Neg logit contributions | |
idious | -1.805 |
ocate | -1.685 |
urnal | -1.683 |
onential | -1.678 |
enary | -1.649 |
Token | and |
Token ID | 290 |
Feature activation | -3.76e+00 |
Pos logit contributions | |
idious | +0.064 |
ocate | +0.061 |
urnal | +0.061 |
onential | +0.060 |
enary | +0.060 |
Neg logit contributions | |
BT | -0.050 |
Dollar | -0.049 |
cour | -0.048 |
FW | -0.047 |
rentals | -0.046 |
Token | Maur |
Token ID | 18867 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
idious | +3.861 |
ocate | +3.637 |
urnal | +3.620 |
onential | +3.564 |
enary | +3.555 |
Neg logit contributions | |
BT | -2.765 |
Dollar | -2.639 |
cour | -2.573 |
FW | -2.562 |
fav | -2.436 |
Token | had |
Token ID | 550 |
Feature activation | +2.26e-01 |
Pos logit contributions | |
BT | +2.338 |
Dollar | +2.274 |
cour | +2.164 |
FW | +2.142 |
fav | +2.100 |
Neg logit contributions | |
idious | -4.222 |
ocate | -4.022 |
urnal | -4.020 |
onential | -4.005 |
enary | -3.960 |
Token | Paul |
Token ID | 3362 |
Feature activation | +7.89e+00 |
Pos logit contributions | |
BT | +0.150 |
Dollar | +0.146 |
cour | +0.141 |
FW | +0.139 |
rentals | +0.133 |
Neg logit contributions | |
idious | -0.248 |
urnal | -0.236 |
ocate | -0.236 |
onential | -0.233 |
enary | -0.232 |
Token | Sch |
Token ID | 3059 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
Dollar | +4.869 |
BT | +4.731 |
cour | +4.570 |
FW | +4.547 |
fav | +4.342 |
Neg logit contributions | |
idious | -8.536 |
urnal | -8.274 |
onential | -8.180 |
ocate | -8.110 |
enary | -7.965 |
Token | oles |
Token ID | 4316 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
idious | +1.202 |
ocate | +1.111 |
urnal | +1.108 |
onential | +1.094 |
enary | +1.075 |
Neg logit contributions | |
BT | -1.792 |
Dollar | -1.759 |
cour | -1.729 |
FW | -1.707 |
rentals | -1.665 |
Token | , |
Token ID | 11 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
idious | +1.217 |
ocate | +1.150 |
urnal | +1.149 |
onential | +1.135 |
enary | +1.129 |
Neg logit contributions | |
BT | -0.846 |
Dollar | -0.825 |
cour | -0.796 |
FW | -0.786 |
rentals | -0.757 |
Token | David |
Token ID | 3271 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
idious | +0.582 |
urnal | +0.550 |
ocate | +0.549 |
onential | +0.542 |
enary | +0.539 |
Neg logit contributions | |
BT | -0.436 |
Dollar | -0.425 |
cour | -0.412 |
FW | -0.407 |
rentals | -0.393 |
Token | Beckham |
Token ID | 37244 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
Dollar | +11.023 |
Stub | +9.641 |
BT | +9.065 |
FW | +8.581 |
cour | +8.435 |
Neg logit contributions | |
idious | -19.469 |
onential | -19.260 |
urnal | -18.677 |
enary | -18.307 |
ocate | -17.956 |
Token | and |
Token ID | 290 |
Feature activation | -6.49e+00 |
Pos logit contributions | |
BT | +1.224 |
Dollar | +1.195 |
cour | +1.156 |
FW | +1.141 |
fav | +1.103 |
Neg logit contributions | |
idious | -1.734 |
urnal | -1.647 |
ocate | -1.647 |
onential | -1.628 |
enary | -1.613 |
Token | Nick |
Token ID | 8047 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
idious | +6.507 |
ocate | +6.123 |
urnal | +6.117 |
enary | +5.919 |
onential | +5.904 |
Neg logit contributions | |
BT | -4.745 |
Dollar | -4.449 |
cour | -4.439 |
FW | -4.425 |
FB | -4.159 |
Token | y |
Token ID | 88 |
Feature activation | +6.60e+00 |
Pos logit contributions | |
Dollar | +6.399 |
BT | +6.057 |
cour | +5.717 |
FW | +5.696 |
fav | +5.455 |
Neg logit contributions | |
idious | -11.877 |
onential | -11.416 |
ocate | -11.245 |
enary | -11.017 |
urnal | -10.921 |
Token | Butt |
Token ID | 36041 |
Feature activation | -3.54e+00 |
Pos logit contributions | |
Dollar | +3.035 |
BT | +2.922 |
cour | +2.802 |
FW | +2.624 |
fav | +2.534 |
Neg logit contributions | |
idious | -8.551 |
ocate | -8.175 |
enary | -8.152 |
onential | -8.140 |
urnal | -8.099 |
Token | as |
Token ID | 355 |
Feature activation | -9.23e+00 |
Pos logit contributions | |
idious | +5.232 |
urnal | +4.896 |
ocate | +4.879 |
onential | +4.807 |
enary | +4.798 |
Neg logit contributions | |
BT | -4.026 |
Dollar | -3.820 |
cour | -3.790 |
FW | -3.761 |
rentals | -3.609 |
Token | individuals |
Token ID | 3925 |
Feature activation | -4.49e+00 |
Pos logit contributions | |
idious | +8.253 |
urnal | +7.680 |
ocate | +7.552 |
enary | +7.446 |
onential | +7.410 |
Neg logit contributions | |
BT | -7.477 |
cour | -7.054 |
FW | -7.044 |
Dollar | -7.034 |
FB | -6.752 |
Token | . |
Token ID | 13 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
idious | +4.419 |
urnal | +4.135 |
ocate | +4.129 |
enary | +4.087 |
onential | +4.065 |
Neg logit contributions | |
BT | -3.460 |
Dollar | -3.361 |
cour | -3.276 |
FW | -3.242 |
rentals | -3.137 |
Token |
|
Token ID | 198 |
Feature activation | +4.11e+00 |
Pos logit contributions | |
BT | +0.222 |
Dollar | +0.217 |
cour | +0.210 |
FW | +0.207 |
rentals | +0.199 |
Neg logit contributions | |
idious | -0.305 |
urnal | -0.289 |
ocate | -0.289 |
onential | -0.285 |
enary | -0.283 |
Token |
|
Token ID | 198 |
Feature activation | +5.05e+00 |
Pos logit contributions | |
BT | +2.917 |
Dollar | +2.807 |
cour | +2.775 |
FW | +2.699 |
fav | +2.579 |
Neg logit contributions | |
idious | -4.391 |
urnal | -4.157 |
onential | -4.143 |
ocate | -4.113 |
enary | -4.055 |
Token | David |
Token ID | 11006 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
BT | +2.868 |
FW | +2.636 |
cour | +2.565 |
Dollar | +2.547 |
FB | +2.454 |
Neg logit contributions | |
idious | -6.115 |
onential | -5.855 |
ocate | -5.846 |
urnal | -5.842 |
enary | -5.732 |
Token | : |
Token ID | 25 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
Dollar | +9.170 |
BT | +8.865 |
cour | +8.111 |
FW | +8.013 |
fav | +7.492 |
Neg logit contributions | |
idious | -20.585 |
onential | -20.022 |
urnal | -19.992 |
ocate | -19.555 |
enary | -19.106 |
Token | I |
Token ID | 314 |
Feature activation | +4.10e+00 |
Pos logit contributions | |
idious | +0.348 |
urnal | +0.330 |
ocate | +0.329 |
onential | +0.326 |
enary | +0.323 |
Neg logit contributions | |
BT | -0.231 |
Dollar | -0.224 |
cour | -0.217 |
FW | -0.214 |
rentals | -0.206 |
Token | noticed |
Token ID | 6810 |
Feature activation | +8.97e-01 |
Pos logit contributions | |
BT | +2.801 |
Dollar | +2.690 |
cour | +2.591 |
FW | +2.531 |
fav | +2.486 |
Neg logit contributions | |
idious | -4.450 |
urnal | -4.223 |
ocate | -4.195 |
onential | -4.187 |
enary | -4.128 |
Token | that |
Token ID | 326 |
Feature activation | -2.58e+00 |
Pos logit contributions | |
BT | +0.631 |
Dollar | +0.621 |
cour | +0.592 |
FW | +0.584 |
rentals | +0.566 |
Neg logit contributions | |
idious | -0.951 |
ocate | -0.905 |
urnal | -0.904 |
onential | -0.896 |
enary | -0.888 |
Token | everyone |
Token ID | 2506 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
idious | +2.635 |
urnal | +2.480 |
ocate | +2.479 |
onential | +2.446 |
enary | +2.435 |
Neg logit contributions | |
BT | -1.919 |
Dollar | -1.848 |
cour | -1.813 |
FW | -1.790 |
rentals | -1.721 |
Token | ki |
Token ID | 4106 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
idious | +4.533 |
ocate | +4.225 |
urnal | +4.194 |
onential | +4.142 |
enary | +4.071 |
Neg logit contributions | |
BT | -5.163 |
Dollar | -5.032 |
cour | -4.927 |
FW | -4.874 |
rentals | -4.742 |
Token | , |
Token ID | 11 |
Feature activation | -4.23e+00 |
Pos logit contributions | |
BT | +3.294 |
Dollar | +3.193 |
cour | +3.093 |
FW | +3.023 |
fav | +2.952 |
Neg logit contributions | |
idious | -4.629 |
ocate | -4.387 |
urnal | -4.361 |
onential | -4.348 |
enary | -4.332 |
Token | Keith |
Token ID | 14926 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
idious | +4.274 |
urnal | +4.032 |
ocate | +4.017 |
onential | +3.927 |
enary | +3.924 |
Neg logit contributions | |
BT | -3.141 |
Dollar | -3.008 |
cour | -2.957 |
FW | -2.931 |
rentals | -2.812 |
Token | Gillespie |
Token ID | 45078 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
Dollar | +5.926 |
BT | +5.923 |
cour | +5.506 |
Stub | +5.279 |
FW | +5.177 |
Neg logit contributions | |
idious | -11.407 |
ocate | -10.898 |
onential | -10.835 |
urnal | -10.546 |
enary | -10.541 |
Token | and |
Token ID | 290 |
Feature activation | -6.34e+00 |
Pos logit contributions | |
idious | +0.268 |
ocate | +0.254 |
urnal | +0.254 |
onential | +0.251 |
enary | +0.249 |
Neg logit contributions | |
BT | -0.188 |
Dollar | -0.183 |
cour | -0.177 |
FW | -0.175 |
rentals | -0.169 |
Token | David |
Token ID | 3271 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
idious | +6.367 |
urnal | +5.981 |
ocate | +5.963 |
enary | +5.825 |
onential | +5.788 |
Neg logit contributions | |
BT | -4.651 |
Dollar | -4.417 |
cour | -4.371 |
FW | -4.338 |
FB | -4.109 |
Token | Pierce |
Token ID | 23023 |
Feature activation | +5.10e+00 |
Pos logit contributions | |
Dollar | +11.067 |
Stub | +9.949 |
BT | +9.819 |
cour | +9.050 |
FW | +8.952 |
Neg logit contributions | |
idious | -18.887 |
onential | -18.766 |
urnal | -18.342 |
enary | -18.119 |
ocate | -17.697 |
Token |
|
Token ID | 198 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
BT | +3.569 |
Dollar | +3.456 |
cour | +3.373 |
FW | +3.302 |
fav | +3.243 |
Neg logit contributions | |
idious | -5.330 |
urnal | -5.067 |
onential | -5.048 |
ocate | -5.040 |
enary | -4.955 |
Token |
|
Token ID | 198 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
BT | +1.359 |
Dollar | +1.319 |
cour | +1.295 |
FW | +1.264 |
fav | +1.219 |
Neg logit contributions | |
idious | -1.869 |
urnal | -1.766 |
ocate | -1.759 |
onential | -1.754 |
enary | -1.727 |
Token | It |
Token ID | 1026 |
Feature activation | -4.73e+00 |
Pos logit contributions | |
BT | +1.037 |
Dollar | +0.982 |
cour | +0.967 |
FW | +0.960 |
FB | +0.906 |
Neg logit contributions | |
idious | -1.689 |
ocate | -1.604 |
urnal | -1.604 |
onential | -1.594 |
enary | -1.578 |
Token | has |
Token ID | 468 |
Feature activation | -5.73e+00 |
Pos logit contributions | |
idious | +4.798 |
urnal | +4.538 |
ocate | +4.513 |
enary | +4.453 |
onential | +4.422 |
Neg logit contributions | |
BT | -3.480 |
Dollar | -3.399 |
cour | -3.265 |
FW | -3.261 |
FB | -3.121 |
Token | Design |
Token ID | 8495 |
Feature activation | +8.98e+00 |
Pos logit contributions | |
idious | +1.136 |
ocate | +1.076 |
urnal | +1.074 |
onential | +1.060 |
enary | +1.053 |
Neg logit contributions | |
BT | -0.820 |
Dollar | -0.798 |
cour | -0.775 |
FW | -0.764 |
rentals | -0.734 |
Token | ated |
Token ID | 515 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
Dollar | +6.793 |
BT | +6.691 |
cour | +6.466 |
FW | +6.455 |
FB | +6.397 |
Neg logit contributions | |
idious | -8.366 |
onential | -8.001 |
urnal | -7.880 |
ocate | -7.800 |
enary | -7.672 |
Token | Players |
Token ID | 13094 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
Dollar | +5.542 |
BT | +5.269 |
FW | +4.801 |
rentals | +4.676 |
cour | +4.664 |
Neg logit contributions | |
idious | -15.719 |
ocate | -14.861 |
onential | -14.806 |
urnal | -14.698 |
enary | -14.527 |
Token | from |
Token ID | 422 |
Feature activation | +5.35e+00 |
Pos logit contributions | |
BT | +1.454 |
Dollar | +1.418 |
cour | +1.372 |
FW | +1.353 |
rentals | +1.309 |
Neg logit contributions | |
idious | -2.092 |
urnal | -1.981 |
ocate | -1.976 |
onential | -1.956 |
enary | -1.940 |
Token | the |
Token ID | 262 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
BT | +4.049 |
Dollar | +4.042 |
cour | +3.794 |
FW | +3.791 |
rentals | +3.737 |
Neg logit contributions | |
idious | -5.284 |
urnal | -5.008 |
onential | -4.952 |
ocate | -4.911 |
enary | -4.853 |
Token | David |
Token ID | 3271 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
BT | +1.567 |
Dollar | +1.549 |
FW | +1.456 |
cour | +1.455 |
rentals | +1.412 |
Neg logit contributions | |
idious | -2.382 |
urnal | -2.268 |
onential | -2.246 |
ocate | -2.242 |
enary | -2.206 |
Token | Beckham |
Token ID | 37244 |
Feature activation | +5.24e+00 |
Pos logit contributions | |
Dollar | +12.157 |
BT | +11.032 |
FW | +10.672 |
Stub | +10.654 |
cour | +10.300 |
Neg logit contributions | |
idious | -17.751 |
onential | -17.635 |
enary | -16.516 |
urnal | -16.284 |
ocate | -15.991 |
Token | buzz |
Token ID | 14713 |
Feature activation | +8.34e+00 |
Pos logit contributions | |
BT | +3.707 |
Dollar | +3.706 |
cour | +3.528 |
FW | +3.489 |
rentals | +3.397 |
Neg logit contributions | |
idious | -5.415 |
urnal | -5.157 |
ocate | -5.100 |
onential | -5.091 |
enary | -4.980 |
Token | to |
Token ID | 284 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
Dollar | +5.683 |
BT | +5.664 |
cour | +5.513 |
FW | +5.352 |
rentals | +5.113 |
Neg logit contributions | |
idious | -8.564 |
ocate | -8.156 |
onential | -8.113 |
urnal | -8.109 |
enary | -7.945 |
Token | the |
Token ID | 262 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
BT | +2.345 |
Dollar | +2.321 |
cour | +2.214 |
FW | +2.202 |
rentals | +2.149 |
Neg logit contributions | |
idious | -3.339 |
urnal | -3.154 |
onential | -3.112 |
ocate | -3.107 |
enary | -3.068 |
Token | arrival |
Token ID | 10325 |
Feature activation | -6.29e-01 |
Pos logit contributions | |
BT | +0.934 |
Dollar | +0.918 |
cour | +0.875 |
FW | +0.867 |
rentals | +0.840 |
Neg logit contributions | |
idious | -1.461 |
urnal | -1.387 |
ocate | -1.382 |
onential | -1.373 |
enary | -1.357 |
Token | on |
Token ID | 319 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
BT | +1.946 |
Dollar | +1.929 |
cour | +1.847 |
FW | +1.812 |
rentals | +1.789 |
Neg logit contributions | |
idious | -2.711 |
ocate | -2.558 |
urnal | -2.552 |
onential | -2.526 |
enary | -2.502 |
Token | Apple |
Token ID | 4196 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
idious | +0.214 |
ocate | +0.203 |
urnal | +0.203 |
onential | +0.201 |
enary | +0.200 |
Neg logit contributions | |
BT | -0.146 |
Dollar | -0.143 |
cour | -0.137 |
FW | -0.135 |
rentals | -0.131 |
Token | Music |
Token ID | 7849 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
idious | +1.914 |
ocate | +1.832 |
urnal | +1.824 |
onential | +1.813 |
enary | +1.797 |
Neg logit contributions | |
BT | -0.953 |
Dollar | -0.930 |
cour | -0.894 |
FW | -0.879 |
fav | -0.833 |
Token | . |
Token ID | 13 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
idious | +1.649 |
ocate | +1.565 |
urnal | +1.558 |
onential | +1.545 |
enary | +1.530 |
Neg logit contributions | |
BT | -1.230 |
Dollar | -1.199 |
cour | -1.164 |
FW | -1.150 |
fav | -1.103 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +6.09e-02 |
Pos logit contributions | |
idious | +1.060 |
ocate | +1.003 |
urnal | +1.002 |
onential | +0.991 |
enary | +0.983 |
Neg logit contributions | |
BT | -0.792 |
Dollar | -0.771 |
cour | -0.749 |
FW | -0.739 |
rentals | -0.718 |
Token | David |
Token ID | 11006 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
BT | +0.041 |
Dollar | +0.040 |
cour | +0.039 |
FW | +0.038 |
rentals | +0.036 |
Neg logit contributions | |
idious | -0.067 |
urnal | -0.063 |
ocate | -0.063 |
onential | -0.063 |
enary | -0.062 |
Token | Brooks |
Token ID | 17704 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
Dollar | +12.880 |
BT | +11.955 |
cour | +11.287 |
Stub | +11.177 |
FW | +11.015 |
Neg logit contributions | |
idious | -16.118 |
onential | -15.368 |
enary | -15.115 |
ocate | -15.060 |
urnal | -15.030 |
Token | writes |
Token ID | 6797 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
idious | +3.030 |
ocate | +2.878 |
urnal | +2.856 |
onential | +2.822 |
enary | +2.804 |
Neg logit contributions | |
BT | -2.036 |
Dollar | -1.964 |
cour | -1.914 |
FW | -1.900 |
rentals | -1.813 |
Token | a |
Token ID | 257 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
idious | +2.199 |
urnal | +2.086 |
ocate | +2.082 |
onential | +2.059 |
enary | +2.046 |
Neg logit contributions | |
BT | -1.398 |
Dollar | -1.355 |
cour | -1.314 |
FW | -1.294 |
rentals | -1.243 |
Token | pro |
Token ID | 386 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
idious | +1.108 |
urnal | +1.046 |
ocate | +1.043 |
onential | +1.031 |
enary | +1.024 |
Neg logit contributions | |
BT | -0.876 |
Dollar | -0.852 |
cour | -0.830 |
FW | -0.820 |
rentals | -0.792 |
Token | - |
Token ID | 12 |
Feature activation | +7.56e-01 |
Pos logit contributions | |
BT | +0.652 |
Dollar | +0.632 |
cour | +0.608 |
FW | +0.597 |
fav | +0.571 |
Neg logit contributions | |
idious | -1.281 |
ocate | -1.220 |
urnal | -1.217 |
onential | -1.205 |
enary | -1.202 |
Token | series |
Token ID | 2168 |
Feature activation | -4.10e+00 |
Pos logit contributions | |
BT | +1.220 |
Dollar | +1.207 |
cour | +1.158 |
FW | +1.130 |
fav | +1.106 |
Neg logit contributions | |
idious | -1.811 |
ocate | -1.730 |
urnal | -1.718 |
onential | -1.704 |
enary | -1.688 |
Token | " |
Token ID | 366 |
Feature activation | -9.86e-01 |
Pos logit contributions | |
idious | +4.489 |
urnal | +4.265 |
ocate | +4.228 |
onential | +4.196 |
enary | +4.171 |
Neg logit contributions | |
BT | -2.693 |
Dollar | -2.582 |
cour | -2.519 |
FW | -2.490 |
rentals | -2.400 |
Token | Teen |
Token ID | 45639 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
idious | +1.136 |
urnal | +1.081 |
ocate | +1.081 |
onential | +1.070 |
enary | +1.063 |
Neg logit contributions | |
BT | -0.605 |
Dollar | -0.586 |
cour | -0.564 |
FW | -0.555 |
rentals | -0.532 |
Token | Titans |
Token ID | 18711 |
Feature activation | -7.34e+00 |
Pos logit contributions | |
idious | +2.071 |
urnal | +1.964 |
ocate | +1.960 |
onential | +1.938 |
enary | +1.927 |
Neg logit contributions | |
BT | -1.358 |
Dollar | -1.313 |
cour | -1.276 |
FW | -1.258 |
rentals | -1.213 |
Token | ." |
Token ID | 526 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
idious | +7.090 |
ocate | +6.766 |
urnal | +6.745 |
enary | +6.619 |
onential | +6.603 |
Neg logit contributions | |
BT | -5.475 |
Dollar | -5.144 |
FW | -5.097 |
cour | -5.050 |
rentals | -4.975 |
Token | David |
Token ID | 3271 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
idious | +2.761 |
ocate | +2.616 |
urnal | +2.614 |
onential | +2.577 |
enary | +2.566 |
Neg logit contributions | |
BT | -2.150 |
Dollar | -2.087 |
cour | -2.039 |
FW | -2.011 |
rentals | -1.964 |
Token | took |
Token ID | 1718 |
Feature activation | -4.98e+00 |
Pos logit contributions | |
Dollar | +11.061 |
BT | +10.893 |
fav | +10.156 |
cour | +9.811 |
favors | +9.685 |
Neg logit contributions | |
idious | -17.300 |
onential | -16.320 |
ocate | -16.006 |
urnal | -15.936 |
enary | -15.615 |
Token | some |
Token ID | 617 |
Feature activation | -6.83e+00 |
Pos logit contributions | |
idious | +4.828 |
urnal | +4.570 |
ocate | +4.552 |
onential | +4.493 |
enary | +4.462 |
Neg logit contributions | |
BT | -3.899 |
Dollar | -3.765 |
cour | -3.673 |
FW | -3.655 |
rentals | -3.489 |
Token | time |
Token ID | 640 |
Feature activation | -4.60e+00 |
Pos logit contributions | |
idious | +4.959 |
urnal | +4.613 |
ocate | +4.536 |
enary | +4.467 |
onential | +4.374 |
Neg logit contributions | |
BT | -6.878 |
Dollar | -6.670 |
cour | -6.555 |
FW | -6.501 |
FB | -6.324 |
Token | out |
Token ID | 503 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
idious | +4.635 |
urnal | +4.372 |
ocate | +4.340 |
enary | +4.313 |
onential | +4.278 |
Neg logit contributions | |
BT | -3.439 |
Dollar | -3.374 |
cour | -3.247 |
FW | -3.212 |
rentals | -3.093 |
Token | of |
Token ID | 286 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
BT | +1.924 |
Dollar | +1.870 |
cour | +1.835 |
FW | +1.788 |
rentals | +1.747 |
Neg logit contributions | |
idious | -2.537 |
ocate | -2.414 |
urnal | -2.408 |
onential | -2.401 |
enary | -2.347 |
Token | and |
Token ID | 290 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
idious | +5.939 |
urnal | +5.615 |
ocate | +5.596 |
enary | +5.554 |
onential | +5.481 |
Neg logit contributions | |
BT | -4.713 |
Dollar | -4.605 |
cour | -4.475 |
FW | -4.395 |
rentals | -4.285 |
Token | 30 |
Token ID | 1542 |
Feature activation | -4.35e-01 |
Pos logit contributions | |
idious | +1.612 |
ocate | +1.525 |
urnal | +1.520 |
onential | +1.498 |
enary | +1.498 |
Neg logit contributions | |
BT | -1.191 |
Dollar | -1.155 |
cour | -1.127 |
FW | -1.112 |
rentals | -1.071 |
Token | th |
Token ID | 400 |
Feature activation | -5.34e+00 |
Pos logit contributions | |
idious | +0.472 |
ocate | +0.449 |
urnal | +0.448 |
onential | +0.443 |
enary | +0.441 |
Neg logit contributions | |
BT | -0.294 |
Dollar | -0.287 |
cour | -0.276 |
FW | -0.272 |
rentals | -0.263 |
Token | ! |
Token ID | 0 |
Feature activation | +9.30e-01 |
Pos logit contributions | |
idious | +5.170 |
ocate | +4.870 |
urnal | +4.863 |
enary | +4.811 |
onential | +4.769 |
Neg logit contributions | |
BT | -4.116 |
Dollar | -4.017 |
cour | -3.897 |
FW | -3.845 |
fav | -3.710 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -6.43e-01 |
Pos logit contributions | |
BT | +0.703 |
Dollar | +0.688 |
cour | +0.664 |
FW | +0.656 |
fav | +0.630 |
Neg logit contributions | |
idious | -0.945 |
urnal | -0.893 |
ocate | -0.889 |
onential | -0.883 |
enary | -0.874 |
Token | David |
Token ID | 11006 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
idious | +0.706 |
urnal | +0.670 |
ocate | +0.670 |
onential | +0.663 |
enary | +0.658 |
Neg logit contributions | |
BT | -0.431 |
Dollar | -0.417 |
cour | -0.404 |
FW | -0.399 |
rentals | -0.381 |
Token | Camp |
Token ID | 5425 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
Dollar | +12.676 |
BT | +11.832 |
cour | +11.216 |
Stub | +11.068 |
FW | +10.918 |
Neg logit contributions | |
idious | -15.838 |
onential | -15.085 |
enary | -14.823 |
urnal | -14.779 |
ocate | -14.753 |
Token | os |
Token ID | 418 |
Feature activation | -5.26e+00 |
Pos logit contributions | |
BT | +2.121 |
Dollar | +2.100 |
cour | +2.058 |
FW | +2.019 |
fav | +1.984 |
Neg logit contributions | |
idious | -1.914 |
urnal | -1.788 |
ocate | -1.786 |
onential | -1.785 |
enary | -1.760 |
Token |
|
Token ID | 198 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
idious | +5.504 |
ocate | +5.227 |
urnal | +5.201 |
enary | +5.132 |
onential | +5.105 |
Neg logit contributions | |
BT | -3.654 |
Dollar | -3.540 |
cour | -3.420 |
FW | -3.395 |
rentals | -3.265 |
Token |
|
Token ID | 198 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
idious | +1.954 |
ocate | +1.851 |
urnal | +1.846 |
onential | +1.821 |
enary | +1.814 |
Neg logit contributions | |
BT | -1.620 |
Dollar | -1.596 |
cour | -1.533 |
FW | -1.519 |
rentals | -1.495 |
Token | San |
Token ID | 15017 |
Feature activation | -3.38e+00 |
Pos logit contributions | |
idious | +1.205 |
urnal | +1.144 |
ocate | +1.143 |
onential | +1.132 |
enary | +1.124 |
Neg logit contributions | |
BT | -0.752 |
Dollar | -0.727 |
cour | -0.706 |
FW | -0.695 |
rentals | -0.665 |
Token | Spider |
Token ID | 12648 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
Dollar | +1.835 |
BT | +1.834 |
cour | +1.719 |
FW | +1.699 |
rentals | +1.633 |
Neg logit contributions | |
idious | -3.204 |
urnal | -3.055 |
ocate | -3.044 |
onential | -3.027 |
enary | -2.984 |
Token | House |
Token ID | 2097 |
Feature activation | +8.69e+00 |
Pos logit contributions | |
idious | +0.545 |
ocate | +0.519 |
urnal | +0.519 |
onential | +0.513 |
enary | +0.510 |
Neg logit contributions | |
BT | -0.298 |
Dollar | -0.287 |
cour | -0.278 |
FW | -0.274 |
rentals | -0.263 |
Token | . |
Token ID | 13 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
Dollar | +5.832 |
BT | +5.713 |
cour | +5.411 |
FW | +5.325 |
rentals | +5.231 |
Neg logit contributions | |
idious | -9.114 |
urnal | -8.828 |
onential | -8.690 |
ocate | -8.639 |
enary | -8.544 |
Token | � |
Token ID | 447 |
Feature activation | +3.38e+00 |
Pos logit contributions | |
idious | +0.752 |
ocate | +0.710 |
urnal | +0.710 |
onential | +0.700 |
enary | +0.696 |
Neg logit contributions | |
BT | -0.599 |
Dollar | -0.583 |
cour | -0.566 |
FW | -0.560 |
rentals | -0.542 |
Token | � |
Token ID | 251 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
BT | +3.456 |
Dollar | +3.382 |
cour | +3.309 |
FW | +3.277 |
fav | +3.201 |
Neg logit contributions | |
idious | -2.526 |
ocate | -2.335 |
urnal | -2.315 |
onential | -2.281 |
enary | -2.257 |
Token | Mary |
Token ID | 5335 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
BT | +1.707 |
Dollar | +1.681 |
cour | +1.617 |
FW | +1.597 |
rentals | +1.525 |
Neg logit contributions | |
idious | -2.347 |
urnal | -2.223 |
ocate | -2.220 |
onential | -2.211 |
enary | -2.181 |
Token | Pick |
Token ID | 12346 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
Dollar | +13.247 |
BT | +13.039 |
cour | +12.269 |
FW | +11.996 |
Stub | +11.670 |
Neg logit contributions | |
ocate | -14.450 |
onential | -14.427 |
idious | -14.360 |
urnal | -14.314 |
enary | -13.631 |
Token | ford |
Token ID | 3841 |
Feature activation | +4.49e+00 |
Pos logit contributions | |
BT | +2.774 |
Dollar | +2.719 |
cour | +2.662 |
FW | +2.594 |
rentals | +2.531 |
Neg logit contributions | |
idious | -2.949 |
urnal | -2.791 |
onential | -2.770 |
ocate | -2.760 |
enary | -2.706 |
Token | and |
Token ID | 290 |
Feature activation | -4.23e+00 |
Pos logit contributions | |
BT | +2.992 |
Dollar | +2.972 |
cour | +2.813 |
FW | +2.779 |
rentals | +2.672 |
Neg logit contributions | |
idious | -4.832 |
urnal | -4.647 |
ocate | -4.632 |
onential | -4.620 |
enary | -4.549 |
Token | her |
Token ID | 607 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
idious | +4.248 |
ocate | +3.991 |
urnal | +3.987 |
enary | +3.919 |
onential | +3.913 |
Neg logit contributions | |
BT | -3.229 |
Dollar | -3.085 |
cour | -3.023 |
FW | -3.002 |
rentals | -2.878 |
Token | husband |
Token ID | 5229 |
Feature activation | +5.50e+00 |
Pos logit contributions | |
idious | +1.198 |
urnal | +1.130 |
ocate | +1.130 |
onential | +1.116 |
enary | +1.108 |
Neg logit contributions | |
BT | -0.960 |
Dollar | -0.936 |
cour | -0.909 |
FW | -0.898 |
rentals | -0.868 |
Token | : |
Token ID | 25 |
Feature activation | +4.62e+00 |
Pos logit contributions | |
BT | +1.898 |
Dollar | +1.842 |
cour | +1.773 |
FW | +1.736 |
rentals | +1.663 |
Neg logit contributions | |
idious | -3.736 |
urnal | -3.562 |
ocate | -3.539 |
onential | -3.535 |
enary | -3.502 |
Token |
|
Token ID | 198 |
Feature activation | +3.07e+00 |
Pos logit contributions | |
BT | +3.326 |
Dollar | +3.255 |
cour | +3.127 |
FW | +3.081 |
fav | +2.978 |
Neg logit contributions | |
idious | -4.772 |
urnal | -4.528 |
onential | -4.497 |
ocate | -4.477 |
enary | -4.412 |
Token |
|
Token ID | 198 |
Feature activation | +4.12e+00 |
Pos logit contributions | |
BT | +2.231 |
Dollar | +2.146 |
cour | +2.117 |
FW | +2.062 |
fav | +1.972 |
Neg logit contributions | |
idious | -3.245 |
urnal | -3.066 |
onential | -3.046 |
ocate | -3.035 |
enary | -2.990 |
Token | |
Token ID | 9525 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
BT | +2.998 |
cour | +2.802 |
Dollar | +2.783 |
FW | +2.776 |
FB | +2.638 |
Neg logit contributions | |
idious | -4.311 |
urnal | -4.099 |
ocate | -4.079 |
onential | -4.079 |
enary | -4.020 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -8.88e-01 |
Pos logit contributions | |
BT | +1.904 |
Dollar | +1.826 |
cour | +1.786 |
FW | +1.759 |
FB | +1.666 |
Neg logit contributions | |
idious | -2.854 |
urnal | -2.720 |
ocate | -2.701 |
onential | -2.686 |
enary | -2.650 |
Token | David |
Token ID | 11006 |
Feature activation | +1.81e+01 |
Pos logit contributions | |
idious | +0.975 |
urnal | +0.926 |
ocate | +0.925 |
onential | +0.915 |
enary | +0.909 |
Neg logit contributions | |
BT | -0.595 |
Dollar | -0.577 |
cour | -0.558 |
FW | -0.550 |
rentals | -0.527 |
Token | Cameron |
Token ID | 10821 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
Dollar | +12.630 |
BT | +11.781 |
cour | +11.205 |
Stub | +11.002 |
FW | +10.884 |
Neg logit contributions | |
idious | -15.628 |
onential | -14.924 |
urnal | -14.627 |
enary | -14.619 |
ocate | -14.607 |
Token | � |
Token ID | 447 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
idious | +0.412 |
ocate | +0.391 |
urnal | +0.391 |
onential | +0.386 |
enary | +0.384 |
Neg logit contributions | |
BT | -0.268 |
Dollar | -0.260 |
cour | -0.252 |
FW | -0.249 |
rentals | -0.239 |
Token | � |
Token ID | 247 |
Feature activation | +2.94e+00 |
Pos logit contributions | |
BT | +1.138 |
Dollar | +1.116 |
cour | +1.083 |
FW | +1.061 |
fav | +1.025 |
Neg logit contributions | |
idious | -1.717 |
ocate | -1.627 |
urnal | -1.623 |
onential | -1.602 |
enary | -1.583 |
Token | s |
Token ID | 82 |
Feature activation | -5.88e+00 |
Pos logit contributions | |
BT | +2.088 |
Dollar | +2.026 |
cour | +1.963 |
FW | +1.917 |
fav | +1.885 |
Neg logit contributions | |
idious | -3.103 |
urnal | -2.944 |
ocate | -2.934 |
onential | -2.920 |
enary | -2.875 |
Token | plans |
Token ID | 3352 |
Feature activation | +6.47e+00 |
Pos logit contributions | |
idious | +6.098 |
urnal | +5.763 |
ocate | +5.750 |
enary | +5.658 |
onential | +5.656 |
Neg logit contributions | |
BT | -4.131 |
Dollar | -3.922 |
FW | -3.909 |
cour | -3.869 |
rentals | -3.666 |
Token | former |
Token ID | 1966 |
Feature activation | +9.92e-01 |
Pos logit contributions | |
BT | +3.607 |
Dollar | +3.599 |
cour | +3.363 |
FW | +3.324 |
fav | +3.320 |
Neg logit contributions | |
idious | -5.218 |
urnal | -5.001 |
ocate | -4.919 |
onential | -4.914 |
enary | -4.909 |
Token | Ku |
Token ID | 12554 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
BT | +0.761 |
Dollar | +0.748 |
cour | +0.716 |
FW | +0.710 |
rentals | +0.691 |
Neg logit contributions | |
idious | -0.994 |
urnal | -0.938 |
ocate | -0.935 |
onential | -0.928 |
enary | -0.921 |
Token | Klux |
Token ID | 45092 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
BT | +2.611 |
Dollar | +2.571 |
cour | +2.442 |
FW | +2.432 |
fav | +2.341 |
Neg logit contributions | |
idious | -3.158 |
urnal | -2.961 |
ocate | -2.948 |
onential | -2.941 |
enary | -2.913 |
Token | Klan |
Token ID | 31151 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
idious | +3.078 |
ocate | +2.918 |
urnal | +2.893 |
onential | +2.823 |
enary | +2.813 |
Neg logit contributions | |
BT | -2.888 |
Dollar | -2.802 |
cour | -2.770 |
FW | -2.736 |
rentals | -2.647 |
Token | leader |
Token ID | 3554 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
idious | +3.770 |
ocate | +3.586 |
urnal | +3.530 |
enary | +3.459 |
onential | +3.427 |
Neg logit contributions | |
BT | -3.909 |
Dollar | -3.753 |
cour | -3.713 |
FW | -3.707 |
fav | -3.545 |
Token | David |
Token ID | 3271 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
idious | +3.188 |
ocate | +3.003 |
urnal | +2.962 |
enary | +2.899 |
onential | +2.881 |
Neg logit contributions | |
BT | -2.729 |
Dollar | -2.596 |
cour | -2.579 |
FW | -2.571 |
fav | -2.473 |
Token | Duke |
Token ID | 11083 |
Feature activation | +3.14e-01 |
Pos logit contributions | |
Dollar | +3.582 |
BT | +1.770 |
Stub | +1.675 |
Bridge | +1.323 |
dollars | +1.315 |
Neg logit contributions | |
onential | -25.667 |
idious | -25.400 |
enary | -25.229 |
urnal | -24.510 |
chnology | -24.391 |
Token | . |
Token ID | 13 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
BT | +0.227 |
Dollar | +0.222 |
cour | +0.214 |
FW | +0.211 |
rentals | +0.203 |
Neg logit contributions | |
idious | -0.328 |
urnal | -0.311 |
ocate | -0.310 |
onential | -0.308 |
enary | -0.305 |
Token | ( |
Token ID | 357 |
Feature activation | +3.33e+00 |
Pos logit contributions | |
idious | +0.116 |
urnal | +0.109 |
ocate | +0.109 |
onential | +0.108 |
enary | +0.107 |
Neg logit contributions | |
BT | -0.088 |
Dollar | -0.086 |
cour | -0.084 |
FW | -0.083 |
rentals | -0.080 |
Token | Joe |
Token ID | 19585 |
Feature activation | +9.84e+00 |
Pos logit contributions | |
BT | +2.506 |
Dollar | +2.403 |
cour | +2.376 |
FW | +2.305 |
FB | +2.210 |
Neg logit contributions | |
idious | -3.410 |
urnal | -3.229 |
ocate | -3.219 |
onential | -3.199 |
enary | -3.142 |
Token | Bur |
Token ID | 5481 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
BT | +4.589 |
Dollar | +4.585 |
cour | +4.265 |
FW | +4.060 |
Stub | +4.021 |
Neg logit contributions | |
idious | -12.203 |
ocate | -11.672 |
onential | -11.548 |
enary | -11.536 |
urnal | -11.419 |
Token |
|
Token ID | 198 |
Feature activation | +3.09e+00 |
Pos logit contributions | |
BT | +1.755 |
Dollar | +1.703 |
cour | +1.666 |
FW | +1.627 |
fav | +1.569 |
Neg logit contributions | |
idious | -2.475 |
urnal | -2.338 |
onential | -2.322 |
ocate | -2.320 |
enary | -2.282 |
Token | Sleep |
Token ID | 40555 |
Feature activation | +3.74e+00 |
Pos logit contributions | |
BT | +2.022 |
Dollar | +1.880 |
cour | +1.871 |
FW | +1.857 |
FB | +1.772 |
Neg logit contributions | |
idious | -3.488 |
urnal | -3.334 |
ocate | -3.324 |
onential | -3.287 |
enary | -3.261 |
Token | ers |
Token ID | 364 |
Feature activation | +6.50e-01 |
Pos logit contributions | |
BT | +2.540 |
Dollar | +2.491 |
cour | +2.402 |
FW | +2.346 |
rentals | +2.283 |
Neg logit contributions | |
idious | -4.048 |
urnal | -3.842 |
ocate | -3.834 |
onential | -3.797 |
enary | -3.778 |
Token |
|
Token ID | 198 |
Feature activation | +6.37e+00 |
Pos logit contributions | |
BT | +0.455 |
Dollar | +0.443 |
cour | +0.429 |
FW | +0.422 |
rentals | +0.405 |
Neg logit contributions | |
idious | -0.693 |
ocate | -0.657 |
urnal | -0.655 |
onential | -0.647 |
enary | -0.643 |
Token |
|
Token ID | 198 |
Feature activation | +6.20e+00 |
Pos logit contributions | |
BT | +4.217 |
Dollar | +4.044 |
cour | +4.024 |
FW | +3.854 |
FB | +3.710 |
Neg logit contributions | |
idious | -7.027 |
urnal | -6.660 |
onential | -6.646 |
ocate | -6.563 |
enary | -6.461 |
Token | Jay |
Token ID | 30568 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
BT | +4.044 |
cour | +3.712 |
FW | +3.701 |
Dollar | +3.630 |
FB | +3.584 |
Neg logit contributions | |
idious | -6.971 |
urnal | -6.671 |
ocate | -6.646 |
onential | -6.579 |
enary | -6.524 |
Token | Cutler |
Token ID | 37194 |
Feature activation | +3.64e+00 |
Pos logit contributions | |
BT | +5.740 |
Dollar | +5.625 |
FW | +5.129 |
cour | +5.086 |
fav | +4.896 |
Neg logit contributions | |
idious | -22.422 |
urnal | -21.795 |
onential | -21.570 |
ocate | -21.378 |
elfth | -21.284 |
Token | ( |
Token ID | 357 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
BT | +2.496 |
Dollar | +2.427 |
cour | +2.334 |
FW | +2.301 |
fav | +2.236 |
Neg logit contributions | |
idious | -3.893 |
urnal | -3.728 |
ocate | -3.715 |
onential | -3.690 |
enary | -3.645 |
Token | at |
Token ID | 265 |
Feature activation | -4.19e-01 |
Pos logit contributions | |
BT | +0.637 |
Dollar | +0.610 |
cour | +0.600 |
FW | +0.592 |
FB | +0.564 |
Neg logit contributions | |
idious | -0.933 |
urnal | -0.891 |
ocate | -0.888 |
onential | -0.877 |
enary | -0.871 |
Token | MIN |
Token ID | 20625 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
idious | +0.478 |
urnal | +0.456 |
ocate | +0.455 |
onential | +0.450 |
enary | +0.448 |
Neg logit contributions | |
BT | -0.262 |
Dollar | -0.254 |
cour | -0.245 |
FW | -0.241 |
rentals | -0.231 |
Token | ): |
Token ID | 2599 |
Feature activation | +4.78e+00 |
Pos logit contributions | |
BT | +1.210 |
Dollar | +1.169 |
cour | +1.130 |
FW | +1.116 |
rentals | +1.064 |
Neg logit contributions | |
idious | -2.127 |
urnal | -2.031 |
ocate | -2.024 |
onential | -2.000 |
enary | -1.987 |
Token | , |
Token ID | 11 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
idious | +0.450 |
ocate | +0.426 |
urnal | +0.426 |
onential | +0.421 |
enary | +0.418 |
Neg logit contributions | |
BT | -0.290 |
Dollar | -0.282 |
cour | -0.272 |
FW | -0.269 |
rentals | -0.258 |
Token | if |
Token ID | 611 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
BT | +2.421 |
Dollar | +2.395 |
cour | +2.289 |
FW | +2.241 |
fav | +2.190 |
Neg logit contributions | |
idious | -3.580 |
urnal | -3.404 |
ocate | -3.388 |
onential | -3.355 |
enary | -3.332 |
Token | you |
Token ID | 345 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
BT | +0.892 |
Dollar | +0.876 |
cour | +0.853 |
FW | +0.841 |
fav | +0.821 |
Neg logit contributions | |
idious | -0.902 |
urnal | -0.846 |
ocate | -0.844 |
onential | -0.835 |
enary | -0.831 |
Token | will |
Token ID | 481 |
Feature activation | +5.53e-01 |
Pos logit contributions | |
BT | +0.897 |
Dollar | +0.871 |
cour | +0.841 |
FW | +0.829 |
fav | +0.798 |
Neg logit contributions | |
idious | -1.446 |
urnal | -1.373 |
ocate | -1.372 |
onential | -1.358 |
enary | -1.348 |
Token | , |
Token ID | 11 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
BT | +0.411 |
Dollar | +0.400 |
cour | +0.388 |
FW | +0.383 |
rentals | +0.370 |
Neg logit contributions | |
idious | -0.566 |
urnal | -0.536 |
ocate | -0.536 |
onential | -0.530 |
enary | -0.525 |
Token | David |
Token ID | 3271 |
Feature activation | +1.78e+01 |
Pos logit contributions | |
BT | +0.751 |
Dollar | +0.731 |
cour | +0.706 |
FW | +0.694 |
fav | +0.671 |
Neg logit contributions | |
idious | -1.163 |
urnal | -1.105 |
ocate | -1.104 |
onential | -1.092 |
enary | -1.085 |
Token | Wise |
Token ID | 28908 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
Dollar | +10.405 |
BT | +9.825 |
FW | +9.331 |
cour | +9.310 |
fav | +9.153 |
Neg logit contributions | |
idious | -16.658 |
onential | -16.559 |
urnal | -16.370 |
ocate | -16.214 |
enary | -15.608 |
Token | � |
Token ID | 447 |
Feature activation | +7.16e-01 |
Pos logit contributions | |
BT | +0.136 |
Dollar | +0.133 |
cour | +0.129 |
FW | +0.127 |
rentals | +0.123 |
Neg logit contributions | |
idious | -0.169 |
urnal | -0.159 |
ocate | -0.159 |
onential | -0.157 |
enary | -0.156 |
Token | � |
Token ID | 247 |
Feature activation | +6.33e+00 |
Pos logit contributions | |
BT | +0.641 |
Dollar | +0.629 |
cour | +0.614 |
FW | +0.604 |
rentals | +0.588 |
Neg logit contributions | |
idious | -0.625 |
ocate | -0.586 |
urnal | -0.584 |
onential | -0.576 |
enary | -0.569 |
Token | s |
Token ID | 82 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
BT | +2.422 |
Dollar | +2.325 |
cour | +2.248 |
FW | +2.125 |
fav | +2.088 |
Neg logit contributions | |
idious | -8.507 |
urnal | -8.213 |
onential | -8.162 |
ocate | -8.135 |
enary | -8.004 |
Token | � |
Token ID | 564 |
Feature activation | -4.56e+00 |
Pos logit contributions | |
idious | +3.352 |
ocate | +3.157 |
urnal | +3.152 |
enary | +3.113 |
onential | +3.111 |
Neg logit contributions | |
BT | -2.313 |
Dollar | -2.214 |
cour | -2.172 |
FW | -2.155 |
rentals | -2.050 |
Token | in |
Token ID | 287 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
idious | +5.688 |
ocate | +5.311 |
urnal | +5.277 |
onential | +5.205 |
enary | +5.198 |
Neg logit contributions | |
BT | -4.338 |
Dollar | -4.205 |
FW | -4.102 |
cour | -4.088 |
rentals | -3.897 |
Token | the |
Token ID | 262 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
idious | +2.138 |
urnal | +2.017 |
ocate | +2.017 |
onential | +1.992 |
enary | +1.978 |
Neg logit contributions | |
BT | -1.663 |
Dollar | -1.622 |
cour | -1.574 |
FW | -1.557 |
rentals | -1.502 |
Token | Conservative |
Token ID | 11132 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
idious | +1.979 |
ocate | +1.876 |
urnal | +1.874 |
onential | +1.851 |
enary | +1.843 |
Neg logit contributions | |
BT | -1.293 |
Dollar | -1.255 |
cour | -1.222 |
FW | -1.207 |
rentals | -1.154 |
Token | party |
Token ID | 2151 |
Feature activation | -3.81e+00 |
Pos logit contributions | |
idious | +2.571 |
urnal | +2.443 |
ocate | +2.441 |
onential | +2.408 |
enary | +2.396 |
Neg logit contributions | |
BT | -1.685 |
Dollar | -1.634 |
cour | -1.589 |
FW | -1.572 |
rentals | -1.502 |
Token | . |
Token ID | 13 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
idious | +3.849 |
ocate | +3.629 |
urnal | +3.624 |
onential | +3.565 |
enary | +3.549 |
Neg logit contributions | |
BT | -2.850 |
Dollar | -2.754 |
cour | -2.695 |
FW | -2.674 |
rentals | -2.564 |
Token | David |
Token ID | 3271 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
BT | +1.023 |
Dollar | +1.001 |
cour | +0.961 |
FW | +0.946 |
fav | +0.916 |
Neg logit contributions | |
idious | -1.442 |
urnal | -1.367 |
ocate | -1.361 |
onential | -1.347 |
enary | -1.335 |
Token | Cameron |
Token ID | 10821 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
Dollar | +6.981 |
BT | +6.536 |
Stub | +5.629 |
fav | +5.566 |
FW | +5.226 |
Neg logit contributions | |
idious | -20.903 |
onential | -20.125 |
enary | -20.121 |
urnal | -19.862 |
ocate | -19.801 |
Token | believes |
Token ID | 5804 |
Feature activation | +5.32e+00 |
Pos logit contributions | |
BT | +1.158 |
Dollar | +1.132 |
cour | +1.086 |
FW | +1.063 |
fav | +1.053 |
Neg logit contributions | |
idious | -1.775 |
urnal | -1.692 |
ocate | -1.685 |
onential | -1.677 |
enary | -1.658 |
Token | there |
Token ID | 612 |
Feature activation | -9.83e+00 |
Pos logit contributions | |
BT | +3.694 |
Dollar | +3.677 |
cour | +3.461 |
fav | +3.434 |
rentals | +3.390 |
Neg logit contributions | |
idious | -5.499 |
urnal | -5.341 |
ocate | -5.263 |
onential | -5.242 |
enary | -5.173 |
Token | is |
Token ID | 318 |
Feature activation | -7.11e+00 |
Pos logit contributions | |
idious | +9.108 |
ocate | +8.617 |
enary | +8.436 |
onential | +8.385 |
urnal | +8.323 |
Neg logit contributions | |
BT | -7.350 |
Dollar | -7.201 |
cour | -7.066 |
FW | -6.978 |
FB | -6.731 |
Token | significant |
Token ID | 2383 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
idious | +6.773 |
ocate | +6.239 |
enary | +6.156 |
onential | +6.146 |
urnal | +6.112 |
Neg logit contributions | |
BT | -5.625 |
Dollar | -5.367 |
FW | -5.319 |
cour | -5.315 |
FB | -5.093 |
Token | pool |
Token ID | 5933 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
BT | +2.813 |
Dollar | +2.777 |
cour | +2.634 |
FW | +2.596 |
fav | +2.551 |
Neg logit contributions | |
idious | -3.918 |
ocate | -3.740 |
urnal | -3.736 |
onential | -3.698 |
enary | -3.675 |
Token | together |
Token ID | 1978 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
BT | +0.807 |
Dollar | +0.789 |
cour | +0.762 |
FW | +0.752 |
rentals | +0.728 |
Neg logit contributions | |
idious | -1.139 |
urnal | -1.086 |
ocate | -1.081 |
onential | -1.073 |
enary | -1.063 |
Token | ? |
Token ID | 30 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
BT | +2.582 |
Dollar | +2.514 |
cour | +2.434 |
FW | +2.372 |
fav | +2.292 |
Neg logit contributions | |
idious | -4.677 |
ocate | -4.492 |
urnal | -4.487 |
onential | -4.464 |
enary | -4.413 |
Token |
|
Token ID | 198 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
BT | +2.007 |
Dollar | +1.957 |
cour | +1.884 |
FW | +1.860 |
fav | +1.780 |
Neg logit contributions | |
idious | -2.781 |
urnal | -2.636 |
ocate | -2.625 |
onential | -2.607 |
enary | -2.572 |
Token |
|
Token ID | 198 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
BT | +1.213 |
Dollar | +1.178 |
cour | +1.152 |
FW | +1.128 |
fav | +1.085 |
Neg logit contributions | |
idious | -1.658 |
urnal | -1.568 |
ocate | -1.559 |
onential | -1.555 |
enary | -1.533 |
Token | Mike |
Token ID | 16073 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
BT | +1.687 |
Dollar | +1.614 |
cour | +1.599 |
FW | +1.578 |
FB | +1.492 |
Neg logit contributions | |
idious | -2.373 |
urnal | -2.253 |
ocate | -2.239 |
onential | -2.232 |
enary | -2.201 |
Token | Don |
Token ID | 2094 |
Feature activation | +8.81e+00 |
Pos logit contributions | |
Dollar | +6.370 |
cour | +5.159 |
BT | +4.996 |
FW | +4.907 |
Stub | +4.573 |
Neg logit contributions | |
idious | -22.778 |
urnal | -22.656 |
onential | -22.079 |
chnology | -21.120 |
enary | -21.043 |
Token | ais |
Token ID | 15152 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
cour | +5.448 |
BT | +5.398 |
Dollar | +5.122 |
FW | +4.891 |
fav | +4.692 |
Neg logit contributions | |
idious | -9.381 |
onential | -8.996 |
urnal | -8.919 |
ocate | -8.870 |
enary | -8.771 |
Token | : |
Token ID | 25 |
Feature activation | +3.58e-02 |
Pos logit contributions | |
BT | +1.218 |
Dollar | +1.172 |
cour | +1.122 |
FW | +1.087 |
fav | +1.023 |
Neg logit contributions | |
idious | -3.299 |
urnal | -3.158 |
ocate | -3.146 |
onential | -3.134 |
enary | -3.104 |
Token | I |
Token ID | 314 |
Feature activation | +4.76e+00 |
Pos logit contributions | |
BT | +0.026 |
Dollar | +0.025 |
cour | +0.025 |
FW | +0.024 |
rentals | +0.023 |
Neg logit contributions | |
idious | -0.037 |
ocate | -0.035 |
urnal | -0.035 |
onential | -0.035 |
enary | -0.034 |
Token | was |
Token ID | 373 |
Feature activation | -7.50e-02 |
Pos logit contributions | |
BT | +3.310 |
Dollar | +3.195 |
cour | +3.083 |
FW | +3.003 |
fav | +2.970 |
Neg logit contributions | |
idious | -5.101 |
urnal | -4.811 |
onential | -4.783 |
ocate | -4.772 |
enary | -4.705 |
Token | Craig |
Token ID | 13854 |
Feature activation | +8.40e+00 |
Pos logit contributions | |
BT | +3.091 |
Dollar | +3.084 |
cour | +2.938 |
FW | +2.877 |
rentals | +2.855 |
Neg logit contributions | |
idious | -4.344 |
urnal | -4.162 |
ocate | -4.144 |
onential | -4.139 |
enary | -4.089 |
Token | Kim |
Token ID | 6502 |
Feature activation | +9.06e+00 |
Pos logit contributions | |
Dollar | +4.227 |
BT | +3.929 |
cour | +3.526 |
FW | +3.523 |
rentals | +3.496 |
Neg logit contributions | |
idious | -10.359 |
urnal | -9.948 |
onential | -9.834 |
ocate | -9.777 |
enary | -9.752 |
Token | b |
Token ID | 65 |
Feature activation | +4.60e+00 |
Pos logit contributions | |
BT | +2.686 |
Dollar | +2.561 |
cour | +2.519 |
FW | +2.362 |
fav | +2.064 |
Neg logit contributions | |
ocate | -12.809 |
idious | -12.612 |
urnal | -12.256 |
onential | -12.199 |
enary | -12.175 |
Token | rel |
Token ID | 2411 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
Dollar | +3.635 |
BT | +3.630 |
cour | +3.498 |
FW | +3.359 |
rentals | +3.332 |
Neg logit contributions | |
idious | -4.295 |
onential | -4.115 |
urnal | -4.111 |
ocate | -4.050 |
enary | -4.024 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
BT | +2.576 |
Dollar | +2.491 |
cour | +2.431 |
FW | +2.389 |
rentals | +2.314 |
Neg logit contributions | |
idious | -3.886 |
urnal | -3.720 |
ocate | -3.698 |
onential | -3.678 |
enary | -3.620 |
Token | Kim |
Token ID | 6502 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
BT | +1.334 |
Dollar | +1.311 |
cour | +1.252 |
FW | +1.239 |
fav | +1.184 |
Neg logit contributions | |
idious | -1.953 |
urnal | -1.856 |
ocate | -1.844 |
onential | -1.829 |
enary | -1.811 |
Token | b |
Token ID | 65 |
Feature activation | +8.55e+00 |
Pos logit contributions | |
BT | +6.958 |
cour | +6.547 |
Dollar | +5.989 |
FB | +5.487 |
FW | +5.391 |
Neg logit contributions | |
idious | -20.840 |
urnal | -20.290 |
ocate | -20.245 |
onential | -20.132 |
enary | -19.862 |
Token | rel |
Token ID | 2411 |
Feature activation | +9.22e+00 |
Pos logit contributions | |
BT | +6.649 |
cour | +6.424 |
FW | +6.255 |
Dollar | +6.191 |
FB | +5.903 |
Neg logit contributions | |
idious | -7.959 |
onential | -7.638 |
ocate | -7.500 |
urnal | -7.462 |
enary | -7.342 |
Token | is |
Token ID | 318 |
Feature activation | +4.69e+00 |
Pos logit contributions | |
BT | +5.858 |
Dollar | +5.611 |
cour | +5.483 |
FW | +5.385 |
fav | +5.244 |
Neg logit contributions | |
idious | -9.961 |
urnal | -9.547 |
onential | -9.459 |
ocate | -9.332 |
enary | -9.227 |
Token | awesome |
Token ID | 7427 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
BT | +3.557 |
Dollar | +3.526 |
cour | +3.370 |
FW | +3.346 |
rentals | +3.286 |
Neg logit contributions | |
idious | -4.640 |
urnal | -4.429 |
onential | -4.402 |
ocate | -4.387 |
enary | -4.328 |
Token | . |
Token ID | 13 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
idious | +2.977 |
ocate | +2.805 |
urnal | +2.799 |
onential | +2.766 |
enary | +2.759 |
Neg logit contributions | |
BT | -2.112 |
Dollar | -2.061 |
cour | -1.993 |
FW | -1.959 |
rentals | -1.891 |
Token | They |
Token ID | 1119 |
Feature activation | +4.87e+00 |
Pos logit contributions | |
idious | +0.033 |
ocate | +0.032 |
urnal | +0.032 |
onential | +0.031 |
enary | +0.031 |
Neg logit contributions | |
BT | -0.026 |
Dollar | -0.025 |
cour | -0.024 |
FW | -0.024 |
rentals | -0.023 |
Token | also |
Token ID | 635 |
Feature activation | +5.95e+00 |
Pos logit contributions | |
BT | +2.965 |
Dollar | +2.858 |
cour | +2.752 |
FW | +2.679 |
rentals | +2.614 |
Neg logit contributions | |
idious | -5.611 |
urnal | -5.365 |
onential | -5.312 |
ocate | -5.265 |
enary | -5.220 |
Token | could |
Token ID | 714 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
BT | +3.510 |
Dollar | +3.403 |
cour | +3.242 |
FW | +3.155 |
rentals | +3.124 |
Neg logit contributions | |
idious | -6.906 |
urnal | -6.632 |
onential | -6.575 |
ocate | -6.512 |
enary | -6.441 |
Token | rest |
Token ID | 1334 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
idious | +1.234 |
ocate | +1.176 |
urnal | +1.165 |
onential | +1.153 |
enary | +1.149 |
Neg logit contributions | |
BT | -0.844 |
Dollar | -0.820 |
cour | -0.799 |
FW | -0.786 |
fav | -0.753 |
Token | ructure |
Token ID | 5620 |
Feature activation | -8.28e-01 |
Pos logit contributions | |
idious | +2.251 |
ocate | +2.108 |
urnal | +2.071 |
enary | +2.019 |
onential | +2.002 |
Neg logit contributions | |
BT | -3.875 |
Dollar | -3.796 |
cour | -3.724 |
FW | -3.683 |
fav | -3.610 |
Token | Mike |
Token ID | 4995 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
idious | +0.864 |
ocate | +0.818 |
urnal | +0.816 |
onential | +0.808 |
enary | +0.803 |
Neg logit contributions | |
BT | -0.599 |
Dollar | -0.578 |
cour | -0.563 |
FW | -0.555 |
fav | -0.532 |
Token | P |
Token ID | 350 |
Feature activation | +4.97e+00 |
Pos logit contributions | |
Dollar | +9.411 |
BT | +9.086 |
cour | +8.246 |
FW | +8.141 |
Stub | +7.982 |
Neg logit contributions | |
idious | -19.699 |
onential | -18.720 |
ocate | -18.596 |
enary | -18.416 |
elfth | -17.974 |
Token | ounce |
Token ID | 8652 |
Feature activation | +4.77e+00 |
Pos logit contributions | |
BT | +4.402 |
cour | +4.200 |
Dollar | +4.175 |
FW | +4.077 |
rentals | +3.978 |
Neg logit contributions | |
idious | -4.336 |
urnal | -4.082 |
onential | -4.022 |
ocate | -3.912 |
enary | -3.884 |
Token | y |
Token ID | 88 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
BT | +2.327 |
Dollar | +2.249 |
cour | +2.161 |
FW | +2.035 |
rentals | +1.984 |
Neg logit contributions | |
idious | -6.068 |
ocate | -5.880 |
onential | -5.835 |
enary | -5.749 |
urnal | -5.712 |
Token | ($ |
Token ID | 7198 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
BT | +0.833 |
Dollar | +0.811 |
cour | +0.780 |
FW | +0.770 |
rentals | +0.741 |
Neg logit contributions | |
idious | -1.375 |
urnal | -1.309 |
ocate | -1.301 |
onential | -1.293 |
enary | -1.280 |
Token | 8 |
Token ID | 23 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
BT | +1.922 |
Dollar | +1.847 |
cour | +1.829 |
FW | +1.801 |
FB | +1.735 |
Neg logit contributions | |
idious | -2.065 |
urnal | -1.951 |
ocate | -1.922 |
onential | -1.914 |
enary | -1.890 |
Token | o |
Token ID | 78 |
Feature activation | -4.64e-01 |
Pos logit contributions | |
idious | +3.410 |
urnal | +3.248 |
ocate | +3.234 |
onential | +3.207 |
enary | +3.194 |
Neg logit contributions | |
BT | -2.384 |
Dollar | -2.298 |
FW | -2.217 |
cour | -2.212 |
rentals | -2.137 |
Token | Tre |
Token ID | 4700 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
idious | +0.527 |
urnal | +0.501 |
ocate | +0.501 |
onential | +0.496 |
enary | +0.493 |
Neg logit contributions | |
BT | -0.292 |
Dollar | -0.283 |
cour | -0.273 |
FW | -0.268 |
rentals | -0.257 |
Token | u |
Token ID | 84 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
BT | +2.471 |
Dollar | +2.421 |
cour | +2.395 |
FW | +2.285 |
fav | +2.206 |
Neg logit contributions | |
idious | -3.762 |
ocate | -3.554 |
urnal | -3.536 |
onential | -3.527 |
enary | -3.494 |
Token | , |
Token ID | 11 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
BT | +1.315 |
Dollar | +1.289 |
cour | +1.258 |
FW | +1.227 |
fav | +1.185 |
Neg logit contributions | |
idious | -1.581 |
ocate | -1.484 |
onential | -1.480 |
urnal | -1.479 |
enary | -1.458 |
Token | an |
Token ID | 281 |
Feature activation | -9.54e+00 |
Pos logit contributions | |
idious | +8.367 |
ocate | +7.819 |
urnal | +7.799 |
enary | +7.676 |
onential | +7.586 |
Neg logit contributions | |
BT | -9.359 |
Dollar | -9.006 |
cour | -8.846 |
FW | -8.832 |
rentals | -8.606 |
Token | astroph |
Token ID | 48782 |
Feature activation | -2.16e+01 |
Pos logit contributions | |
idious | +6.706 |
urnal | +6.251 |
ocate | +6.198 |
onential | +6.043 |
enary | +5.981 |
Neg logit contributions | |
BT | -9.745 |
Dollar | -9.479 |
cour | -9.164 |
FW | -9.152 |
rentals | -8.952 |
Token | ys |
Token ID | 893 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
idious | +11.585 |
ocate | +11.185 |
urnal | +11.133 |
onential | +10.713 |
enary | +10.362 |
Neg logit contributions | |
BT | -20.657 |
Dollar | -20.382 |
fav | -20.096 |
rentals | -19.955 |
FW | -19.937 |
Token | icist |
Token ID | 48187 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
idious | +4.314 |
ocate | +4.055 |
urnal | +3.738 |
onential | +3.443 |
enary | +3.419 |
Neg logit contributions | |
BT | -18.013 |
Dollar | -17.951 |
rentals | -17.504 |
cour | -17.292 |
fav | -17.275 |
Token | at |
Token ID | 379 |
Feature activation | -7.24e+00 |
Pos logit contributions | |
idious | +13.948 |
urnal | +12.974 |
enary | +12.805 |
ocate | +12.479 |
onential | +11.902 |
Neg logit contributions | |
BT | -16.450 |
Dollar | -15.908 |
FW | -15.751 |
cour | -15.453 |
rentals | -15.156 |
Token | the |
Token ID | 262 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
idious | +6.902 |
ocate | +6.617 |
urnal | +6.559 |
onential | +6.432 |
enary | +6.428 |
Neg logit contributions | |
BT | -5.505 |
Dollar | -5.230 |
cour | -5.193 |
FW | -5.180 |
rentals | -5.061 |
Token | University |
Token ID | 2059 |
Feature activation | -5.97e+00 |
Pos logit contributions | |
idious | +5.821 |
ocate | +5.571 |
urnal | +5.556 |
enary | +5.467 |
onential | +5.440 |
Neg logit contributions | |
BT | -4.519 |
Dollar | -4.290 |
cour | -4.242 |
FW | -4.227 |
rentals | -4.094 |
Token | ell |
Token ID | 695 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
BT | +0.752 |
Dollar | +0.739 |
cour | +0.718 |
FW | +0.702 |
fav | +0.682 |
Neg logit contributions | |
idious | -0.820 |
ocate | -0.776 |
urnal | -0.769 |
onential | -0.766 |
enary | -0.755 |
Token | , |
Token ID | 11 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
idious | +3.480 |
urnal | +3.285 |
ocate | +3.284 |
onential | +3.243 |
enary | +3.236 |
Neg logit contributions | |
BT | -2.359 |
Dollar | -2.279 |
cour | -2.212 |
FW | -2.197 |
rentals | -2.127 |
Token | professor |
Token ID | 6240 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
idious | +11.282 |
ocate | +10.721 |
urnal | +10.666 |
onential | +10.537 |
enary | +10.533 |
Neg logit contributions | |
BT | -8.753 |
FW | -8.298 |
Dollar | -8.136 |
cour | -8.129 |
rentals | -7.962 |
Token | of |
Token ID | 286 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
idious | +12.768 |
urnal | +11.946 |
ocate | +11.607 |
enary | +11.512 |
onential | +11.432 |
Neg logit contributions | |
BT | -15.764 |
FW | -14.964 |
Dollar | -14.880 |
cour | -14.724 |
rentals | -14.538 |
Token | climate |
Token ID | 4258 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
idious | +9.883 |
ocate | +9.324 |
urnal | +9.299 |
onential | +9.233 |
enary | +9.028 |
Neg logit contributions | |
BT | -10.023 |
FW | -9.626 |
Dollar | -9.570 |
cour | -9.417 |
FB | -9.240 |
Token | sciences |
Token ID | 19838 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
idious | +10.288 |
ocate | +9.765 |
urnal | +9.501 |
onential | +9.495 |
enary | +9.273 |
Neg logit contributions | |
BT | -10.315 |
Dollar | -10.045 |
FW | -9.839 |
cour | -9.644 |
FB | -9.332 |
Token | at |
Token ID | 379 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
idious | +14.908 |
enary | +13.609 |
urnal | +13.604 |
ocate | +13.588 |
onential | +13.441 |
Neg logit contributions | |
BT | -16.094 |
FW | -15.660 |
Dollar | -15.655 |
cour | -15.251 |
fav | -14.872 |
Token | Duke |
Token ID | 11083 |
Feature activation | -9.54e+00 |
Pos logit contributions | |
idious | +11.564 |
ocate | +11.169 |
enary | +10.964 |
urnal | +10.952 |
onential | +10.914 |
Neg logit contributions | |
BT | -6.052 |
FW | -5.638 |
cour | -5.478 |
Dollar | -5.473 |
rentals | -5.416 |
Token | 's |
Token ID | 338 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
idious | +8.506 |
urnal | +8.250 |
ocate | +8.224 |
enary | +8.161 |
onential | +8.086 |
Neg logit contributions | |
BT | -7.506 |
Dollar | -7.307 |
FW | -7.043 |
cour | -7.035 |
rentals | -6.999 |
Token | Nicholas |
Token ID | 20320 |
Feature activation | +2.35e+00 |
Pos logit contributions | |
idious | +10.703 |
ocate | +10.283 |
onential | +10.267 |
urnal | +10.250 |
enary | +10.124 |
Neg logit contributions | |
BT | -6.631 |
FW | -6.234 |
Dollar | -6.130 |
cour | -6.070 |
rentals | -5.984 |
Token | School |
Token ID | 3961 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
BT | +1.491 |
Dollar | +1.450 |
cour | +1.399 |
FW | +1.365 |
fav | +1.306 |
Neg logit contributions | |
idious | -2.674 |
ocate | -2.544 |
urnal | -2.497 |
onential | -2.493 |
enary | -2.470 |
Token | Thomas |
Token ID | 5658 |
Feature activation | +5.55e+00 |
Pos logit contributions | |
idious | +5.204 |
ocate | +4.942 |
urnal | +4.940 |
onential | +4.871 |
enary | +4.848 |
Neg logit contributions | |
BT | -3.304 |
Dollar | -3.139 |
cour | -3.095 |
FW | -3.051 |
rentals | -2.979 |
Token | Se |
Token ID | 1001 |
Feature activation | +3.93e+00 |
Pos logit contributions | |
Dollar | +3.404 |
BT | +3.401 |
cour | +3.181 |
FW | +3.151 |
fav | +3.016 |
Neg logit contributions | |
idious | -6.263 |
urnal | -5.983 |
ocate | -5.963 |
onential | -5.937 |
enary | -5.887 |
Token | iler |
Token ID | 5329 |
Feature activation | -2.59e+00 |
Pos logit contributions | |
BT | +3.258 |
Dollar | +3.160 |
cour | +3.071 |
FW | +3.047 |
FB | +2.907 |
Neg logit contributions | |
idious | -3.561 |
urnal | -3.351 |
ocate | -3.343 |
onential | -3.319 |
enary | -3.261 |
Token | , |
Token ID | 11 |
Feature activation | -8.06e+00 |
Pos logit contributions | |
idious | +2.704 |
ocate | +2.559 |
urnal | +2.556 |
onential | +2.523 |
enary | +2.514 |
Neg logit contributions | |
BT | -1.865 |
Dollar | -1.816 |
cour | -1.761 |
FW | -1.738 |
rentals | -1.679 |
Token | a |
Token ID | 257 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
idious | +7.365 |
ocate | +6.971 |
urnal | +6.914 |
enary | +6.826 |
onential | +6.771 |
Neg logit contributions | |
BT | -6.526 |
Dollar | -6.236 |
cour | -6.160 |
FW | -6.080 |
rentals | -5.984 |
Token | physicist |
Token ID | 33013 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
idious | +4.318 |
ocate | +4.098 |
urnal | +4.064 |
enary | +3.997 |
onential | +3.945 |
Neg logit contributions | |
BT | -4.362 |
Dollar | -4.223 |
cour | -4.169 |
FW | -4.116 |
rentals | -4.017 |
Token | from |
Token ID | 422 |
Feature activation | -5.16e+00 |
Pos logit contributions | |
idious | +15.595 |
enary | +14.312 |
ocate | +14.154 |
urnal | +14.138 |
elfth | +13.332 |
Neg logit contributions | |
BT | -15.728 |
Dollar | -14.930 |
FW | -14.889 |
cour | -14.509 |
FB | -14.449 |
Token | Germany |
Token ID | 4486 |
Feature activation | -5.28e+00 |
Pos logit contributions | |
idious | +5.063 |
ocate | +4.840 |
urnal | +4.787 |
enary | +4.723 |
onential | +4.712 |
Neg logit contributions | |
BT | -3.916 |
Dollar | -3.745 |
cour | -3.682 |
FW | -3.644 |
rentals | -3.547 |
Token | , |
Token ID | 11 |
Feature activation | -3.99e+00 |
Pos logit contributions | |
idious | +5.248 |
ocate | +4.991 |
urnal | +4.970 |
enary | +4.914 |
onential | +4.893 |
Neg logit contributions | |
BT | -3.945 |
Dollar | -3.843 |
cour | -3.750 |
FW | -3.690 |
rentals | -3.587 |
Token | gave |
Token ID | 2921 |
Feature activation | -4.86e+00 |
Pos logit contributions | |
idious | +4.047 |
ocate | +3.833 |
urnal | +3.821 |
onential | +3.763 |
enary | +3.745 |
Neg logit contributions | |
BT | -2.962 |
Dollar | -2.865 |
cour | -2.810 |
FW | -2.771 |
rentals | -2.663 |
Token | the |
Token ID | 262 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
idious | +4.668 |
urnal | +4.413 |
ocate | +4.389 |
onential | +4.340 |
enary | +4.309 |
Neg logit contributions | |
BT | -3.871 |
Dollar | -3.737 |
cour | -3.668 |
FW | -3.633 |
rentals | -3.524 |
Token | it |
Token ID | 340 |
Feature activation | -9.13e-01 |
Pos logit contributions | |
BT | +3.427 |
Dollar | +3.307 |
cour | +3.168 |
FW | +3.072 |
fav | +3.050 |
Neg logit contributions | |
idious | -6.689 |
urnal | -6.425 |
enary | -6.364 |
ocate | -6.349 |
onential | -6.302 |
Token | , |
Token ID | 11 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
idious | +0.928 |
urnal | +0.877 |
ocate | +0.877 |
onential | +0.866 |
enary | +0.860 |
Neg logit contributions | |
BT | -0.686 |
Dollar | -0.669 |
cour | -0.648 |
FW | -0.639 |
rentals | -0.618 |
Token | � |
Token ID | 447 |
Feature activation | +2.67e+00 |
Pos logit contributions | |
idious | +0.914 |
urnal | +0.857 |
ocate | +0.855 |
onential | +0.844 |
enary | +0.839 |
Neg logit contributions | |
BT | -0.877 |
Dollar | -0.860 |
cour | -0.834 |
FW | -0.825 |
rentals | -0.802 |
Token | � |
Token ID | 251 |
Feature activation | +8.99e-02 |
Pos logit contributions | |
BT | +1.983 |
Dollar | +1.947 |
cour | +1.886 |
FW | +1.855 |
fav | +1.795 |
Neg logit contributions | |
idious | -2.734 |
ocate | -2.581 |
urnal | -2.564 |
onential | -2.537 |
enary | -2.518 |
Token | says |
Token ID | 1139 |
Feature activation | -5.77e+00 |
Pos logit contributions | |
BT | +0.068 |
Dollar | +0.067 |
cour | +0.065 |
FW | +0.064 |
fav | +0.061 |
Neg logit contributions | |
idious | -0.091 |
urnal | -0.086 |
ocate | -0.085 |
onential | -0.085 |
enary | -0.084 |
Token | physicist |
Token ID | 33013 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
idious | +5.897 |
ocate | +5.600 |
urnal | +5.555 |
onential | +5.510 |
enary | +5.475 |
Neg logit contributions | |
BT | -4.182 |
Dollar | -4.002 |
cour | -3.928 |
FW | -3.915 |
rentals | -3.744 |
Token | Y |
Token ID | 575 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
idious | +17.186 |
urnal | +16.203 |
ocate | +16.067 |
enary | +15.889 |
onential | +15.502 |
Neg logit contributions | |
BT | -12.929 |
FW | -11.926 |
cour | -11.871 |
Dollar | -11.631 |
FB | -11.606 |
Token | annis |
Token ID | 45017 |
Feature activation | -7.83e-01 |
Pos logit contributions | |
BT | +3.079 |
Dollar | +2.970 |
cour | +2.953 |
FW | +2.921 |
rentals | +2.821 |
Neg logit contributions | |
idious | -2.405 |
ocate | -2.218 |
urnal | -2.212 |
onential | -2.196 |
enary | -2.168 |
Token | Sem |
Token ID | 12449 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
idious | +0.886 |
urnal | +0.842 |
ocate | +0.842 |
onential | +0.833 |
enary | +0.828 |
Neg logit contributions | |
BT | -0.499 |
Dollar | -0.484 |
cour | -0.466 |
FW | -0.459 |
rentals | -0.440 |
Token | ert |
Token ID | 861 |
Feature activation | -5.49e+00 |
Pos logit contributions | |
BT | +2.388 |
Dollar | +2.333 |
cour | +2.294 |
FW | +2.226 |
rentals | +2.155 |
Neg logit contributions | |
idious | -2.767 |
ocate | -2.626 |
urnal | -2.607 |
onential | -2.591 |
enary | -2.560 |
Token | z |
Token ID | 89 |
Feature activation | -6.20e+00 |
Pos logit contributions | |
idious | +5.822 |
urnal | +5.523 |
ocate | +5.490 |
enary | +5.443 |
onential | +5.423 |
Neg logit contributions | |
BT | -3.779 |
Dollar | -3.687 |
cour | -3.539 |
FW | -3.518 |
rentals | -3.405 |
Token | u |
Token ID | 84 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
BT | +2.471 |
Dollar | +2.421 |
cour | +2.395 |
FW | +2.285 |
fav | +2.206 |
Neg logit contributions | |
idious | -3.762 |
ocate | -3.554 |
urnal | -3.536 |
onential | -3.527 |
enary | -3.494 |
Token | , |
Token ID | 11 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
BT | +1.315 |
Dollar | +1.289 |
cour | +1.258 |
FW | +1.227 |
fav | +1.185 |
Neg logit contributions | |
idious | -1.581 |
ocate | -1.484 |
onential | -1.480 |
urnal | -1.479 |
enary | -1.458 |
Token | an |
Token ID | 281 |
Feature activation | -9.54e+00 |
Pos logit contributions | |
idious | +8.367 |
ocate | +7.819 |
urnal | +7.799 |
enary | +7.676 |
onential | +7.586 |
Neg logit contributions | |
BT | -9.359 |
Dollar | -9.006 |
cour | -8.846 |
FW | -8.832 |
rentals | -8.606 |
Token | astroph |
Token ID | 48782 |
Feature activation | -2.16e+01 |
Pos logit contributions | |
idious | +6.706 |
urnal | +6.251 |
ocate | +6.198 |
onential | +6.043 |
enary | +5.981 |
Neg logit contributions | |
BT | -9.745 |
Dollar | -9.479 |
cour | -9.164 |
FW | -9.152 |
rentals | -8.952 |
Token | ys |
Token ID | 893 |
Feature activation | -1.34e+01 |
Pos logit contributions | |
idious | +11.585 |
ocate | +11.185 |
urnal | +11.133 |
onential | +10.713 |
enary | +10.362 |
Neg logit contributions | |
BT | -20.657 |
Dollar | -20.382 |
fav | -20.096 |
rentals | -19.955 |
FW | -19.937 |
Token | icist |
Token ID | 48187 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
idious | +4.314 |
ocate | +4.055 |
urnal | +3.738 |
onential | +3.443 |
enary | +3.419 |
Neg logit contributions | |
BT | -18.013 |
Dollar | -17.951 |
rentals | -17.504 |
cour | -17.292 |
fav | -17.275 |
Token | at |
Token ID | 379 |
Feature activation | -7.24e+00 |
Pos logit contributions | |
idious | +13.948 |
urnal | +12.974 |
enary | +12.805 |
ocate | +12.479 |
onential | +11.902 |
Neg logit contributions | |
BT | -16.450 |
Dollar | -15.908 |
FW | -15.751 |
cour | -15.453 |
rentals | -15.156 |
Token | the |
Token ID | 262 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
idious | +6.902 |
ocate | +6.617 |
urnal | +6.559 |
onential | +6.432 |
enary | +6.428 |
Neg logit contributions | |
BT | -5.505 |
Dollar | -5.230 |
cour | -5.193 |
FW | -5.180 |
rentals | -5.061 |
Token | University |
Token ID | 2059 |
Feature activation | -5.97e+00 |
Pos logit contributions | |
idious | +5.821 |
ocate | +5.571 |
urnal | +5.556 |
enary | +5.467 |
onential | +5.440 |
Neg logit contributions | |
BT | -4.519 |
Dollar | -4.290 |
cour | -4.242 |
FW | -4.227 |
rentals | -4.094 |
Token | of |
Token ID | 286 |
Feature activation | -8.29e+00 |
Pos logit contributions | |
idious | +5.146 |
ocate | +4.893 |
urnal | +4.843 |
onential | +4.776 |
enary | +4.776 |
Neg logit contributions | |
BT | -5.181 |
Dollar | -4.987 |
cour | -4.923 |
FW | -4.906 |
rentals | -4.832 |
Token | California |
Token ID | 3442 |
Feature activation | -7.07e+00 |
Pos logit contributions | |
idious | +7.971 |
urnal | +7.617 |
ocate | +7.615 |
enary | +7.532 |
elfth | +7.375 |
Neg logit contributions | |
BT | -5.929 |
cour | -5.585 |
Dollar | -5.565 |
FW | -5.556 |
rentals | -5.466 |
Token | baum |
Token ID | 24738 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
BT | +1.283 |
Dollar | +1.248 |
cour | +1.218 |
FW | +1.187 |
rentals | +1.139 |
Neg logit contributions | |
idious | -1.873 |
urnal | -1.782 |
ocate | -1.777 |
onential | -1.764 |
enary | -1.743 |
Token | , |
Token ID | 11 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
idious | +2.427 |
urnal | +2.300 |
ocate | +2.296 |
onential | +2.266 |
enary | +2.258 |
Neg logit contributions | |
BT | -1.646 |
Dollar | -1.600 |
cour | -1.545 |
FW | -1.529 |
rentals | -1.478 |
Token | a |
Token ID | 257 |
Feature activation | -6.89e+00 |
Pos logit contributions | |
idious | +8.847 |
ocate | +8.221 |
urnal | +8.220 |
enary | +8.129 |
onential | +8.031 |
Neg logit contributions | |
BT | -10.013 |
Dollar | -9.739 |
FW | -9.484 |
cour | -9.470 |
rentals | -9.297 |
Token | cos |
Token ID | 8615 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
idious | +5.896 |
urnal | +5.580 |
ocate | +5.554 |
enary | +5.471 |
onential | +5.369 |
Neg logit contributions | |
BT | -5.844 |
Dollar | -5.724 |
FW | -5.607 |
cour | -5.604 |
rentals | -5.397 |
Token | m |
Token ID | 76 |
Feature activation | -9.36e+00 |
Pos logit contributions | |
idious | +14.865 |
enary | +13.933 |
urnal | +13.730 |
onential | +13.702 |
ocate | +13.432 |
Neg logit contributions | |
Dollar | -12.309 |
BT | -12.137 |
FW | -11.803 |
rentals | -11.566 |
fav | -11.299 |
Token | ologist |
Token ID | 7451 |
Feature activation | -1.94e+01 |
Pos logit contributions | |
idious | +4.859 |
ocate | +4.522 |
urnal | +4.467 |
onential | +4.137 |
enary | +4.132 |
Neg logit contributions | |
BT | -11.290 |
Dollar | -11.198 |
cour | -10.881 |
FW | -10.848 |
rentals | -10.791 |
Token | at |
Token ID | 379 |
Feature activation | -7.19e+00 |
Pos logit contributions | |
idious | +13.771 |
enary | +12.812 |
urnal | +12.656 |
ocate | +12.492 |
onential | +12.052 |
Neg logit contributions | |
BT | -15.586 |
Dollar | -15.216 |
FW | -14.935 |
cour | -14.688 |
rentals | -14.331 |
Token | Carnegie |
Token ID | 33976 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
idious | +6.799 |
ocate | +6.531 |
urnal | +6.434 |
enary | +6.341 |
onential | +6.328 |
Neg logit contributions | |
BT | -5.502 |
Dollar | -5.250 |
FW | -5.197 |
cour | -5.196 |
rentals | -5.056 |
Token | Mellon |
Token ID | 49808 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
idious | +3.534 |
ocate | +3.399 |
urnal | +3.388 |
enary | +3.355 |
onential | +3.351 |
Neg logit contributions | |
BT | -1.389 |
Dollar | -1.322 |
cour | -1.273 |
FW | -1.248 |
fav | -1.189 |
Token | University |
Token ID | 2059 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
idious | +6.486 |
ocate | +6.300 |
enary | +6.187 |
urnal | +6.177 |
onential | +6.113 |
Neg logit contributions | |
BT | -5.777 |
Dollar | -5.622 |
cour | -5.484 |
FW | -5.452 |
rentals | -5.391 |
Token | in |
Token ID | 287 |
Feature activation | -6.15e+00 |
Pos logit contributions | |
idious | +9.445 |
ocate | +9.258 |
urnal | +9.067 |
enary | +9.017 |
onential | +8.981 |
Neg logit contributions | |
BT | -9.137 |
Dollar | -8.994 |
cour | -8.776 |
rentals | -8.654 |
FW | -8.648 |
Token | J |
Token ID | 449 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
Dollar | +3.539 |
BT | +3.514 |
cour | +3.276 |
FW | +3.235 |
fav | +3.060 |
Neg logit contributions | |
idious | -6.691 |
urnal | -6.340 |
ocate | -6.329 |
onential | -6.311 |
enary | -6.223 |
Token | ough |
Token ID | 619 |
Feature activation | +3.20e+00 |
Pos logit contributions | |
BT | +2.933 |
Dollar | +2.867 |
cour | +2.808 |
FW | +2.768 |
FB | +2.674 |
Neg logit contributions | |
idious | -2.772 |
ocate | -2.569 |
onential | -2.557 |
urnal | -2.550 |
enary | -2.526 |
Token | in |
Token ID | 259 |
Feature activation | -6.86e+00 |
Pos logit contributions | |
BT | +2.726 |
Dollar | +2.680 |
cour | +2.640 |
FW | +2.537 |
fav | +2.495 |
Neg logit contributions | |
idious | -2.865 |
onential | -2.681 |
urnal | -2.675 |
ocate | -2.635 |
enary | -2.615 |
Token | , |
Token ID | 11 |
Feature activation | -9.19e+00 |
Pos logit contributions | |
idious | +6.775 |
urnal | +6.369 |
ocate | +6.358 |
enary | +6.254 |
onential | +6.202 |
Neg logit contributions | |
BT | -5.106 |
Dollar | -5.024 |
FW | -4.820 |
cour | -4.776 |
rentals | -4.718 |
Token | a |
Token ID | 257 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
idious | +7.820 |
ocate | +7.330 |
urnal | +7.303 |
enary | +7.177 |
onential | +7.073 |
Neg logit contributions | |
BT | -7.856 |
Dollar | -7.601 |
FW | -7.425 |
cour | -7.303 |
rentals | -7.230 |
Token | glac |
Token ID | 25169 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
idious | +4.343 |
ocate | +4.071 |
urnal | +4.063 |
enary | +3.990 |
onential | +3.886 |
Neg logit contributions | |
BT | -4.749 |
Dollar | -4.625 |
FW | -4.531 |
cour | -4.482 |
FB | -4.381 |
Token | iologist |
Token ID | 31599 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
idious | +10.226 |
ocate | +9.546 |
iate | +9.448 |
urnal | +8.903 |
enary | +8.575 |
Neg logit contributions | |
BT | -20.401 |
Dollar | -19.866 |
FW | -19.271 |
rentals | -19.204 |
fav | -18.925 |
Token | at |
Token ID | 379 |
Feature activation | -5.57e+00 |
Pos logit contributions | |
idious | +13.392 |
enary | +12.338 |
urnal | +12.332 |
ocate | +12.241 |
onential | +11.662 |
Neg logit contributions | |
BT | -14.016 |
Dollar | -13.823 |
FW | -13.443 |
cour | -13.098 |
FB | -12.925 |
Token | the |
Token ID | 262 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
idious | +5.446 |
ocate | +5.199 |
urnal | +5.146 |
enary | +5.083 |
onential | +5.041 |
Neg logit contributions | |
BT | -4.214 |
Dollar | -4.041 |
FW | -3.968 |
cour | -3.950 |
rentals | -3.850 |
Token | University |
Token ID | 2059 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
idious | +4.647 |
ocate | +4.435 |
urnal | +4.405 |
enary | +4.349 |
onential | +4.319 |
Neg logit contributions | |
BT | -3.627 |
Dollar | -3.465 |
FW | -3.396 |
cour | -3.390 |
rentals | -3.284 |
Token | of |
Token ID | 286 |
Feature activation | -8.03e+00 |
Pos logit contributions | |
idious | +4.232 |
ocate | +4.025 |
urnal | +3.956 |
enary | +3.928 |
onential | +3.904 |
Neg logit contributions | |
BT | -4.377 |
Dollar | -4.228 |
cour | -4.151 |
FW | -4.147 |
rentals | -4.100 |
Token | historical |
Token ID | 6754 |
Feature activation | +5.94e-01 |
Pos logit contributions | |
BT | +0.193 |
Dollar | +0.189 |
cour | +0.183 |
FW | +0.180 |
fav | +0.175 |
Neg logit contributions | |
idious | -0.244 |
ocate | -0.231 |
urnal | -0.231 |
onential | -0.229 |
enary | -0.226 |
Token | horror |
Token ID | 9961 |
Feature activation | -4.90e+00 |
Pos logit contributions | |
BT | +0.465 |
Dollar | +0.455 |
cour | +0.439 |
FW | +0.432 |
fav | +0.424 |
Neg logit contributions | |
idious | -0.581 |
urnal | -0.552 |
ocate | -0.552 |
onential | -0.548 |
enary | -0.541 |
Token | novel |
Token ID | 5337 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
idious | +4.654 |
urnal | +4.358 |
ocate | +4.358 |
enary | +4.268 |
onential | +4.263 |
Neg logit contributions | |
BT | -3.977 |
Dollar | -3.859 |
FW | -3.738 |
cour | -3.737 |
rentals | -3.594 |
Token | about |
Token ID | 546 |
Feature activation | +7.72e-01 |
Pos logit contributions | |
idious | +1.660 |
urnal | +1.571 |
ocate | +1.570 |
onential | +1.552 |
enary | +1.542 |
Neg logit contributions | |
BT | -1.175 |
Dollar | -1.143 |
cour | -1.107 |
FW | -1.094 |
rentals | -1.055 |
Token | a |
Token ID | 257 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
BT | +0.632 |
Dollar | +0.624 |
cour | +0.604 |
FW | +0.593 |
rentals | +0.580 |
Neg logit contributions | |
idious | -0.727 |
ocate | -0.686 |
urnal | -0.686 |
onential | -0.680 |
enary | -0.673 |
Token | perf |
Token ID | 23035 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
idious | +1.173 |
urnal | +1.106 |
ocate | +1.103 |
onential | +1.087 |
enary | +1.081 |
Neg logit contributions | |
BT | -0.972 |
Dollar | -0.945 |
cour | -0.920 |
FW | -0.911 |
rentals | -0.879 |
Token | umer |
Token ID | 6975 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
idious | +14.354 |
ocate | +11.933 |
urnal | +11.711 |
onential | +11.195 |
enary | +11.164 |
Neg logit contributions | |
BT | -17.894 |
Dollar | -17.632 |
rentals | -16.894 |
cour | -16.822 |
FB | -16.661 |
Token | 's |
Token ID | 338 |
Feature activation | -3.80e+00 |
Pos logit contributions | |
idious | +9.944 |
ocate | +9.268 |
urnal | +9.098 |
enary | +9.072 |
onential | +8.843 |
Neg logit contributions | |
BT | -7.994 |
Dollar | -7.551 |
FW | -7.538 |
cour | -7.467 |
FB | -7.123 |
Token | apprentice |
Token ID | 39252 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
idious | +3.924 |
ocate | +3.692 |
urnal | +3.691 |
onential | +3.620 |
enary | +3.610 |
Neg logit contributions | |
BT | -2.807 |
Dollar | -2.694 |
cour | -2.620 |
FW | -2.608 |
FB | -2.484 |
Token | born |
Token ID | 4642 |
Feature activation | +1.93e-02 |
Pos logit contributions | |
idious | +5.154 |
ocate | +4.811 |
urnal | +4.793 |
enary | +4.732 |
onential | +4.700 |
Neg logit contributions | |
BT | -3.878 |
Dollar | -3.710 |
cour | -3.648 |
FW | -3.645 |
fav | -3.447 |
Token | with |
Token ID | 351 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
BT | +0.015 |
Dollar | +0.015 |
cour | +0.015 |
FW | +0.014 |
rentals | +0.014 |
Neg logit contributions | |
idious | -0.019 |
urnal | -0.018 |
ocate | -0.018 |
onential | -0.018 |
enary | -0.017 |
Token | arch |
Token ID | 998 |
Feature activation | -2.45e-02 |
Pos logit contributions | |
BT | +4.330 |
Dollar | +4.255 |
FW | +4.132 |
cour | +4.131 |
FB | +3.977 |
Neg logit contributions | |
idious | -3.698 |
urnal | -3.414 |
ocate | -3.411 |
onential | -3.376 |
enary | -3.348 |
Token | , |
Token ID | 11 |
Feature activation | -9.12e+00 |
Pos logit contributions | |
idious | +0.024 |
urnal | +0.022 |
ocate | +0.022 |
onential | +0.022 |
enary | +0.022 |
Neg logit contributions | |
BT | -0.020 |
Dollar | -0.019 |
cour | -0.019 |
FW | -0.018 |
fav | -0.018 |
Token | a |
Token ID | 257 |
Feature activation | -5.89e+00 |
Pos logit contributions | |
idious | +7.667 |
urnal | +7.087 |
ocate | +7.086 |
onential | +6.965 |
enary | +6.953 |
Neg logit contributions | |
BT | -7.988 |
Dollar | -7.624 |
FW | -7.556 |
cour | -7.512 |
rentals | -7.301 |
Token | professor |
Token ID | 6240 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
idious | +4.590 |
ocate | +4.299 |
urnal | +4.287 |
enary | +4.206 |
onential | +4.166 |
Neg logit contributions | |
BT | -5.496 |
Dollar | -5.371 |
FW | -5.301 |
cour | -5.291 |
rentals | -5.111 |
Token | of |
Token ID | 286 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
idious | +12.333 |
urnal | +11.523 |
ocate | +11.439 |
enary | +11.342 |
onential | +11.240 |
Neg logit contributions | |
BT | -14.618 |
Dollar | -14.116 |
FW | -13.873 |
cour | -13.805 |
rentals | -13.537 |
Token | psychology |
Token ID | 15119 |
Feature activation | -1.87e+01 |
Pos logit contributions | |
idious | +7.819 |
urnal | +7.419 |
onential | +7.281 |
ocate | +7.280 |
enary | +7.148 |
Neg logit contributions | |
BT | -9.611 |
Dollar | -9.504 |
FW | -9.286 |
cour | -9.233 |
FB | -8.981 |
Token | at |
Token ID | 379 |
Feature activation | -8.59e+00 |
Pos logit contributions | |
idious | +13.847 |
urnal | +12.824 |
enary | +12.404 |
ocate | +12.353 |
onential | +12.282 |
Neg logit contributions | |
BT | -15.044 |
Dollar | -14.761 |
FW | -14.555 |
cour | -13.959 |
AH | -13.791 |
Token | Washington |
Token ID | 2669 |
Feature activation | +4.67e+00 |
Pos logit contributions | |
idious | +8.246 |
ocate | +7.941 |
urnal | +7.809 |
enary | +7.710 |
onential | +7.695 |
Neg logit contributions | |
BT | -6.294 |
Dollar | -5.899 |
FW | -5.899 |
cour | -5.883 |
rentals | -5.715 |
Token | University |
Token ID | 2059 |
Feature activation | -5.98e+00 |
Pos logit contributions | |
Dollar | +3.088 |
BT | +3.075 |
cour | +2.920 |
FW | +2.835 |
fav | +2.762 |
Neg logit contributions | |
idious | -5.080 |
urnal | -4.807 |
ocate | -4.735 |
onential | -4.732 |
enary | -4.653 |
Token | in |
Token ID | 287 |
Feature activation | -4.63e+00 |
Pos logit contributions | |
idious | +5.388 |
ocate | +5.167 |
urnal | +5.087 |
onential | +5.057 |
enary | +5.013 |
Neg logit contributions | |
BT | -4.958 |
Dollar | -4.840 |
cour | -4.719 |
FW | -4.679 |
rentals | -4.515 |
Token | St |
Token ID | 520 |
Feature activation | -7.52e+00 |
Pos logit contributions | |
idious | +5.079 |
urnal | +4.883 |
ocate | +4.878 |
onential | +4.830 |
enary | +4.801 |
Neg logit contributions | |
BT | -2.955 |
Dollar | -2.839 |
FW | -2.815 |
cour | -2.789 |
fav | -2.660 |
Token | . |
Token ID | 13 |
Feature activation | +4.54e+00 |
Pos logit contributions | |
BT | +0.151 |
Dollar | +0.147 |
cour | +0.143 |
FW | +0.143 |
rentals | +0.138 |
Neg logit contributions | |
idious | -0.146 |
urnal | -0.136 |
ocate | -0.136 |
onential | -0.135 |
enary | -0.134 |
Token | Sh |
Token ID | 911 |
Feature activation | +4.50e-01 |
Pos logit contributions | |
Dollar | +2.743 |
BT | +2.742 |
cour | +2.559 |
FW | +2.533 |
fav | +2.385 |
Neg logit contributions | |
idious | -5.246 |
urnal | -4.973 |
ocate | -4.970 |
onential | -4.918 |
enary | -4.881 |
Token | ind |
Token ID | 521 |
Feature activation | +8.95e-01 |
Pos logit contributions | |
BT | +0.416 |
Dollar | +0.406 |
cour | +0.401 |
FW | +0.393 |
rentals | +0.381 |
Neg logit contributions | |
idious | -0.375 |
urnal | -0.349 |
ocate | -0.349 |
onential | -0.345 |
enary | -0.340 |
Token | ell |
Token ID | 695 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
BT | +0.752 |
Dollar | +0.739 |
cour | +0.718 |
FW | +0.702 |
fav | +0.682 |
Neg logit contributions | |
idious | -0.820 |
ocate | -0.776 |
urnal | -0.769 |
onential | -0.766 |
enary | -0.755 |
Token | , |
Token ID | 11 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
idious | +3.480 |
urnal | +3.285 |
ocate | +3.284 |
onential | +3.243 |
enary | +3.236 |
Neg logit contributions | |
BT | -2.359 |
Dollar | -2.279 |
cour | -2.212 |
FW | -2.197 |
rentals | -2.127 |
Token | professor |
Token ID | 6240 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
idious | +11.282 |
ocate | +10.721 |
urnal | +10.666 |
onential | +10.537 |
enary | +10.533 |
Neg logit contributions | |
BT | -8.753 |
FW | -8.298 |
Dollar | -8.136 |
cour | -8.129 |
rentals | -7.962 |
Token | of |
Token ID | 286 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
idious | +12.768 |
urnal | +11.946 |
ocate | +11.607 |
enary | +11.512 |
onential | +11.432 |
Neg logit contributions | |
BT | -15.764 |
FW | -14.964 |
Dollar | -14.880 |
cour | -14.724 |
rentals | -14.538 |
Token | climate |
Token ID | 4258 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
idious | +9.883 |
ocate | +9.324 |
urnal | +9.299 |
onential | +9.233 |
enary | +9.028 |
Neg logit contributions | |
BT | -10.023 |
FW | -9.626 |
Dollar | -9.570 |
cour | -9.417 |
FB | -9.240 |
Token | sciences |
Token ID | 19838 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
idious | +10.288 |
ocate | +9.765 |
urnal | +9.501 |
onential | +9.495 |
enary | +9.273 |
Neg logit contributions | |
BT | -10.315 |
Dollar | -10.045 |
FW | -9.839 |
cour | -9.644 |
FB | -9.332 |
Token | at |
Token ID | 379 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
idious | +14.908 |
enary | +13.609 |
urnal | +13.604 |
ocate | +13.588 |
onential | +13.441 |
Neg logit contributions | |
BT | -16.094 |
FW | -15.660 |
Dollar | -15.655 |
cour | -15.251 |
fav | -14.872 |
Token | Duke |
Token ID | 11083 |
Feature activation | -9.54e+00 |
Pos logit contributions | |
idious | +11.564 |
ocate | +11.169 |
enary | +10.964 |
urnal | +10.952 |
onential | +10.914 |
Neg logit contributions | |
BT | -6.052 |
FW | -5.638 |
cour | -5.478 |
Dollar | -5.473 |
rentals | -5.416 |
Token | Mon |
Token ID | 2892 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
BT | +1.687 |
Dollar | +1.668 |
cour | +1.574 |
FW | +1.549 |
fav | +1.477 |
Neg logit contributions | |
idious | -3.241 |
ocate | -3.085 |
urnal | -3.079 |
onential | -3.066 |
enary | -3.030 |
Token | nat |
Token ID | 32353 |
Feature activation | -3.09e+00 |
Pos logit contributions | |
idious | +0.155 |
ocate | +0.146 |
urnal | +0.146 |
onential | +0.145 |
enary | +0.143 |
Neg logit contributions | |
BT | -0.114 |
Dollar | -0.112 |
cour | -0.109 |
FW | -0.106 |
rentals | -0.103 |
Token | , |
Token ID | 11 |
Feature activation | -8.94e+00 |
Pos logit contributions | |
idious | +3.180 |
urnal | +3.013 |
ocate | +3.009 |
onential | +2.969 |
enary | +2.952 |
Neg logit contributions | |
BT | -2.278 |
Dollar | -2.217 |
cour | -2.143 |
FW | -2.125 |
rentals | -2.058 |
Token | a |
Token ID | 257 |
Feature activation | -5.90e+00 |
Pos logit contributions | |
idious | +7.922 |
ocate | +7.474 |
urnal | +7.469 |
onential | +7.324 |
enary | +7.242 |
Neg logit contributions | |
BT | -7.390 |
Dollar | -7.059 |
FW | -6.936 |
cour | -6.911 |
rentals | -6.743 |
Token | soc |
Token ID | 1307 |
Feature activation | -1.45e+01 |
Pos logit contributions | |
idious | +5.017 |
urnal | +4.752 |
ocate | +4.751 |
enary | +4.633 |
onential | +4.608 |
Neg logit contributions | |
BT | -5.088 |
Dollar | -4.936 |
cour | -4.867 |
FW | -4.827 |
rentals | -4.707 |
Token | iologist |
Token ID | 31599 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
idious | +10.665 |
ocate | +10.238 |
urnal | +10.226 |
enary | +9.803 |
onential | +9.692 |
Neg logit contributions | |
BT | -12.887 |
Dollar | -12.762 |
FW | -12.356 |
rentals | -12.255 |
cour | -12.095 |
Token | and |
Token ID | 290 |
Feature activation | -9.22e+00 |
Pos logit contributions | |
idious | +13.778 |
urnal | +12.657 |
enary | +12.541 |
ocate | +12.491 |
onential | +12.079 |
Neg logit contributions | |
BT | -14.455 |
Dollar | -14.054 |
FW | -13.753 |
rentals | -13.425 |
cour | -13.421 |
Token | dem |
Token ID | 1357 |
Feature activation | -6.80e+00 |
Pos logit contributions | |
idious | +7.681 |
ocate | +7.350 |
urnal | +7.271 |
onential | +7.122 |
enary | +7.050 |
Neg logit contributions | |
BT | -7.974 |
Dollar | -7.603 |
FW | -7.540 |
cour | -7.471 |
rentals | -7.232 |
Token | ographer |
Token ID | 18539 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
idious | +3.848 |
ocate | +3.604 |
urnal | +3.577 |
enary | +3.510 |
onential | +3.509 |
Neg logit contributions | |
BT | -7.942 |
Dollar | -7.853 |
FW | -7.617 |
cour | -7.596 |
rentals | -7.511 |
Token | at |
Token ID | 379 |
Feature activation | -5.07e+00 |
Pos logit contributions | |
idious | +11.107 |
urnal | +10.286 |
ocate | +10.253 |
enary | +10.179 |
onential | +9.876 |
Neg logit contributions | |
BT | -9.978 |
Dollar | -9.737 |
FW | -9.491 |
cour | -9.293 |
rentals | -9.177 |
Token | Pennsylvania |
Token ID | 9589 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
idious | +5.002 |
ocate | +4.797 |
urnal | +4.730 |
onential | +4.681 |
enary | +4.670 |
Neg logit contributions | |
BT | -3.806 |
Dollar | -3.651 |
cour | -3.575 |
FW | -3.564 |
rentals | -3.451 |
Token | , |
Token ID | 11 |
Feature activation | -7.25e+00 |
Pos logit contributions | |
idious | +4.402 |
ocate | +4.150 |
urnal | +4.138 |
onential | +4.072 |
enary | +4.071 |
Neg logit contributions | |
BT | -3.042 |
Dollar | -2.911 |
cour | -2.874 |
FW | -2.836 |
rentals | -2.706 |
Token | a |
Token ID | 257 |
Feature activation | -4.79e+00 |
Pos logit contributions | |
idious | +6.676 |
ocate | +6.277 |
urnal | +6.257 |
enary | +6.108 |
onential | +6.100 |
Neg logit contributions | |
BT | -5.959 |
Dollar | -5.630 |
cour | -5.561 |
FW | -5.511 |
FB | -5.327 |
Token | professor |
Token ID | 6240 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
idious | +4.218 |
ocate | +3.976 |
urnal | +3.971 |
enary | +3.877 |
onential | +3.824 |
Neg logit contributions | |
BT | -4.145 |
Dollar | -3.950 |
cour | -3.919 |
FW | -3.873 |
FB | -3.773 |
Token | of |
Token ID | 286 |
Feature activation | -1.05e+01 |
Pos logit contributions | |
idious | +12.287 |
urnal | +11.453 |
ocate | +11.355 |
enary | +11.170 |
onential | +10.999 |
Neg logit contributions | |
BT | -14.357 |
Dollar | -13.655 |
FW | -13.391 |
cour | -13.363 |
FB | -13.090 |
Token | biological |
Token ID | 10685 |
Feature activation | -9.76e+00 |
Pos logit contributions | |
idious | +8.438 |
urnal | +8.030 |
ocate | +7.937 |
enary | +7.684 |
onential | +7.656 |
Neg logit contributions | |
BT | -9.204 |
Dollar | -8.743 |
cour | -8.520 |
FW | -8.494 |
FB | -8.369 |
Token | science |
Token ID | 3783 |
Feature activation | -1.82e+01 |
Pos logit contributions | |
idious | +7.483 |
ocate | +6.953 |
urnal | +6.933 |
enary | +6.863 |
onential | +6.772 |
Neg logit contributions | |
BT | -9.291 |
Dollar | -8.982 |
cour | -8.787 |
FW | -8.728 |
FB | -8.525 |
Token | at |
Token ID | 379 |
Feature activation | -9.33e+00 |
Pos logit contributions | |
idious | +13.693 |
ocate | +12.442 |
enary | +12.372 |
urnal | +12.349 |
onential | +12.198 |
Neg logit contributions | |
BT | -14.579 |
Dollar | -13.945 |
FW | -13.741 |
cour | -13.558 |
AH | -13.206 |
Token | Florida |
Token ID | 4744 |
Feature activation | -8.53e+00 |
Pos logit contributions | |
idious | +9.067 |
ocate | +8.720 |
urnal | +8.572 |
enary | +8.501 |
onential | +8.467 |
Neg logit contributions | |
BT | -6.651 |
cour | -6.178 |
Dollar | -6.145 |
FW | -6.145 |
rentals | -5.995 |
Token | State |
Token ID | 1812 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
idious | +7.671 |
enary | +7.252 |
urnal | +7.235 |
ocate | +7.181 |
onential | +7.085 |
Neg logit contributions | |
BT | -6.904 |
Dollar | -6.461 |
cour | -6.406 |
FW | -6.342 |
rentals | -6.308 |
Token | University |
Token ID | 2059 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
idious | +3.463 |
ocate | +3.280 |
urnal | +3.257 |
onential | +3.226 |
enary | +3.224 |
Neg logit contributions | |
BT | -2.803 |
Dollar | -2.702 |
cour | -2.632 |
FW | -2.600 |
rentals | -2.561 |
Token | , |
Token ID | 11 |
Feature activation | -6.75e+00 |
Pos logit contributions | |
idious | +9.382 |
ocate | +8.922 |
urnal | +8.873 |
enary | +8.835 |
onential | +8.820 |
Neg logit contributions | |
BT | -8.101 |
Dollar | -7.768 |
cour | -7.666 |
FW | -7.516 |
rentals | -7.447 |
Token | , |
Token ID | 11 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
BT | +1.808 |
Dollar | +1.772 |
cour | +1.713 |
FW | +1.682 |
fav | +1.640 |
Neg logit contributions | |
idious | -2.389 |
urnal | -2.269 |
ocate | -2.263 |
onential | -2.252 |
enary | -2.218 |
Token | a |
Token ID | 257 |
Feature activation | -2.19e+00 |
Pos logit contributions | |
idious | +3.268 |
ocate | +3.078 |
urnal | +3.075 |
onential | +3.030 |
enary | +3.018 |
Neg logit contributions | |
BT | -2.671 |
Dollar | -2.599 |
cour | -2.529 |
FW | -2.503 |
rentals | -2.424 |
Token | doctoral |
Token ID | 40995 |
Feature activation | -8.18e+00 |
Pos logit contributions | |
idious | +2.060 |
ocate | +1.938 |
urnal | +1.935 |
enary | +1.900 |
onential | +1.900 |
Neg logit contributions | |
BT | -1.799 |
Dollar | -1.753 |
cour | -1.713 |
FW | -1.696 |
rentals | -1.643 |
Token | candidate |
Token ID | 4540 |
Feature activation | -9.37e+00 |
Pos logit contributions | |
idious | +6.171 |
ocate | +5.890 |
urnal | +5.752 |
enary | +5.721 |
onential | +5.668 |
Neg logit contributions | |
BT | -7.812 |
Dollar | -7.675 |
cour | -7.549 |
FW | -7.451 |
rentals | -7.257 |
Token | in |
Token ID | 287 |
Feature activation | -5.23e+00 |
Pos logit contributions | |
idious | +8.377 |
ocate | +7.834 |
urnal | +7.791 |
enary | +7.745 |
onential | +7.652 |
Neg logit contributions | |
BT | -7.582 |
Dollar | -7.406 |
FW | -7.218 |
cour | -7.215 |
rentals | -6.998 |
Token | lingu |
Token ID | 20280 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
idious | +4.966 |
ocate | +4.676 |
urnal | +4.654 |
onential | +4.593 |
enary | +4.582 |
Neg logit contributions | |
BT | -4.148 |
Dollar | -4.018 |
cour | -3.935 |
FW | -3.914 |
rentals | -3.765 |
Token | istics |
Token ID | 3969 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
idious | +9.108 |
ocate | +8.619 |
urnal | +8.047 |
enary | +8.045 |
onential | +7.919 |
Neg logit contributions | |
Dollar | -19.366 |
BT | -19.131 |
cour | -18.299 |
FW | -18.228 |
fav | -18.176 |
Token | at |
Token ID | 379 |
Feature activation | -6.96e+00 |
Pos logit contributions | |
idious | +11.920 |
ocate | +10.996 |
enary | +10.890 |
urnal | +10.863 |
onential | +10.633 |
Neg logit contributions | |
BT | -11.032 |
Dollar | -10.856 |
FW | -10.659 |
cour | -10.454 |
FB | -10.284 |
Token | Penn |
Token ID | 6595 |
Feature activation | -9.98e+00 |
Pos logit contributions | |
idious | +6.991 |
ocate | +6.748 |
urnal | +6.621 |
enary | +6.578 |
onential | +6.531 |
Neg logit contributions | |
BT | -4.923 |
Dollar | -4.654 |
cour | -4.616 |
FW | -4.600 |
rentals | -4.486 |
Token | , |
Token ID | 11 |
Feature activation | -4.31e+00 |
Pos logit contributions | |
idious | +9.273 |
enary | +8.900 |
ocate | +8.830 |
urnal | +8.748 |
onential | +8.604 |
Neg logit contributions | |
BT | -7.402 |
Dollar | -7.348 |
cour | -7.012 |
FW | -6.991 |
rentals | -6.917 |
Token | notes |
Token ID | 4710 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
idious | +4.440 |
ocate | +4.206 |
urnal | +4.194 |
onential | +4.118 |
enary | +4.111 |
Neg logit contributions | |
BT | -3.075 |
Dollar | -2.982 |
cour | -2.918 |
FW | -2.893 |
rentals | -2.770 |
Token | chio |
Token ID | 40900 |
Feature activation | -3.45e+00 |
Pos logit contributions | |
idious | +2.537 |
urnal | +2.398 |
ocate | +2.396 |
onential | +2.365 |
enary | +2.355 |
Neg logit contributions | |
BT | -1.844 |
Dollar | -1.789 |
cour | -1.733 |
FW | -1.713 |
rentals | -1.661 |
Token | , |
Token ID | 11 |
Feature activation | -8.74e+00 |
Pos logit contributions | |
idious | +3.569 |
urnal | +3.381 |
ocate | +3.354 |
onential | +3.318 |
enary | +3.305 |
Neg logit contributions | |
BT | -2.494 |
Dollar | -2.398 |
cour | -2.339 |
FW | -2.328 |
rentals | -2.235 |
Token | a |
Token ID | 257 |
Feature activation | -6.57e+00 |
Pos logit contributions | |
idious | +7.241 |
urnal | +6.690 |
ocate | +6.686 |
enary | +6.517 |
onential | +6.515 |
Neg logit contributions | |
BT | -7.910 |
Dollar | -7.495 |
cour | -7.387 |
FW | -7.343 |
rentals | -7.133 |
Token | pale |
Token ID | 14005 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
idious | +5.683 |
ocate | +5.340 |
urnal | +5.321 |
enary | +5.197 |
onential | +5.089 |
Neg logit contributions | |
BT | -5.696 |
Dollar | -5.407 |
cour | -5.341 |
FW | -5.332 |
FB | -5.217 |
Token | ont |
Token ID | 756 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
idious | +7.906 |
ocate | +7.762 |
urnal | +7.623 |
enary | +7.450 |
onential | +7.106 |
Neg logit contributions | |
BT | -11.782 |
Dollar | -11.527 |
FW | -11.281 |
rentals | -10.964 |
cour | -10.948 |
Token | ologist |
Token ID | 7451 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
idious | +5.039 |
ocate | +4.693 |
urnal | +4.603 |
enary | +4.352 |
onential | +4.166 |
Neg logit contributions | |
BT | -14.735 |
Dollar | -14.538 |
FW | -13.987 |
rentals | -13.946 |
cour | -13.755 |
Token | at |
Token ID | 379 |
Feature activation | -6.07e+00 |
Pos logit contributions | |
idious | +13.551 |
enary | +12.463 |
urnal | +12.429 |
ocate | +12.248 |
onential | +11.744 |
Neg logit contributions | |
BT | -14.575 |
Dollar | -13.930 |
FW | -13.744 |
cour | -13.479 |
FB | -13.398 |
Token | Montana |
Token ID | 18311 |
Feature activation | -4.48e+00 |
Pos logit contributions | |
idious | +5.927 |
ocate | +5.682 |
urnal | +5.606 |
enary | +5.523 |
onential | +5.491 |
Neg logit contributions | |
BT | -4.628 |
Dollar | -4.373 |
cour | -4.318 |
FW | -4.285 |
rentals | -4.170 |
Token | State |
Token ID | 1812 |
Feature activation | -8.92e-01 |
Pos logit contributions | |
idious | +4.408 |
ocate | +4.183 |
urnal | +4.165 |
onential | +4.116 |
enary | +4.114 |
Neg logit contributions | |
BT | -3.452 |
Dollar | -3.324 |
cour | -3.252 |
FW | -3.196 |
rentals | -3.116 |
Token | University |
Token ID | 2059 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
idious | +0.910 |
urnal | +0.861 |
ocate | +0.859 |
onential | +0.850 |
enary | +0.843 |
Neg logit contributions | |
BT | -0.666 |
Dollar | -0.651 |
cour | -0.630 |
FW | -0.622 |
rentals | -0.599 |
Token | not |
Token ID | 407 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
idious | +9.086 |
ocate | +8.693 |
urnal | +8.632 |
enary | +8.621 |
onential | +8.465 |
Neg logit contributions | |
BT | -8.079 |
Dollar | -7.811 |
cour | -7.702 |
FW | -7.570 |
rentals | -7.476 |
Token | Al |
Token ID | 978 |
Feature activation | +2.65e+00 |
Pos logit contributions | |
idious | +6.209 |
urnal | +5.911 |
ocate | +5.874 |
enary | +5.771 |
onential | +5.745 |
Neg logit contributions | |
BT | -4.082 |
Dollar | -3.890 |
cour | -3.823 |
FW | -3.767 |
rentals | -3.664 |
Token | Az |
Token ID | 7578 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
BT | +1.744 |
Dollar | +1.698 |
cour | +1.643 |
FW | +1.600 |
fav | +1.522 |
Neg logit contributions | |
idious | -2.929 |
ocate | -2.779 |
urnal | -2.766 |
onential | -2.749 |
enary | -2.727 |
Token | m |
Token ID | 76 |
Feature activation | -6.98e+00 |
Pos logit contributions | |
idious | +2.035 |
urnal | +1.929 |
ocate | +1.914 |
onential | +1.893 |
enary | +1.886 |
Neg logit contributions | |
BT | -1.551 |
Dollar | -1.514 |
cour | -1.459 |
FW | -1.449 |
rentals | -1.408 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
idious | +6.731 |
urnal | +6.452 |
ocate | +6.399 |
enary | +6.318 |
onential | +6.268 |
Neg logit contributions | |
BT | -5.300 |
Dollar | -5.173 |
cour | -4.985 |
FW | -4.971 |
rentals | -4.844 |
Token | a |
Token ID | 257 |
Feature activation | -4.88e+00 |
Pos logit contributions | |
idious | +8.204 |
urnal | +7.733 |
ocate | +7.717 |
enary | +7.625 |
onential | +7.409 |
Neg logit contributions | |
BT | -8.764 |
Dollar | -8.474 |
cour | -8.282 |
FW | -8.181 |
rentals | -8.019 |
Token | professor |
Token ID | 6240 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
idious | +4.479 |
urnal | +4.241 |
ocate | +4.230 |
enary | +4.171 |
onential | +4.099 |
Neg logit contributions | |
BT | -3.977 |
Dollar | -3.867 |
cour | -3.778 |
FW | -3.776 |
rentals | -3.647 |
Token | of |
Token ID | 286 |
Feature activation | -1.04e+01 |
Pos logit contributions | |
idious | +13.486 |
urnal | +12.582 |
ocate | +12.404 |
enary | +12.387 |
onential | +11.927 |
Neg logit contributions | |
BT | -14.277 |
Dollar | -13.942 |
FW | -13.493 |
cour | -13.249 |
rentals | -13.221 |
Token | Middle |
Token ID | 6046 |
Feature activation | -5.30e+00 |
Pos logit contributions | |
idious | +9.238 |
urnal | +8.914 |
ocate | +8.823 |
enary | +8.734 |
onential | +8.726 |
Neg logit contributions | |
BT | -8.038 |
Dollar | -7.725 |
FW | -7.625 |
cour | -7.452 |
rentals | -7.294 |
Token | East |
Token ID | 3687 |
Feature activation | -8.56e+00 |
Pos logit contributions | |
idious | +5.171 |
urnal | +4.957 |
ocate | +4.931 |
enary | +4.895 |
onential | +4.879 |
Neg logit contributions | |
BT | -4.011 |
Dollar | -3.855 |
FW | -3.789 |
cour | -3.751 |
rentals | -3.672 |
Token | history |
Token ID | 2106 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
idious | +7.838 |
urnal | +7.485 |
onential | +7.449 |
ocate | +7.433 |
enary | +7.404 |
Neg logit contributions | |
BT | -6.661 |
Dollar | -6.433 |
FW | -6.318 |
cour | -6.225 |
rentals | -5.987 |
Token | at |
Token ID | 379 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
idious | +9.771 |
ocate | +8.989 |
urnal | +8.954 |
enary | +8.926 |
onential | +8.828 |
Neg logit contributions | |
BT | -9.020 |
Dollar | -8.986 |
FW | -8.628 |
cour | -8.467 |
rentals | -8.278 |
Token | , |
Token ID | 11 |
Feature activation | -9.46e+00 |
Pos logit contributions | |
idious | +1.629 |
ocate | +1.540 |
urnal | +1.540 |
onential | +1.518 |
enary | +1.512 |
Neg logit contributions | |
BT | -1.146 |
Dollar | -1.117 |
cour | -1.081 |
FW | -1.069 |
rentals | -1.032 |
Token | a |
Token ID | 257 |
Feature activation | -6.99e+00 |
Pos logit contributions | |
idious | +8.353 |
ocate | +7.898 |
urnal | +7.809 |
enary | +7.698 |
onential | +7.650 |
Neg logit contributions | |
BT | -7.716 |
Dollar | -7.430 |
cour | -7.298 |
FW | -7.281 |
rentals | -7.091 |
Token | University |
Token ID | 2059 |
Feature activation | -2.80e+00 |
Pos logit contributions | |
idious | +6.136 |
ocate | +5.776 |
urnal | +5.765 |
enary | +5.661 |
onential | +5.569 |
Neg logit contributions | |
BT | -5.839 |
Dollar | -5.660 |
cour | -5.578 |
FW | -5.562 |
rentals | -5.378 |
Token | of |
Token ID | 286 |
Feature activation | -7.46e+00 |
Pos logit contributions | |
idious | +2.581 |
ocate | +2.433 |
urnal | +2.429 |
onential | +2.397 |
enary | +2.378 |
Neg logit contributions | |
BT | -2.349 |
Dollar | -2.289 |
cour | -2.238 |
FW | -2.210 |
rentals | -2.149 |
Token | Edinburgh |
Token ID | 23475 |
Feature activation | -6.94e+00 |
Pos logit contributions | |
idious | +6.476 |
ocate | +6.210 |
urnal | +6.139 |
enary | +6.133 |
onential | +5.970 |
Neg logit contributions | |
BT | -6.134 |
Dollar | -5.911 |
cour | -5.780 |
FW | -5.769 |
rentals | -5.705 |
Token | lingu |
Token ID | 20280 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
idious | +5.615 |
ocate | +5.313 |
urnal | +5.278 |
enary | +5.162 |
onential | +5.122 |
Neg logit contributions | |
BT | -6.305 |
Dollar | -6.187 |
cour | -6.091 |
FW | -6.051 |
rentals | -5.898 |
Token | ist |
Token ID | 396 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
idious | +9.243 |
ocate | +9.140 |
enary | +8.059 |
urnal | +7.983 |
onential | +7.699 |
Neg logit contributions | |
Dollar | -18.923 |
BT | -18.736 |
rentals | -17.929 |
FW | -17.891 |
cour | -17.711 |
Token | who |
Token ID | 508 |
Feature activation | -6.95e+00 |
Pos logit contributions | |
idious | +11.816 |
ocate | +11.034 |
enary | +10.950 |
urnal | +10.922 |
onential | +10.534 |
Neg logit contributions | |
BT | -9.931 |
Dollar | -9.912 |
FW | -9.580 |
cour | -9.461 |
rentals | -9.355 |
Token | co |
Token ID | 763 |
Feature activation | -3.57e+00 |
Pos logit contributions | |
idious | +6.970 |
ocate | +6.722 |
urnal | +6.670 |
enary | +6.577 |
onential | +6.514 |
Neg logit contributions | |
BT | -4.890 |
Dollar | -4.780 |
FW | -4.621 |
cour | -4.601 |
rentals | -4.444 |
Token | - |
Token ID | 12 |
Feature activation | -7.86e+00 |
Pos logit contributions | |
idious | +3.805 |
urnal | +3.616 |
ocate | +3.596 |
onential | +3.560 |
enary | +3.553 |
Neg logit contributions | |
BT | -2.469 |
Dollar | -2.410 |
cour | -2.317 |
FW | -2.309 |
rentals | -2.232 |
Token | authored |
Token ID | 39351 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
idious | +6.098 |
urnal | +5.680 |
ocate | +5.654 |
enary | +5.577 |
onential | +5.492 |
Neg logit contributions | |
Dollar | -7.434 |
BT | -7.392 |
FW | -7.072 |
rentals | -7.069 |
cour | -6.908 |
Token | finally |
Token ID | 3443 |
Feature activation | +6.71e-01 |
Pos logit contributions | |
BT | +4.919 |
Dollar | +4.858 |
cour | +4.687 |
FW | +4.566 |
fav | +4.544 |
Neg logit contributions | |
idious | -6.675 |
urnal | -6.465 |
ocate | -6.406 |
onential | -6.340 |
enary | -6.291 |
Token | Pl |
Token ID | 1345 |
Feature activation | -3.19e+00 |
Pos logit contributions | |
BT | +0.493 |
Dollar | +0.481 |
cour | +0.465 |
FW | +0.458 |
rentals | +0.443 |
Neg logit contributions | |
idious | -0.692 |
urnal | -0.656 |
ocate | -0.656 |
onential | -0.649 |
enary | -0.644 |
Token | ath |
Token ID | 776 |
Feature activation | -3.43e+00 |
Pos logit contributions | |
idious | +3.101 |
ocate | +2.925 |
urnal | +2.909 |
enary | +2.891 |
onential | +2.879 |
Neg logit contributions | |
BT | -2.513 |
Dollar | -2.472 |
cour | -2.381 |
FW | -2.371 |
rentals | -2.325 |
Token | is |
Token ID | 318 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
idious | +3.605 |
ocate | +3.403 |
urnal | +3.397 |
enary | +3.347 |
onential | +3.339 |
Neg logit contributions | |
BT | -2.410 |
Dollar | -2.353 |
cour | -2.273 |
FW | -2.251 |
rentals | -2.170 |
Token | a |
Token ID | 257 |
Feature activation | -7.46e-01 |
Pos logit contributions | |
idious | +0.414 |
urnal | +0.391 |
ocate | +0.391 |
onential | +0.386 |
enary | +0.383 |
Neg logit contributions | |
BT | -0.308 |
Dollar | -0.300 |
cour | -0.290 |
FW | -0.287 |
rentals | -0.277 |
Token | poet |
Token ID | 21810 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
idious | +0.677 |
ocate | +0.635 |
urnal | +0.635 |
onential | +0.625 |
enary | +0.621 |
Neg logit contributions | |
BT | -0.641 |
Dollar | -0.627 |
cour | -0.610 |
FW | -0.604 |
rentals | -0.586 |
Token | for |
Token ID | 329 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
idious | +16.137 |
urnal | +14.446 |
ocate | +14.326 |
enary | +14.219 |
onential | +13.945 |
Neg logit contributions | |
BT | -11.630 |
Dollar | -11.382 |
FW | -10.850 |
cour | -10.719 |
rentals | -10.522 |
Token | whom |
Token ID | 4150 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
idious | +2.086 |
ocate | +1.968 |
urnal | +1.965 |
onential | +1.942 |
enary | +1.928 |
Neg logit contributions | |
BT | -1.606 |
Dollar | -1.564 |
cour | -1.514 |
FW | -1.500 |
rentals | -1.447 |
Token | the |
Token ID | 262 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
idious | +1.221 |
ocate | +1.152 |
urnal | +1.151 |
onential | +1.138 |
enary | +1.129 |
Neg logit contributions | |
BT | -0.924 |
Dollar | -0.899 |
cour | -0.871 |
FW | -0.861 |
rentals | -0.829 |
Token | world |
Token ID | 995 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
BT | +0.188 |
Dollar | +0.184 |
cour | +0.179 |
FW | +0.176 |
rentals | +0.171 |
Neg logit contributions | |
idious | -0.235 |
urnal | -0.222 |
ocate | -0.222 |
onential | -0.220 |
enary | -0.218 |
Token | was |
Token ID | 373 |
Feature activation | +4.25e+00 |
Pos logit contributions | |
BT | +2.123 |
Dollar | +2.066 |
cour | +2.007 |
FW | +1.963 |
fav | +1.932 |
Neg logit contributions | |
idious | -3.301 |
ocate | -3.152 |
urnal | -3.148 |
onential | -3.128 |
enary | -3.080 |
Token | on |
Token ID | 319 |
Feature activation | -2.16e+00 |
Pos logit contributions | |
idious | +2.475 |
urnal | +2.333 |
ocate | +2.330 |
onential | +2.298 |
enary | +2.286 |
Neg logit contributions | |
BT | -2.028 |
Dollar | -1.978 |
cour | -1.915 |
FW | -1.905 |
rentals | -1.836 |
Token | 18 |
Token ID | 1248 |
Feature activation | +2.63e+00 |
Pos logit contributions | |
idious | +2.139 |
urnal | +2.017 |
ocate | +2.011 |
onential | +1.983 |
enary | +1.975 |
Neg logit contributions | |
BT | -1.674 |
Dollar | -1.624 |
cour | -1.580 |
FW | -1.574 |
rentals | -1.509 |
Token | October |
Token ID | 3267 |
Feature activation | -8.33e+00 |
Pos logit contributions | |
BT | +1.838 |
Dollar | +1.798 |
cour | +1.735 |
FW | +1.687 |
rentals | +1.634 |
Neg logit contributions | |
idious | -2.826 |
ocate | -2.669 |
urnal | -2.667 |
onential | -2.644 |
enary | -2.619 |
Token | , |
Token ID | 11 |
Feature activation | -7.33e+00 |
Pos logit contributions | |
idious | +7.694 |
urnal | +7.276 |
ocate | +7.182 |
enary | +7.149 |
onential | +7.031 |
Neg logit contributions | |
BT | -6.461 |
Dollar | -6.278 |
FW | -6.153 |
cour | -6.143 |
rentals | -5.924 |
Token | when |
Token ID | 618 |
Feature activation | -7.64e+00 |
Pos logit contributions | |
idious | +6.777 |
urnal | +6.418 |
ocate | +6.332 |
enary | +6.255 |
onential | +6.222 |
Neg logit contributions | |
BT | -5.822 |
Dollar | -5.604 |
FW | -5.564 |
cour | -5.473 |
FB | -5.304 |
Token | astronomers |
Token ID | 33162 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
idious | +7.404 |
urnal | +6.999 |
ocate | +6.976 |
onential | +6.813 |
enary | +6.779 |
Neg logit contributions | |
BT | -5.758 |
Dollar | -5.521 |
FW | -5.439 |
cour | -5.429 |
rentals | -5.183 |
Token | launched |
Token ID | 5611 |
Feature activation | -4.34e+00 |
Pos logit contributions | |
idious | +15.616 |
ocate | +14.488 |
urnal | +14.459 |
enary | +14.265 |
elfth | +13.823 |
Neg logit contributions | |
BT | -11.406 |
cour | -11.248 |
Dollar | -10.883 |
FW | -10.812 |
FB | -10.525 |
Token | the |
Token ID | 262 |
Feature activation | -3.45e+00 |
Pos logit contributions | |
idious | +4.157 |
urnal | +3.914 |
ocate | +3.893 |
onential | +3.841 |
enary | +3.816 |
Neg logit contributions | |
BT | -3.463 |
Dollar | -3.374 |
cour | -3.305 |
FW | -3.265 |
rentals | -3.142 |
Token | third |
Token ID | 2368 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
idious | +3.508 |
urnal | +3.320 |
ocate | +3.312 |
onential | +3.264 |
enary | +3.249 |
Neg logit contributions | |
BT | -2.553 |
Dollar | -2.478 |
cour | -2.432 |
FW | -2.394 |
rentals | -2.310 |
Token | Grav |
Token ID | 32599 |
Feature activation | -8.34e+00 |
Pos logit contributions | |
idious | +5.167 |
urnal | +4.900 |
ocate | +4.844 |
onential | +4.796 |
enary | +4.781 |
Neg logit contributions | |
BT | -3.991 |
Dollar | -3.867 |
cour | -3.809 |
FW | -3.737 |
rentals | -3.642 |
Token | itational |
Token ID | 22181 |
Feature activation | -5.00e+00 |
Pos logit contributions | |
idious | +5.193 |
ocate | +4.853 |
urnal | +4.718 |
onential | +4.587 |
enary | +4.530 |
Neg logit contributions | |
Dollar | -9.029 |
BT | -9.002 |
cour | -8.818 |
FW | -8.698 |
rentals | -8.629 |
Token | M |
Token ID | 44 |
Feature activation | +3.55e-02 |
Pos logit contributions | |
idious | +5.824 |
ocate | +5.558 |
urnal | +5.511 |
enary | +5.448 |
onential | +5.440 |
Neg logit contributions | |
Dollar | -3.902 |
BT | -3.864 |
rentals | -3.690 |
cour | -3.665 |
fav | -3.638 |
Token | ord |
Token ID | 585 |
Feature activation | +4.74e+00 |
Pos logit contributions | |
BT | +0.031 |
Dollar | +0.031 |
cour | +0.030 |
FW | +0.029 |
rentals | +0.029 |
Neg logit contributions | |
idious | -0.031 |
ocate | -0.030 |
urnal | -0.030 |
onential | -0.029 |
enary | -0.029 |
Token | ica |
Token ID | 3970 |
Feature activation | +2.92e+00 |
Pos logit contributions | |
BT | +4.452 |
Dollar | +4.379 |
cour | +4.347 |
FW | +4.224 |
fav | +4.205 |
Neg logit contributions | |
idious | -3.724 |
onential | -3.459 |
urnal | -3.442 |
ocate | -3.336 |
enary | -3.251 |
Token | is |
Token ID | 318 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
BT | +2.012 |
Dollar | +1.958 |
cour | +1.886 |
FW | +1.856 |
fav | +1.795 |
Neg logit contributions | |
idious | -3.147 |
urnal | -2.993 |
ocate | -2.984 |
onential | -2.963 |
enary | -2.935 |
Token | the |
Token ID | 262 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
BT | +0.951 |
Dollar | +0.932 |
cour | +0.903 |
FW | +0.892 |
rentals | +0.864 |
Neg logit contributions | |
idious | -1.161 |
urnal | -1.097 |
ocate | -1.095 |
onential | -1.083 |
enary | -1.076 |
Token | fastest |
Token ID | 14162 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
idious | +2.569 |
ocate | +2.428 |
urnal | +2.413 |
onential | +2.379 |
enary | +2.372 |
Neg logit contributions | |
BT | -2.121 |
Dollar | -2.055 |
cour | -2.012 |
FW | -1.988 |
rentals | -1.918 |
Token | back |
Token ID | 736 |
Feature activation | -8.27e+00 |
Pos logit contributions | |
idious | +16.036 |
ocate | +14.246 |
onential | +13.906 |
enary | +13.898 |
urnal | +13.878 |
Neg logit contributions | |
BT | -12.089 |
cour | -11.311 |
FW | -11.258 |
Dollar | -10.856 |
rentals | -10.732 |
Token | we |
Token ID | 356 |
Feature activation | -8.23e-01 |
Pos logit contributions | |
idious | +7.442 |
ocate | +7.043 |
urnal | +6.936 |
enary | +6.891 |
onential | +6.849 |
Neg logit contributions | |
BT | -6.737 |
Dollar | -6.561 |
FW | -6.312 |
cour | -6.250 |
rentals | -6.202 |
Token | � |
Token ID | 447 |
Feature activation | -8.50e-01 |
Pos logit contributions | |
idious | +0.906 |
ocate | +0.863 |
urnal | +0.861 |
onential | +0.851 |
enary | +0.847 |
Neg logit contributions | |
BT | -0.545 |
Dollar | -0.531 |
cour | -0.511 |
FW | -0.504 |
rentals | -0.484 |
Token | � |
Token ID | 247 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
idious | +0.733 |
urnal | +0.687 |
ocate | +0.685 |
onential | +0.676 |
enary | +0.671 |
Neg logit contributions | |
BT | -0.766 |
Dollar | -0.750 |
cour | -0.730 |
FW | -0.724 |
rentals | -0.703 |
Token | ve |
Token ID | 303 |
Feature activation | -5.32e+00 |
Pos logit contributions | |
BT | +1.247 |
Dollar | +1.214 |
cour | +1.185 |
FW | +1.164 |
rentals | +1.124 |
Neg logit contributions | |
idious | -1.607 |
urnal | -1.526 |
ocate | -1.512 |
onential | -1.508 |
enary | -1.485 |
Token | ger |
Token ID | 1362 |
Feature activation | -5.58e+00 |
Pos logit contributions | |
BT | +1.728 |
Dollar | +1.690 |
cour | +1.646 |
FW | +1.603 |
rentals | +1.551 |
Neg logit contributions | |
idious | -2.522 |
urnal | -2.382 |
ocate | -2.370 |
onential | -2.368 |
enary | -2.323 |
Token | , |
Token ID | 11 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
idious | +5.607 |
ocate | +5.293 |
urnal | +5.280 |
enary | +5.203 |
onential | +5.163 |
Neg logit contributions | |
BT | -4.113 |
Dollar | -3.997 |
FW | -3.850 |
cour | -3.834 |
rentals | -3.740 |
Token | a |
Token ID | 257 |
Feature activation | -6.61e+00 |
Pos logit contributions | |
idious | +9.214 |
ocate | +8.790 |
urnal | +8.632 |
enary | +8.479 |
onential | +8.403 |
Neg logit contributions | |
BT | -9.327 |
Dollar | -8.868 |
FW | -8.743 |
cour | -8.673 |
FB | -8.469 |
Token | UCS |
Token ID | 49553 |
Feature activation | -7.63e+00 |
Pos logit contributions | |
idious | +6.041 |
ocate | +5.789 |
urnal | +5.736 |
enary | +5.574 |
onential | +5.522 |
Neg logit contributions | |
BT | -5.283 |
Dollar | -5.062 |
FW | -5.008 |
cour | -4.939 |
FB | -4.842 |
Token | F |
Token ID | 37 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
idious | +9.088 |
urnal | +8.804 |
enary | +8.673 |
ocate | +8.665 |
onential | +8.661 |
Neg logit contributions | |
Dollar | -3.749 |
BT | -3.740 |
cour | -3.578 |
rentals | -3.440 |
fav | -3.387 |
Token | professor |
Token ID | 6240 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
idious | +10.247 |
ocate | +9.900 |
urnal | +9.814 |
enary | +9.523 |
onential | +9.518 |
Neg logit contributions | |
BT | -9.159 |
Dollar | -8.839 |
cour | -8.759 |
FW | -8.699 |
rentals | -8.515 |
Token | who |
Token ID | 508 |
Feature activation | -6.43e+00 |
Pos logit contributions | |
idious | +13.701 |
ocate | +12.793 |
urnal | +12.659 |
enary | +12.560 |
onential | +12.275 |
Neg logit contributions | |
BT | -13.718 |
Dollar | -13.209 |
rentals | -12.812 |
FW | -12.809 |
cour | -12.802 |
Token | for |
Token ID | 329 |
Feature activation | -3.54e+00 |
Pos logit contributions | |
idious | +6.484 |
ocate | +6.263 |
urnal | +6.187 |
enary | +6.119 |
onential | +6.090 |
Neg logit contributions | |
BT | -4.531 |
Dollar | -4.435 |
FW | -4.283 |
cour | -4.216 |
rentals | -4.107 |
Token | many |
Token ID | 867 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
idious | +4.042 |
ocate | +3.866 |
urnal | +3.850 |
onential | +3.817 |
enary | +3.810 |
Neg logit contributions | |
BT | -2.172 |
Dollar | -2.090 |
FW | -2.003 |
cour | -1.996 |
rentals | -1.903 |
Token | years |
Token ID | 812 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
idious | +1.426 |
ocate | +1.366 |
urnal | +1.364 |
onential | +1.349 |
enary | +1.344 |
Neg logit contributions | |
BT | -0.548 |
Dollar | -0.524 |
cour | -0.497 |
FW | -0.492 |
rentals | -0.459 |
Token | has |
Token ID | 468 |
Feature activation | -5.43e+00 |
Pos logit contributions | |
idious | +2.221 |
ocate | +2.109 |
urnal | +2.104 |
onential | +2.076 |
enary | +2.073 |
Neg logit contributions | |
BT | -1.433 |
Dollar | -1.396 |
cour | -1.341 |
FW | -1.337 |
rentals | -1.277 |
Token | film |
Token ID | 2646 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
idious | +0.178 |
urnal | +0.168 |
ocate | +0.168 |
onential | +0.166 |
enary | +0.164 |
Neg logit contributions | |
BT | -0.139 |
Dollar | -0.136 |
cour | -0.131 |
FW | -0.129 |
rentals | -0.126 |
Token | . |
Token ID | 13 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
idious | +0.495 |
urnal | +0.469 |
ocate | +0.468 |
onential | +0.463 |
enary | +0.460 |
Neg logit contributions | |
BT | -0.353 |
Dollar | -0.344 |
cour | -0.333 |
FW | -0.328 |
rentals | -0.317 |
Token | But |
Token ID | 887 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
idious | +3.216 |
ocate | +3.062 |
urnal | +3.045 |
enary | +3.009 |
onential | +3.002 |
Neg logit contributions | |
BT | -2.462 |
Dollar | -2.383 |
cour | -2.326 |
FW | -2.310 |
rentals | -2.261 |
Token | after |
Token ID | 706 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
BT | +4.511 |
Dollar | +4.487 |
cour | +4.295 |
FW | +4.162 |
fav | +4.106 |
Neg logit contributions | |
idious | -6.407 |
urnal | -6.120 |
onential | -6.095 |
ocate | -6.062 |
enary | -5.964 |
Token | his |
Token ID | 465 |
Feature activation | -2.56e+00 |
Pos logit contributions | |
BT | +0.081 |
Dollar | +0.078 |
cour | +0.076 |
FW | +0.075 |
rentals | +0.072 |
Neg logit contributions | |
idious | -0.110 |
urnal | -0.104 |
ocate | -0.104 |
onential | -0.103 |
enary | -0.102 |
Token | schedule |
Token ID | 7269 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
idious | +2.682 |
urnal | +2.538 |
ocate | +2.534 |
onential | +2.495 |
enary | +2.494 |
Neg logit contributions | |
BT | -1.838 |
Dollar | -1.774 |
cour | -1.726 |
FW | -1.709 |
rentals | -1.632 |
Token | wouldn |
Token ID | 3636 |
Feature activation | +9.72e+00 |
Pos logit contributions | |
BT | +7.129 |
Dollar | +6.813 |
fav | +6.690 |
rentals | +6.687 |
cour | +6.468 |
Neg logit contributions | |
idious | -12.027 |
ocate | -11.848 |
onential | -11.664 |
urnal | -11.581 |
elfth | -11.479 |
Token | � |
Token ID | 447 |
Feature activation | -7.50e-01 |
Pos logit contributions | |
BT | +7.139 |
cour | +6.881 |
Dollar | +6.692 |
FW | +6.531 |
FB | +6.379 |
Neg logit contributions | |
idious | -9.733 |
onential | -9.130 |
urnal | -9.077 |
ocate | -8.835 |
enary | -8.687 |
Token | � |
Token ID | 247 |
Feature activation | +2.98e+00 |
Pos logit contributions | |
idious | +0.663 |
urnal | +0.626 |
ocate | +0.621 |
onential | +0.615 |
enary | +0.611 |
Neg logit contributions | |
BT | -0.656 |
Dollar | -0.643 |
cour | -0.625 |
FW | -0.619 |
rentals | -0.602 |
Token | t |
Token ID | 83 |
Feature activation | -5.79e-01 |
Pos logit contributions | |
BT | +1.693 |
Dollar | +1.642 |
cour | +1.583 |
FW | +1.547 |
fav | +1.469 |
Neg logit contributions | |
idious | -3.554 |
urnal | -3.393 |
ocate | -3.366 |
onential | -3.360 |
enary | -3.312 |
Token | allow |
Token ID | 1249 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
idious | +0.610 |
urnal | +0.579 |
ocate | +0.579 |
onential | +0.571 |
enary | +0.568 |
Neg logit contributions | |
BT | -0.411 |
Dollar | -0.401 |
cour | -0.388 |
FW | -0.382 |
rentals | -0.368 |
Token | writer |
Token ID | 16002 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
BT | +1.141 |
Dollar | +1.121 |
cour | +1.103 |
FW | +1.083 |
fav | +1.065 |
Neg logit contributions | |
idious | -0.828 |
urnal | -0.773 |
ocate | -0.757 |
onential | -0.755 |
enary | -0.740 |
Token | � |
Token ID | 447 |
Feature activation | +3.83e+00 |
Pos logit contributions | |
idious | +2.073 |
ocate | +1.954 |
urnal | +1.943 |
enary | +1.915 |
onential | +1.915 |
Neg logit contributions | |
BT | -1.760 |
Dollar | -1.706 |
cour | -1.668 |
FW | -1.653 |
rentals | -1.589 |
Token | � |
Token ID | 247 |
Feature activation | +4.58e+00 |
Pos logit contributions | |
BT | +2.958 |
Dollar | +2.900 |
cour | +2.804 |
FW | +2.780 |
fav | +2.683 |
Neg logit contributions | |
idious | -3.773 |
ocate | -3.580 |
urnal | -3.557 |
onential | -3.513 |
enary | -3.477 |
Token | s |
Token ID | 82 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
BT | +3.395 |
Dollar | +3.348 |
cour | +3.236 |
FW | +3.188 |
fav | +3.072 |
Neg logit contributions | |
idious | -4.564 |
urnal | -4.374 |
onential | -4.335 |
ocate | -4.304 |
enary | -4.221 |
Token | financial |
Token ID | 3176 |
Feature activation | +1.25e+01 |
Pos logit contributions | |
idious | +1.923 |
ocate | +1.821 |
urnal | +1.814 |
onential | +1.787 |
enary | +1.783 |
Neg logit contributions | |
BT | -1.260 |
Dollar | -1.206 |
cour | -1.173 |
FW | -1.165 |
rentals | -1.105 |
Token | history |
Token ID | 2106 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
Dollar | +7.744 |
cour | +7.597 |
fav | +7.558 |
BT | +7.526 |
rentals | +7.258 |
Neg logit contributions | |
idious | -12.773 |
urnal | -12.544 |
onential | -12.304 |
enary | -12.184 |
ocate | -12.173 |
Token | . |
Token ID | 13 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
BT | +6.732 |
Dollar | +6.610 |
cour | +6.443 |
FW | +6.168 |
fav | +6.094 |
Neg logit contributions | |
idious | -11.818 |
urnal | -11.529 |
onential | -11.453 |
ocate | -11.400 |
enary | -11.136 |
Token |
|
Token ID | 198 |
Feature activation | -2.84e-02 |
Pos logit contributions | |
idious | +1.287 |
ocate | +1.219 |
urnal | +1.215 |
onential | +1.198 |
enary | +1.193 |
Neg logit contributions | |
BT | -1.030 |
Dollar | -1.002 |
cour | -0.975 |
FW | -0.963 |
rentals | -0.936 |
Token |
|
Token ID | 198 |
Feature activation | +9.20e-02 |
Pos logit contributions | |
idious | +0.028 |
ocate | +0.026 |
urnal | +0.026 |
onential | +0.026 |
enary | +0.026 |
Neg logit contributions | |
BT | -0.022 |
Dollar | -0.022 |
cour | -0.021 |
FW | -0.021 |
rentals | -0.020 |
Token | � |
Token ID | 447 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
BT | +0.064 |
Dollar | +0.062 |
cour | +0.061 |
FW | +0.060 |
rentals | +0.057 |
Neg logit contributions | |
idious | -0.099 |
urnal | -0.093 |
ocate | -0.093 |
onential | -0.092 |
enary | -0.092 |
Token | � |
Token ID | 250 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
BT | +1.963 |
Dollar | +1.923 |
cour | +1.866 |
FW | +1.840 |
rentals | +1.781 |
Neg logit contributions | |
idious | -2.465 |
ocate | -2.322 |
urnal | -2.319 |
onential | -2.286 |
enary | -2.271 |
Token | what |
Token ID | 644 |
Feature activation | -8.35e+00 |
Pos logit contributions | |
BT | +3.869 |
Dollar | +3.869 |
cour | +3.682 |
FW | +3.651 |
rentals | +3.591 |
Neg logit contributions | |
idious | -5.246 |
urnal | -5.069 |
onential | -5.024 |
ocate | -4.991 |
enary | -4.974 |
Token | crystal |
Token ID | 15121 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
idious | +7.658 |
ocate | +7.130 |
urnal | +7.099 |
onential | +6.947 |
enary | +6.903 |
Neg logit contributions | |
BT | -6.773 |
cour | -6.323 |
Dollar | -6.302 |
FW | -6.233 |
FB | -6.012 |
Token | meth |
Token ID | 11248 |
Feature activation | -8.24e+00 |
Pos logit contributions | |
idious | +2.640 |
ocate | +2.491 |
urnal | +2.479 |
onential | +2.439 |
enary | +2.434 |
Neg logit contributions | |
BT | -2.419 |
Dollar | -2.358 |
cour | -2.297 |
FW | -2.268 |
rentals | -2.204 |
Token | does |
Token ID | 857 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
idious | +8.461 |
ocate | +7.976 |
urnal | +7.876 |
enary | +7.860 |
onential | +7.762 |
Neg logit contributions | |
BT | -5.738 |
Dollar | -5.460 |
cour | -5.308 |
FW | -5.286 |
FB | -4.995 |
Token | -- |
Token ID | 438 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
BT | +0.102 |
Dollar | +0.100 |
cour | +0.096 |
FW | +0.095 |
fav | +0.093 |
Neg logit contributions | |
idious | -0.149 |
urnal | -0.141 |
ocate | -0.141 |
onential | -0.140 |
enary | -0.138 |
Token | Mike |
Token ID | 16073 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
BT | +0.864 |
Dollar | +0.840 |
cour | +0.818 |
FW | +0.806 |
rentals | +0.775 |
Neg logit contributions | |
idious | -1.110 |
urnal | -1.051 |
ocate | -1.048 |
onential | -1.036 |
enary | -1.029 |
Token | taught |
Token ID | 7817 |
Feature activation | -5.22e+00 |
Pos logit contributions | |
Dollar | +8.333 |
BT | +8.090 |
FW | +7.420 |
fav | +7.369 |
rentals | +7.320 |
Neg logit contributions | |
idious | -13.354 |
ocate | -13.006 |
onential | -12.984 |
urnal | -12.981 |
enary | -12.862 |
Token | me |
Token ID | 502 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
idious | +4.470 |
ocate | +4.159 |
urnal | +4.149 |
onential | +4.095 |
enary | +4.043 |
Neg logit contributions | |
BT | -4.695 |
Dollar | -4.549 |
cour | -4.484 |
FW | -4.439 |
fav | -4.265 |
Token | this |
Token ID | 428 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
idious | +2.339 |
ocate | +2.215 |
urnal | +2.209 |
onential | +2.188 |
enary | +2.171 |
Neg logit contributions | |
BT | -1.588 |
Dollar | -1.537 |
cour | -1.497 |
FW | -1.475 |
rentals | -1.415 |
Token | -- |
Token ID | 438 |
Feature activation | +9.59e-01 |
Pos logit contributions | |
idious | +4.154 |
ocate | +3.891 |
urnal | +3.890 |
onential | +3.864 |
enary | +3.831 |
Neg logit contributions | |
BT | -3.027 |
Dollar | -2.927 |
cour | -2.879 |
FW | -2.828 |
rentals | -2.716 |
Token | cry |
Token ID | 20470 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
BT | +0.781 |
Dollar | +0.760 |
cour | +0.744 |
FW | +0.731 |
fav | +0.704 |
Neg logit contributions | |
idious | -0.916 |
urnal | -0.865 |
ocate | -0.862 |
onential | -0.852 |
enary | -0.846 |
Token | that |
Token ID | 326 |
Feature activation | +7.81e-01 |
Pos logit contributions | |
BT | +1.572 |
Dollar | +1.545 |
cour | +1.482 |
FW | +1.464 |
fav | +1.420 |
Neg logit contributions | |
idious | -2.118 |
ocate | -2.012 |
urnal | -2.005 |
onential | -1.996 |
enary | -1.977 |
Token | vets |
Token ID | 45024 |
Feature activation | -3.66e+00 |
Pos logit contributions | |
BT | +0.614 |
Dollar | +0.600 |
cour | +0.581 |
FW | +0.574 |
rentals | +0.556 |
Neg logit contributions | |
idious | -0.765 |
ocate | -0.723 |
urnal | -0.723 |
onential | -0.715 |
enary | -0.709 |
Token | ' |
Token ID | 6 |
Feature activation | +6.63e-02 |
Pos logit contributions | |
idious | +3.959 |
ocate | +3.753 |
urnal | +3.707 |
enary | +3.644 |
onential | +3.642 |
Neg logit contributions | |
BT | -2.470 |
Dollar | -2.374 |
cour | -2.318 |
FW | -2.284 |
rentals | -2.192 |
Token | bills |
Token ID | 9024 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
BT | +0.043 |
Dollar | +0.042 |
cour | +0.040 |
FW | +0.039 |
rentals | +0.038 |
Neg logit contributions | |
idious | -0.074 |
urnal | -0.071 |
ocate | -0.071 |
onential | -0.070 |
enary | -0.069 |
Token | would |
Token ID | 561 |
Feature activation | +9.51e+00 |
Pos logit contributions | |
BT | +8.388 |
Dollar | +8.263 |
cour | +7.825 |
fav | +7.685 |
rentals | +7.539 |
Neg logit contributions | |
idious | -15.441 |
urnal | -15.307 |
onential | -15.284 |
ocate | -14.857 |
enary | -14.724 |
Token | be |
Token ID | 307 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
Dollar | +5.673 |
BT | +5.665 |
cour | +5.321 |
fav | +5.307 |
rentals | +5.182 |
Neg logit contributions | |
idious | -10.360 |
urnal | -10.023 |
onential | -9.777 |
ocate | -9.574 |
enary | -9.538 |
Token | too |
Token ID | 1165 |
Feature activation | +8.78e+00 |
Pos logit contributions | |
Dollar | +7.076 |
BT | +7.027 |
cour | +6.628 |
rentals | +6.471 |
fav | +6.457 |
Neg logit contributions | |
idious | -11.798 |
onential | -11.572 |
urnal | -11.551 |
ocate | -11.356 |
enary | -11.215 |
Token | expensive |
Token ID | 5789 |
Feature activation | +5.72e+00 |
Pos logit contributions | |
BT | +5.150 |
Dollar | +5.054 |
fav | +4.824 |
cour | +4.748 |
rentals | +4.639 |
Neg logit contributions | |
idious | -9.720 |
onential | -9.563 |
ocate | -9.546 |
urnal | -9.473 |
enary | -9.301 |
Token | , |
Token ID | 11 |
Feature activation | +3.43e+00 |
Pos logit contributions | |
BT | +3.697 |
Dollar | +3.687 |
cour | +3.485 |
fav | +3.416 |
FW | +3.412 |
Neg logit contributions | |
idious | -6.091 |
urnal | -5.928 |
onential | -5.923 |
ocate | -5.920 |
enary | -5.801 |
Token | took |
Token ID | 1718 |
Feature activation | -2.78e+00 |
Pos logit contributions | |
BT | +2.413 |
Dollar | +2.363 |
cour | +2.263 |
FW | +2.211 |
fav | +2.209 |
Neg logit contributions | |
idious | -3.606 |
urnal | -3.444 |
ocate | -3.432 |
onential | -3.430 |
enary | -3.375 |
Token | Bart |
Token ID | 13167 |
Feature activation | -4.89e+00 |
Pos logit contributions | |
idious | +2.748 |
urnal | +2.588 |
ocate | +2.581 |
onential | +2.548 |
enary | +2.530 |
Neg logit contributions | |
BT | -2.170 |
Dollar | -2.104 |
cour | -2.048 |
FW | -2.032 |
rentals | -1.954 |
Token | disturbed |
Token ID | 24069 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
BT | +0.178 |
Dollar | +0.173 |
cour | +0.168 |
FW | +0.165 |
fav | +0.159 |
Neg logit contributions | |
idious | -0.277 |
urnal | -0.263 |
ocate | -0.263 |
onential | -0.261 |
enary | -0.258 |
Token | ground |
Token ID | 2323 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
idious | +3.771 |
ocate | +3.565 |
urnal | +3.560 |
onential | +3.500 |
enary | +3.489 |
Neg logit contributions | |
BT | -2.804 |
Dollar | -2.730 |
cour | -2.644 |
FW | -2.610 |
rentals | -2.509 |
Token | , |
Token ID | 11 |
Feature activation | +3.18e+00 |
Pos logit contributions | |
BT | +0.724 |
Dollar | +0.702 |
cour | +0.685 |
FW | +0.675 |
fav | +0.649 |
Neg logit contributions | |
idious | -1.065 |
urnal | -1.012 |
ocate | -1.007 |
onential | -1.003 |
enary | -0.991 |
Token | but |
Token ID | 475 |
Feature activation | +6.56e+00 |
Pos logit contributions | |
BT | +2.273 |
Dollar | +2.218 |
cour | +2.149 |
FW | +2.113 |
fav | +2.056 |
Neg logit contributions | |
idious | -3.319 |
urnal | -3.152 |
ocate | -3.134 |
onential | -3.110 |
enary | -3.106 |
Token | in |
Token ID | 287 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
BT | +4.577 |
Dollar | +4.485 |
cour | +4.341 |
FW | +4.235 |
fav | +4.231 |
Neg logit contributions | |
idious | -6.724 |
urnal | -6.448 |
enary | -6.369 |
onential | -6.361 |
ocate | -6.346 |
Token | reality |
Token ID | 3950 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
BT | +0.804 |
Dollar | +0.786 |
cour | +0.758 |
FW | +0.745 |
rentals | +0.728 |
Neg logit contributions | |
idious | -1.053 |
urnal | -0.997 |
ocate | -0.994 |
onential | -0.986 |
enary | -0.984 |
Token | will |
Token ID | 481 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
BT | +6.942 |
Dollar | +6.679 |
cour | +6.571 |
fav | +6.550 |
FW | +6.379 |
Neg logit contributions | |
idious | -11.620 |
enary | -11.244 |
urnal | -11.205 |
onential | -11.185 |
ocate | -10.997 |
Token | be |
Token ID | 307 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
BT | +1.327 |
Dollar | +1.279 |
cour | +1.247 |
FW | +1.226 |
fav | +1.206 |
Neg logit contributions | |
idious | -1.976 |
urnal | -1.876 |
ocate | -1.864 |
onential | -1.857 |
enary | -1.844 |
Token | a |
Token ID | 257 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
BT | +1.110 |
Dollar | +1.083 |
cour | +1.052 |
FW | +1.033 |
fav | +1.007 |
Neg logit contributions | |
idious | -1.479 |
urnal | -1.404 |
ocate | -1.401 |
onential | -1.387 |
enary | -1.382 |
Token | dense |
Token ID | 15715 |
Feature activation | -3.92e+00 |
Pos logit contributions | |
BT | +1.087 |
Dollar | +1.060 |
cour | +1.024 |
FW | +1.011 |
fav | +0.981 |
Neg logit contributions | |
idious | -1.489 |
urnal | -1.409 |
ocate | -1.408 |
onential | -1.393 |
enary | -1.385 |
Token | mix |
Token ID | 5022 |
Feature activation | -3.14e+00 |
Pos logit contributions | |
idious | +4.019 |
ocate | +3.782 |
urnal | +3.775 |
onential | +3.736 |
enary | +3.697 |
Neg logit contributions | |
BT | -2.885 |
Dollar | -2.805 |
cour | -2.737 |
FW | -2.693 |
rentals | -2.587 |
Token | . |
Token ID | 13 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
idious | +4.371 |
ocate | +4.119 |
urnal | +4.118 |
enary | +4.053 |
onential | +4.037 |
Neg logit contributions | |
BT | -3.401 |
Dollar | -3.322 |
cour | -3.201 |
FW | -3.176 |
rentals | -3.082 |
Token |
|
Token ID | 198 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
BT | +0.325 |
Dollar | +0.317 |
cour | +0.308 |
FW | +0.304 |
rentals | +0.293 |
Neg logit contributions | |
idious | -0.419 |
urnal | -0.396 |
ocate | -0.396 |
onential | -0.391 |
enary | -0.388 |
Token |
|
Token ID | 198 |
Feature activation | -9.90e-01 |
Pos logit contributions | |
idious | +1.791 |
ocate | +1.696 |
urnal | +1.685 |
enary | +1.657 |
onential | +1.656 |
Neg logit contributions | |
BT | -1.569 |
Dollar | -1.537 |
cour | -1.484 |
FW | -1.474 |
rentals | -1.451 |
Token | The |
Token ID | 464 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
idious | +1.043 |
urnal | +0.989 |
ocate | +0.989 |
onential | +0.976 |
enary | +0.971 |
Neg logit contributions | |
BT | -0.700 |
Dollar | -0.686 |
cour | -0.659 |
FW | -0.650 |
rentals | -0.631 |
Token | rulings |
Token ID | 31532 |
Feature activation | +2.98e+00 |
Pos logit contributions | |
BT | +1.045 |
Dollar | +1.023 |
cour | +0.990 |
FW | +0.970 |
rentals | +0.945 |
Neg logit contributions | |
idious | -1.495 |
urnal | -1.416 |
ocate | -1.415 |
onential | -1.404 |
enary | -1.385 |
Token | are |
Token ID | 389 |
Feature activation | +2.44e+00 |
Pos logit contributions | |
BT | +2.066 |
Dollar | +2.028 |
cour | +1.967 |
FW | +1.928 |
fav | +1.885 |
Neg logit contributions | |
idious | -3.165 |
urnal | -2.999 |
ocate | -2.990 |
onential | -2.986 |
enary | -2.937 |
Token | , |
Token ID | 11 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
BT | +1.863 |
Dollar | +1.836 |
cour | +1.781 |
FW | +1.746 |
fav | +1.707 |
Neg logit contributions | |
idious | -2.433 |
ocate | -2.306 |
urnal | -2.300 |
onential | -2.284 |
enary | -2.262 |
Token | however |
Token ID | 2158 |
Feature activation | +4.11e+00 |
Pos logit contributions | |
idious | +1.538 |
urnal | +1.456 |
ocate | +1.456 |
onential | +1.439 |
enary | +1.429 |
Neg logit contributions | |
BT | -1.089 |
Dollar | -1.061 |
cour | -1.027 |
FW | -1.013 |
rentals | -0.978 |
Token | , |
Token ID | 11 |
Feature activation | -5.06e-01 |
Pos logit contributions | |
BT | +2.605 |
Dollar | +2.557 |
cour | +2.498 |
FW | +2.399 |
fav | +2.355 |
Neg logit contributions | |
idious | -4.575 |
urnal | -4.380 |
ocate | -4.370 |
onential | -4.358 |
enary | -4.307 |
Token | unlikely |
Token ID | 7485 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
idious | +0.514 |
urnal | +0.485 |
ocate | +0.484 |
onential | +0.478 |
enary | +0.476 |
Neg logit contributions | |
BT | -0.382 |
Dollar | -0.370 |
cour | -0.358 |
FW | -0.355 |
rentals | -0.341 |
Token | to |
Token ID | 284 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
idious | +0.554 |
urnal | +0.523 |
ocate | +0.522 |
onential | +0.516 |
enary | +0.513 |
Neg logit contributions | |
BT | -0.463 |
Dollar | -0.452 |
cour | -0.438 |
FW | -0.433 |
rentals | -0.419 |
Token | or |
Token ID | 393 |
Feature activation | +8.66e-01 |
Pos logit contributions | |
BT | +3.262 |
Dollar | +3.176 |
cour | +3.101 |
FW | +3.020 |
fav | +2.938 |
Neg logit contributions | |
idious | -5.028 |
urnal | -4.822 |
ocate | -4.805 |
onential | -4.798 |
enary | -4.706 |
Token | hesitate |
Token ID | 22898 |
Feature activation | -2.63e+00 |
Pos logit contributions | |
BT | +0.629 |
Dollar | +0.613 |
cour | +0.594 |
FW | +0.586 |
rentals | +0.566 |
Neg logit contributions | |
idious | -0.899 |
urnal | -0.852 |
ocate | -0.850 |
onential | -0.842 |
enary | -0.836 |
Token | to |
Token ID | 284 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
idious | +2.535 |
ocate | +2.383 |
urnal | +2.378 |
onential | +2.344 |
enary | +2.334 |
Neg logit contributions | |
BT | -2.117 |
Dollar | -2.069 |
cour | -2.000 |
FW | -1.984 |
rentals | -1.913 |
Token | issue |
Token ID | 2071 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
BT | +1.464 |
Dollar | +1.433 |
cour | +1.382 |
FW | +1.353 |
fav | +1.334 |
Neg logit contributions | |
idious | -2.115 |
urnal | -2.027 |
onential | -2.013 |
ocate | -1.998 |
enary | -1.975 |
Token | rulings |
Token ID | 31532 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
BT | +1.033 |
Dollar | +1.010 |
cour | +0.979 |
FW | +0.961 |
rentals | +0.933 |
Neg logit contributions | |
idious | -1.495 |
urnal | -1.418 |
ocate | -1.416 |
onential | -1.408 |
enary | -1.391 |
Token | that |
Token ID | 326 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
BT | +0.787 |
Dollar | +0.769 |
cour | +0.747 |
FW | +0.730 |
fav | +0.707 |
Neg logit contributions | |
idious | -1.263 |
ocate | -1.206 |
urnal | -1.205 |
onential | -1.197 |
enary | -1.183 |
Token | may |
Token ID | 743 |
Feature activation | +3.02e+00 |
Pos logit contributions | |
BT | +0.767 |
Dollar | +0.746 |
cour | +0.720 |
FW | +0.710 |
rentals | +0.683 |
Neg logit contributions | |
idious | -1.239 |
ocate | -1.176 |
urnal | -1.176 |
onential | -1.163 |
enary | -1.155 |
Token | make |
Token ID | 787 |
Feature activation | -3.30e+00 |
Pos logit contributions | |
BT | +2.064 |
Dollar | +2.009 |
cour | +1.940 |
FW | +1.908 |
fav | +1.898 |
Neg logit contributions | |
idious | -3.230 |
urnal | -3.083 |
onential | -3.055 |
ocate | -3.047 |
enary | -3.008 |
Token | them |
Token ID | 606 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
idious | +3.314 |
urnal | +3.106 |
ocate | +3.106 |
onential | +3.045 |
enary | +3.021 |
Neg logit contributions | |
BT | -2.518 |
Dollar | -2.418 |
FW | -2.354 |
cour | -2.344 |
FB | -2.226 |
Token | targets |
Token ID | 6670 |
Feature activation | +2.03e+00 |
Pos logit contributions | |
idious | +2.096 |
ocate | +1.997 |
urnal | +1.975 |
onential | +1.946 |
enary | +1.946 |
Neg logit contributions | |
BT | -1.362 |
Dollar | -1.322 |
cour | -1.269 |
FW | -1.258 |
FB | -1.201 |
Token | in |
Token ID | 287 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
BT | +1.420 |
Dollar | +1.370 |
cour | +1.342 |
FW | +1.324 |
fav | +1.279 |
Neg logit contributions | |
idious | -2.132 |
urnal | -2.043 |
ocate | -2.035 |
onential | -2.031 |
enary | -1.997 |
Token | And |
Token ID | 1870 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
BT | +0.316 |
Dollar | +0.299 |
cour | +0.295 |
FW | +0.293 |
FB | +0.274 |
Neg logit contributions | |
idious | -0.512 |
urnal | -0.486 |
ocate | -0.486 |
onential | -0.481 |
enary | -0.478 |
Token | ers |
Token ID | 364 |
Feature activation | -5.61e-01 |
Pos logit contributions | |
BT | +1.850 |
Dollar | +1.789 |
cour | +1.743 |
FW | +1.735 |
rentals | +1.664 |
Neg logit contributions | |
idious | -2.637 |
ocate | -2.505 |
urnal | -2.502 |
onential | -2.475 |
enary | -2.447 |
Token | , |
Token ID | 11 |
Feature activation | -3.22e+00 |
Pos logit contributions | |
idious | +0.603 |
urnal | +0.571 |
ocate | +0.571 |
onential | +0.564 |
enary | +0.561 |
Neg logit contributions | |
BT | -0.388 |
Dollar | -0.378 |
cour | -0.365 |
FW | -0.360 |
rentals | -0.346 |
Token | knowing |
Token ID | 6970 |
Feature activation | +7.60e+00 |
Pos logit contributions | |
idious | +3.314 |
urnal | +3.119 |
ocate | +3.118 |
onential | +3.074 |
enary | +3.054 |
Neg logit contributions | |
BT | -2.357 |
Dollar | -2.288 |
cour | -2.219 |
FW | -2.193 |
rentals | -2.115 |
Token | full |
Token ID | 1336 |
Feature activation | +4.77e+00 |
Pos logit contributions | |
BT | +4.906 |
Dollar | +4.869 |
FW | +4.607 |
cour | +4.598 |
fav | +4.584 |
Neg logit contributions | |
idious | -7.989 |
urnal | -7.876 |
ocate | -7.712 |
onential | -7.677 |
enary | -7.674 |
Token | well |
Token ID | 880 |
Feature activation | +4.66e+00 |
Pos logit contributions | |
BT | +2.747 |
cour | +2.563 |
Dollar | +2.563 |
FW | +2.475 |
fav | +2.444 |
Neg logit contributions | |
idious | -5.571 |
urnal | -5.407 |
onential | -5.396 |
ocate | -5.388 |
enary | -5.247 |
Token | that |
Token ID | 326 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
BT | +2.797 |
Dollar | +2.742 |
FW | +2.585 |
cour | +2.584 |
fav | +2.504 |
Neg logit contributions | |
idious | -5.315 |
urnal | -5.147 |
ocate | -5.105 |
onential | -5.064 |
enary | -5.049 |
Token | I |
Token ID | 314 |
Feature activation | +7.31e+00 |
Pos logit contributions | |
BT | +2.853 |
Dollar | +2.823 |
cour | +2.693 |
FW | +2.681 |
rentals | +2.625 |
Neg logit contributions | |
idious | -3.833 |
urnal | -3.681 |
ocate | -3.645 |
enary | -3.605 |
onential | -3.601 |
Token | intend |
Token ID | 14765 |
Feature activation | +4.63e+00 |
Pos logit contributions | |
BT | +4.299 |
Dollar | +4.091 |
cour | +3.917 |
fav | +3.894 |
FW | +3.805 |
Neg logit contributions | |
idious | -8.413 |
urnal | -8.053 |
onential | -8.026 |
ocate | -7.950 |
enary | -7.835 |
Token | to |
Token ID | 284 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
BT | +3.369 |
Dollar | +3.291 |
cour | +3.170 |
FW | +3.149 |
rentals | +3.068 |
Neg logit contributions | |
idious | -4.727 |
urnal | -4.502 |
ocate | -4.471 |
enary | -4.378 |
onential | -4.376 |
Token | leave |
Token ID | 2666 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
BT | +2.099 |
Dollar | +2.057 |
cour | +1.964 |
FW | +1.933 |
fav | +1.898 |
Neg logit contributions | |
idious | -3.270 |
urnal | -3.130 |
ocate | -3.107 |
onential | -3.082 |
enary | -3.060 |
Token | � |
Token ID | 251 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
idious | +0.369 |
urnal | +0.344 |
ocate | +0.343 |
onential | +0.338 |
enary | +0.335 |
Neg logit contributions | |
BT | -0.460 |
Dollar | -0.452 |
cour | -0.441 |
FW | -0.437 |
rentals | -0.426 |
Token | Hundreds |
Token ID | 32636 |
Feature activation | -7.89e-01 |
Pos logit contributions | |
BT | +0.975 |
Dollar | +0.951 |
cour | +0.918 |
FW | +0.906 |
fav | +0.870 |
Neg logit contributions | |
idious | -1.313 |
urnal | -1.238 |
ocate | -1.237 |
onential | -1.227 |
enary | -1.209 |
Token | streamed |
Token ID | 35377 |
Feature activation | +3.07e+00 |
Pos logit contributions | |
idious | +0.792 |
urnal | +0.748 |
ocate | +0.748 |
onential | +0.739 |
enary | +0.733 |
Neg logit contributions | |
BT | -0.602 |
Dollar | -0.587 |
cour | -0.569 |
FW | -0.562 |
rentals | -0.543 |
Token | down |
Token ID | 866 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
BT | +2.366 |
Dollar | +2.333 |
cour | +2.251 |
FW | +2.211 |
rentals | +2.176 |
Neg logit contributions | |
idious | -3.035 |
ocate | -2.858 |
urnal | -2.856 |
onential | -2.854 |
enary | -2.791 |
Token | the |
Token ID | 262 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
BT | +2.930 |
Dollar | +2.914 |
cour | +2.812 |
FW | +2.775 |
rentals | +2.638 |
Neg logit contributions | |
idious | -4.227 |
urnal | -3.974 |
ocate | -3.954 |
onential | -3.947 |
enary | -3.859 |
Token | a |
Token ID | 257 |
Feature activation | +6.84e+00 |
Pos logit contributions | |
BT | +0.754 |
Dollar | +0.739 |
cour | +0.714 |
FW | +0.703 |
rentals | +0.680 |
Neg logit contributions | |
idious | -1.052 |
urnal | -0.995 |
ocate | -0.993 |
onential | -0.986 |
enary | -0.970 |
Token | is |
Token ID | 271 |
Feature activation | -2.73e+00 |
Pos logit contributions | |
BT | +5.190 |
Dollar | +5.028 |
cour | +4.963 |
FW | +4.900 |
FB | +4.694 |
Neg logit contributions | |
idious | -6.679 |
onential | -6.286 |
ocate | -6.231 |
urnal | -6.156 |
ortun | -5.903 |
Token | les |
Token ID | 829 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
idious | +2.401 |
ocate | +2.252 |
urnal | +2.249 |
onential | +2.221 |
enary | +2.199 |
Neg logit contributions | |
BT | -2.419 |
Dollar | -2.363 |
cour | -2.305 |
FW | -2.279 |
rentals | -2.217 |
Token | for |
Token ID | 329 |
Feature activation | +5.07e+00 |
Pos logit contributions | |
BT | +0.795 |
Dollar | +0.776 |
cour | +0.756 |
FW | +0.742 |
rentals | +0.718 |
Neg logit contributions | |
idious | -1.111 |
ocate | -1.058 |
urnal | -1.055 |
onential | -1.049 |
enary | -1.032 |
Token | the |
Token ID | 262 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
BT | +3.677 |
Dollar | +3.655 |
cour | +3.471 |
FW | +3.427 |
fav | +3.385 |
Neg logit contributions | |
idious | -5.187 |
urnal | -4.908 |
onential | -4.889 |
ocate | -4.865 |
enary | -4.759 |
Token | altar |
Token ID | 18890 |
Feature activation | -7.87e-01 |
Pos logit contributions | |
BT | +1.407 |
Dollar | +1.386 |
cour | +1.330 |
FW | +1.314 |
rentals | +1.281 |
Neg logit contributions | |
idious | -1.819 |
urnal | -1.714 |
ocate | -1.708 |
onential | -1.700 |
enary | -1.665 |
Token | patron |
Token ID | 19686 |
Feature activation | +2.75e+00 |
Pos logit contributions | |
idious | +1.201 |
ocate | +1.137 |
urnal | +1.136 |
onential | +1.122 |
enary | +1.115 |
Neg logit contributions | |
BT | -0.880 |
Dollar | -0.858 |
cour | -0.831 |
FW | -0.820 |
rentals | -0.792 |
Token | ize |
Token ID | 1096 |
Feature activation | +6.42e+00 |
Pos logit contributions | |
BT | +1.817 |
Dollar | +1.772 |
cour | +1.699 |
FW | +1.681 |
fav | +1.618 |
Neg logit contributions | |
idious | -3.020 |
urnal | -2.871 |
onential | -2.860 |
ocate | -2.819 |
enary | -2.813 |
Token | the |
Token ID | 262 |
Feature activation | +4.48e+00 |
Pos logit contributions | |
Dollar | +4.947 |
BT | +4.906 |
cour | +4.653 |
rentals | +4.588 |
fav | +4.585 |
Neg logit contributions | |
idious | -6.032 |
urnal | -5.771 |
onential | -5.764 |
ocate | -5.701 |
enary | -5.682 |
Token | child |
Token ID | 1200 |
Feature activation | +1.71e-01 |
Pos logit contributions | |
BT | +3.448 |
Dollar | +3.443 |
cour | +3.266 |
FW | +3.209 |
fav | +3.149 |
Neg logit contributions | |
idious | -4.350 |
urnal | -4.155 |
onential | -4.130 |
ocate | -4.115 |
enary | -4.056 |
Token | and |
Token ID | 290 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
BT | +0.130 |
Dollar | +0.127 |
cour | +0.124 |
FW | +0.121 |
rentals | +0.118 |
Neg logit contributions | |
idious | -0.172 |
urnal | -0.163 |
ocate | -0.163 |
onential | -0.161 |
enary | -0.159 |
Token | say |
Token ID | 910 |
Feature activation | +8.13e+00 |
Pos logit contributions | |
BT | +2.480 |
Dollar | +2.451 |
cour | +2.344 |
FW | +2.312 |
fav | +2.272 |
Neg logit contributions | |
idious | -3.493 |
urnal | -3.327 |
onential | -3.289 |
ocate | -3.288 |
enary | -3.251 |
Token | there |
Token ID | 612 |
Feature activation | -8.13e+00 |
Pos logit contributions | |
BT | +5.006 |
Dollar | +4.926 |
fav | +4.589 |
cour | +4.577 |
FW | +4.570 |
Neg logit contributions | |
idious | -8.864 |
urnal | -8.538 |
onential | -8.536 |
ocate | -8.487 |
enary | -8.354 |
Token | � |
Token ID | 447 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
idious | +7.683 |
ocate | +7.355 |
urnal | +7.184 |
enary | +7.133 |
onential | +7.127 |
Neg logit contributions | |
BT | -6.158 |
Dollar | -5.944 |
cour | -5.825 |
FW | -5.744 |
FB | -5.544 |
Token | � |
Token ID | 247 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
idious | +0.847 |
urnal | +0.795 |
ocate | +0.789 |
onential | +0.782 |
enary | +0.776 |
Neg logit contributions | |
BT | -0.931 |
Dollar | -0.910 |
cour | -0.886 |
FW | -0.881 |
rentals | -0.855 |
Token | s |
Token ID | 82 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
BT | +0.574 |
Dollar | +0.552 |
cour | +0.525 |
FW | +0.515 |
rentals | +0.485 |
Neg logit contributions | |
idious | -1.535 |
urnal | -1.470 |
ocate | -1.470 |
onential | -1.459 |
enary | -1.446 |
Token | a |
Token ID | 257 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
idious | +9.758 |
ocate | +9.152 |
urnal | +9.043 |
enary | +8.962 |
onential | +8.881 |
Neg logit contributions | |
BT | -7.125 |
cour | -6.729 |
Dollar | -6.719 |
FW | -6.667 |
FB | -6.328 |
Token | that |
Token ID | 326 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
idious | +1.721 |
ocate | +1.622 |
urnal | +1.621 |
onential | +1.609 |
enary | +1.598 |
Neg logit contributions | |
BT | -1.250 |
Dollar | -1.219 |
cour | -1.178 |
FW | -1.161 |
rentals | -1.123 |
Token | usually |
Token ID | 3221 |
Feature activation | +4.78e+00 |
Pos logit contributions | |
BT | +1.787 |
Dollar | +1.747 |
cour | +1.681 |
FW | +1.653 |
fav | +1.613 |
Neg logit contributions | |
idious | -2.814 |
ocate | -2.674 |
urnal | -2.674 |
onential | -2.640 |
enary | -2.622 |
Token | signals |
Token ID | 10425 |
Feature activation | +4.18e+00 |
Pos logit contributions | |
BT | +3.188 |
Dollar | +3.123 |
cour | +3.045 |
fav | +2.995 |
FW | +2.950 |
Neg logit contributions | |
idious | -5.135 |
ocate | -4.916 |
urnal | -4.894 |
onential | -4.849 |
enary | -4.795 |
Token | the |
Token ID | 262 |
Feature activation | +6.34e-01 |
Pos logit contributions | |
BT | +3.202 |
Dollar | +3.164 |
cour | +3.059 |
FW | +2.998 |
rentals | +2.983 |
Neg logit contributions | |
idious | -4.092 |
urnal | -3.902 |
ocate | -3.875 |
onential | -3.824 |
enary | -3.788 |
Token | end |
Token ID | 886 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
BT | +0.545 |
Dollar | +0.533 |
cour | +0.518 |
FW | +0.513 |
rentals | +0.499 |
Neg logit contributions | |
idious | -0.574 |
urnal | -0.540 |
ocate | -0.539 |
onential | -0.533 |
enary | -0.528 |
Token | of |
Token ID | 286 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
idious | +2.151 |
ocate | +2.021 |
urnal | +2.019 |
onential | +1.992 |
enary | +1.980 |
Neg logit contributions | |
BT | -1.921 |
Dollar | -1.886 |
cour | -1.831 |
FW | -1.808 |
rentals | -1.748 |
Token | an |
Token ID | 281 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
idious | +1.625 |
ocate | +1.532 |
urnal | +1.529 |
onential | +1.513 |
enary | +1.501 |
Neg logit contributions | |
BT | -1.339 |
Dollar | -1.303 |
cour | -1.264 |
FW | -1.253 |
fav | -1.201 |
Token | elite |
Token ID | 9085 |
Feature activation | -2.91e+00 |
Pos logit contributions | |
idious | +3.851 |
urnal | +3.628 |
ocate | +3.621 |
onential | +3.585 |
enary | +3.539 |
Neg logit contributions | |
BT | -3.129 |
Dollar | -3.033 |
cour | -2.926 |
FW | -2.900 |
rentals | -2.789 |
Token | career |
Token ID | 3451 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
idious | +2.914 |
ocate | +2.757 |
urnal | +2.751 |
onential | +2.709 |
enary | +2.704 |
Neg logit contributions | |
BT | -2.224 |
Dollar | -2.159 |
cour | -2.099 |
FW | -2.072 |
fav | -1.989 |
Token | not |
Token ID | 407 |
Feature activation | +3.83e+00 |
Pos logit contributions | |
BT | +4.025 |
Dollar | +3.928 |
cour | +3.890 |
fav | +3.754 |
FW | +3.753 |
Neg logit contributions | |
idious | -6.791 |
urnal | -6.537 |
ocate | -6.481 |
onential | -6.436 |
elfth | -6.319 |
Token | the |
Token ID | 262 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
BT | +2.704 |
Dollar | +2.625 |
cour | +2.594 |
FW | +2.507 |
fav | +2.484 |
Neg logit contributions | |
idious | -3.982 |
ocate | -3.812 |
urnal | -3.796 |
onential | -3.772 |
enary | -3.729 |
Token | on |
Token ID | 319 |
Feature activation | +7.31e-01 |
Pos logit contributions | |
idious | +2.071 |
ocate | +1.957 |
urnal | +1.953 |
onential | +1.933 |
enary | +1.921 |
Neg logit contributions | |
BT | -1.500 |
Dollar | -1.461 |
cour | -1.415 |
FW | -1.396 |
rentals | -1.346 |
Token | substit |
Token ID | 21436 |
Feature activation | -7.39e+00 |
Pos logit contributions | |
BT | +0.560 |
Dollar | +0.547 |
cour | +0.529 |
FW | +0.522 |
fav | +0.509 |
Neg logit contributions | |
idious | -0.727 |
urnal | -0.692 |
ocate | -0.689 |
onential | -0.682 |
enary | -0.675 |
Token | utions |
Token ID | 3508 |
Feature activation | -4.71e+00 |
Pos logit contributions | |
idious | +5.673 |
ocate | +5.281 |
urnal | +5.226 |
enary | +5.183 |
onential | +5.108 |
Neg logit contributions | |
BT | -7.130 |
Dollar | -7.103 |
FW | -6.816 |
cour | -6.774 |
FB | -6.606 |
Token | quickly |
Token ID | 2952 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
idious | +4.738 |
ocate | +4.428 |
urnal | +4.423 |
enary | +4.351 |
onential | +4.339 |
Neg logit contributions | |
BT | -3.544 |
Dollar | -3.465 |
cour | -3.338 |
FW | -3.314 |
rentals | -3.172 |
Token | enough |
Token ID | 1576 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
idious | +2.344 |
urnal | +2.200 |
ocate | +2.200 |
onential | +2.169 |
enary | +2.157 |
Neg logit contributions | |
BT | -1.991 |
Dollar | -1.947 |
cour | -1.889 |
FW | -1.867 |
rentals | -1.809 |
Token | . |
Token ID | 13 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
idious | +1.579 |
urnal | +1.494 |
ocate | +1.494 |
onential | +1.476 |
enary | +1.465 |
Neg logit contributions | |
BT | -1.152 |
Dollar | -1.123 |
cour | -1.088 |
FW | -1.074 |
rentals | -1.037 |
Token | And |
Token ID | 843 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
idious | +1.996 |
ocate | +1.885 |
urnal | +1.882 |
onential | +1.859 |
enary | +1.849 |
Neg logit contributions | |
BT | -1.532 |
Dollar | -1.490 |
cour | -1.450 |
FW | -1.431 |
rentals | -1.395 |
Token | although |
Token ID | 3584 |
Feature activation | -7.51e-02 |
Pos logit contributions | |
BT | +1.717 |
Dollar | +1.682 |
cour | +1.629 |
FW | +1.600 |
fav | +1.554 |
Neg logit contributions | |
idious | -2.341 |
urnal | -2.234 |
ocate | -2.229 |
onential | -2.214 |
enary | -2.189 |
Token | he |
Token ID | 339 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
idious | +0.074 |
urnal | +0.070 |
ocate | +0.070 |
onential | +0.069 |
enary | +0.068 |
Neg logit contributions | |
BT | -0.059 |
Dollar | -0.058 |
cour | -0.056 |
FW | -0.055 |
rentals | -0.053 |
Token | resists |
Token ID | 47786 |
Feature activation | -4.31e+00 |
Pos logit contributions | |
idious | +3.264 |
ocate | +3.094 |
urnal | +3.072 |
enary | +3.038 |
onential | +3.026 |
Neg logit contributions | |
BT | -1.980 |
Dollar | -1.919 |
cour | -1.861 |
FW | -1.843 |
FB | -1.748 |
Token | endorsing |
Token ID | 38379 |
Feature activation | -3.98e-01 |
Pos logit contributions | |
idious | +4.470 |
ocate | +4.213 |
urnal | +4.159 |
onential | +4.127 |
enary | +4.114 |
Neg logit contributions | |
BT | -3.141 |
Dollar | -3.028 |
cour | -2.941 |
FW | -2.924 |
rentals | -2.763 |
Token | A |
Token ID | 317 |
Feature activation | +8.07e+00 |
Pos logit contributions | |
BT | +1.967 |
Dollar | +1.897 |
cour | +1.847 |
FW | +1.827 |
fav | +1.759 |
Neg logit contributions | |
idious | -2.554 |
urnal | -2.425 |
ocate | -2.407 |
onential | -2.389 |
enary | -2.367 |
Token | du |
Token ID | 646 |
Feature activation | -7.95e-01 |
Pos logit contributions | |
BT | +5.508 |
Dollar | +5.366 |
cour | +5.180 |
FW | +4.979 |
fav | +4.950 |
Neg logit contributions | |
idious | -8.345 |
ocate | -7.885 |
urnal | -7.883 |
onential | -7.843 |
enary | -7.775 |
Token | says |
Token ID | 1139 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
idious | +0.813 |
ocate | +0.771 |
urnal | +0.769 |
onential | +0.759 |
enary | +0.755 |
Neg logit contributions | |
BT | -0.586 |
Dollar | -0.573 |
cour | -0.554 |
FW | -0.548 |
rentals | -0.528 |
Token | . |
Token ID | 13 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
idious | +1.358 |
ocate | +1.285 |
urnal | +1.281 |
onential | +1.265 |
enary | +1.259 |
Neg logit contributions | |
BT | -0.983 |
Dollar | -0.958 |
cour | -0.931 |
FW | -0.917 |
rentals | -0.884 |
Token | � |
Token ID | 564 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
idious | +2.787 |
ocate | +2.652 |
urnal | +2.636 |
onential | +2.609 |
enary | +2.602 |
Neg logit contributions | |
BT | -1.904 |
Dollar | -1.875 |
cour | -1.812 |
FW | -1.775 |
rentals | -1.749 |
Token | � |
Token ID | 250 |
Feature activation | -3.33e+00 |
Pos logit contributions | |
idious | +2.047 |
urnal | +1.940 |
ocate | +1.926 |
onential | +1.912 |
enary | +1.899 |
Neg logit contributions | |
BT | -1.925 |
Dollar | -1.874 |
cour | -1.827 |
FW | -1.812 |
rentals | -1.752 |
Token | Ben |
Token ID | 11696 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
idious | +3.558 |
ocate | +3.386 |
urnal | +3.368 |
onential | +3.328 |
enary | +3.316 |
Neg logit contributions | |
BT | -2.239 |
Dollar | -2.221 |
cour | -2.125 |
FW | -2.082 |
rentals | -2.053 |
Token | f |
Token ID | 69 |
Feature activation | -4.76e-01 |
Pos logit contributions | |
BT | +6.816 |
Dollar | +6.663 |
cour | +6.539 |
FW | +6.471 |
fav | +6.174 |
Neg logit contributions | |
idious | -12.496 |
onential | -11.841 |
urnal | -11.771 |
enary | -11.611 |
ocate | -11.448 |
Token | ica |
Token ID | 3970 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
idious | +0.344 |
urnal | +0.317 |
ocate | +0.316 |
onential | +0.312 |
enary | +0.308 |
Neg logit contributions | |
BT | -0.498 |
Dollar | -0.489 |
cour | -0.479 |
FW | -0.474 |
rentals | -0.462 |
Token | is |
Token ID | 318 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
BT | +2.767 |
Dollar | +2.694 |
cour | +2.573 |
FW | +2.554 |
fav | +2.471 |
Neg logit contributions | |
idious | -4.525 |
urnal | -4.304 |
onential | -4.272 |
ocate | -4.261 |
enary | -4.208 |
Token | my |
Token ID | 616 |
Feature activation | +4.33e-01 |
Pos logit contributions | |
BT | +2.879 |
Dollar | +2.839 |
cour | +2.710 |
FW | +2.693 |
fav | +2.608 |
Neg logit contributions | |
idious | -3.842 |
urnal | -3.660 |
ocate | -3.634 |
onential | -3.633 |
enary | -3.594 |
Token | -- |
Token ID | 1377 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
BT | +1.066 |
Dollar | +1.039 |
cour | +0.999 |
FW | +0.986 |
rentals | +0.954 |
Neg logit contributions | |
idious | -1.734 |
ocate | -1.652 |
urnal | -1.650 |
onential | -1.633 |
enary | -1.620 |
Token | which |
Token ID | 543 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
BT | +2.519 |
Dollar | +2.473 |
cour | +2.391 |
FW | +2.355 |
fav | +2.298 |
Neg logit contributions | |
idious | -3.682 |
urnal | -3.516 |
ocate | -3.504 |
onential | -3.464 |
enary | -3.438 |
Token | she |
Token ID | 673 |
Feature activation | -4.56e-02 |
Pos logit contributions | |
BT | +1.014 |
Dollar | +0.992 |
cour | +0.959 |
FW | +0.945 |
fav | +0.920 |
Neg logit contributions | |
idious | -1.396 |
urnal | -1.320 |
ocate | -1.320 |
onential | -1.306 |
enary | -1.295 |
Token | describes |
Token ID | 8477 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
idious | +0.048 |
ocate | +0.046 |
urnal | +0.046 |
onential | +0.045 |
enary | +0.045 |
Neg logit contributions | |
BT | -0.032 |
Dollar | -0.031 |
cour | -0.030 |
FW | -0.030 |
rentals | -0.029 |
Token | as |
Token ID | 355 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
BT | +2.076 |
Dollar | +2.026 |
cour | +1.936 |
FW | +1.899 |
fav | +1.834 |
Neg logit contributions | |
idious | -4.119 |
ocate | -3.934 |
urnal | -3.924 |
onential | -3.895 |
enary | -3.851 |
Token | " |
Token ID | 366 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
BT | +1.622 |
Dollar | +1.590 |
cour | +1.534 |
FW | +1.512 |
fav | +1.464 |
Neg logit contributions | |
idious | -2.429 |
ocate | -2.309 |
urnal | -2.305 |
onential | -2.281 |
enary | -2.267 |
Token | sweet |
Token ID | 34751 |
Feature activation | -8.80e+00 |
Pos logit contributions | |
idious | +1.117 |
urnal | +1.055 |
ocate | +1.054 |
onential | +1.041 |
enary | +1.034 |
Neg logit contributions | |
BT | -0.848 |
Dollar | -0.829 |
cour | -0.801 |
FW | -0.792 |
rentals | -0.767 |
Token | and |
Token ID | 290 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
idious | +8.307 |
ocate | +7.659 |
urnal | +7.612 |
onential | +7.533 |
enary | +7.523 |
Neg logit contributions | |
BT | -6.794 |
Dollar | -6.717 |
cour | -6.430 |
FW | -6.356 |
FB | -6.215 |
Token | Southern |
Token ID | 8050 |
Feature activation | -4.91e+00 |
Pos logit contributions | |
idious | +1.548 |
urnal | +1.461 |
ocate | +1.459 |
onential | +1.441 |
enary | +1.431 |
Neg logit contributions | |
BT | -1.111 |
Dollar | -1.080 |
cour | -1.043 |
FW | -1.036 |
rentals | -0.995 |
Token | " |
Token ID | 1 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
idious | +4.808 |
urnal | +4.520 |
ocate | +4.504 |
onential | +4.450 |
enary | +4.417 |
Neg logit contributions | |
BT | -3.739 |
Dollar | -3.631 |
cour | -3.542 |
FW | -3.491 |
rentals | -3.384 |
Token | -- |
Token ID | 1377 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
idious | +3.233 |
urnal | +3.049 |
ocate | +3.046 |
onential | +3.012 |
enary | +2.992 |
Neg logit contributions | |
BT | -2.484 |
Dollar | -2.400 |
cour | -2.337 |
FW | -2.314 |
rentals | -2.221 |
Token | compliment |
Token ID | 19370 |
Feature activation | +5.45e-01 |
Pos logit contributions | |
BT | +2.782 |
Dollar | +2.714 |
cour | +2.622 |
FW | +2.602 |
fav | +2.502 |
Neg logit contributions | |
idious | -3.691 |
urnal | -3.478 |
onential | -3.470 |
ocate | -3.447 |
enary | -3.400 |
Token | ed |
Token ID | 276 |
Feature activation | -4.23e-01 |
Pos logit contributions | |
BT | +0.293 |
Dollar | +0.283 |
cour | +0.270 |
FW | +0.265 |
rentals | +0.252 |
Neg logit contributions | |
idious | -0.670 |
urnal | -0.640 |
ocate | -0.640 |
onential | -0.634 |
enary | -0.629 |
Token | Sheriff |
Token ID | 12874 |
Feature activation | -6.51e+00 |
Pos logit contributions | |
idious | +0.442 |
urnal | +0.418 |
ocate | +0.418 |
onential | +0.413 |
enary | +0.410 |
Neg logit contributions | |
BT | -0.305 |
Dollar | -0.297 |
cour | -0.287 |
FW | -0.284 |
rentals | -0.273 |
Token | � |
Token ID | 447 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
idious | +6.850 |
ocate | +6.518 |
urnal | +6.442 |
enary | +6.343 |
onential | +6.328 |
Neg logit contributions | |
BT | -4.420 |
Dollar | -4.239 |
cour | -4.121 |
FW | -4.087 |
rentals | -4.006 |
Token | � |
Token ID | 247 |
Feature activation | +7.09e+00 |
Pos logit contributions | |
idious | +1.097 |
urnal | +1.026 |
ocate | +1.025 |
onential | +1.011 |
enary | +1.003 |
Neg logit contributions | |
BT | -1.184 |
Dollar | -1.159 |
cour | -1.129 |
FW | -1.119 |
rentals | -1.088 |
Token | s |
Token ID | 82 |
Feature activation | -5.90e+00 |
Pos logit contributions | |
BT | +2.578 |
cour | +2.450 |
Dollar | +2.445 |
FW | +2.249 |
FB | +2.046 |
Neg logit contributions | |
idious | -9.673 |
urnal | -9.304 |
onential | -9.300 |
ocate | -9.264 |
enary | -9.083 |
Token | deputies |
Token ID | 21861 |
Feature activation | -6.21e+00 |
Pos logit contributions | |
idious | +6.053 |
ocate | +5.713 |
urnal | +5.674 |
enary | +5.605 |
onential | +5.605 |
Neg logit contributions | |
BT | -4.265 |
Dollar | -4.067 |
cour | -3.987 |
FW | -3.932 |
rentals | -3.836 |
Token | and |
Token ID | 290 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
idious | +6.339 |
urnal | +5.949 |
ocate | +5.906 |
enary | +5.850 |
onential | +5.787 |
Neg logit contributions | |
BT | -4.420 |
Dollar | -4.296 |
cour | -4.190 |
FW | -4.090 |
rentals | -4.004 |
Token | HB |
Token ID | 25997 |
Feature activation | +3.34e+00 |
Pos logit contributions | |
idious | +1.035 |
urnal | +0.978 |
ocate | +0.977 |
onential | +0.967 |
enary | +0.959 |
Neg logit contributions | |
BT | -0.770 |
Dollar | -0.752 |
cour | -0.728 |
FW | -0.719 |
rentals | -0.694 |
Token | PD |
Token ID | 5760 |
Feature activation | -5.28e+00 |
Pos logit contributions | |
BT | +1.192 |
Dollar | +1.066 |
cour | +1.022 |
FW | +1.021 |
FB | +0.918 |
Neg logit contributions | |
idious | -4.763 |
urnal | -4.574 |
ocate | -4.552 |
onential | -4.547 |
enary | -4.501 |
Token | officers |
Token ID | 3790 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
idious | +4.916 |
ocate | +4.667 |
urnal | +4.642 |
enary | +4.590 |
onential | +4.563 |
Neg logit contributions | |
BT | -4.279 |
Dollar | -4.165 |
cour | -4.042 |
FW | -3.988 |
rentals | -3.884 |
Token | . |
Token ID | 13 |
Feature activation | -4.47e-01 |
Pos logit contributions | |
idious | +0.382 |
urnal | +0.362 |
ocate | +0.361 |
onential | +0.357 |
enary | +0.355 |
Neg logit contributions | |
BT | -0.269 |
Dollar | -0.262 |
cour | -0.254 |
FW | -0.250 |
rentals | -0.241 |
Token | On |
Token ID | 1550 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
idious | +0.462 |
urnal | +0.438 |
ocate | +0.437 |
onential | +0.432 |
enary | +0.429 |
Neg logit contributions | |
BT | -0.328 |
Dollar | -0.320 |
cour | -0.309 |
FW | -0.305 |
rentals | -0.294 |
Token | February |
Token ID | 3945 |
Feature activation | -4.84e+00 |
Pos logit contributions | |
idious | +0.221 |
urnal | +0.209 |
ocate | +0.209 |
onential | +0.207 |
enary | +0.206 |
Neg logit contributions | |
BT | -0.156 |
Dollar | -0.153 |
cour | -0.147 |
FW | -0.145 |
rentals | -0.140 |
Token | 2 |
Token ID | 362 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
idious | +4.244 |
ocate | +4.014 |
urnal | +4.009 |
enary | +3.953 |
onential | +3.883 |
Neg logit contributions | |
BT | -4.106 |
Dollar | -3.955 |
cour | -3.891 |
FW | -3.858 |
rentals | -3.799 |
Token | , |
Token ID | 11 |
Feature activation | -6.90e+00 |
Pos logit contributions | |
BT | +0.927 |
Dollar | +0.902 |
cour | +0.868 |
FW | +0.855 |
rentals | +0.819 |
Neg logit contributions | |
idious | -1.545 |
urnal | -1.469 |
ocate | -1.468 |
onential | -1.455 |
enary | -1.441 |
Token | as |
Token ID | 355 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
idious | +5.826 |
urnal | +5.399 |
ocate | +5.398 |
enary | +5.288 |
onential | +5.278 |
Neg logit contributions | |
BT | -6.205 |
Dollar | -5.919 |
FW | -5.880 |
cour | -5.867 |
fav | -5.666 |
Token | Ranger |
Token ID | 21888 |
Feature activation | -7.21e+00 |
Pos logit contributions | |
idious | +12.128 |
urnal | +11.418 |
ocate | +11.372 |
enary | +11.217 |
onential | +10.930 |
Neg logit contributions | |
BT | -8.988 |
cour | -8.364 |
FW | -8.296 |
Dollar | -8.168 |
fav | -8.035 |
Token | 6 |
Token ID | 718 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
idious | +6.058 |
ocate | +5.804 |
enary | +5.659 |
urnal | +5.621 |
onential | +5.538 |
Neg logit contributions | |
BT | -6.283 |
Dollar | -6.084 |
cour | -6.043 |
FW | -5.988 |
fav | -5.709 |
Token | passed |
Token ID | 3804 |
Feature activation | -3.51e-01 |
Pos logit contributions | |
idious | +1.814 |
ocate | +1.717 |
urnal | +1.715 |
onential | +1.689 |
enary | +1.683 |
Neg logit contributions | |
BT | -1.337 |
Dollar | -1.306 |
cour | -1.268 |
FW | -1.251 |
rentals | -1.205 |
Token | the |
Token ID | 262 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
idious | +0.353 |
ocate | +0.333 |
urnal | +0.333 |
onential | +0.329 |
enary | +0.327 |
Neg logit contributions | |
BT | -0.267 |
Dollar | -0.260 |
cour | -0.252 |
FW | -0.249 |
rentals | -0.240 |
Token | 2 |
Token ID | 362 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
idious | +1.712 |
urnal | +1.618 |
ocate | +1.618 |
onential | +1.594 |
enary | +1.590 |
Neg logit contributions | |
BT | -1.200 |
Dollar | -1.158 |
cour | -1.131 |
FW | -1.116 |
rentals | -1.071 |
Token | quite |
Token ID | 2407 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
idious | +6.597 |
urnal | +6.134 |
ocate | +6.092 |
onential | +6.005 |
enary | +5.947 |
Neg logit contributions | |
BT | -5.602 |
Dollar | -5.342 |
FW | -5.300 |
cour | -5.209 |
FB | -4.992 |
Token | a |
Token ID | 257 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
idious | +2.310 |
urnal | +2.147 |
ocate | +2.139 |
onential | +2.106 |
enary | +2.096 |
Neg logit contributions | |
BT | -2.178 |
Dollar | -2.122 |
cour | -2.056 |
FW | -2.049 |
rentals | -1.969 |
Token | different |
Token ID | 1180 |
Feature activation | -5.58e+00 |
Pos logit contributions | |
BT | +1.090 |
Dollar | +1.069 |
cour | +1.036 |
FW | +1.016 |
fav | +0.987 |
Neg logit contributions | |
idious | -1.513 |
ocate | -1.440 |
urnal | -1.436 |
onential | -1.422 |
enary | -1.408 |
Token | figure |
Token ID | 3785 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
idious | +5.458 |
urnal | +5.083 |
ocate | +5.043 |
onential | +4.965 |
enary | +4.941 |
Neg logit contributions | |
BT | -4.348 |
Dollar | -4.131 |
cour | -4.073 |
FW | -4.071 |
rentals | -3.872 |
Token | from |
Token ID | 422 |
Feature activation | -2.91e+00 |
Pos logit contributions | |
idious | +0.291 |
urnal | +0.277 |
ocate | +0.277 |
onential | +0.274 |
enary | +0.271 |
Neg logit contributions | |
BT | -0.205 |
Dollar | -0.200 |
cour | -0.194 |
FW | -0.190 |
fav | -0.185 |
Token | what |
Token ID | 644 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
idious | +2.910 |
urnal | +2.743 |
ocate | +2.741 |
onential | +2.700 |
enary | +2.683 |
Neg logit contributions | |
BT | -2.225 |
Dollar | -2.155 |
cour | -2.098 |
FW | -2.073 |
rentals | -2.002 |
Token | he |
Token ID | 339 |
Feature activation | -5.50e+00 |
Pos logit contributions | |
idious | +9.824 |
urnal | +9.051 |
ocate | +9.012 |
onential | +8.725 |
enary | +8.723 |
Neg logit contributions | |
BT | -9.042 |
FW | -8.489 |
Dollar | -8.472 |
cour | -8.462 |
FB | -8.028 |
Token | intends |
Token ID | 19582 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
idious | +5.793 |
urnal | +5.433 |
ocate | +5.425 |
enary | +5.306 |
onential | +5.292 |
Neg logit contributions | |
BT | -3.834 |
Dollar | -3.716 |
FW | -3.607 |
cour | -3.585 |
FB | -3.400 |
Token | . |
Token ID | 13 |
Feature activation | -4.87e+00 |
Pos logit contributions | |
idious | +1.219 |
ocate | +1.155 |
urnal | +1.154 |
onential | +1.141 |
enary | +1.132 |
Neg logit contributions | |
BT | -0.899 |
Dollar | -0.877 |
cour | -0.850 |
FW | -0.839 |
rentals | -0.811 |
Token | � |
Token ID | 447 |
Feature activation | +2.07e+00 |
Pos logit contributions | |
idious | +4.720 |
ocate | +4.453 |
urnal | +4.445 |
onential | +4.392 |
enary | +4.378 |
Neg logit contributions | |
BT | -3.679 |
Dollar | -3.584 |
cour | -3.491 |
rentals | -3.446 |
FW | -3.437 |
Token | � |
Token ID | 251 |
Feature activation | -2.68e-01 |
Pos logit contributions | |
BT | +1.605 |
Dollar | +1.556 |
cour | +1.528 |
FW | +1.498 |
fav | +1.448 |
Neg logit contributions | |
idious | -2.057 |
ocate | -1.947 |
urnal | -1.921 |
onential | -1.918 |
enary | -1.889 |
Token | . |
Token ID | 13 |
Feature activation | -2.81e+00 |
Pos logit contributions | |
idious | +10.028 |
ocate | +9.625 |
urnal | +9.438 |
enary | +9.335 |
onential | +9.278 |
Neg logit contributions | |
BT | -8.412 |
Dollar | -8.082 |
FW | -7.927 |
cour | -7.877 |
FB | -7.543 |
Token |
|
Token ID | 198 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
idious | +2.781 |
ocate | +2.638 |
urnal | +2.630 |
onential | +2.607 |
enary | +2.588 |
Neg logit contributions | |
BT | -2.139 |
Dollar | -2.075 |
cour | -2.027 |
FW | -2.000 |
rentals | -1.962 |
Token |
|
Token ID | 198 |
Feature activation | -6.86e-01 |
Pos logit contributions | |
idious | +1.139 |
ocate | +1.078 |
urnal | +1.075 |
onential | +1.059 |
enary | +1.055 |
Neg logit contributions | |
BT | -0.950 |
Dollar | -0.933 |
cour | -0.899 |
FW | -0.891 |
rentals | -0.874 |
Token | The |
Token ID | 464 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
idious | +0.740 |
urnal | +0.702 |
ocate | +0.702 |
onential | +0.694 |
enary | +0.690 |
Neg logit contributions | |
BT | -0.474 |
Dollar | -0.459 |
cour | -0.445 |
FW | -0.439 |
rentals | -0.420 |
Token | only |
Token ID | 691 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
BT | +1.259 |
Dollar | +1.242 |
cour | +1.188 |
FW | +1.174 |
rentals | +1.144 |
Neg logit contributions | |
idious | -1.594 |
urnal | -1.506 |
ocate | -1.499 |
onential | -1.483 |
enary | -1.469 |
Token | economist |
Token ID | 17646 |
Feature activation | -1.30e+01 |
Pos logit contributions | |
idious | +2.331 |
ocate | +2.199 |
urnal | +2.190 |
onential | +2.161 |
enary | +2.150 |
Neg logit contributions | |
BT | -1.957 |
Dollar | -1.896 |
cour | -1.857 |
FW | -1.837 |
rentals | -1.764 |
Token | to |
Token ID | 284 |
Feature activation | -3.83e-01 |
Pos logit contributions | |
idious | +11.702 |
ocate | +10.894 |
enary | +10.728 |
urnal | +10.721 |
onential | +10.527 |
Neg logit contributions | |
BT | -9.577 |
Dollar | -8.959 |
FW | -8.897 |
cour | -8.886 |
rentals | -8.496 |
Token | say |
Token ID | 910 |
Feature activation | +4.11e+00 |
Pos logit contributions | |
idious | +0.428 |
urnal | +0.407 |
ocate | +0.406 |
onential | +0.402 |
enary | +0.399 |
Neg logit contributions | |
BT | -0.250 |
Dollar | -0.243 |
cour | -0.234 |
FW | -0.230 |
fav | -0.222 |
Token | the |
Token ID | 262 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
BT | +2.850 |
Dollar | +2.817 |
cour | +2.649 |
FW | +2.619 |
fav | +2.595 |
Neg logit contributions | |
idious | -4.359 |
urnal | -4.164 |
ocate | -4.158 |
onential | -4.109 |
enary | -4.067 |
Token | bill |
Token ID | 2855 |
Feature activation | +5.72e+00 |
Pos logit contributions | |
BT | +1.112 |
Dollar | +1.091 |
cour | +1.046 |
FW | +1.035 |
rentals | +1.006 |
Neg logit contributions | |
idious | -1.459 |
urnal | -1.382 |
ocate | -1.378 |
onential | -1.361 |
enary | -1.351 |
Token | would |
Token ID | 561 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
BT | +3.577 |
Dollar | +3.488 |
cour | +3.321 |
fav | +3.308 |
FW | +3.273 |
Neg logit contributions | |
idious | -6.348 |
urnal | -6.122 |
ocate | -6.091 |
onential | -6.078 |
enary | -5.932 |
Token | the |
Token ID | 262 |
Feature activation | -3.91e+00 |
Pos logit contributions | |
BT | +2.839 |
Dollar | +2.821 |
cour | +2.713 |
FW | +2.656 |
fav | +2.631 |
Neg logit contributions | |
idious | -3.766 |
ocate | -3.580 |
urnal | -3.569 |
onential | -3.560 |
enary | -3.530 |
Token | greatest |
Token ID | 6000 |
Feature activation | -9.51e+00 |
Pos logit contributions | |
idious | +3.514 |
ocate | +3.313 |
urnal | +3.294 |
enary | +3.227 |
onential | +3.214 |
Neg logit contributions | |
BT | -3.364 |
Dollar | -3.233 |
cour | -3.189 |
FW | -3.154 |
rentals | -3.037 |
Token | Spanish |
Token ID | 7897 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
idious | +8.971 |
ocate | +8.469 |
urnal | +8.334 |
enary | +8.243 |
onential | +8.097 |
Neg logit contributions | |
BT | -7.270 |
FW | -6.797 |
cour | -6.792 |
Dollar | -6.733 |
FB | -6.456 |
Token | - |
Token ID | 12 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
idious | +4.260 |
ocate | +4.018 |
urnal | +4.016 |
enary | +3.944 |
onential | +3.936 |
Neg logit contributions | |
BT | -3.488 |
Dollar | -3.391 |
cour | -3.308 |
FW | -3.292 |
rentals | -3.171 |
Token | language |
Token ID | 16129 |
Feature activation | -4.19e+00 |
Pos logit contributions | |
idious | +2.480 |
urnal | +2.329 |
ocate | +2.328 |
onential | +2.293 |
enary | +2.285 |
Neg logit contributions | |
BT | -2.251 |
Dollar | -2.216 |
cour | -2.140 |
FW | -2.122 |
rentals | -2.072 |
Token | writer |
Token ID | 6260 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
idious | +3.531 |
ocate | +3.293 |
urnal | +3.274 |
onential | +3.203 |
enary | +3.194 |
Neg logit contributions | |
BT | -3.830 |
Dollar | -3.723 |
cour | -3.652 |
FW | -3.637 |
rentals | -3.500 |
Token | of |
Token ID | 286 |
Feature activation | -6.61e+00 |
Pos logit contributions | |
idious | +9.898 |
ocate | +9.446 |
urnal | +9.300 |
enary | +9.212 |
onential | +9.035 |
Neg logit contributions | |
BT | -9.372 |
Dollar | -9.125 |
cour | -8.915 |
FW | -8.843 |
rentals | -8.698 |
Token | the |
Token ID | 262 |
Feature activation | -4.45e+00 |
Pos logit contributions | |
idious | +5.770 |
ocate | +5.471 |
urnal | +5.408 |
onential | +5.373 |
enary | +5.353 |
Neg logit contributions | |
BT | -5.635 |
Dollar | -5.480 |
FW | -5.367 |
cour | -5.361 |
FB | -5.146 |
Token | 20 |
Token ID | 1160 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
idious | +3.985 |
ocate | +3.743 |
urnal | +3.741 |
onential | +3.689 |
enary | +3.667 |
Neg logit contributions | |
BT | -3.834 |
Dollar | -3.745 |
cour | -3.656 |
FW | -3.617 |
rentals | -3.506 |
Token | th |
Token ID | 400 |
Feature activation | -9.75e+00 |
Pos logit contributions | |
idious | +0.449 |
urnal | +0.426 |
ocate | +0.426 |
onential | +0.421 |
enary | +0.418 |
Neg logit contributions | |
BT | -0.271 |
Dollar | -0.263 |
cour | -0.254 |
FW | -0.250 |
rentals | -0.240 |
Token | century |
Token ID | 4289 |
Feature activation | -4.86e+00 |
Pos logit contributions | |
idious | +7.731 |
urnal | +7.354 |
enary | +7.287 |
onential | +7.268 |
ocate | +7.145 |
Neg logit contributions | |
BT | -8.551 |
Dollar | -8.282 |
cour | -8.148 |
FW | -8.064 |
rentals | -7.983 |
Token | . |
Token ID | 13 |
Feature activation | -2.10e+00 |
Pos logit contributions | |
idious | +0.559 |
urnal | +0.529 |
ocate | +0.529 |
onential | +0.523 |
enary | +0.519 |
Neg logit contributions | |
BT | -0.395 |
Dollar | -0.385 |
cour | -0.373 |
FW | -0.368 |
rentals | -0.356 |
Token |
|
Token ID | 198 |
Feature activation | +9.32e-01 |
Pos logit contributions | |
idious | +2.046 |
ocate | +1.936 |
urnal | +1.932 |
onential | +1.906 |
enary | +1.896 |
Neg logit contributions | |
BT | -1.644 |
Dollar | -1.595 |
cour | -1.557 |
FW | -1.536 |
rentals | -1.502 |
Token |
|
Token ID | 198 |
Feature activation | +4.83e-01 |
Pos logit contributions | |
BT | +0.713 |
Dollar | +0.694 |
cour | +0.676 |
FW | +0.665 |
fav | +0.641 |
Neg logit contributions | |
idious | -0.938 |
urnal | -0.885 |
ocate | -0.883 |
onential | -0.876 |
enary | -0.867 |
Token | I |
Token ID | 40 |
Feature activation | +4.02e+00 |
Pos logit contributions | |
BT | +0.334 |
Dollar | +0.320 |
cour | +0.313 |
FW | +0.310 |
FB | +0.293 |
Neg logit contributions | |
idious | -0.523 |
urnal | -0.497 |
ocate | -0.496 |
onential | -0.492 |
enary | -0.488 |
Token | can |
Token ID | 460 |
Feature activation | -7.39e+00 |
Pos logit contributions | |
BT | +2.640 |
Dollar | +2.502 |
cour | +2.411 |
FW | +2.371 |
fav | +2.291 |
Neg logit contributions | |
idious | -4.484 |
urnal | -4.241 |
ocate | -4.228 |
onential | -4.212 |
enary | -4.172 |
Token | 't |
Token ID | 470 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
idious | +6.661 |
ocate | +6.363 |
enary | +6.201 |
urnal | +6.129 |
onential | +6.109 |
Neg logit contributions | |
BT | -5.997 |
Dollar | -5.924 |
cour | -5.797 |
FW | -5.637 |
FB | -5.474 |
Token | pretend |
Token ID | 16614 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
idious | +10.998 |
ocate | +10.497 |
enary | +10.227 |
urnal | +10.014 |
onential | +10.001 |
Neg logit contributions | |
BT | -8.762 |
cour | -8.529 |
Dollar | -8.489 |
FW | -8.038 |
FB | -7.902 |
Token | to |
Token ID | 284 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
BT | +0.125 |
Dollar | +0.122 |
cour | +0.118 |
FW | +0.117 |
rentals | +0.113 |
Neg logit contributions | |
idious | -0.170 |
urnal | -0.161 |
ocate | -0.161 |
onential | -0.159 |
enary | -0.158 |
Token | know |
Token ID | 760 |
Feature activation | +4.12e-01 |
Pos logit contributions | |
BT | +2.302 |
Dollar | +2.242 |
FW | +2.142 |
cour | +2.127 |
fav | +2.089 |
Neg logit contributions | |
idious | -3.890 |
urnal | -3.724 |
onential | -3.682 |
ocate | -3.668 |
enary | -3.619 |
Token | what |
Token ID | 644 |
Feature activation | -5.35e+00 |
Pos logit contributions | |
BT | +0.291 |
Dollar | +0.285 |
cour | +0.274 |
FW | +0.271 |
fav | +0.262 |
Neg logit contributions | |
idious | -0.436 |
urnal | -0.415 |
ocate | -0.414 |
onential | -0.409 |
enary | -0.406 |
Token | was |
Token ID | 373 |
Feature activation | -3.33e+00 |
Pos logit contributions | |
idious | +5.490 |
ocate | +5.130 |
urnal | +5.084 |
onential | +5.024 |
enary | +5.008 |
Neg logit contributions | |
BT | -3.920 |
Dollar | -3.730 |
cour | -3.687 |
FW | -3.634 |
FB | -3.433 |