Token | percent |
Token ID | 1411 |
Feature activation | +3.58e+01 |
Pos logit contributions | |
percent | +20.343 |
percentages | +20.313 |
percentage | +19.354 |
percentile | +18.110 |
percent | +17.933 |
Neg logit contributions | |
civilisation | -21.759 |
Construction | -20.551 |
paradise | -20.103 |
Building | -20.076 |
issance | -20.009 |
Token | said |
Token ID | 531 |
Feature activation | +1.29e+01 |
Pos logit contributions | |
percentages | +26.507 |
disapprove | +26.100 |
unfavorable | +25.918 |
percent | +25.778 |
vs | +25.592 |
Neg logit contributions | |
civilisation | -20.662 |
issance | -18.607 |
Construction | -18.290 |
paradise | -18.225 |
ufact | -18.157 |
Token | she |
Token ID | 673 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
percentages | +13.719 |
percentage | +12.681 |
percentile | +12.610 |
unfavorable | +12.507 |
inaccur | +12.316 |
Neg logit contributions | |
civilisation | -9.300 |
Construction | -8.955 |
Located | -8.453 |
ufact | -8.417 |
issance | -8.395 |
Token | was |
Token ID | 373 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
percentages | +13.827 |
percentile | +12.957 |
inaccur | +12.855 |
percentage | +12.756 |
unfavorable | +12.666 |
Neg logit contributions | |
civilisation | -8.987 |
Construction | -8.749 |
paradise | -8.062 |
ufact | -7.976 |
Building | -7.963 |
Token | not |
Token ID | 407 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
percentages | +23.558 |
unfavorable | +23.191 |
inaccurate | +22.887 |
inaccur | +22.722 |
incorrect | +22.474 |
Neg logit contributions | |
ufact | -19.812 |
civilisation | -19.272 |
Construction | -19.002 |
issance | -18.700 |
Located | -17.691 |
Token | , |
Token ID | 11 |
Feature activation | +5.77e+01 |
Pos logit contributions | |
percentages | +15.541 |
percentage | +14.193 |
unfavorable | +14.146 |
inaccur | +13.995 |
percentile | +13.881 |
Neg logit contributions | |
civilisation | -16.200 |
Construction | -16.081 |
ufact | -15.946 |
issance | -15.472 |
Located | -14.964 |
Token | whereas |
Token ID | 9472 |
Feature activation | +3.02e+01 |
Pos logit contributions | |
percentages | +33.500 |
vs | +32.961 |
percentage | +32.048 |
fewer | +31.958 |
49 | +31.225 |
Neg logit contributions | |
civilisation | -22.209 |
issance | -21.546 |
ufact | -20.542 |
Construction | -20.266 |
paradise | -19.193 |
Token | only |
Token ID | 691 |
Feature activation | +4.91e+01 |
Pos logit contributions | |
percentages | +23.202 |
fewer | +21.494 |
percentage | +21.135 |
unfavorable | +20.783 |
percent | +20.449 |
Neg logit contributions | |
civilisation | -20.872 |
ufact | -19.557 |
Construction | -19.556 |
issance | -19.227 |
Built | -18.880 |
Token | 34 |
Token ID | 4974 |
Feature activation | +3.68e+01 |
Pos logit contributions | |
percentages | +29.140 |
percentage | +27.674 |
49 | +27.589 |
fewer | +27.519 |
47 | +27.218 |
Neg logit contributions | |
ufact | -26.397 |
issance | -25.185 |
civilisation | -24.319 |
Construction | -23.774 |
exting | -23.382 |
Token | percent |
Token ID | 1411 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
percent | +25.594 |
percentages | +23.741 |
percentage | +23.041 |
percentile | +22.069 |
percent | +21.918 |
Neg logit contributions | |
civilisation | -25.394 |
Construction | -23.509 |
Building | -23.487 |
issance | -22.917 |
Laun | -22.881 |
Token | she |
Token ID | 673 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
percentages | +25.767 |
disapprove | +25.089 |
percent | +24.925 |
percentage | +24.776 |
unfavorable | +24.491 |
Neg logit contributions | |
civilisation | -21.313 |
Construction | -19.679 |
Located | -19.627 |
Building | -19.125 |
ufact | -18.875 |
Token | they |
Token ID | 484 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
percentages | +9.959 |
percentage | +9.076 |
percentile | +9.056 |
unfavorable | +8.920 |
fewer | +8.751 |
Neg logit contributions | |
civilisation | -8.675 |
Construction | -8.438 |
Located | -8.055 |
Built | -7.992 |
paradise | -7.888 |
Token | would |
Token ID | 561 |
Feature activation | +3.32e+01 |
Pos logit contributions | |
percentages | +16.263 |
disapprove | +15.811 |
percentage | +15.509 |
unfavorable | +15.225 |
percentile | +14.963 |
Neg logit contributions | |
civilisation | -18.090 |
Construction | -17.726 |
Building | -16.959 |
ufact | -16.849 |
Located | -16.753 |
Token | vote |
Token ID | 3015 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
disapprove | +22.003 |
percentages | +20.577 |
percentage | +20.528 |
criticize | +20.504 |
hate | +20.100 |
Neg logit contributions | |
ufact | -24.144 |
Construction | -23.928 |
civilisation | -23.365 |
Building | -23.136 |
Located | -22.645 |
Token | for |
Token ID | 329 |
Feature activation | +3.16e+01 |
Pos logit contributions | |
percentages | +12.023 |
percentage | +10.714 |
unfavorable | +10.690 |
percentile | +10.477 |
fewer | +10.456 |
Neg logit contributions | |
civilisation | -17.580 |
Construction | -16.923 |
Located | -16.373 |
Built | -16.353 |
paradise | -16.295 |
Token | Obama |
Token ID | 2486 |
Feature activation | +3.10e+01 |
Pos logit contributions | |
percentages | +20.926 |
percentage | +19.616 |
fewer | +19.526 |
unfavorable | +19.515 |
vs | +19.374 |
Neg logit contributions | |
civilisation | -21.443 |
Construction | -21.299 |
Located | -20.837 |
Built | -20.319 |
issance | -20.065 |
Token | , |
Token ID | 11 |
Feature activation | +5.67e+01 |
Pos logit contributions | |
vs | +21.920 |
percentages | +21.769 |
fewer | +20.474 |
percentage | +20.452 |
percent | +19.939 |
Neg logit contributions | |
civilisation | -21.301 |
Construction | -20.794 |
Located | -20.298 |
Built | -20.133 |
Building | -19.602 |
Token | while |
Token ID | 981 |
Feature activation | +4.05e+01 |
Pos logit contributions | |
percentages | +31.988 |
vs | +31.359 |
fewer | +30.772 |
percentage | +30.256 |
49 | +29.700 |
Neg logit contributions | |
issance | -24.383 |
civilisation | -23.691 |
Construction | -23.605 |
Built | -23.383 |
�� | -23.126 |
Token | 44 |
Token ID | 5846 |
Feature activation | +3.43e+01 |
Pos logit contributions | |
percentages | +26.881 |
fewer | +25.640 |
49 | +24.712 |
percentage | +24.442 |
47 | +24.350 |
Neg logit contributions | |
ufact | -24.466 |
issance | -23.624 |
Built | -23.427 |
civilisation | -23.415 |
Construction | -22.904 |
Token | percent |
Token ID | 1411 |
Feature activation | +3.58e+01 |
Pos logit contributions | |
percent | +23.145 |
percentages | +21.433 |
percentage | +20.767 |
percentile | +20.200 |
percent | +19.072 |
Neg logit contributions | |
civilisation | -28.028 |
ufact | -27.148 |
arrang | -26.473 |
Construction | -25.884 |
Building | -25.344 |
Token | would |
Token ID | 561 |
Feature activation | +3.30e+01 |
Pos logit contributions | |
percentages | +24.715 |
percentage | +23.658 |
percent | +23.548 |
disapprove | +23.543 |
unfavorable | +23.481 |
Neg logit contributions | |
civilisation | -21.638 |
Construction | -20.505 |
Located | -20.464 |
Building | -20.006 |
Built | -19.926 |
Token | vote |
Token ID | 3015 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
disapprove | +22.079 |
percentages | +21.061 |
criticize | +20.823 |
percentage | +20.675 |
unfavorable | +20.506 |
Neg logit contributions | |
ufact | -23.441 |
Construction | -23.240 |
civilisation | -22.942 |
Building | -22.596 |
Built | -22.556 |
Token | and |
Token ID | 290 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
percentages | +23.017 |
percentage | +22.160 |
percentile | +21.975 |
vs | +21.045 |
(> | +20.946 |
Neg logit contributions | |
civilisation | -17.997 |
Construction | -17.822 |
paradise | -16.372 |
Built | -16.325 |
ufact | -16.237 |
Token | obesity |
Token ID | 13825 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
percentages | +18.687 |
percentage | +17.483 |
percentile | +17.431 |
unfavorable | +16.840 |
percent | +16.194 |
Neg logit contributions | |
Construction | -17.022 |
issance | -16.788 |
civilisation | -16.658 |
ufact | -16.542 |
Built | -16.025 |
Token | combined |
Token ID | 5929 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
percentages | +25.060 |
percentile | +23.590 |
percentage | +23.238 |
vs | +22.142 |
percent | +21.765 |
Neg logit contributions | |
civilisation | -17.043 |
Construction | -16.908 |
ufact | -15.879 |
Built | -15.757 |
issance | -15.655 |
Token | ( |
Token ID | 357 |
Feature activation | +3.12e+01 |
Pos logit contributions | |
percentages | +18.872 |
percentile | +17.697 |
percentage | +17.471 |
vs | +16.620 |
average | +16.202 |
Neg logit contributions | |
civilisation | -16.175 |
Construction | -16.151 |
Built | -15.293 |
ufact | -15.234 |
paradise | -15.095 |
Token | B |
Token ID | 33 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
percentages | +23.546 |
percent | +22.338 |
percentage | +22.075 |
percentile | +21.864 |
percent | +21.047 |
Neg logit contributions | |
civilisation | -19.788 |
paradise | -18.341 |
ufact | -17.641 |
rebuilt | -16.924 |
issance | -16.900 |
Token | MI |
Token ID | 8895 |
Feature activation | +5.42e+01 |
Pos logit contributions | |
percentages | +8.228 |
percentile | +7.448 |
percentage | +7.174 |
vs | +7.053 |
percent | +6.696 |
Neg logit contributions | |
civilisation | -20.220 |
paradise | -19.287 |
Construction | -19.057 |
ufact | -18.840 |
rebuilt | -18.170 |
Token | ≥ |
Token ID | 26870 |
Feature activation | +3.83e+01 |
Pos logit contributions | |
≥ | +33.946 |
percentages | +33.612 |
percentile | +32.610 |
percentage | +32.091 |
vs | +32.064 |
Neg logit contributions | |
civilisation | -18.572 |
issance | -18.572 |
Construction | -18.251 |
ufact | -18.037 |
paradise | -17.791 |
Token | 25 |
Token ID | 1495 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
percentages | +22.755 |
percentile | +22.121 |
≥ | +22.063 |
vs | +21.902 |
percentage | +21.491 |
Neg logit contributions | |
civilisation | -24.409 |
ufact | -23.758 |
arrang | -22.755 |
paradise | -22.713 |
issance | -22.330 |
Token | kg |
Token ID | 14211 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
percentages | +15.337 |
percentile | +14.689 |
percentage | +14.299 |
percent | +13.862 |
vs | +13.649 |
Neg logit contributions | |
civilisation | -15.566 |
Construction | -15.227 |
paradise | -14.640 |
Built | -14.400 |
issance | -14.344 |
Token | / |
Token ID | 14 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
percentages | +15.069 |
percentile | +14.642 |
vs | +14.209 |
percentage | +13.930 |
fewer | +13.617 |
Neg logit contributions | |
Construction | -19.657 |
civilisation | -19.518 |
issance | -18.511 |
paradise | -18.417 |
Built | -18.382 |
Token | m |
Token ID | 76 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
percentages | +9.727 |
percentile | +9.319 |
percentage | +8.934 |
vs | +8.712 |
percent | +8.607 |
Neg logit contributions | |
civilisation | -13.912 |
Construction | -13.220 |
paradise | -12.867 |
ufact | -12.694 |
issance | -12.356 |
Token | such |
Token ID | 884 |
Feature activation | +5.58e+00 |
Pos logit contributions | |
percentages | +12.756 |
percentile | +11.695 |
percentage | +11.525 |
fewer | +11.209 |
unfavorable | +11.149 |
Neg logit contributions | |
Construction | -15.142 |
civilisation | -14.553 |
Built | -13.941 |
ufact | -13.911 |
Building | -13.772 |
Token | socially |
Token ID | 18118 |
Feature activation | +7.33e+00 |
Pos logit contributions | |
percentages | +4.458 |
percentile | +4.084 |
percentage | +3.933 |
unfavorable | +3.769 |
inaccur | +3.765 |
Neg logit contributions | |
civilisation | -5.912 |
Construction | -5.815 |
paradise | -5.594 |
Built | -5.514 |
Located | -5.448 |
Token | ( |
Token ID | 357 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
percentages | +5.684 |
percentile | +5.204 |
percentage | +5.016 |
unfavorable | +4.840 |
inaccur | +4.812 |
Neg logit contributions | |
civilisation | -7.822 |
Construction | -7.578 |
paradise | -7.341 |
Built | -7.192 |
ufact | -7.134 |
Token | including |
Token ID | 8201 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
percentages | +8.505 |
percentile | +7.574 |
percentage | +7.520 |
inaccur | +7.285 |
percent | +7.218 |
Neg logit contributions | |
civilisation | -12.115 |
paradise | -11.381 |
Construction | -11.349 |
ufact | -11.030 |
rebuilt | -10.919 |
Token | the |
Token ID | 262 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
percentages | +9.558 |
percentile | +8.761 |
percentage | +8.606 |
unfavorable | +8.423 |
inaccur | +8.377 |
Neg logit contributions | |
civilisation | -9.103 |
Construction | -8.947 |
paradise | -8.478 |
Built | -8.458 |
Located | -8.410 |
Token | use |
Token ID | 779 |
Feature activation | +5.37e+01 |
Pos logit contributions | |
percentages | +9.167 |
percentage | +8.289 |
percentile | +8.255 |
inaccur | +7.979 |
unfavorable | +7.888 |
Neg logit contributions | |
civilisation | -14.001 |
Construction | -13.726 |
paradise | -13.256 |
Built | -13.073 |
Located | -13.010 |
Token | of |
Token ID | 286 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
of | +26.674 |
vs | +22.394 |
fewer | +22.298 |
percent | +21.882 |
OF | +21.841 |
Neg logit contributions | |
exting | -37.537 |
arrang | -36.162 |
neighb | -34.336 |
ufact | -34.326 |
mosqu | -34.224 |
Token | female |
Token ID | 4048 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
percentages | +15.096 |
percentile | +13.878 |
percentage | +13.814 |
incorrect | +13.126 |
fewer | +13.119 |
Neg logit contributions | |
Construction | -18.148 |
civilisation | -17.349 |
Built | -17.006 |
Building | -16.855 |
Located | -16.691 |
Token | pronouns |
Token ID | 43947 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
percentages | +8.051 |
percentile | +6.949 |
percentage | +6.640 |
offenses | +6.252 |
fewer | +6.236 |
Neg logit contributions | |
civilisation | -17.011 |
Construction | -16.743 |
ufact | -16.321 |
paradise | -16.040 |
Built | -15.987 |
Token | like |
Token ID | 588 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
percentages | +7.629 |
vs | +6.859 |
percentile | +6.728 |
hate | +6.521 |
percentage | +6.470 |
Neg logit contributions | |
Construction | -22.759 |
ufact | -22.618 |
civilisation | -22.614 |
arrang | -21.719 |
Built | -21.427 |
Token | " |
Token ID | 366 |
Feature activation | -4.49e+00 |
Pos logit contributions | |
percentages | +10.888 |
percentile | +10.062 |
percentage | +9.883 |
vs | +9.493 |
fewer | +9.277 |
Neg logit contributions | |
civilisation | -16.590 |
Construction | -16.241 |
ufact | -16.200 |
Built | -15.496 |
arrang | -15.241 |
Token | a |
Token ID | 257 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
percentages | +26.339 |
fewer | +24.674 |
percentage | +24.239 |
unfavorable | +24.044 |
hate | +24.043 |
Neg logit contributions | |
civilisation | -15.828 |
Construction | -15.796 |
issance | -15.185 |
ufact | -15.157 |
Located | -14.699 |
Token | transgender |
Token ID | 10637 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
percentages | +11.753 |
percentile | +11.005 |
percentage | +10.952 |
unfavorable | +10.450 |
fewer | +10.295 |
Neg logit contributions | |
civilisation | -9.640 |
Construction | -9.452 |
paradise | -8.973 |
ufact | -8.902 |
Built | -8.858 |
Token | person |
Token ID | 1048 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
percentages | +12.577 |
percentage | +11.682 |
percentile | +11.658 |
unfavorable | +11.279 |
fewer | +10.926 |
Neg logit contributions | |
civilisation | -14.058 |
Construction | -13.912 |
paradise | -13.355 |
ufact | -13.302 |
Built | -13.269 |
Token | . |
Token ID | 13 |
Feature activation | +3.37e+01 |
Pos logit contributions | |
percentages | +15.384 |
percentile | +14.283 |
percentage | +14.223 |
vs | +13.929 |
fewer | +13.869 |
Neg logit contributions | |
civilisation | -15.959 |
Construction | -15.254 |
ufact | -14.628 |
Built | -14.558 |
paradise | -14.490 |
Token | How |
Token ID | 1374 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
percentages | +24.356 |
vs | +23.325 |
fewer | +23.299 |
percentage | +23.252 |
percent | +23.173 |
Neg logit contributions | |
civilisation | -21.542 |
arrang | -20.126 |
ufact | -19.136 |
paradise | -18.788 |
issance | -18.517 |
Token | many |
Token ID | 867 |
Feature activation | +5.33e+01 |
Pos logit contributions | |
percentages | +11.381 |
percentage | +10.341 |
percentile | +10.326 |
unfavorable | +10.058 |
fewer | +9.898 |
Neg logit contributions | |
civilisation | -10.978 |
Construction | -10.724 |
ufact | -10.173 |
Built | -10.104 |
paradise | -10.063 |
Token | Rachel |
Token ID | 15984 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
percentages | +35.763 |
percentage | +34.173 |
fewer | +33.951 |
percent | +33.580 |
hate | +32.711 |
Neg logit contributions | |
ufact | -21.071 |
issance | -18.645 |
Located | -18.488 |
Built | -18.268 |
Construction | -18.239 |
Token | Do |
Token ID | 2141 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
percentages | +11.963 |
percentile | +11.142 |
percentage | +11.038 |
unfavorable | +10.748 |
inaccur | +10.670 |
Neg logit contributions | |
civilisation | -9.078 |
Construction | -8.718 |
paradise | -8.286 |
ufact | -8.070 |
Located | -8.038 |
Token | lez |
Token ID | 36858 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
percentages | +1.016 |
percentile | +0.949 |
percentage | +0.914 |
pts | +0.890 |
unfavorable | +0.889 |
Neg logit contributions | |
civilisation | -0.894 |
Construction | -0.859 |
paradise | -0.832 |
Built | -0.801 |
Located | -0.794 |
Token | als |
Token ID | 874 |
Feature activation | +3.29e+01 |
Pos logit contributions | |
percentages | +3.643 |
percentile | +3.430 |
percentage | +3.316 |
pts | +3.252 |
unfavorable | +3.243 |
Neg logit contributions | |
civilisation | -2.512 |
Construction | -2.390 |
paradise | -2.296 |
Built | -2.209 |
Located | -2.180 |
Token | do |
Token ID | 466 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
percentages | +25.963 |
hate | +24.523 |
percentage | +24.438 |
tweets | +24.319 |
vs | +24.297 |
Neg logit contributions | |
Construction | -18.369 |
ufact | -17.842 |
civilisation | -17.596 |
Building | -16.706 |
Located | -16.620 |
Token | 37 |
Token ID | 5214 |
Feature activation | +3.20e+01 |
Pos logit contributions | |
percentages | +28.084 |
percentage | +26.404 |
fewer | +25.690 |
percentile | +24.926 |
vs | +24.882 |
Neg logit contributions | |
civilisation | -17.217 |
ufact | -16.843 |
issance | -16.639 |
Construction | -16.629 |
Built | -16.571 |
Token | % |
Token ID | 4 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
percentages | +24.328 |
percent | +23.856 |
percentage | +23.826 |
percentile | +22.669 |
% | +22.474 |
Neg logit contributions | |
civilisation | -19.314 |
ufact | -17.995 |
paradise | -17.913 |
Construction | -17.811 |
Built | -17.799 |
Token | were |
Token ID | 547 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
percentages | +16.220 |
percentage | +14.712 |
percentile | +14.676 |
percent | +14.288 |
unfavorable | +14.143 |
Neg logit contributions | |
civilisation | -16.110 |
Construction | -15.457 |
issance | -14.945 |
Built | -14.897 |
paradise | -14.855 |
Token | manual |
Token ID | 10107 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
percentages | +14.754 |
percentage | +13.580 |
percentile | +13.471 |
unfavorable | +13.075 |
fewer | +12.989 |
Neg logit contributions | |
civilisation | -12.665 |
Construction | -12.144 |
paradise | -11.829 |
issance | -11.734 |
Built | -11.711 |
Token | workers |
Token ID | 3259 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
percentages | +3.798 |
percentile | +3.550 |
percentage | +3.456 |
unfavorable | +3.348 |
pts | +3.337 |
Neg logit contributions | |
civilisation | -2.803 |
Construction | -2.685 |
paradise | -2.587 |
Built | -2.477 |
Located | -2.469 |
Token | , |
Token ID | 11 |
Feature activation | +5.21e+01 |
Pos logit contributions | |
percentages | +18.589 |
vs | +17.264 |
percentage | +17.112 |
percentile | +16.993 |
fewer | +16.508 |
Neg logit contributions | |
civilisation | -18.061 |
Construction | -16.966 |
issance | -16.485 |
ufact | -16.212 |
Built | -16.201 |
Token | over |
Token ID | 625 |
Feature activation | +3.78e+01 |
Pos logit contributions | |
percentages | +31.361 |
fewer | +29.980 |
percentage | +29.461 |
vs | +29.062 |
49 | +28.811 |
Neg logit contributions | |
issance | -21.818 |
ufact | -21.644 |
civilisation | -21.424 |
Construction | -21.193 |
Built | -20.833 |
Token | 10 |
Token ID | 838 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
percentages | +26.810 |
percentage | +24.916 |
fewer | +24.409 |
percentile | +24.145 |
0 | +23.810 |
Neg logit contributions | |
ufact | -20.381 |
Construction | -20.152 |
civilisation | -19.917 |
issance | -19.788 |
Built | -19.744 |
Token | % |
Token ID | 4 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
percentages | +21.818 |
percentage | +21.327 |
percent | +20.564 |
percentile | +19.871 |
% | +19.521 |
Neg logit contributions | |
civilisation | -19.437 |
ufact | -19.114 |
Construction | -19.059 |
Built | -18.746 |
paradise | -18.599 |
Token | were |
Token ID | 547 |
Feature activation | +8.04e+00 |
Pos logit contributions | |
percentages | +13.489 |
percentile | +12.367 |
percentage | +12.206 |
fewer | +11.860 |
unfavorable | +11.749 |
Neg logit contributions | |
civilisation | -12.551 |
Construction | -12.171 |
paradise | -11.702 |
Built | -11.674 |
issance | -11.646 |
Token | farmers |
Token ID | 9818 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
percentages | +8.161 |
percentile | +7.568 |
percentage | +7.458 |
unfavorable | +7.179 |
fewer | +7.163 |
Neg logit contributions | |
civilisation | -6.601 |
Construction | -6.328 |
paradise | -6.149 |
Built | -6.046 |
Located | -5.975 |
Token | � |
Token ID | 447 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
percentages | +8.423 |
percentile | +7.734 |
percentage | +7.581 |
vs | +7.284 |
pts | +7.229 |
Neg logit contributions | |
civilisation | -10.151 |
Construction | -9.455 |
paradise | -9.320 |
ufact | -9.000 |
Built | -8.922 |
Token | � |
Token ID | 251 |
Feature activation | +3.31e+00 |
Pos logit contributions | |
Construction | +5.167 |
civilisation | +5.110 |
paradise | +4.960 |
Located | +4.582 |
Built | +4.578 |
Neg logit contributions | |
percentages | -12.627 |
percentile | -11.888 |
inaccur | -11.597 |
percentage | -11.545 |
unfavorable | -11.464 |
Token |
|
Token ID | 198 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
percentages | +3.159 |
percentile | +2.927 |
percentage | +2.843 |
pts | +2.755 |
unfavorable | +2.736 |
Neg logit contributions | |
civilisation | -3.073 |
Construction | -2.931 |
paradise | -2.851 |
Built | -2.736 |
ufact | -2.719 |
Token |
|
Token ID | 198 |
Feature activation | -9.90e-01 |
Pos logit contributions | |
Construction | +1.744 |
civilisation | +1.708 |
paradise | +1.639 |
Built | +1.622 |
Located | +1.618 |
Neg logit contributions | |
percentages | -2.285 |
percentile | -2.107 |
percentage | -2.025 |
disapprove | -2.023 |
unfavorable | -2.019 |
Token | These |
Token ID | 4711 |
Feature activation | +3.17e+01 |
Pos logit contributions | |
Construction | +0.772 |
civilisation | +0.769 |
paradise | +0.720 |
Built | +0.715 |
Located | +0.710 |
Neg logit contributions | |
percentages | -1.081 |
percentile | -1.015 |
percentage | -0.977 |
unfavorable | -0.956 |
offenses | -0.949 |
Token | kinds |
Token ID | 6982 |
Feature activation | +5.19e+01 |
Pos logit contributions | |
percentages | +26.485 |
tweets | +24.717 |
inaccur | +24.351 |
percentage | +24.136 |
offenses | +23.868 |
Neg logit contributions | |
Construction | -17.822 |
civilisation | -17.325 |
ufact | -16.952 |
Located | -16.573 |
Built | -16.220 |
Token | of |
Token ID | 286 |
Feature activation | +2.83e+01 |
Pos logit contributions | |
of | +27.858 |
percentages | +25.765 |
fewer | +24.652 |
percent | +24.576 |
percentage | +24.266 |
Neg logit contributions | |
ufact | -30.252 |
arrang | -28.812 |
exting | -28.662 |
neighb | -27.190 |
civilisation | -27.048 |
Token | comparisons |
Token ID | 17909 |
Feature activation | +2.48e+01 |
Pos logit contributions | |
percentages | +24.602 |
inaccur | +22.756 |
tweets | +22.739 |
offenses | +22.262 |
percentage | +22.083 |
Neg logit contributions | |
Construction | -17.062 |
ufact | -16.368 |
civilisation | -16.324 |
Located | -16.171 |
issance | -16.037 |
Token | make |
Token ID | 787 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
percentages | +21.275 |
inaccur | +19.951 |
percentage | +19.828 |
vs | +19.678 |
percentile | +19.647 |
Neg logit contributions | |
Construction | -16.228 |
civilisation | -16.012 |
Located | -15.278 |
ufact | -15.202 |
Built | -14.591 |
Token | transgender |
Token ID | 10637 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
percentages | +11.404 |
percentile | +10.451 |
percentage | +10.398 |
fewer | +10.237 |
unfavorable | +10.202 |
Neg logit contributions | |
civilisation | -8.558 |
Construction | -8.480 |
Located | -7.915 |
paradise | -7.894 |
ufact | -7.792 |
Token | people |
Token ID | 661 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
percentages | +15.480 |
percentage | +13.914 |
percentile | +13.766 |
inaccur | +13.709 |
vs | +13.651 |
Neg logit contributions | |
Construction | -13.625 |
civilisation | -13.479 |
Located | -12.893 |
Built | -12.761 |
ufact | -12.515 |
Token | ." |
Token ID | 526 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
percentages | +15.033 |
percentage | +13.727 |
percentile | +13.724 |
vs | +13.541 |
unfavorable | +13.477 |
Neg logit contributions | |
civilisation | -12.886 |
Construction | -12.486 |
paradise | -11.741 |
ufact | -11.725 |
Located | -11.450 |
Token | It |
Token ID | 632 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
percentages | +18.399 |
percentage | +17.183 |
pts | +17.171 |
percentile | +17.153 |
vs | +16.885 |
Neg logit contributions | |
civilisation | -14.019 |
paradise | -12.319 |
ufact | -12.264 |
Construction | -12.161 |
rebuilt | -11.742 |
Token | shows |
Token ID | 2523 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
percentages | +17.033 |
percentile | +15.804 |
percentage | +15.482 |
inaccur | +15.314 |
fewer | +14.920 |
Neg logit contributions | |
civilisation | -16.263 |
Construction | -16.071 |
Built | -15.175 |
Building | -15.068 |
Located | -14.881 |
Token | that |
Token ID | 326 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
percentages | +19.054 |
fewer | +17.255 |
percentage | +17.025 |
unfavorable | +16.654 |
percentile | +16.615 |
Neg logit contributions | |
civilisation | -17.039 |
Construction | -16.790 |
ufact | -16.270 |
Built | -16.058 |
Located | -15.889 |
Token | about |
Token ID | 546 |
Feature activation | +4.90e+01 |
Pos logit contributions | |
percentages | +28.861 |
fewer | +27.037 |
percentage | +26.890 |
unfavorable | +25.823 |
average | +25.385 |
Neg logit contributions | |
ufact | -19.274 |
Construction | -19.257 |
Built | -18.752 |
civilisation | -18.687 |
Located | -18.358 |
Token | half |
Token ID | 2063 |
Feature activation | +5.18e+01 |
Pos logit contributions | |
percentages | +30.690 |
percentage | +28.947 |
fewer | +28.809 |
average | +27.838 |
percentile | +27.562 |
Neg logit contributions | |
ufact | -23.808 |
issance | -22.848 |
Construction | -22.689 |
Built | -22.559 |
Located | -22.491 |
Token | the |
Token ID | 262 |
Feature activation | +3.05e+01 |
Pos logit contributions | |
percentages | +31.021 |
disapprove | +30.697 |
percent | +30.487 |
percentage | +29.980 |
of | +29.919 |
Neg logit contributions | |
civilisation | -21.715 |
Located | -21.127 |
ufact | -20.916 |
issance | -20.600 |
Construction | -20.504 |
Token | country |
Token ID | 1499 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
percentages | +25.902 |
percentage | +24.450 |
average | +22.957 |
respondents | +22.957 |
unfavorable | +22.874 |
Neg logit contributions | |
Construction | -18.519 |
ufact | -18.044 |
civilisation | -17.841 |
Built | -17.515 |
Located | -17.058 |
Token | doesn |
Token ID | 1595 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
percentages | +18.680 |
percentile | +17.039 |
percentage | +16.968 |
disapprove | +16.949 |
inaccur | +16.694 |
Neg logit contributions | |
civilisation | -18.750 |
Construction | -18.630 |
ufact | -17.693 |
Built | -17.542 |
Located | -17.511 |
Token | 't |
Token ID | 470 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
percentages | +7.721 |
percentile | +7.443 |
percent | +7.146 |
vs | +7.054 |
percentage | +7.050 |
Neg logit contributions | |
civilisation | -23.468 |
arrang | -23.381 |
ufact | -22.776 |
neighb | -22.204 |
exting | -22.041 |
Token | know |
Token ID | 760 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
percentages | +16.423 |
percentage | +15.795 |
percentile | +15.761 |
disapprove | +15.638 |
statistically | +15.559 |
Neg logit contributions | |
ufact | -22.412 |
Construction | -22.294 |
civilisation | -21.962 |
Building | -21.021 |
issance | -20.735 |
Token | 2016 |
Token ID | 1584 |
Feature activation | +3.28e+01 |
Pos logit contributions | |
percentages | +22.346 |
percentage | +21.139 |
vs | +20.815 |
fewer | +20.761 |
percentile | +20.420 |
Neg logit contributions | |
civilisation | -17.927 |
ufact | -16.784 |
Construction | -16.520 |
issance | -16.247 |
Built | -15.943 |
Token | there |
Token ID | 612 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
percentages | +26.117 |
fewer | +25.531 |
percentage | +24.846 |
percent | +23.944 |
vs | +23.924 |
Neg logit contributions | |
civilisation | -17.532 |
ufact | -16.998 |
Construction | -16.282 |
Built | -15.557 |
issance | -15.552 |
Token | were |
Token ID | 547 |
Feature activation | +4.63e+01 |
Pos logit contributions | |
percentages | +16.817 |
percentage | +15.552 |
percentile | +15.310 |
fewer | +15.117 |
inaccur | +15.047 |
Neg logit contributions | |
civilisation | -14.753 |
Construction | -13.667 |
paradise | -13.321 |
Building | -13.115 |
ufact | -13.068 |
Token | already |
Token ID | 1541 |
Feature activation | +3.93e+01 |
Pos logit contributions | |
fewer | +31.465 |
percentages | +30.710 |
percentage | +29.057 |
inaccur | +29.004 |
offenses | +28.858 |
Neg logit contributions | |
civilisation | -18.942 |
ufact | -18.341 |
issance | -17.507 |
Construction | -17.256 |
Building | -17.089 |
Token | 2 |
Token ID | 362 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
fewer | +28.389 |
percentages | +28.222 |
offenses | +26.594 |
percentage | +26.384 |
inaccur | +26.337 |
Neg logit contributions | |
ufact | -18.637 |
civilisation | -18.418 |
Construction | -17.659 |
issance | -17.357 |
Building | -16.895 |
Token | , |
Token ID | 11 |
Feature activation | +5.12e+01 |
Pos logit contributions | |
percentages | +23.519 |
percent | +23.009 |
percentage | +22.847 |
fewer | +22.667 |
offenses | +22.618 |
Neg logit contributions | |
civilisation | -17.037 |
ufact | -16.580 |
Construction | -16.017 |
paradise | -15.183 |
Building | -15.145 |
Token | 378 |
Token ID | 30695 |
Feature activation | +3.49e+01 |
Pos logit contributions | |
538 | +27.585 |
9 | +27.427 |
percentile | +26.973 |
percentages | +26.963 |
89 | +26.862 |
Neg logit contributions | |
civilisation | -20.777 |
paradise | -19.052 |
ufact | -18.840 |
Construction | -18.610 |
arrang | -17.779 |
Token | cases |
Token ID | 2663 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
percentages | +27.185 |
fewer | +27.036 |
indict | +26.617 |
offenses | +26.546 |
hate | +26.020 |
Neg logit contributions | |
ufact | -17.617 |
civilisation | -16.928 |
Construction | -15.910 |
paradise | -15.567 |
issance | -14.669 |
Token | that |
Token ID | 326 |
Feature activation | +8.72e+00 |
Pos logit contributions | |
percentages | +15.117 |
unfavorable | +14.279 |
percentile | +14.204 |
percentage | +14.088 |
inaccur | +14.029 |
Neg logit contributions | |
civilisation | -11.140 |
Construction | -10.828 |
paradise | -10.134 |
Building | -10.128 |
issance | -10.118 |
Token | haven |
Token ID | 4398 |
Feature activation | +9.76e+00 |
Pos logit contributions | |
percentages | +8.820 |
percentile | +8.213 |
percentage | +8.130 |
unfavorable | +7.896 |
inaccur | +7.879 |
Neg logit contributions | |
civilisation | -7.091 |
Construction | -6.793 |
paradise | -6.528 |
Built | -6.345 |
Located | -6.313 |
Token | � |
Token ID | 447 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
percentages | +7.709 |
percentile | +7.178 |
percentage | +6.987 |
percent | +6.671 |
fewer | +6.626 |
Neg logit contributions | |
civilisation | -10.255 |
paradise | -9.428 |
Construction | -9.355 |
ufact | -9.121 |
arrang | -8.899 |
Token | ful |
Token ID | 913 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
percentages | +11.930 |
percentile | +11.302 |
percentage | +11.034 |
vs | +10.740 |
pts | +10.686 |
Neg logit contributions | |
civilisation | -10.860 |
Construction | -10.299 |
paradise | -9.768 |
ufact | -9.649 |
Located | -9.496 |
Token | ' |
Token ID | 6 |
Feature activation | +3.88e+01 |
Pos logit contributions | |
percentages | +15.601 |
percentile | +15.052 |
percentage | +14.511 |
vs | +14.170 |
unfavorable | +14.090 |
Neg logit contributions | |
civilisation | -14.718 |
Construction | -13.806 |
paradise | -13.542 |
ufact | -13.186 |
Built | -13.002 |
Token | 2 |
Token ID | 362 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
percentile | +28.756 |
percentage | +28.054 |
percentages | +28.008 |
average | +27.379 |
unfavorable | +26.992 |
Neg logit contributions | |
Construction | -17.598 |
ufact | -17.543 |
civilisation | -17.222 |
Located | -16.632 |
Built | -16.591 |
Token | . |
Token ID | 13 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
percentages | +13.857 |
percentile | +13.492 |
percentage | +13.087 |
percent | +12.787 |
unfavorable | +12.606 |
Neg logit contributions | |
civilisation | -13.992 |
Construction | -13.554 |
ufact | -13.072 |
Built | -12.910 |
paradise | -12.816 |
Token | 4 |
Token ID | 19 |
Feature activation | +2.74e+01 |
Pos logit contributions | |
percentages | +16.074 |
percentile | +15.706 |
pts | +15.130 |
percentage | +15.080 |
vs | +14.751 |
Neg logit contributions | |
civilisation | -20.567 |
Construction | -18.947 |
ufact | -18.740 |
paradise | -18.566 |
arrang | -17.934 |
Token | out |
Token ID | 503 |
Feature activation | +5.10e+01 |
Pos logit contributions | |
percentile | +21.074 |
percentages | +20.479 |
percentage | +19.999 |
unfavorable | +19.756 |
percent | +19.631 |
Neg logit contributions | |
civilisation | -18.497 |
Construction | -18.349 |
ufact | -17.505 |
Built | -17.163 |
Building | -16.928 |
Token | of |
Token ID | 286 |
Feature activation | +2.47e+01 |
Pos logit contributions | |
of | +26.794 |
percentile | +23.881 |
vs | +23.665 |
fewer | +23.209 |
percent | +23.097 |
Neg logit contributions | |
exting | -32.393 |
arrang | -31.745 |
ufact | -31.000 |
mosqu | -30.659 |
entreprene | -29.944 |
Token | 10 |
Token ID | 838 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
percentages | +16.678 |
percentile | +15.806 |
percentage | +15.519 |
unfavorable | +14.497 |
fewer | +14.467 |
Neg logit contributions | |
civilisation | -20.181 |
ufact | -20.180 |
Construction | -20.122 |
issance | -19.995 |
Built | -19.503 |
Token | , |
Token ID | 11 |
Feature activation | +3.19e+01 |
Pos logit contributions | |
percentages | +16.807 |
percentile | +16.542 |
percentage | +15.960 |
unfavorable | +15.729 |
percent | +15.337 |
Neg logit contributions | |
civilisation | -16.174 |
Construction | -15.798 |
ufact | -15.230 |
Built | -14.976 |
issance | -14.815 |
Token | stating |
Token ID | 12316 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
percentages | +23.611 |
percentile | +22.637 |
unfavorable | +22.551 |
inaccur | +22.491 |
percentage | +22.314 |
Neg logit contributions | |
Construction | -18.572 |
civilisation | -18.321 |
Built | -17.693 |
ufact | -17.313 |
issance | -17.108 |
Token | " |
Token ID | 366 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
civilisation | +3.847 |
Construction | +3.709 |
paradise | +3.614 |
Built | +3.433 |
Located | +3.407 |
Neg logit contributions | |
percentages | -4.206 |
percentile | -3.920 |
percentage | -3.755 |
pts | -3.659 |
unfavorable | -3.643 |
Token | at |
Token ID | 379 |
Feature activation | +3.16e+01 |
Pos logit contributions | |
fewer | +28.422 |
percentages | +27.575 |
vs | +26.281 |
percentage | +26.244 |
percentile | +25.811 |
Neg logit contributions | |
civilisation | -22.166 |
Construction | -22.056 |
ufact | -21.849 |
ingen | -20.974 |
Built | -20.923 |
Token | least |
Token ID | 1551 |
Feature activation | +4.25e+01 |
Pos logit contributions | |
percentages | +18.978 |
fewer | +18.258 |
percentile | +17.713 |
percentage | +17.386 |
average | +17.327 |
Neg logit contributions | |
Construction | -24.902 |
civilisation | -24.326 |
ufact | -24.114 |
Building | -23.482 |
Located | -23.476 |
Token | 20 |
Token ID | 1160 |
Feature activation | +4.17e+01 |
Pos logit contributions | |
percentages | +26.322 |
percentile | +25.160 |
percentage | +25.122 |
fewer | +25.083 |
average | +24.706 |
Neg logit contributions | |
ufact | -23.673 |
Construction | -23.614 |
civilisation | -22.871 |
Located | -22.501 |
Built | -22.239 |
Token | Fantasy |
Token ID | 10982 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
percentages | +25.490 |
pts | +25.435 |
percentile | +25.310 |
percentage | +25.220 |
percent | +24.694 |
Neg logit contributions | |
ufact | -24.391 |
Construction | -23.911 |
civilisation | -23.735 |
Located | -22.939 |
Built | -22.886 |
Token | points |
Token ID | 2173 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
percentages | +15.243 |
percentage | +13.953 |
pts | +13.551 |
percentile | +13.453 |
percent | +12.944 |
Neg logit contributions | |
ufact | -27.095 |
civilisation | -26.066 |
Construction | -25.968 |
arrang | -24.612 |
Located | -24.517 |
Token | , |
Token ID | 11 |
Feature activation | +5.07e+01 |
Pos logit contributions | |
percentages | +24.072 |
vs | +23.660 |
fewer | +23.107 |
percentage | +22.933 |
percentile | +22.225 |
Neg logit contributions | |
Construction | -22.061 |
civilisation | -21.060 |
Located | -20.670 |
Built | -20.456 |
Building | -20.416 |
Token | but |
Token ID | 475 |
Feature activation | +2.48e+01 |
Pos logit contributions | |
percentages | +30.816 |
fewer | +30.591 |
vs | +29.857 |
percentage | +29.770 |
average | +29.325 |
Neg logit contributions | |
Construction | -21.995 |
civilisation | -21.256 |
ufact | -21.033 |
issance | -20.949 |
Located | -20.089 |
Token | Ryan |
Token ID | 6047 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
percentages | +21.033 |
offenses | +19.733 |
fewer | +19.487 |
percentage | +19.305 |
percentile | +19.075 |
Neg logit contributions | |
Construction | -16.552 |
ufact | -16.542 |
civilisation | -16.469 |
Located | -16.173 |
Built | -15.875 |
Token | hasn |
Token ID | 5818 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
percentages | +13.385 |
percentile | +12.449 |
percentage | +12.171 |
offenses | +12.072 |
vs | +12.007 |
Neg logit contributions | |
civilisation | -11.583 |
Construction | -11.192 |
Built | -10.475 |
Located | -10.474 |
Building | -10.395 |
Token | 't |
Token ID | 470 |
Feature activation | +1.42e+01 |
Pos logit contributions | |
percentages | +6.758 |
percentile | +6.295 |
percentage | +5.979 |
vs | +5.805 |
fewer | +5.784 |
Neg logit contributions | |
civilisation | -15.031 |
arrang | -14.100 |
ufact | -14.040 |
Construction | -13.852 |
paradise | -13.793 |
Token | scored |
Token ID | 7781 |
Feature activation | +3.19e+01 |
Pos logit contributions | |
percentages | +13.431 |
percentile | +12.861 |
percentage | +12.537 |
fewer | +12.243 |
average | +12.064 |
Neg logit contributions | |
civilisation | -11.517 |
Construction | -11.420 |
ufact | -10.380 |
Building | -10.371 |
Located | -10.342 |
Token | , |
Token ID | 11 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
percentages | +1.700 |
percentile | +1.568 |
percentage | +1.506 |
unfavorable | +1.456 |
pts | +1.453 |
Neg logit contributions | |
civilisation | -1.946 |
Construction | -1.880 |
paradise | -1.827 |
Built | -1.764 |
Located | -1.756 |
Token | also |
Token ID | 635 |
Feature activation | +2.13e+01 |
Pos logit contributions | |
percentages | +17.766 |
percentage | +16.802 |
percentile | +16.631 |
inaccur | +16.308 |
criticize | +16.081 |
Neg logit contributions | |
civilisation | -13.442 |
Construction | -13.015 |
Located | -12.363 |
paradise | -12.252 |
Built | -12.142 |
Token | found |
Token ID | 1043 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
percentages | +19.093 |
percentage | +18.057 |
percentile | +17.848 |
inaccur | +17.743 |
criticize | +17.720 |
Neg logit contributions | |
civilisation | -15.033 |
Construction | -14.792 |
Located | -13.748 |
ufact | -13.654 |
Built | -13.627 |
Token | that |
Token ID | 326 |
Feature activation | +3.19e+01 |
Pos logit contributions | |
percentages | +21.669 |
percentage | +19.892 |
percentile | +19.694 |
fewer | +19.613 |
inaccur | +19.425 |
Neg logit contributions | |
civilisation | -15.707 |
Construction | -15.491 |
ufact | -15.068 |
Built | -14.923 |
Located | -14.561 |
Token | 49 |
Token ID | 5125 |
Feature activation | +3.51e+01 |
Pos logit contributions | |
percentages | +28.322 |
percentage | +26.471 |
fewer | +26.255 |
percentile | +25.756 |
average | +25.212 |
Neg logit contributions | |
Construction | -15.528 |
Built | -15.445 |
ufact | -15.260 |
civilisation | -15.022 |
Located | -14.401 |
Token | % |
Token ID | 4 |
Feature activation | +5.07e+01 |
Pos logit contributions | |
percent | +28.013 |
percentages | +27.663 |
percentage | +26.533 |
percentile | +25.918 |
% | +24.687 |
Neg logit contributions | |
civilisation | -17.774 |
Construction | -17.626 |
Built | -17.606 |
ufact | -17.363 |
Building | -16.709 |
Token | of |
Token ID | 286 |
Feature activation | +3.35e+01 |
Pos logit contributions | |
percentages | +32.399 |
percent | +31.870 |
fewer | +31.677 |
percentage | +31.022 |
percentile | +30.974 |
Neg logit contributions | |
issance | -19.371 |
civilisation | -19.229 |
ufact | -19.112 |
Construction | -19.090 |
Building | -18.984 |
Token | respondents |
Token ID | 14502 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
percentages | +27.809 |
percentage | +26.287 |
percentile | +25.776 |
fewer | +25.661 |
percent | +25.339 |
Neg logit contributions | |
ufact | -16.188 |
Built | -16.167 |
Construction | -16.145 |
civilisation | -15.594 |
Located | -15.185 |
Token | to |
Token ID | 284 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
percentages | +23.769 |
disapprove | +22.725 |
percentage | +22.651 |
inaccur | +22.328 |
unfavorable | +22.116 |
Neg logit contributions | |
Construction | -18.289 |
civilisation | -18.082 |
Building | -17.406 |
Built | -17.367 |
ufact | -17.338 |
Token | the |
Token ID | 262 |
Feature activation | +1.46e+01 |
Pos logit contributions | |
percentages | +18.071 |
percentile | +16.869 |
percentage | +16.587 |
unfavorable | +16.200 |
fewer | +16.181 |
Neg logit contributions | |
civilisation | -14.137 |
Construction | -13.940 |
ufact | -13.407 |
Located | -13.141 |
Built | -13.084 |
Token | Lok |
Token ID | 36861 |
Feature activation | +8.92e-01 |
Pos logit contributions | |
percentages | +13.889 |
percentile | +12.892 |
percentage | +12.862 |
unfavorable | +12.249 |
fewer | +12.076 |
Neg logit contributions | |
civilisation | -11.337 |
Construction | -11.275 |
ufact | -10.863 |
paradise | -10.652 |
Built | -10.621 |
Token | they |
Token ID | 484 |
Feature activation | +2.37e+01 |
Pos logit contributions | |
percentages | +24.329 |
fewer | +23.042 |
percentage | +22.572 |
vs | +22.058 |
unfavorable | +21.990 |
Neg logit contributions | |
Construction | -20.020 |
Located | -19.822 |
civilisation | -19.727 |
Built | -19.484 |
ufact | -19.012 |
Token | would |
Token ID | 561 |
Feature activation | +3.19e+01 |
Pos logit contributions | |
percentages | +18.310 |
disapprove | +17.921 |
percentage | +17.385 |
unfavorable | +17.256 |
percentile | +16.851 |
Neg logit contributions | |
civilisation | -18.750 |
Construction | -18.337 |
Located | -17.636 |
Building | -17.500 |
ufact | -17.369 |
Token | vote |
Token ID | 3015 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
disapprove | +22.562 |
percentages | +21.346 |
criticize | +21.226 |
percentage | +21.092 |
hate | +20.631 |
Neg logit contributions | |
ufact | -23.337 |
Construction | -22.921 |
civilisation | -22.411 |
Building | -22.110 |
Located | -21.884 |
Token | for |
Token ID | 329 |
Feature activation | +2.94e+01 |
Pos logit contributions | |
percentages | +11.047 |
percentage | +9.784 |
percentile | +9.695 |
unfavorable | +9.685 |
fewer | +9.668 |
Neg logit contributions | |
civilisation | -14.296 |
Construction | -13.894 |
Built | -13.318 |
Located | -13.315 |
paradise | -13.178 |
Token | Obama |
Token ID | 2486 |
Feature activation | +2.25e+01 |
Pos logit contributions | |
percentages | +21.056 |
fewer | +19.839 |
percentage | +19.552 |
unfavorable | +19.402 |
vs | +19.173 |
Neg logit contributions | |
Construction | -20.627 |
civilisation | -20.330 |
Located | -20.170 |
Built | -19.493 |
ufact | -19.247 |
Token | , |
Token ID | 11 |
Feature activation | +5.04e+01 |
Pos logit contributions | |
percentages | +17.082 |
vs | +16.467 |
fewer | +15.729 |
percentage | +15.712 |
percentile | +15.612 |
Neg logit contributions | |
civilisation | -18.735 |
Construction | -18.060 |
Located | -17.679 |
Built | -17.640 |
Building | -17.100 |
Token | while |
Token ID | 981 |
Feature activation | +3.69e+01 |
Pos logit contributions | |
percentages | +31.287 |
vs | +30.148 |
percentage | +29.580 |
fewer | +28.897 |
49 | +28.656 |
Neg logit contributions | |
issance | -23.227 |
civilisation | -22.706 |
Construction | -22.585 |
ufact | -22.434 |
Built | -22.220 |
Token | 46 |
Token ID | 6337 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
percentages | +26.338 |
fewer | +24.153 |
percentage | +23.975 |
unfavorable | +23.278 |
49 | +23.132 |
Neg logit contributions | |
civilisation | -23.001 |
ufact | -22.749 |
Built | -22.351 |
issance | -22.332 |
Construction | -21.928 |
Token | percent |
Token ID | 1411 |
Feature activation | +3.58e+01 |
Pos logit contributions | |
percent | +22.259 |
percentages | +20.837 |
percentage | +20.217 |
percentile | +19.513 |
fewer | +18.507 |
Neg logit contributions | |
civilisation | -26.838 |
ufact | -25.593 |
arrang | -24.943 |
Construction | -24.907 |
Building | -24.384 |
Token | in |
Token ID | 287 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
percentages | +24.626 |
disapprove | +24.152 |
unfavorable | +23.852 |
percentage | +23.671 |
percent | +23.519 |
Neg logit contributions | |
civilisation | -21.604 |
Construction | -20.709 |
Located | -20.573 |
Building | -20.149 |
Built | -19.957 |
Token | Florida |
Token ID | 4744 |
Feature activation | +2.83e+01 |
Pos logit contributions | |
percentages | +18.509 |
percentage | +16.983 |
unfavorable | +16.452 |
percentile | +16.142 |
fewer | +16.113 |
Neg logit contributions | |
Construction | -19.597 |
civilisation | -19.458 |
issance | -18.714 |
ufact | -18.503 |
Built | -18.457 |
Token | yards |
Token ID | 5695 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
percentages | +13.294 |
percentage | +12.155 |
percentile | +12.152 |
offenses | +11.651 |
fewer | +11.583 |
Neg logit contributions | |
civilisation | -16.953 |
Construction | -16.744 |
ufact | -15.982 |
paradise | -15.741 |
Built | -15.612 |
Token | ( |
Token ID | 357 |
Feature activation | +3.28e+01 |
Pos logit contributions | |
percentages | +15.311 |
vs | +14.232 |
percentage | +14.231 |
percentile | +14.036 |
fewer | +13.874 |
Neg logit contributions | |
civilisation | -17.239 |
Construction | -16.304 |
issance | -15.814 |
ufact | -15.478 |
Building | -15.350 |
Token | Fort |
Token ID | 21926 |
Feature activation | +3.00e+00 |
Pos logit contributions | |
percent | +25.346 |
percentages | +25.087 |
vs | +23.993 |
percentage | +23.965 |
percentile | +23.720 |
Neg logit contributions | |
civilisation | -18.661 |
ufact | -15.881 |
paradise | -15.771 |
rebuilt | -14.575 |
Construction | -14.303 |
Token | e |
Token ID | 68 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
percentages | +2.806 |
percentile | +2.609 |
percentage | +2.521 |
pts | +2.424 |
unfavorable | +2.424 |
Neg logit contributions | |
civilisation | -2.838 |
Construction | -2.722 |
paradise | -2.648 |
Built | -2.547 |
Located | -2.536 |
Token | finished |
Token ID | 5201 |
Feature activation | +2.60e+01 |
Pos logit contributions | |
percentages | +24.373 |
percentile | +23.022 |
percentage | +22.982 |
vs | +22.694 |
average | +22.566 |
Neg logit contributions | |
civilisation | -15.617 |
Construction | -13.771 |
ufact | -13.313 |
paradise | -13.000 |
Located | -12.848 |
Token | with |
Token ID | 351 |
Feature activation | +4.92e+01 |
Pos logit contributions | |
percentages | +21.013 |
percentage | +19.966 |
percentile | +19.226 |
vs | +19.207 |
fewer | +19.125 |
Neg logit contributions | |
civilisation | -17.992 |
Construction | -17.378 |
ufact | -17.150 |
issance | -16.572 |
Building | -16.115 |
Token | 1 |
Token ID | 352 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
percentages | +31.079 |
fewer | +30.982 |
percentage | +29.452 |
8 | +29.047 |
9 | +29.033 |
Neg logit contributions | |
ufact | -20.496 |
Construction | -20.356 |
civilisation | -19.613 |
Building | -18.388 |
Located | -18.256 |
Token | , |
Token ID | 11 |
Feature activation | +4.29e+01 |
Pos logit contributions | |
percentile | +12.901 |
percentage | +12.760 |
percent | +12.644 |
percentages | +12.536 |
fewer | +12.457 |
Neg logit contributions | |
civilisation | -24.657 |
ufact | -24.370 |
Construction | -23.311 |
Located | -22.366 |
Building | -22.361 |
Token | 07 |
Token ID | 2998 |
Feature activation | +1.45e+01 |
Pos logit contributions | |
538 | +24.607 |
9 | +24.432 |
percentile | +24.065 |
percentages | +23.994 |
vs | +23.798 |
Neg logit contributions | |
civilisation | -22.600 |
arrang | -20.038 |
ufact | -20.013 |
paradise | -19.965 |
Construction | -19.079 |
Token | 6 |
Token ID | 21 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
percentages | +5.718 |
percentile | +4.907 |
percentage | +4.752 |
percent | +4.414 |
fewer | +4.409 |
Neg logit contributions | |
civilisation | -19.818 |
Construction | -19.169 |
paradise | -18.887 |
ufact | -18.682 |
Located | -18.391 |
Token | ); |
Token ID | 1776 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
fewer | +26.338 |
vs | +25.674 |
percentages | +25.601 |
percentile | +25.212 |
average | +24.954 |
Neg logit contributions | |
ufact | -19.657 |
civilisation | -19.501 |
Construction | -18.585 |
Building | -17.624 |
Located | -17.158 |
Token | she |
Token ID | 673 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
percentages | +13.719 |
percentage | +12.681 |
percentile | +12.610 |
unfavorable | +12.507 |
inaccur | +12.316 |
Neg logit contributions | |
civilisation | -9.300 |
Construction | -8.955 |
Located | -8.453 |
ufact | -8.417 |
issance | -8.395 |
Token | was |
Token ID | 373 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
percentages | +13.827 |
percentile | +12.957 |
inaccur | +12.855 |
percentage | +12.756 |
unfavorable | +12.666 |
Neg logit contributions | |
civilisation | -8.987 |
Construction | -8.749 |
paradise | -8.062 |
ufact | -7.976 |
Building | -7.963 |
Token | not |
Token ID | 407 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
percentages | +23.558 |
unfavorable | +23.191 |
inaccurate | +22.887 |
inaccur | +22.722 |
incorrect | +22.474 |
Neg logit contributions | |
ufact | -19.812 |
civilisation | -19.272 |
Construction | -19.002 |
issance | -18.700 |
Located | -17.691 |
Token | , |
Token ID | 11 |
Feature activation | +5.77e+01 |
Pos logit contributions | |
percentages | +15.541 |
percentage | +14.193 |
unfavorable | +14.146 |
inaccur | +13.995 |
percentile | +13.881 |
Neg logit contributions | |
civilisation | -16.200 |
Construction | -16.081 |
ufact | -15.946 |
issance | -15.472 |
Located | -14.964 |
Token | whereas |
Token ID | 9472 |
Feature activation | +3.02e+01 |
Pos logit contributions | |
percentages | +33.500 |
vs | +32.961 |
percentage | +32.048 |
fewer | +31.958 |
49 | +31.225 |
Neg logit contributions | |
civilisation | -22.209 |
issance | -21.546 |
ufact | -20.542 |
Construction | -20.266 |
paradise | -19.193 |
Token | only |
Token ID | 691 |
Feature activation | +4.91e+01 |
Pos logit contributions | |
percentages | +23.202 |
fewer | +21.494 |
percentage | +21.135 |
unfavorable | +20.783 |
percent | +20.449 |
Neg logit contributions | |
civilisation | -20.872 |
ufact | -19.557 |
Construction | -19.556 |
issance | -19.227 |
Built | -18.880 |
Token | 34 |
Token ID | 4974 |
Feature activation | +3.68e+01 |
Pos logit contributions | |
percentages | +29.140 |
percentage | +27.674 |
49 | +27.589 |
fewer | +27.519 |
47 | +27.218 |
Neg logit contributions | |
ufact | -26.397 |
issance | -25.185 |
civilisation | -24.319 |
Construction | -23.774 |
exting | -23.382 |
Token | percent |
Token ID | 1411 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
percent | +25.594 |
percentages | +23.741 |
percentage | +23.041 |
percentile | +22.069 |
percent | +21.918 |
Neg logit contributions | |
civilisation | -25.394 |
Construction | -23.509 |
Building | -23.487 |
issance | -22.917 |
Laun | -22.881 |
Token | she |
Token ID | 673 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
percentages | +25.767 |
disapprove | +25.089 |
percent | +24.925 |
percentage | +24.776 |
unfavorable | +24.491 |
Neg logit contributions | |
civilisation | -21.313 |
Construction | -19.679 |
Located | -19.627 |
Building | -19.125 |
ufact | -18.875 |
Token | was |
Token ID | 373 |
Feature activation | +2.29e+01 |
Pos logit contributions | |
percentages | +6.875 |
percentile | +6.497 |
percentage | +6.335 |
inaccur | +6.229 |
unfavorable | +6.215 |
Neg logit contributions | |
civilisation | -3.719 |
Construction | -3.562 |
paradise | -3.312 |
Located | -3.187 |
Built | -3.168 |
Token | . |
Token ID | 13 |
Feature activation | +2.53e+01 |
Pos logit contributions | |
percentages | +18.508 |
unfavorable | +17.613 |
inaccur | +16.993 |
percentage | +16.977 |
inaccurate | +16.932 |
Neg logit contributions | |
civilisation | -17.356 |
ufact | -16.911 |
Construction | -16.669 |
issance | -16.352 |
paradise | -15.815 |
Token | are |
Token ID | 389 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
percentages | +12.271 |
percentile | +11.277 |
percentage | +11.006 |
percent | +10.919 |
vs | +10.633 |
Neg logit contributions | |
Construction | -18.421 |
civilisation | -18.081 |
ufact | -17.575 |
paradise | -17.426 |
Located | -17.279 |
Token | ." |
Token ID | 526 |
Feature activation | +1.93e+01 |
Pos logit contributions | |
percentages | +15.033 |
percentage | +13.727 |
percentile | +13.724 |
vs | +13.541 |
unfavorable | +13.477 |
Neg logit contributions | |
civilisation | -12.886 |
Construction | -12.486 |
paradise | -11.741 |
ufact | -11.725 |
Located | -11.450 |
Token | It |
Token ID | 632 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
percentages | +18.399 |
percentage | +17.183 |
pts | +17.171 |
percentile | +17.153 |
vs | +16.885 |
Neg logit contributions | |
civilisation | -14.019 |
paradise | -12.319 |
ufact | -12.264 |
Construction | -12.161 |
rebuilt | -11.742 |
Token | shows |
Token ID | 2523 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
percentages | +17.033 |
percentile | +15.804 |
percentage | +15.482 |
inaccur | +15.314 |
fewer | +14.920 |
Neg logit contributions | |
civilisation | -16.263 |
Construction | -16.071 |
Built | -15.175 |
Building | -15.068 |
Located | -14.881 |
Token | that |
Token ID | 326 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
percentages | +19.054 |
fewer | +17.255 |
percentage | +17.025 |
unfavorable | +16.654 |
percentile | +16.615 |
Neg logit contributions | |
civilisation | -17.039 |
Construction | -16.790 |
ufact | -16.270 |
Built | -16.058 |
Located | -15.889 |
Token | about |
Token ID | 546 |
Feature activation | +4.90e+01 |
Pos logit contributions | |
percentages | +28.861 |
fewer | +27.037 |
percentage | +26.890 |
unfavorable | +25.823 |
average | +25.385 |
Neg logit contributions | |
ufact | -19.274 |
Construction | -19.257 |
Built | -18.752 |
civilisation | -18.687 |
Located | -18.358 |
Token | half |
Token ID | 2063 |
Feature activation | +5.18e+01 |
Pos logit contributions | |
percentages | +30.690 |
percentage | +28.947 |
fewer | +28.809 |
average | +27.838 |
percentile | +27.562 |
Neg logit contributions | |
ufact | -23.808 |
issance | -22.848 |
Construction | -22.689 |
Built | -22.559 |
Located | -22.491 |
Token | the |
Token ID | 262 |
Feature activation | +3.05e+01 |
Pos logit contributions | |
percentages | +31.021 |
disapprove | +30.697 |
percent | +30.487 |
percentage | +29.980 |
of | +29.919 |
Neg logit contributions | |
civilisation | -21.715 |
Located | -21.127 |
ufact | -20.916 |
issance | -20.600 |
Construction | -20.504 |
Token | country |
Token ID | 1499 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
percentages | +25.902 |
percentage | +24.450 |
average | +22.957 |
respondents | +22.957 |
unfavorable | +22.874 |
Neg logit contributions | |
Construction | -18.519 |
ufact | -18.044 |
civilisation | -17.841 |
Built | -17.515 |
Located | -17.058 |
Token | doesn |
Token ID | 1595 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
percentages | +18.680 |
percentile | +17.039 |
percentage | +16.968 |
disapprove | +16.949 |
inaccur | +16.694 |
Neg logit contributions | |
civilisation | -18.750 |
Construction | -18.630 |
ufact | -17.693 |
Built | -17.542 |
Located | -17.511 |
Token | 't |
Token ID | 470 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
percentages | +7.721 |
percentile | +7.443 |
percent | +7.146 |
vs | +7.054 |
percentage | +7.050 |
Neg logit contributions | |
civilisation | -23.468 |
arrang | -23.381 |
ufact | -22.776 |
neighb | -22.204 |
exting | -22.041 |
Token | reg |
Token ID | 2301 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
percentages | +8.909 |
percentile | +7.987 |
percentage | +7.729 |
regress | +7.531 |
percent | +7.529 |
Neg logit contributions | |
civilisation | -10.980 |
paradise | -10.239 |
Construction | -10.117 |
ufact | -9.723 |
Built | -9.712 |
Token | ression |
Token ID | 2234 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
percentages | +3.718 |
percentile | +3.476 |
percentage | +3.365 |
unfavorable | +3.262 |
pts | +3.261 |
Neg logit contributions | |
civilisation | -2.988 |
Construction | -2.848 |
paradise | -2.772 |
Built | -2.646 |
Located | -2.628 |
Token | if |
Token ID | 611 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
percentages | +11.283 |
percentile | +10.204 |
percentage | +10.033 |
regress | +9.640 |
vs | +9.531 |
Neg logit contributions | |
civilisation | -12.570 |
Construction | -11.832 |
paradise | -11.578 |
Located | -11.428 |
Built | -11.365 |
Token | a |
Token ID | 257 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
percentages | +17.271 |
percentile | +15.846 |
percentage | +15.815 |
fewer | +15.485 |
unfavorable | +15.237 |
Neg logit contributions | |
civilisation | -13.489 |
Construction | -13.152 |
ufact | -12.596 |
paradise | -12.435 |
Built | -12.291 |
Token | sufficient |
Token ID | 6751 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
percentages | +9.203 |
percentile | +8.734 |
percentage | +8.566 |
statistically | +8.049 |
fewer | +7.997 |
Neg logit contributions | |
civilisation | -9.658 |
Construction | -9.508 |
paradise | -9.046 |
ufact | -8.978 |
Built | -8.969 |
Token | number |
Token ID | 1271 |
Feature activation | +4.88e+01 |
Pos logit contributions | |
percentages | +19.698 |
percentage | +19.157 |
percentile | +17.988 |
percent | +17.449 |
unfavorable | +17.080 |
Neg logit contributions | |
Construction | -15.916 |
civilisation | -15.414 |
Built | -15.139 |
ufact | -15.010 |
issance | -14.984 |
Token | of |
Token ID | 286 |
Feature activation | +3.51e+01 |
Pos logit contributions | |
percentages | +31.058 |
of | +28.906 |
percentage | +28.768 |
fewer | +28.403 |
percent | +28.387 |
Neg logit contributions | |
civilisation | -21.848 |
Construction | -21.098 |
ufact | -21.010 |
issance | -20.861 |
paradise | -20.615 |
Token | studies |
Token ID | 3640 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
percentages | +28.342 |
percentage | +26.517 |
percentile | +26.077 |
fewer | +25.694 |
percent | +25.632 |
Neg logit contributions | |
Construction | -18.171 |
civilisation | -17.735 |
ufact | -17.418 |
Built | -17.217 |
Building | -16.713 |
Token | are |
Token ID | 389 |
Feature activation | +5.07e-01 |
Pos logit contributions | |
percentages | +14.688 |
percentile | +13.737 |
percentage | +13.657 |
vs | +13.234 |
inaccur | +13.168 |
Neg logit contributions | |
civilisation | -13.196 |
Construction | -12.713 |
Located | -11.946 |
paradise | -11.908 |
Built | -11.825 |
Token | found |
Token ID | 1043 |
Feature activation | +9.79e+00 |
Pos logit contributions | |
percentages | +0.490 |
percentile | +0.456 |
percentage | +0.439 |
pts | +0.426 |
unfavorable | +0.424 |
Neg logit contributions | |
civilisation | -0.464 |
Construction | -0.447 |
paradise | -0.434 |
Built | -0.417 |
Located | -0.414 |
Token | ( |
Token ID | 357 |
Feature activation | +2.22e+01 |
Pos logit contributions | |
percentages | +9.547 |
percentile | +8.834 |
percentage | +8.708 |
unfavorable | +8.571 |
inaccur | +8.436 |
Neg logit contributions | |
civilisation | -8.379 |
Construction | -7.920 |
paradise | -7.710 |
Built | -7.525 |
ufact | -7.481 |
Token | has |
Token ID | 468 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
percentages | +14.660 |
percentile | +13.391 |
percentage | +13.355 |
vs | +13.179 |
fewer | +13.002 |
Neg logit contributions | |
civilisation | -12.876 |
Construction | -12.355 |
paradise | -11.937 |
ufact | -11.743 |
Building | -11.560 |
Token | a |
Token ID | 257 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
percentages | +17.432 |
percentage | +16.032 |
fewer | +15.903 |
percentile | +15.765 |
unfavorable | +15.399 |
Neg logit contributions | |
civilisation | -14.324 |
Construction | -14.239 |
paradise | -13.229 |
Located | -13.123 |
Building | -13.067 |
Token | debt |
Token ID | 5057 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
percentages | +19.293 |
percentage | +18.791 |
percentile | +18.002 |
percent | +17.577 |
unfavorable | +17.184 |
Neg logit contributions | |
Construction | -14.701 |
civilisation | -13.995 |
issance | -13.577 |
ufact | -13.572 |
Built | -13.382 |
Token | to |
Token ID | 284 |
Feature activation | +7.61e+00 |
Pos logit contributions | |
percentages | +13.071 |
percentage | +12.314 |
percentile | +12.122 |
percent | +11.535 |
unfavorable | +11.322 |
Neg logit contributions | |
civilisation | -11.203 |
Construction | -11.094 |
paradise | -10.392 |
issance | -10.120 |
ufact | -10.102 |
Token | GDP |
Token ID | 12396 |
Feature activation | +3.24e+01 |
Pos logit contributions | |
percentages | +6.035 |
percentile | +5.475 |
percentage | +5.409 |
pts | +5.022 |
percent | +5.020 |
Neg logit contributions | |
civilisation | -7.925 |
Construction | -7.790 |
paradise | -7.560 |
Located | -7.385 |
Built | -7.374 |
Token | ratio |
Token ID | 8064 |
Feature activation | +4.86e+01 |
Pos logit contributions | |
percentages | +22.615 |
percentage | +22.327 |
percentile | +21.081 |
average | +20.775 |
percent | +20.358 |
Neg logit contributions | |
Construction | -21.146 |
civilisation | -20.057 |
ufact | -19.798 |
issance | -19.639 |
Built | -19.434 |
Token | of |
Token ID | 286 |
Feature activation | +4.56e+01 |
Pos logit contributions | |
percentages | +30.346 |
fewer | +29.292 |
percentage | +29.228 |
of | +29.061 |
average | +28.011 |
Neg logit contributions | |
Construction | -20.886 |
civilisation | -20.765 |
issance | -20.739 |
eworld | -19.291 |
ufact | -19.180 |
Token | only |
Token ID | 691 |
Feature activation | +4.35e+01 |
Pos logit contributions | |
percentages | +28.835 |
fewer | +27.857 |
percentage | +27.337 |
49 | +26.992 |
0 | +26.888 |
Neg logit contributions | |
ufact | -22.313 |
civilisation | -21.358 |
issance | -21.267 |
Construction | -20.623 |
Building | -19.471 |
Token | 2 |
Token ID | 362 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
percentages | +27.754 |
percentage | +26.413 |
fewer | +26.211 |
0 | +26.158 |
49 | +25.969 |
Neg logit contributions | |
ufact | -23.460 |
issance | -22.641 |
civilisation | -22.090 |
Construction | -21.851 |
Building | -20.473 |
Token | . |
Token ID | 13 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
percentages | +22.300 |
percentage | +21.853 |
percent | +20.871 |
percentile | +20.809 |
pts | +19.910 |
Neg logit contributions | |
civilisation | -18.744 |
Construction | -18.599 |
Built | -17.918 |
Building | -17.794 |
paradise | -17.701 |
Token | 8 |
Token ID | 23 |
Feature activation | +3.62e+01 |
Pos logit contributions | |
percentages | +16.541 |
percentile | +15.915 |
percentage | +15.649 |
pts | +15.604 |
vs | +15.532 |
Neg logit contributions | |
civilisation | -20.670 |
paradise | -18.695 |
ufact | -18.678 |
arrang | -18.473 |
Construction | -18.284 |
Token | OA |
Token ID | 23621 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
percentages | +7.893 |
percentile | +7.079 |
percentage | +6.953 |
offenses | +6.506 |
fewer | +6.405 |
Neg logit contributions | |
civilisation | -11.688 |
Construction | -11.223 |
ufact | -10.963 |
paradise | -10.957 |
issance | -10.654 |
Token | ( |
Token ID | 357 |
Feature activation | +2.61e+01 |
Pos logit contributions | |
percentages | +23.150 |
percentage | +22.038 |
percentile | +21.871 |
vs | +20.729 |
percent | +20.700 |
Neg logit contributions | |
civilisation | -18.663 |
Construction | -17.501 |
Located | -16.484 |
paradise | -16.341 |
issance | -16.189 |
Token | value |
Token ID | 8367 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
percent | +23.013 |
percentages | +22.961 |
percentage | +22.055 |
percentile | +21.753 |
percent | +21.153 |
Neg logit contributions | |
civilisation | -17.012 |
ufact | -15.159 |
paradise | -15.012 |
rebuilt | -13.733 |
Construction | -13.498 |
Token | per |
Token ID | 583 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
percentages | +24.477 |
percentage | +23.468 |
percentile | +23.352 |
vs | +22.900 |
fewer | +22.229 |
Neg logit contributions | |
civilisation | -16.049 |
Construction | -15.843 |
ufact | -15.088 |
paradise | -14.418 |
issance | -14.380 |
Token | play |
Token ID | 711 |
Feature activation | +2.90e+01 |
Pos logit contributions | |
percentages | +15.660 |
percentile | +15.383 |
percentage | +15.172 |
fewer | +14.464 |
percent | +14.359 |
Neg logit contributions | |
Construction | -13.322 |
civilisation | -13.111 |
ufact | -12.911 |
Built | -12.340 |
Building | -12.088 |
Token | ), |
Token ID | 828 |
Feature activation | +4.84e+01 |
Pos logit contributions | |
percentage | +23.712 |
percentages | +23.585 |
percentile | +23.049 |
vs | +22.825 |
fewer | +22.541 |
Neg logit contributions | |
civilisation | -17.740 |
Construction | -17.306 |
ufact | -16.629 |
issance | -16.445 |
paradise | -16.232 |
Token | and |
Token ID | 290 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
percentages | +30.703 |
percentage | +30.365 |
percentile | +29.402 |
average | +28.834 |
percent | +28.832 |
Neg logit contributions | |
civilisation | -20.941 |
Construction | -20.721 |
ufact | -19.258 |
issance | -18.645 |
Building | -18.358 |
Token | fourth |
Token ID | 5544 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
percentages | +23.710 |
percentage | +22.658 |
percentile | +22.083 |
fewer | +21.793 |
percent | +21.528 |
Neg logit contributions | |
civilisation | -17.557 |
Construction | -17.406 |
ufact | -16.642 |
Building | -16.102 |
issance | -15.664 |
Token | in |
Token ID | 287 |
Feature activation | +2.53e+01 |
Pos logit contributions | |
percentages | +15.396 |
percentile | +15.046 |
percentage | +14.446 |
vs | +13.877 |
percent | +13.869 |
Neg logit contributions | |
civilisation | -19.408 |
Construction | -19.094 |
ufact | -18.130 |
Building | -17.939 |
Built | -17.792 |
Token | running |
Token ID | 2491 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
percentages | +22.635 |
percentage | +21.697 |
percentile | +21.249 |
average | +20.589 |
percent | +20.532 |
Neg logit contributions | |
Construction | -16.283 |
civilisation | -16.169 |
ufact | -15.608 |
Built | -14.998 |
Located | -14.979 |
Token | back |
Token ID | 736 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
percentages | +15.270 |
percentage | +14.253 |
percentile | +14.150 |
offenses | +13.261 |
vs | +13.173 |
Neg logit contributions | |
Construction | -13.400 |
civilisation | -13.183 |
ufact | -12.635 |
Located | -12.316 |
paradise | -12.100 |
Token | is |
Token ID | 318 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
civilisation | +8.767 |
rebuilt | +8.540 |
paradise | +8.523 |
Construction | +8.055 |
Built | +7.979 |
Neg logit contributions | |
percentages | -15.541 |
percentile | -15.294 |
inacc | -14.653 |
disapprove | -14.605 |
pts | -14.602 |
Token | . |
Token ID | 13 |
Feature activation | +2.44e+01 |
Pos logit contributions | |
civilisation | +0.382 |
Construction | +0.367 |
paradise | +0.357 |
Built | +0.339 |
Located | +0.337 |
Neg logit contributions | |
percentages | -0.477 |
percentile | -0.448 |
percentage | -0.430 |
pts | -0.422 |
unfavorable | -0.418 |
Token | Twenty |
Token ID | 22381 |
Feature activation | +3.11e+01 |
Pos logit contributions | |
percentages | +18.250 |
vs | +16.985 |
percentage | +16.806 |
percent | +16.563 |
fewer | +16.451 |
Neg logit contributions | |
civilisation | -20.733 |
paradise | -18.359 |
arrang | -17.847 |
rebuilt | -17.832 |
ufact | -17.527 |
Token | - |
Token ID | 12 |
Feature activation | +3.23e+01 |
Pos logit contributions | |
percentages | +23.453 |
percent | +23.045 |
percentage | +22.345 |
percentile | +21.216 |
fewer | +20.714 |
Neg logit contributions | |
civilisation | -22.355 |
Construction | -20.879 |
issance | -20.577 |
Built | -20.286 |
ufact | -19.637 |
Token | seven |
Token ID | 26548 |
Feature activation | +3.73e+01 |
Pos logit contributions | |
percent | +20.784 |
percentages | +20.637 |
percent | +19.198 |
percentage | +19.003 |
percentile | +18.783 |
Neg logit contributions | |
civilisation | -24.896 |
ufact | -22.001 |
issance | -21.190 |
Construction | -20.951 |
paradise | -20.889 |
Token | percent |
Token ID | 1411 |
Feature activation | +4.80e+01 |
Pos logit contributions | |
percent | +26.214 |
percentages | +25.231 |
percentage | +24.448 |
percentile | +22.931 |
percent | +21.807 |
Neg logit contributions | |
civilisation | -25.927 |
Construction | -24.904 |
ufact | -24.651 |
Built | -24.549 |
issance | -24.294 |
Token | in |
Token ID | 287 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
disapprove | +29.881 |
percentages | +29.141 |
percent | +28.835 |
of | +28.368 |
percentage | +28.361 |
Neg logit contributions | |
civilisation | -22.410 |
Located | -21.401 |
Construction | -21.183 |
ufact | -21.119 |
Built | -20.999 |
Token | Ohio |
Token ID | 6835 |
Feature activation | +4.51e+01 |
Pos logit contributions | |
percentages | +21.976 |
percentage | +20.374 |
fewer | +19.650 |
percent | +19.339 |
unfavorable | +19.316 |
Neg logit contributions | |
civilisation | -20.304 |
Construction | -20.296 |
issance | -19.919 |
ufact | -19.833 |
Built | -19.278 |
Token | and |
Token ID | 290 |
Feature activation | +4.35e+01 |
Pos logit contributions | |
disapprove | +28.776 |
percentages | +27.619 |
vs | +27.511 |
hate | +27.094 |
percentage | +26.822 |
Neg logit contributions | |
civilisation | -21.931 |
Construction | -20.619 |
ufact | -20.600 |
issance | -20.436 |
Located | -20.417 |
Token | 32 |
Token ID | 3933 |
Feature activation | +4.38e+01 |
Pos logit contributions | |
percentages | +28.216 |
fewer | +27.480 |
49 | +26.684 |
percentage | +26.339 |
47 | +26.132 |
Neg logit contributions | |
ufact | -23.199 |
issance | -21.726 |
Construction | -21.267 |
civilisation | -21.211 |
Built | -21.206 |
Token | percent |
Token ID | 1411 |
Feature activation | +3.76e+01 |
Pos logit contributions | |
percent | +27.670 |
percentages | +25.635 |
percentage | +25.176 |
percentile | +23.573 |
fewer | +22.205 |
Neg logit contributions | |
ufact | -31.685 |
civilisation | -31.008 |
exting | -30.375 |
arrang | -29.470 |
Nitrome | -29.220 |
Token | future |
Token ID | 2003 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
civilisation | +19.379 |
Construction | +18.850 |
paradise | +18.465 |
rebuilt | +17.929 |
Built | +17.720 |
Neg logit contributions | |
percentages | -9.236 |
percentile | -8.346 |
unfavorable | -7.778 |
pts | -7.651 |
percentage | -7.510 |
Token | stores |
Token ID | 7000 |
Feature activation | -3.58e+01 |
Pos logit contributions | |
civilisation | +21.348 |
paradise | +20.629 |
Construction | +20.129 |
rebuilt | +19.542 |
refurb | +19.539 |
Neg logit contributions | |
percentages | -12.592 |
percentile | -11.811 |
unfavorable | -11.202 |
pts | -11.190 |
disapprove | -11.087 |
Token | . |
Token ID | 13 |
Feature activation | -4.19e+01 |
Pos logit contributions | |
civilisation | +25.854 |
paradise | +25.115 |
Construction | +25.084 |
rebuilt | +24.508 |
transformed | +23.823 |
Neg logit contributions | |
percentages | -17.778 |
percentile | -16.728 |
pts | -15.739 |
inacc | -15.187 |
unfavorable | -14.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
Construction | +24.624 |
Located | +23.218 |
Built | +22.789 |
Building | +22.703 |
Located | +22.458 |
Neg logit contributions | |
percentages | -24.802 |
unfavorable | -23.415 |
regress | -23.166 |
inaccur | -22.888 |
inconsist | -22.884 |
Token |
|
Token ID | 198 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
Construction | +6.516 |
Built | +6.040 |
Located | +6.033 |
Building | +5.878 |
paradise | +5.819 |
Neg logit contributions | |
percentages | -12.604 |
disapprove | -11.912 |
unfavorable | -11.456 |
percentile | -11.434 |
injure | -11.336 |
Token | " |
Token ID | 1 |
Feature activation | -4.78e+01 |
Pos logit contributions | |
Construction | +18.786 |
Built | +17.106 |
Building | +16.891 |
Located | +16.728 |
Laun | +16.011 |
Neg logit contributions | |
percentages | -21.385 |
percentile | -19.544 |
unfavorable | -19.174 |
disapprove | -18.940 |
percentage | -18.861 |
Token | Opening |
Token ID | 43093 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
Construction | +29.975 |
Building | +28.373 |
Located | +27.991 |
Built | +27.826 |
Laun | +26.914 |
Neg logit contributions | |
percentages | -27.376 |
disapprove | -26.393 |
unfavorable | -25.417 |
percentile | -25.095 |
regress | -25.030 |
Token | our |
Token ID | 674 |
Feature activation | -2.63e+01 |
Pos logit contributions | |
civilisation | +19.257 |
Construction | +18.526 |
paradise | +18.356 |
Harbour | +17.561 |
transformed | +17.089 |
Neg logit contributions | |
percentages | -11.223 |
percentile | -10.545 |
unfavorable | -9.965 |
pts | -9.660 |
percent | -9.472 |
Token | Aberdeen |
Token ID | 44985 |
Feature activation | -4.04e+01 |
Pos logit contributions | |
civilisation | +22.946 |
paradise | +22.714 |
bustling | +21.252 |
Construction | +21.168 |
Harbour | +21.142 |
Neg logit contributions | |
percentages | -14.167 |
percentile | -13.413 |
criticize | -12.525 |
unfavorable | -12.516 |
pts | -12.475 |
Token | garden |
Token ID | 11376 |
Feature activation | -3.08e+01 |
Pos logit contributions | |
paradise | +28.547 |
civilisation | +27.753 |
gardens | +27.177 |
Construction | +26.800 |
building | +26.282 |
Neg logit contributions | |
percentages | -17.293 |
unfavorable | -16.327 |
percentile | -15.881 |
offenses | -15.419 |
regress | -15.307 |
Token | centre |
Token ID | 7372 |
Feature activation | -3.64e+01 |
Pos logit contributions | |
civilisation | +24.388 |
paradise | +24.139 |
transformed | +21.446 |
refurb | +21.340 |
Construction | +21.320 |
Neg logit contributions | |
percentages | -16.740 |
percentile | -15.935 |
unfavorable | -15.739 |
Percent | -15.025 |
percent | -14.891 |
Token | new |
Token ID | 649 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
civilisation | +24.460 |
paradise | +24.164 |
bustling | +22.997 |
Construction | +22.962 |
building | +22.760 |
Neg logit contributions | |
percentages | -16.356 |
percentile | -14.991 |
unfavorable | -14.340 |
criticize | -14.206 |
offenses | -14.105 |
Token | store |
Token ID | 3650 |
Feature activation | -4.03e+01 |
Pos logit contributions | |
civilisation | +27.550 |
paradise | +27.214 |
building | +25.667 |
Construction | +25.031 |
bustling | +24.954 |
Neg logit contributions | |
percentages | -16.933 |
unfavorable | -15.234 |
percentile | -15.071 |
criticize | -14.946 |
pts | -14.926 |
Token | . |
Token ID | 13 |
Feature activation | -4.00e+01 |
Pos logit contributions | |
civilisation | +27.242 |
paradise | +27.028 |
Construction | +25.710 |
rebuilt | +25.452 |
building | +25.432 |
Neg logit contributions | |
percentages | -18.854 |
percentile | -17.215 |
unfavorable | -16.479 |
pts | -16.407 |
disapprove | -16.102 |
Token |
|
Token ID | 198 |
Feature activation | -8.42e+00 |
Pos logit contributions | |
Construction | +25.042 |
Located | +24.049 |
Located | +23.626 |
Built | +23.565 |
Building | +23.506 |
Neg logit contributions | |
percentages | -22.705 |
regress | -21.976 |
unfavorable | -21.416 |
inaccur | -21.273 |
inconsist | -21.035 |
Token |
|
Token ID | 198 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
Construction | +5.488 |
Built | +5.095 |
Located | +5.091 |
civilisation | +5.006 |
paradise | +4.996 |
Neg logit contributions | |
percentages | -9.614 |
disapprove | -8.945 |
percentile | -8.738 |
unfavorable | -8.676 |
offenses | -8.572 |
Token | " |
Token ID | 1 |
Feature activation | -4.51e+01 |
Pos logit contributions | |
Construction | +16.455 |
Built | +15.025 |
Building | +14.809 |
Located | +14.717 |
Laun | +14.000 |
Neg logit contributions | |
percentages | -19.897 |
percentile | -18.311 |
unfavorable | -17.757 |
percentage | -17.610 |
disapprove | -17.500 |
Token | I |
Token ID | 40 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
Construction | +28.807 |
Building | +27.369 |
Located | +27.285 |
Built | +27.027 |
Laun | +25.579 |
Neg logit contributions | |
percentages | -26.685 |
disapprove | -25.726 |
percentile | -24.884 |
unfavorable | -24.846 |
regress | -24.635 |
Token | know |
Token ID | 760 |
Feature activation | -2.79e+01 |
Pos logit contributions | |
civilisation | +13.964 |
rebuilt | +13.507 |
paradise | +13.300 |
Construction | +12.928 |
realised | +12.749 |
Neg logit contributions | |
percentages | -11.342 |
percentile | -10.253 |
pts | -9.843 |
unfavorable | -9.840 |
offenses | -9.741 |
Token | our |
Token ID | 674 |
Feature activation | -2.37e+01 |
Pos logit contributions | |
civilisation | +24.057 |
paradise | +22.811 |
Construction | +22.496 |
Harbour | +21.929 |
rebuilt | +21.521 |
Neg logit contributions | |
percentages | -14.393 |
percentile | -13.321 |
partName | -12.847 |
unfavorable | -12.615 |
offenses | -12.547 |
Token | customers |
Token ID | 4297 |
Feature activation | +8.78e+00 |
Pos logit contributions | |
civilisation | +22.096 |
paradise | +21.283 |
Construction | +20.110 |
countryside | +20.038 |
bustling | +19.992 |
Neg logit contributions | |
percentages | -12.720 |
percentile | -12.021 |
pts | -11.390 |
percent | -11.316 |
injure | -11.234 |
Token | in |
Token ID | 287 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
percentages | +7.293 |
percentile | +6.675 |
percentage | +6.563 |
disapprove | +6.224 |
fewer | +6.209 |
Neg logit contributions | |
civilisation | -8.671 |
Construction | -8.565 |
Located | -8.100 |
Built | -8.086 |
paradise | -8.036 |
Token | " |
Token ID | 1 |
Feature activation | -3.72e+01 |
Pos logit contributions | |
Construction | +14.694 |
Building | +13.511 |
Built | +13.509 |
Located | +13.205 |
Laun | +12.825 |
Neg logit contributions | |
percentages | -19.638 |
percentile | -18.326 |
disapprove | -17.857 |
unfavorable | -17.833 |
percentage | -17.585 |
Token | The |
Token ID | 464 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
Construction | +24.812 |
Building | +24.689 |
Laun | +23.616 |
Built | +23.572 |
Located | +23.492 |
Neg logit contributions | |
percentages | -23.936 |
disapprove | -23.429 |
percentile | -22.587 |
injure | -22.499 |
unfavorable | -22.071 |
Token | Trust |
Token ID | 9870 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
civilisation | +16.439 |
Construction | +15.889 |
paradise | +15.686 |
rebuilt | +15.487 |
Building | +15.323 |
Neg logit contributions | |
percentages | -10.909 |
percentile | -10.561 |
disapprove | -9.749 |
injure | -9.556 |
offenses | -9.543 |
Token | is |
Token ID | 318 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
civilisation | +19.630 |
rebuilt | +18.348 |
Construction | +18.282 |
envis | +18.168 |
paradise | +18.047 |
Neg logit contributions | |
percentages | -15.351 |
percentile | -14.372 |
pts | -13.635 |
unfavorable | -13.616 |
inacc | -13.499 |
Token | therefore |
Token ID | 4361 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
civilisation | +16.718 |
Construction | +15.787 |
paradise | +15.761 |
rebuilt | +15.705 |
revital | +15.248 |
Neg logit contributions | |
percentages | -13.981 |
percentile | -13.359 |
pts | -12.762 |
disapprove | -12.424 |
injure | -12.364 |
Token | happy |
Token ID | 3772 |
Feature activation | -4.50e+01 |
Pos logit contributions | |
civilisation | +18.368 |
rebuilt | +17.705 |
building | +17.497 |
envis | +17.443 |
revital | +17.407 |
Neg logit contributions | |
percentages | -15.432 |
percentile | -15.020 |
pts | -14.481 |
inacc | -14.040 |
injure | -13.916 |
Token | to |
Token ID | 284 |
Feature activation | -2.83e+01 |
Pos logit contributions | |
civilisation | +26.297 |
Construction | +25.228 |
revital | +25.195 |
paradise | +25.134 |
building | +25.115 |
Neg logit contributions | |
percentile | -20.360 |
percentages | -19.568 |
offenses | -18.427 |
unfavorable | -18.088 |
disapprove | -17.956 |
Token | play |
Token ID | 711 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
revital | +20.030 |
refurb | +19.951 |
civilisation | +19.880 |
envis | +19.516 |
paradise | +19.319 |
Neg logit contributions | |
percentages | -17.840 |
inacc | -16.641 |
percentile | -16.570 |
unfavorable | -16.192 |
pts | -15.952 |
Token | an |
Token ID | 281 |
Feature activation | -7.36e+00 |
Pos logit contributions | |
civilisation | +12.898 |
paradise | +11.943 |
Construction | +11.943 |
rebuilt | +11.109 |
Located | +10.923 |
Neg logit contributions | |
percentages | -12.938 |
percentile | -12.843 |
pts | -12.134 |
disapprove | -11.873 |
offenses | -11.783 |
Token | active |
Token ID | 4075 |
Feature activation | -8.17e+00 |
Pos logit contributions | |
civilisation | +6.251 |
Construction | +6.007 |
paradise | +5.749 |
rebuilt | +5.533 |
Built | +5.479 |
Neg logit contributions | |
percentages | -6.894 |
percentile | -6.578 |
pts | -6.303 |
percentage | -6.178 |
offenses | -6.159 |
Token | part |
Token ID | 636 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
civilisation | +6.255 |
Construction | +5.827 |
paradise | +5.661 |
rebuilt | +5.250 |
Building | +5.162 |
Neg logit contributions | |
percentages | -8.421 |
percentile | -7.875 |
offenses | -7.681 |
pts | -7.659 |
inaccur | -7.471 |
Token | 40 |
Token ID | 2319 |
Feature activation | +3.00e+00 |
Pos logit contributions | |
percentages | +5.319 |
percentile | +4.737 |
percentage | +4.638 |
fewer | +4.450 |
offenses | +4.328 |
Neg logit contributions | |
civilisation | -8.762 |
Construction | -8.617 |
paradise | -8.356 |
Located | -8.237 |
Built | -8.215 |
Token | years |
Token ID | 812 |
Feature activation | -9.76e+00 |
Pos logit contributions | |
percentages | +2.018 |
percentile | +1.813 |
percentage | +1.723 |
unfavorable | +1.638 |
pts | +1.636 |
Neg logit contributions | |
civilisation | -3.626 |
Construction | -3.524 |
paradise | -3.445 |
Built | -3.347 |
Located | -3.336 |
Token | , |
Token ID | 11 |
Feature activation | -5.50e+00 |
Pos logit contributions | |
civilisation | +8.285 |
Construction | +7.998 |
paradise | +7.703 |
rebuilt | +7.450 |
Built | +7.309 |
Neg logit contributions | |
percentages | -9.232 |
percentile | -8.616 |
percentage | -8.141 |
unfavorable | -8.038 |
pts | -7.951 |
Token | said |
Token ID | 531 |
Feature activation | -3.33e+01 |
Pos logit contributions | |
civilisation | +4.513 |
Construction | +4.242 |
paradise | +4.185 |
rebuilt | +3.997 |
Built | +3.879 |
Neg logit contributions | |
percentages | -5.660 |
percentile | -5.356 |
percentage | -5.067 |
unfavorable | -4.996 |
pts | -4.961 |
Token | : |
Token ID | 25 |
Feature activation | -5.25e+00 |
Pos logit contributions | |
civilisation | +26.277 |
Construction | +25.607 |
paradise | +25.492 |
renovation | +23.936 |
refurb | +23.716 |
Neg logit contributions | |
percentages | -15.614 |
percentile | -14.726 |
partName | -14.129 |
percent | -13.797 |
criticize | -13.586 |
Token | " |
Token ID | 366 |
Feature activation | -4.50e+01 |
Pos logit contributions | |
Construction | +4.207 |
civilisation | +4.137 |
paradise | +3.969 |
Built | +3.894 |
Located | +3.891 |
Neg logit contributions | |
percentages | -5.380 |
percentile | -4.958 |
unfavorable | -4.796 |
disapprove | -4.790 |
offenses | -4.769 |
Token | I |
Token ID | 40 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
Construction | +29.275 |
Building | +27.930 |
Located | +27.823 |
Built | +27.619 |
Laun | +25.973 |
Neg logit contributions | |
percentages | -25.190 |
percentile | -23.528 |
disapprove | -23.391 |
unfavorable | -23.009 |
indict | -22.718 |
Token | 'm |
Token ID | 1101 |
Feature activation | -6.53e+00 |
Pos logit contributions | |
civilisation | +11.545 |
paradise | +10.987 |
rebuilt | +10.921 |
Construction | +10.848 |
Built | +10.400 |
Neg logit contributions | |
percentages | -10.235 |
percentile | -9.292 |
pts | -8.916 |
unfavorable | -8.860 |
offenses | -8.856 |
Token | so |
Token ID | 523 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
civilisation | +5.295 |
Construction | +5.004 |
paradise | +4.998 |
rebuilt | +4.678 |
Built | +4.572 |
Neg logit contributions | |
percentages | -6.669 |
percentile | -6.297 |
percentage | -6.004 |
pts | -5.932 |
offenses | -5.909 |
Token | proud |
Token ID | 6613 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
civilisation | +12.344 |
Construction | +11.628 |
paradise | +11.600 |
rebuilt | +11.147 |
transformed | +10.891 |
Neg logit contributions | |
percentages | -16.093 |
percentile | -15.394 |
offenses | -14.547 |
inacc | -14.488 |
pts | -14.243 |
Token | to |
Token ID | 284 |
Feature activation | -2.84e+01 |
Pos logit contributions | |
civilisation | +21.045 |
Construction | +20.589 |
paradise | +20.043 |
Built | +19.387 |
Harbour | +19.182 |
Neg logit contributions | |
percentages | -9.770 |
percentile | -8.755 |
unfavorable | -8.112 |
offenses | -7.987 |
disapprove | -7.944 |
Token | have |
Token ID | 423 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
civilisation | +16.091 |
rebuilt | +15.789 |
Construction | +15.618 |
paradise | +15.460 |
Built | +15.157 |
Neg logit contributions | |
percentages | -13.158 |
percentile | -12.621 |
unfavorable | -11.259 |
offenses | -11.242 |
inacc | -11.198 |
Token | now |
Token ID | 783 |
Feature activation | -3.42e+01 |
Pos logit contributions | |
rebuilt | +21.837 |
civilisation | +21.737 |
paradise | +21.107 |
transformed | +20.816 |
Construction | +20.255 |
Neg logit contributions | |
percentages | -15.559 |
percentile | -15.266 |
disapprove | -14.305 |
percent | -14.093 |
Percent | -13.638 |
Token | returned |
Token ID | 4504 |
Feature activation | -2.98e+01 |
Pos logit contributions | |
rebuilt | +24.462 |
transformed | +23.617 |
civilisation | +23.048 |
paradise | +22.845 |
realised | +22.715 |
Neg logit contributions | |
percentile | -18.564 |
percentages | -18.173 |
inacc | -16.952 |
disapprove | -16.906 |
percent | -16.394 |
Token | to |
Token ID | 284 |
Feature activation | -2.79e+01 |
Pos logit contributions | |
civilisation | +21.959 |
paradise | +21.346 |
rebuilt | +19.751 |
Construction | +19.567 |
bustling | +19.311 |
Neg logit contributions | |
percentile | -18.492 |
percentages | -18.491 |
disapprove | -16.490 |
inacc | -16.222 |
percent | -16.092 |
Token | Ireland |
Token ID | 7517 |
Feature activation | -3.02e+01 |
Pos logit contributions | |
civilisation | +22.731 |
paradise | +22.070 |
bustling | +20.204 |
rebuilt | +20.115 |
revital | +19.949 |
Neg logit contributions | |
percentile | -16.600 |
percentages | -16.544 |
pts | -14.463 |
percent | -14.371 |
unfavorable | -14.298 |
Token | and |
Token ID | 290 |
Feature activation | -4.49e+01 |
Pos logit contributions | |
civilisation | +22.068 |
paradise | +21.855 |
rebuilt | +21.448 |
Construction | +21.407 |
revital | +20.636 |
Neg logit contributions | |
percentages | -17.612 |
percentile | -17.348 |
inacc | -15.763 |
disapprove | -15.520 |
pts | -15.243 |
Token | set |
Token ID | 900 |
Feature activation | -1.48e+01 |
Pos logit contributions | |
rebuilt | +29.690 |
civilisation | +29.033 |
transformed | +28.068 |
paradise | +27.752 |
refurb | +27.555 |
Neg logit contributions | |
percentile | -18.274 |
percentages | -18.008 |
inacc | -16.304 |
percent | -16.110 |
unfavorable | -15.689 |
Token | up |
Token ID | 510 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
civilisation | +13.154 |
Construction | +12.394 |
paradise | +12.382 |
Built | +11.767 |
rebuilt | +11.493 |
Neg logit contributions | |
percentages | -11.626 |
percentile | -11.514 |
disapprove | -10.325 |
unfavorable | -10.215 |
percentage | -10.145 |
Token | Black |
Token ID | 2619 |
Feature activation | -1.41e+01 |
Pos logit contributions | |
civilisation | +18.819 |
paradise | +18.357 |
Construction | +17.775 |
Located | +17.330 |
Harbour | +17.240 |
Neg logit contributions | |
percentages | -15.142 |
percentile | -14.958 |
unfavorable | -13.837 |
disapprove | -13.716 |
percent | -13.178 |
Token | Donkey |
Token ID | 43823 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
civilisation | +8.653 |
Construction | +7.991 |
paradise | +7.797 |
Harbour | +7.694 |
Located | +7.498 |
Neg logit contributions | |
percentages | -15.079 |
percentile | -14.347 |
pts | -13.899 |
percentage | -13.730 |
unfavorable | -13.712 |
Token | brewery |
Token ID | 22120 |
Feature activation | -2.87e+01 |
Pos logit contributions | |
paradise | +25.801 |
Construction | +25.635 |
civilisation | +25.450 |
Located | +24.744 |
rebuilt | +24.490 |
Neg logit contributions | |
percentile | -17.171 |
percentages | -16.815 |
unfavorable | -15.308 |
pts | -14.968 |
inacc | -14.871 |
Token | UK |
Token ID | 3482 |
Feature activation | -3.25e+01 |
Pos logit contributions | |
civilisation | +21.718 |
countryside | +20.597 |
paradise | +20.524 |
bustling | +19.980 |
revital | +19.692 |
Neg logit contributions | |
percentages | -16.740 |
percentile | -15.476 |
pts | -15.002 |
unfavorable | -14.872 |
disapprove | -14.791 |
Token | and |
Token ID | 290 |
Feature activation | -3.88e+01 |
Pos logit contributions | |
civilisation | +25.026 |
Construction | +24.196 |
paradise | +23.598 |
rebuilt | +22.886 |
Located | +22.736 |
Neg logit contributions | |
percentages | -18.394 |
percentile | -16.051 |
inacc | -15.625 |
pts | -15.527 |
disapprove | -15.180 |
Token | the |
Token ID | 262 |
Feature activation | -3.25e+01 |
Pos logit contributions | |
civilisation | +28.824 |
paradise | +26.283 |
revital | +25.767 |
transformed | +25.750 |
countryside | +25.423 |
Neg logit contributions | |
percentages | -17.463 |
percentile | -16.412 |
percent | -16.035 |
unfavorable | -15.269 |
inacc | -15.224 |
Token | benchmark |
Token ID | 18335 |
Feature activation | -3.70e+01 |
Pos logit contributions | |
civilisation | +26.841 |
countryside | +25.657 |
paradise | +25.528 |
Construction | +25.141 |
revital | +24.860 |
Neg logit contributions | |
percentages | -14.495 |
percentile | -13.755 |
pts | -13.397 |
criticize | -13.150 |
injure | -13.041 |
Token | from |
Token ID | 422 |
Feature activation | -2.85e+01 |
Pos logit contributions | |
civilisation | +29.904 |
Construction | +28.297 |
paradise | +28.247 |
building | +27.387 |
redevelopment | +26.771 |
Neg logit contributions | |
percentages | -14.462 |
percentile | -13.328 |
unfavorable | -13.064 |
disapprove | -12.943 |
partName | -12.918 |
Token | which |
Token ID | 543 |
Feature activation | -4.47e+01 |
Pos logit contributions | |
civilisation | +23.321 |
paradise | +21.567 |
Construction | +21.517 |
Harbour | +20.331 |
architecture | +20.123 |
Neg logit contributions | |
percentages | -16.679 |
percentile | -15.750 |
unfavorable | -14.739 |
partName | -14.397 |
pts | -14.255 |
Token | we |
Token ID | 356 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
civilisation | +32.856 |
paradise | +29.672 |
Construction | +29.031 |
gardens | +28.895 |
building | +28.576 |
Neg logit contributions | |
percentages | -16.088 |
percentile | -15.364 |
partName | -14.884 |
percent | -14.646 |
pts | -14.534 |
Token | will |
Token ID | 481 |
Feature activation | -2.17e+01 |
Pos logit contributions | |
civilisation | +12.210 |
rebuilt | +11.673 |
paradise | +11.409 |
Construction | +11.366 |
Built | +10.964 |
Neg logit contributions | |
percentages | -8.896 |
percentile | -8.170 |
inacc | -7.966 |
unfavorable | -7.916 |
pts | -7.796 |
Token | launch |
Token ID | 4219 |
Feature activation | -3.92e+01 |
Pos logit contributions | |
civilisation | +17.922 |
paradise | +17.234 |
rebuilt | +16.980 |
revital | +16.571 |
refurb | +16.517 |
Neg logit contributions | |
percentages | -14.498 |
inacc | -13.556 |
Percent | -12.956 |
unfavorable | -12.896 |
percentile | -12.820 |
Token | all |
Token ID | 477 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
civilisation | +28.790 |
Construction | +27.764 |
paradise | +27.731 |
gardens | +26.247 |
Harbour | +26.147 |
Neg logit contributions | |
percentages | -16.648 |
percentile | -15.277 |
partName | -14.884 |
unfavorable | -14.659 |
inacc | -14.601 |
Token | future |
Token ID | 2003 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
civilisation | +19.379 |
Construction | +18.850 |
paradise | +18.465 |
rebuilt | +17.929 |
Built | +17.720 |
Neg logit contributions | |
percentages | -9.236 |
percentile | -8.346 |
unfavorable | -7.778 |
pts | -7.651 |
percentage | -7.510 |
Token | � |
Token ID | 447 |
Feature activation | -9.26e+00 |
Pos logit contributions | |
civilisation | +6.824 |
Construction | +6.671 |
paradise | +6.544 |
Built | +6.370 |
Located | +6.350 |
Neg logit contributions | |
percentages | -5.464 |
percentile | -5.039 |
percentage | -4.713 |
pts | -4.680 |
unfavorable | -4.633 |
Token | � |
Token ID | 251 |
Feature activation | -1.62e+01 |
Pos logit contributions | |
civilisation | +5.429 |
Construction | +5.351 |
paradise | +5.191 |
Built | +4.960 |
rebuilt | +4.866 |
Neg logit contributions | |
percentages | -10.852 |
percentile | -10.112 |
percentage | -9.857 |
unfavorable | -9.784 |
inaccur | -9.774 |
Token | which |
Token ID | 543 |
Feature activation | -3.60e+01 |
Pos logit contributions | |
Construction | +15.475 |
civilisation | +15.427 |
paradise | +15.172 |
Located | +14.961 |
Built | +14.887 |
Neg logit contributions | |
percentages | -11.036 |
percentile | -10.188 |
percentage | -9.372 |
pts | -9.320 |
unfavorable | -9.196 |
Token | the |
Token ID | 262 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
rebuilt | +26.004 |
transformed | +25.825 |
civilisation | +25.617 |
Construction | +25.486 |
paradise | +25.138 |
Neg logit contributions | |
percentages | -16.478 |
percentile | -15.669 |
inacc | -14.361 |
pts | -14.172 |
unfavorable | -14.052 |
Token | book |
Token ID | 1492 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
civilisation | +12.725 |
Construction | +12.156 |
paradise | +12.067 |
rebuilt | +11.602 |
Built | +11.453 |
Neg logit contributions | |
percentages | -10.367 |
percentile | -9.711 |
pts | -9.013 |
percentage | -8.791 |
offenses | -8.650 |
Token | said |
Token ID | 531 |
Feature activation | -4.38e+01 |
Pos logit contributions | |
civilisation | +2.502 |
Construction | +2.414 |
paradise | +2.363 |
Built | +2.268 |
rebuilt | +2.253 |
Neg logit contributions | |
percentages | -2.196 |
percentile | -2.030 |
percentage | -1.945 |
pts | -1.882 |
unfavorable | -1.879 |
Token | was |
Token ID | 373 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
transformed | +28.404 |
rebuilt | +28.244 |
Construction | +28.135 |
paradise | +27.761 |
revital | +27.748 |
Neg logit contributions | |
percentages | -17.292 |
percentile | -16.554 |
inacc | -15.791 |
pts | -14.941 |
disapprove | -14.333 |
Token | later |
Token ID | 1568 |
Feature activation | -3.27e+01 |
Pos logit contributions | |
paradise | +19.328 |
civilisation | +19.254 |
Construction | +19.006 |
rebuilt | +18.949 |
Built | +18.856 |
Neg logit contributions | |
percentages | -13.280 |
percentile | -12.093 |
pts | -11.062 |
percentage | -11.046 |
inacc | -10.934 |
Token | called |
Token ID | 1444 |
Feature activation | -1.62e+01 |
Pos logit contributions | |
rebuilt | +25.866 |
transformed | +24.778 |
refurb | +24.539 |
renovated | +24.345 |
revital | +23.598 |
Neg logit contributions | |
percentages | -17.106 |
percentile | -16.724 |
inacc | -14.812 |
pts | -14.295 |
disapprove | -14.295 |
Token | the |
Token ID | 262 |
Feature activation | -1.79e+01 |
Pos logit contributions | |
civilisation | +14.921 |
Construction | +14.604 |
paradise | +14.571 |
Located | +13.918 |
Harbour | +13.747 |
Neg logit contributions | |
percentages | -11.634 |
percentile | -10.569 |
percentage | -9.943 |
pts | -9.891 |
inacc | -9.822 |
Token | Stephen |
Token ID | 7970 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
civilisation | +16.666 |
paradise | +16.379 |
Construction | +16.188 |
Located | +15.482 |
rebuilt | +15.467 |
Neg logit contributions | |
percentages | -12.117 |
percentile | -10.906 |
inacc | -10.258 |
pts | -10.234 |
unfavorable | -10.227 |
Token | D |
Token ID | 360 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
civilisation | +20.909 |
Construction | +19.446 |
paradise | +19.352 |
Harbour | +18.916 |
bustling | +18.103 |
Neg logit contributions | |
percentages | -15.537 |
percentile | -14.419 |
unfavorable | -13.669 |
regress | -13.229 |
pts | -13.195 |
Token | obbies |
Token ID | 41372 |
Feature activation | -2.22e+01 |
Pos logit contributions | |
Construction | +8.252 |
civilisation | +8.099 |
Built | +7.698 |
paradise | +7.688 |
Located | +7.582 |
Neg logit contributions | |
percentages | -10.924 |
percentile | -10.323 |
percentage | -9.918 |
unfavorable | -9.837 |
inaccur | -9.708 |
Token | , |
Token ID | 11 |
Feature activation | -7.92e+00 |
Pos logit contributions | |
civilisation | +19.126 |
Construction | +18.820 |
paradise | +18.525 |
Built | +17.615 |
Harbour | +17.276 |
Neg logit contributions | |
percentages | -15.294 |
percentile | -14.093 |
unfavorable | -13.601 |
regress | -12.948 |
offenses | -12.782 |
Token | said |
Token ID | 531 |
Feature activation | -3.01e+01 |
Pos logit contributions | |
civilisation | +6.339 |
Construction | +5.988 |
paradise | +5.866 |
rebuilt | +5.568 |
Built | +5.464 |
Neg logit contributions | |
percentages | -8.083 |
percentile | -7.715 |
percentage | -7.225 |
unfavorable | -7.186 |
offenses | -7.130 |
Token | : |
Token ID | 25 |
Feature activation | -6.68e+00 |
Pos logit contributions | |
civilisation | +24.234 |
Construction | +23.659 |
paradise | +23.241 |
refurb | +21.646 |
renovation | +21.592 |
Neg logit contributions | |
percentages | -15.974 |
percentile | -15.056 |
criticize | -13.900 |
percent | -13.863 |
partName | -13.811 |
Token | " |
Token ID | 366 |
Feature activation | -4.37e+01 |
Pos logit contributions | |
Construction | +5.309 |
civilisation | +5.235 |
paradise | +4.975 |
Built | +4.896 |
Located | +4.872 |
Neg logit contributions | |
percentages | -6.794 |
percentile | -6.316 |
unfavorable | -6.130 |
disapprove | -6.046 |
offenses | -6.045 |
Token | The |
Token ID | 464 |
Feature activation | -2.86e+01 |
Pos logit contributions | |
Construction | +28.326 |
Located | +27.069 |
Building | +27.031 |
Built | +26.758 |
Laun | +25.458 |
Neg logit contributions | |
percentages | -25.899 |
percentile | -24.355 |
disapprove | -24.145 |
unfavorable | -23.909 |
indict | -23.215 |
Token | Aberdeen |
Token ID | 44985 |
Feature activation | -3.47e+01 |
Pos logit contributions | |
civilisation | +24.805 |
paradise | +23.896 |
Construction | +23.630 |
renovation | +23.018 |
revital | +22.898 |
Neg logit contributions | |
percentages | -13.962 |
percentile | -13.220 |
pts | -12.810 |
criticize | -12.419 |
injure | -12.234 |
Token | store |
Token ID | 3650 |
Feature activation | -3.62e+01 |
Pos logit contributions | |
civilisation | +26.848 |
Construction | +26.159 |
paradise | +26.045 |
Harbour | +25.342 |
countryside | +25.134 |
Neg logit contributions | |
percentages | -16.724 |
unfavorable | -15.261 |
percentile | -14.932 |
regress | -14.887 |
pts | -14.863 |
Token | is |
Token ID | 318 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
civilisation | +27.880 |
transformed | +26.302 |
paradise | +26.261 |
revital | +25.819 |
rebuilt | +25.529 |
Neg logit contributions | |
percentages | -16.553 |
percentile | -15.393 |
unfavorable | -15.358 |
disapprove | -15.095 |
pts | -14.981 |
Token | a |
Token ID | 257 |
Feature activation | -3.44e+01 |
Pos logit contributions | |
civilisation | +18.719 |
paradise | +18.691 |
rebuilt | +17.821 |
transformed | +17.529 |
Construction | +17.271 |
Neg logit contributions | |
percentages | -14.394 |
percentile | -12.892 |
disapprove | -12.649 |
pts | -12.610 |
percent | -12.344 |
Token | in |
Token ID | 287 |
Feature activation | -3.90e+01 |
Pos logit contributions | |
civilisation | +14.329 |
Construction | +13.805 |
paradise | +13.156 |
rebuilt | +12.829 |
Building | +12.736 |
Neg logit contributions | |
percentages | -12.772 |
percentile | -12.023 |
offenses | -11.215 |
pts | -11.093 |
percentage | -11.003 |
Token | the |
Token ID | 262 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
civilisation | +27.052 |
revital | +26.628 |
building | +26.554 |
refurb | +26.113 |
organising | +26.017 |
Neg logit contributions | |
percentile | -17.635 |
percentages | -17.366 |
percent | -15.762 |
pts | -15.693 |
disapprove | -15.487 |
Token | new |
Token ID | 649 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
civilisation | +26.589 |
revital | +26.256 |
refurb | +25.828 |
rebuilt | +25.724 |
Construction | +25.724 |
Neg logit contributions | |
percentages | -16.533 |
percentile | -16.299 |
injure | -14.919 |
disapprove | -14.722 |
criticize | -14.278 |
Token | Fans |
Token ID | 24964 |
Feature activation | -5.83e+00 |
Pos logit contributions | |
civilisation | +18.892 |
paradise | +17.794 |
Construction | +17.775 |
Building | +17.336 |
Harbour | +17.218 |
Neg logit contributions | |
percentages | -15.025 |
percentile | -14.668 |
disapprove | -13.531 |
injure | -13.430 |
unfavorable | -13.330 |
Token | ' |
Token ID | 6 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
civilisation | +4.669 |
Construction | +4.610 |
paradise | +4.466 |
Built | +4.278 |
Building | +4.256 |
Neg logit contributions | |
percentages | -5.995 |
percentile | -5.589 |
unfavorable | -5.367 |
percentage | -5.310 |
disapprove | -5.269 |
Token | Forum |
Token ID | 14867 |
Feature activation | -4.36e+01 |
Pos logit contributions | |
civilisation | +8.812 |
paradise | +8.258 |
Construction | +8.188 |
Building | +7.747 |
Harbour | +7.560 |
Neg logit contributions | |
percentages | -18.337 |
percentile | -17.511 |
unfavorable | -16.820 |
disapprove | -16.640 |
injure | -16.605 |
Token | . |
Token ID | 13 |
Feature activation | -2.91e+01 |
Pos logit contributions | |
civilisation | +28.681 |
Construction | +27.109 |
refurb | +26.462 |
building | +26.286 |
rebuilt | +26.267 |
Neg logit contributions | |
percentages | -18.721 |
percentile | -17.403 |
percent | -16.877 |
disapprove | -16.756 |
unfavorable | -16.690 |
Token | It |
Token ID | 632 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
Construction | +20.615 |
Building | +19.998 |
Built | +19.559 |
Located | +19.534 |
Harbour | +19.239 |
Neg logit contributions | |
percentages | -18.973 |
disapprove | -18.027 |
percentile | -18.011 |
regress | -17.994 |
injure | -17.790 |
Token | is |
Token ID | 318 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
civilisation | +17.208 |
rebuilt | +16.281 |
revital | +16.199 |
envis | +16.012 |
paradise | +15.832 |
Neg logit contributions | |
percentages | -17.195 |
percentile | -16.111 |
unfavorable | -15.766 |
disapprove | -15.592 |
Percent | -15.518 |
Token | seen |
Token ID | 1775 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
civilisation | +18.015 |
paradise | +17.409 |
rebuilt | +16.850 |
Construction | +16.683 |
envis | +16.537 |
Neg logit contributions | |
percentages | -13.335 |
percentile | -12.511 |
pts | -12.150 |
disapprove | -11.939 |
percent | -11.824 |
Token | as |
Token ID | 355 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
civilisation | +12.347 |
Construction | +11.404 |
paradise | +11.374 |
rebuilt | +10.776 |
revital | +10.692 |
Neg logit contributions | |
percentages | -12.560 |
percentile | -11.863 |
pts | -11.192 |
disapprove | -11.089 |
percentage | -11.074 |
Token | ienne |
Token ID | 37938 |
Feature activation | -7.71e-01 |
Pos logit contributions | |
civilisation | +7.649 |
Construction | +7.186 |
paradise | +7.056 |
issance | +6.798 |
Built | +6.790 |
Neg logit contributions | |
percentages | -10.145 |
percentile | -9.371 |
unfavorable | -9.075 |
percentage | -8.977 |
pts | -8.892 |
Token | describes |
Token ID | 8477 |
Feature activation | -6.63e+00 |
Pos logit contributions | |
civilisation | +0.754 |
Construction | +0.727 |
paradise | +0.708 |
Built | +0.681 |
Located | +0.675 |
Neg logit contributions | |
percentages | -0.694 |
percentile | -0.643 |
percentage | -0.616 |
unfavorable | -0.598 |
pts | -0.596 |
Token | the |
Token ID | 262 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
civilisation | +6.135 |
paradise | +5.729 |
Construction | +5.722 |
Built | +5.364 |
Located | +5.286 |
Neg logit contributions | |
percentages | -6.028 |
percentile | -5.671 |
percentage | -5.360 |
unfavorable | -5.297 |
pts | -5.208 |
Token | ideological |
Token ID | 15735 |
Feature activation | -7.06e+00 |
Pos logit contributions | |
civilisation | +16.100 |
paradise | +14.888 |
Construction | +14.708 |
rebuilt | +14.009 |
revital | +13.848 |
Neg logit contributions | |
percentages | -10.224 |
percentile | -9.620 |
pts | -8.901 |
unfavorable | -8.649 |
disapprove | -8.641 |
Token | context |
Token ID | 4732 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
civilisation | +7.195 |
paradise | +6.779 |
Construction | +6.705 |
rebuilt | +6.300 |
Built | +6.254 |
Neg logit contributions | |
percentages | -5.774 |
percentile | -5.373 |
percentage | -5.027 |
pts | -5.002 |
unfavorable | -4.966 |
Token | that |
Token ID | 326 |
Feature activation | -4.29e+01 |
Pos logit contributions | |
civilisation | +14.612 |
Construction | +14.067 |
paradise | +13.742 |
Built | +13.380 |
rebuilt | +13.332 |
Neg logit contributions | |
percentages | -5.995 |
percentile | -5.436 |
percentage | -4.838 |
pts | -4.583 |
offenses | -4.517 |
Token | gave |
Token ID | 2921 |
Feature activation | -2.80e+01 |
Pos logit contributions | |
civilisation | +31.500 |
transformed | +30.184 |
rebuilt | +28.377 |
paradise | +27.868 |
revital | +27.715 |
Neg logit contributions | |
percentages | -15.321 |
percentile | -14.555 |
percent | -13.995 |
pts | -13.258 |
injure | -12.572 |
Token | birth |
Token ID | 4082 |
Feature activation | -2.00e+01 |
Pos logit contributions | |
civilisation | +24.842 |
paradise | +22.062 |
Construction | +21.216 |
transformed | +20.688 |
Built | +20.552 |
Neg logit contributions | |
percentages | -15.230 |
percentile | -13.982 |
percent | -13.350 |
offenses | -12.462 |
pts | -12.380 |
Token | to |
Token ID | 284 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
civilisation | +16.882 |
Construction | +15.727 |
paradise | +15.577 |
issance | +14.668 |
Located | +14.612 |
Neg logit contributions | |
percentages | -14.209 |
percentile | -13.298 |
percentage | -12.419 |
unfavorable | -12.177 |
inacc | -12.076 |
Token | this |
Token ID | 428 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
civilisation | +10.639 |
paradise | +9.731 |
Construction | +9.453 |
Built | +8.989 |
rebuilt | +8.987 |
Neg logit contributions | |
percentages | -9.672 |
percentile | -9.127 |
unfavorable | -8.516 |
percentage | -8.488 |
pts | -8.426 |
Token | field |
Token ID | 2214 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
civilisation | +15.489 |
paradise | +14.373 |
Construction | +13.690 |
rebuilt | +13.540 |
revital | +13.290 |
Neg logit contributions | |
percentages | -11.106 |
percentile | -10.140 |
pts | -9.580 |
offenses | -9.409 |
percent | -9.341 |
Token | Museum |
Token ID | 9594 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
civilisation | +20.041 |
Construction | +18.417 |
paradise | +17.989 |
Harbour | +17.886 |
rebuilt | +17.531 |
Neg logit contributions | |
percentages | -13.593 |
percentile | -12.465 |
unfavorable | -11.607 |
pts | -11.483 |
percentage | -11.227 |
Token | in |
Token ID | 287 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
civilisation | +14.966 |
Construction | +14.390 |
paradise | +13.937 |
Built | +13.751 |
rebuilt | +13.637 |
Neg logit contributions | |
percentages | -7.312 |
percentile | -6.922 |
pts | -5.957 |
unfavorable | -5.928 |
percentage | -5.876 |
Token | northern |
Token ID | 7840 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
civilisation | +20.115 |
paradise | +18.723 |
rebuilt | +18.597 |
Construction | +18.378 |
Harbour | +18.098 |
Neg logit contributions | |
percentages | -15.099 |
percentile | -14.632 |
disapprove | -13.342 |
pts | -13.267 |
inaccur | -13.197 |
Token | Siber |
Token ID | 28394 |
Feature activation | -9.12e+00 |
Pos logit contributions | |
civilisation | +14.243 |
paradise | +12.734 |
rebuilt | +11.980 |
Construction | +11.968 |
countryside | +11.921 |
Neg logit contributions | |
percentages | -18.219 |
percentile | -17.573 |
percent | -16.432 |
pts | -16.402 |
disapprove | -16.351 |
Token | a |
Token ID | 64 |
Feature activation | -2.33e+01 |
Pos logit contributions | |
civilisation | +7.548 |
Construction | +7.076 |
paradise | +6.916 |
Built | +6.816 |
rebuilt | +6.677 |
Neg logit contributions | |
percentages | -8.986 |
percentile | -8.369 |
percentage | -8.017 |
unfavorable | -7.941 |
pts | -7.913 |
Token | and |
Token ID | 290 |
Feature activation | -4.28e+01 |
Pos logit contributions | |
civilisation | +20.956 |
paradise | +19.357 |
countryside | +19.164 |
Construction | +19.156 |
Harbour | +18.955 |
Neg logit contributions | |
percentages | -14.863 |
percentile | -14.112 |
unfavorable | -12.751 |
inacc | -12.421 |
pts | -12.401 |
Token | named |
Token ID | 3706 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
civilisation | +31.033 |
rebuilt | +30.166 |
Harbour | +29.089 |
transformed | +28.792 |
paradise | +28.408 |
Neg logit contributions | |
percentages | -16.555 |
percentile | -16.116 |
inacc | -14.889 |
pts | -14.636 |
percent | -14.351 |
Token | Ly |
Token ID | 9334 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
civilisation | +10.525 |
paradise | +9.909 |
Construction | +9.744 |
Built | +9.248 |
Harbour | +9.234 |
Neg logit contributions | |
percentages | -9.637 |
percentile | -9.060 |
percentage | -8.467 |
unfavorable | -8.313 |
offenses | -8.302 |
Token | uba |
Token ID | 22013 |
Feature activation | -1.51e+01 |
Pos logit contributions | |
civilisation | +4.214 |
Construction | +4.086 |
paradise | +3.870 |
Built | +3.805 |
Located | +3.733 |
Neg logit contributions | |
percentages | -5.258 |
percentile | -4.939 |
percentage | -4.695 |
unfavorable | -4.641 |
inaccur | -4.639 |
Token | , |
Token ID | 11 |
Feature activation | -9.38e+00 |
Pos logit contributions | |
civilisation | +15.131 |
Construction | +14.309 |
paradise | +14.141 |
Harbour | +13.696 |
issance | +13.574 |
Neg logit contributions | |
percentages | -10.369 |
percentile | -9.695 |
unfavorable | -8.833 |
inacc | -8.782 |
inaccur | -8.753 |
Token | after |
Token ID | 706 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
civilisation | +9.883 |
Construction | +9.339 |
paradise | +9.277 |
rebuilt | +8.986 |
Built | +8.979 |
Neg logit contributions | |
percentages | -6.918 |
percentile | -6.508 |
percentage | -5.953 |
pts | -5.918 |
offenses | -5.832 |
Token | on |
Token ID | 319 |
Feature activation | -3.00e+01 |
Pos logit contributions | |
civilisation | +21.829 |
paradise | +21.167 |
rebuilt | +20.763 |
refurb | +20.122 |
transformed | +20.042 |
Neg logit contributions | |
percentages | -16.726 |
percentile | -16.439 |
Percent | -15.433 |
pts | -15.265 |
percent | -15.030 |
Token | site |
Token ID | 2524 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
civilisation | +24.286 |
paradise | +22.704 |
Construction | +22.118 |
refurb | +21.706 |
Harbour | +21.680 |
Neg logit contributions | |
percentages | -15.738 |
percentile | -15.731 |
percent | -13.940 |
Percent | -13.899 |
unfavorable | -13.342 |
Token | until |
Token ID | 1566 |
Feature activation | -4.22e+01 |
Pos logit contributions | |
civilisation | +20.335 |
paradise | +18.972 |
Construction | +18.361 |
rebuilt | +18.317 |
refurb | +17.776 |
Neg logit contributions | |
percentages | -16.048 |
percentile | -15.652 |
pts | -14.816 |
percent | -14.666 |
Percent | -14.426 |
Token | the |
Token ID | 262 |
Feature activation | -2.82e+01 |
Pos logit contributions | |
civilisation | +30.365 |
redevelopment | +29.185 |
Construction | +28.647 |
refurb | +28.535 |
rebuilt | +28.414 |
Neg logit contributions | |
percentile | -16.829 |
percentages | -16.525 |
percent | -14.904 |
omit | -14.777 |
pts | -14.732 |
Token | area |
Token ID | 1989 |
Feature activation | -3.58e+01 |
Pos logit contributions | |
civilisation | +22.974 |
Construction | +21.583 |
countryside | +21.581 |
paradise | +21.446 |
redevelopment | +21.304 |
Neg logit contributions | |
percentages | -15.202 |
percentile | -15.090 |
pts | -13.707 |
percent | -13.202 |
unfavorable | -13.099 |
Token | is |
Token ID | 318 |
Feature activation | -4.22e+01 |
Pos logit contributions | |
civilisation | +26.651 |
revital | +24.544 |
transformed | +23.975 |
paradise | +23.779 |
redevelopment | +23.749 |
Neg logit contributions | |
percentages | -17.498 |
percentile | -17.082 |
percent | -16.411 |
omit | -16.306 |
pts | -16.067 |
Token | developed |
Token ID | 4166 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
civilisation | +26.904 |
transformed | +25.359 |
rebuilt | +25.119 |
revital | +24.895 |
redevelop | +24.182 |
Neg logit contributions | |
percentages | -21.100 |
percentile | -19.654 |
inacc | -19.625 |
omit | -19.011 |
percent | -18.989 |
Token | . |
Token ID | 13 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
civilisation | +22.845 |
paradise | +21.054 |
Construction | +20.862 |
rebuilt | +20.493 |
Harbour | +19.723 |
Neg logit contributions | |
percentages | -15.253 |
pts | -14.244 |
percentile | -14.185 |
inacc | -13.536 |
percent | -13.032 |
Token | The |
Token ID | 383 |
Feature activation | -1.84e+01 |
Pos logit contributions | |
Construction | +17.381 |
Harbour | +15.908 |
civilisation | +15.665 |
Building | +15.663 |
Built | +15.505 |
Neg logit contributions | |
percentages | -18.038 |
percentile | -17.229 |
regress | -17.005 |
unfavorable | -16.547 |
inaccur | -16.478 |
Token | cost |
Token ID | 1575 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
civilisation | +18.498 |
Construction | +17.926 |
paradise | +17.508 |
refurb | +17.038 |
rebuilt | +17.015 |
Neg logit contributions | |
percentages | -10.131 |
percentile | -10.077 |
pts | -9.079 |
unfavorable | -8.972 |
criticize | -8.775 |
Token | of |
Token ID | 286 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
percentages | +8.358 |
percentile | +7.623 |
percentage | +7.531 |
inaccur | +7.027 |
vs | +7.000 |
Neg logit contributions | |
civilisation | -9.861 |
Construction | -9.604 |
paradise | -9.439 |
ufact | -9.188 |
Built | -9.187 |
Token | ied |
Token ID | 798 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
civilisation | +5.638 |
rebuilt | +5.420 |
paradise | +5.374 |
Built | +5.335 |
Construction | +5.243 |
Neg logit contributions | |
percentages | -12.065 |
percentile | -11.208 |
inacc | -10.952 |
unfavorable | -10.947 |
offenses | -10.918 |
Token | and |
Token ID | 290 |
Feature activation | -3.40e+01 |
Pos logit contributions | |
civilisation | +11.946 |
paradise | +11.378 |
Construction | +11.152 |
rebuilt | +11.028 |
refurb | +10.573 |
Neg logit contributions | |
percentages | -8.440 |
percentile | -7.853 |
percentage | -7.237 |
inacc | -7.212 |
pts | -7.186 |
Token | remain |
Token ID | 3520 |
Feature activation | -2.93e+01 |
Pos logit contributions | |
civilisation | +27.834 |
rebuilt | +27.059 |
refurb | +26.316 |
paradise | +25.729 |
transformed | +25.725 |
Neg logit contributions | |
percentile | -14.424 |
percentages | -14.333 |
percent | -13.164 |
pts | -12.989 |
Percent | -12.873 |
Token | on |
Token ID | 319 |
Feature activation | -3.00e+01 |
Pos logit contributions | |
civilisation | +21.829 |
paradise | +21.167 |
rebuilt | +20.763 |
refurb | +20.122 |
transformed | +20.042 |
Neg logit contributions | |
percentages | -16.726 |
percentile | -16.439 |
Percent | -15.433 |
pts | -15.265 |
percent | -15.030 |
Token | site |
Token ID | 2524 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
civilisation | +24.286 |
paradise | +22.704 |
Construction | +22.118 |
refurb | +21.706 |
Harbour | +21.680 |
Neg logit contributions | |
percentages | -15.738 |
percentile | -15.731 |
percent | -13.940 |
Percent | -13.899 |
unfavorable | -13.342 |
Token | until |
Token ID | 1566 |
Feature activation | -4.22e+01 |
Pos logit contributions | |
civilisation | +20.335 |
paradise | +18.972 |
Construction | +18.361 |
rebuilt | +18.317 |
refurb | +17.776 |
Neg logit contributions | |
percentages | -16.048 |
percentile | -15.652 |
pts | -14.816 |
percent | -14.666 |
Percent | -14.426 |
Token | the |
Token ID | 262 |
Feature activation | -2.82e+01 |
Pos logit contributions | |
civilisation | +30.365 |
redevelopment | +29.185 |
Construction | +28.647 |
refurb | +28.535 |
rebuilt | +28.414 |
Neg logit contributions | |
percentile | -16.829 |
percentages | -16.525 |
percent | -14.904 |
omit | -14.777 |
pts | -14.732 |
Token | area |
Token ID | 1989 |
Feature activation | -3.58e+01 |
Pos logit contributions | |
civilisation | +22.974 |
Construction | +21.583 |
countryside | +21.581 |
paradise | +21.446 |
redevelopment | +21.304 |
Neg logit contributions | |
percentages | -15.202 |
percentile | -15.090 |
pts | -13.707 |
percent | -13.202 |
unfavorable | -13.099 |
Token | is |
Token ID | 318 |
Feature activation | -4.22e+01 |
Pos logit contributions | |
civilisation | +26.651 |
revital | +24.544 |
transformed | +23.975 |
paradise | +23.779 |
redevelopment | +23.749 |
Neg logit contributions | |
percentages | -17.498 |
percentile | -17.082 |
percent | -16.411 |
omit | -16.306 |
pts | -16.067 |
Token | developed |
Token ID | 4166 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
civilisation | +26.904 |
transformed | +25.359 |
rebuilt | +25.119 |
revital | +24.895 |
redevelop | +24.182 |
Neg logit contributions | |
percentages | -21.100 |
percentile | -19.654 |
inacc | -19.625 |
omit | -19.011 |
percent | -18.989 |
Token | . |
Token ID | 13 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
civilisation | +22.845 |
paradise | +21.054 |
Construction | +20.862 |
rebuilt | +20.493 |
Harbour | +19.723 |
Neg logit contributions | |
percentages | -15.253 |
pts | -14.244 |
percentile | -14.185 |
inacc | -13.536 |
percent | -13.032 |
Token | proud |
Token ID | 6613 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
civilisation | +12.344 |
Construction | +11.628 |
paradise | +11.600 |
rebuilt | +11.147 |
transformed | +10.891 |
Neg logit contributions | |
percentages | -16.093 |
percentile | -15.394 |
offenses | -14.547 |
inacc | -14.488 |
pts | -14.243 |
Token | to |
Token ID | 284 |
Feature activation | -2.84e+01 |
Pos logit contributions | |
civilisation | +21.045 |
Construction | +20.589 |
paradise | +20.043 |
Built | +19.387 |
Harbour | +19.182 |
Neg logit contributions | |
percentages | -9.770 |
percentile | -8.755 |
unfavorable | -8.112 |
offenses | -7.987 |
disapprove | -7.944 |
Token | be |
Token ID | 307 |
Feature activation | -3.15e+01 |
Pos logit contributions | |
civilisation | +20.053 |
refurb | +19.927 |
revital | +19.912 |
paradise | +19.623 |
rebuilt | +19.337 |
Neg logit contributions | |
percentages | -18.675 |
inacc | -16.943 |
percentile | -16.770 |
unfavorable | -16.567 |
offenses | -16.238 |
Token | able |
Token ID | 1498 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
civilisation | +22.934 |
building | +22.238 |
Construction | +22.224 |
rebuilt | +21.884 |
refurb | +21.526 |
Neg logit contributions | |
percentages | -18.260 |
percentile | -17.785 |
pts | -16.566 |
regress | -16.296 |
percent | -16.233 |
Token | to |
Token ID | 284 |
Feature activation | -2.94e+01 |
Pos logit contributions | |
civilisation | +16.011 |
paradise | +15.487 |
rebuilt | +15.243 |
refurb | +14.989 |
revital | +14.671 |
Neg logit contributions | |
percentages | -20.307 |
percentile | -18.473 |
inacc | -18.166 |
Percent | -18.145 |
offenses | -18.056 |
Token | help |
Token ID | 1037 |
Feature activation | -4.22e+01 |
Pos logit contributions | |
refurb | +21.350 |
revital | +21.159 |
civilisation | +20.768 |
paradise | +20.663 |
rebuilt | +20.308 |
Neg logit contributions | |
percentages | -17.971 |
inacc | -16.780 |
percentile | -16.017 |
offenses | -15.975 |
unfavorable | -15.966 |
Token | open |
Token ID | 1280 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
civilisation | +29.159 |
revital | +28.434 |
refurb | +27.397 |
Construction | +26.944 |
rejuven | +26.883 |
Neg logit contributions | |
percentages | -18.730 |
percentile | -16.973 |
unfavorable | -16.736 |
inacc | -16.425 |
offenses | -16.116 |
Token | the |
Token ID | 262 |
Feature activation | -3.06e+01 |
Pos logit contributions | |
civilisation | +19.335 |
paradise | +18.769 |
Construction | +18.261 |
Harbour | +17.658 |
Built | +17.282 |
Neg logit contributions | |
percentages | -15.252 |
percentile | -14.170 |
unfavorable | -13.362 |
percentage | -13.170 |
inacc | -13.029 |
Token | new |
Token ID | 649 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
civilisation | +24.460 |
paradise | +24.164 |
bustling | +22.997 |
Construction | +22.962 |
building | +22.760 |
Neg logit contributions | |
percentages | -16.356 |
percentile | -14.991 |
unfavorable | -14.340 |
criticize | -14.206 |
offenses | -14.105 |
Token | store |
Token ID | 3650 |
Feature activation | -4.03e+01 |
Pos logit contributions | |
civilisation | +27.550 |
paradise | +27.214 |
building | +25.667 |
Construction | +25.031 |
bustling | +24.954 |
Neg logit contributions | |
percentages | -16.933 |
unfavorable | -15.234 |
percentile | -15.071 |
criticize | -14.946 |
pts | -14.926 |
Token | . |
Token ID | 13 |
Feature activation | -4.00e+01 |
Pos logit contributions | |
civilisation | +27.242 |
paradise | +27.028 |
Construction | +25.710 |
rebuilt | +25.452 |
building | +25.432 |
Neg logit contributions | |
percentages | -18.854 |
percentile | -17.215 |
unfavorable | -16.479 |
pts | -16.407 |
disapprove | -16.102 |
Token | will |
Token ID | 481 |
Feature activation | -2.17e+01 |
Pos logit contributions | |
civilisation | +12.210 |
rebuilt | +11.673 |
paradise | +11.409 |
Construction | +11.366 |
Built | +10.964 |
Neg logit contributions | |
percentages | -8.896 |
percentile | -8.170 |
inacc | -7.966 |
unfavorable | -7.916 |
pts | -7.796 |
Token | launch |
Token ID | 4219 |
Feature activation | -3.92e+01 |
Pos logit contributions | |
civilisation | +17.922 |
paradise | +17.234 |
rebuilt | +16.980 |
revital | +16.571 |
refurb | +16.517 |
Neg logit contributions | |
percentages | -14.498 |
inacc | -13.556 |
Percent | -12.956 |
unfavorable | -12.896 |
percentile | -12.820 |
Token | all |
Token ID | 477 |
Feature activation | -1.76e+01 |
Pos logit contributions | |
civilisation | +28.790 |
Construction | +27.764 |
paradise | +27.731 |
gardens | +26.247 |
Harbour | +26.147 |
Neg logit contributions | |
percentages | -16.648 |
percentile | -15.277 |
partName | -14.884 |
unfavorable | -14.659 |
inacc | -14.601 |
Token | future |
Token ID | 2003 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
civilisation | +19.379 |
Construction | +18.850 |
paradise | +18.465 |
rebuilt | +17.929 |
Built | +17.720 |
Neg logit contributions | |
percentages | -9.236 |
percentile | -8.346 |
unfavorable | -7.778 |
pts | -7.651 |
percentage | -7.510 |
Token | stores |
Token ID | 7000 |
Feature activation | -3.58e+01 |
Pos logit contributions | |
civilisation | +21.348 |
paradise | +20.629 |
Construction | +20.129 |
rebuilt | +19.542 |
refurb | +19.539 |
Neg logit contributions | |
percentages | -12.592 |
percentile | -11.811 |
unfavorable | -11.202 |
pts | -11.190 |
disapprove | -11.087 |
Token | . |
Token ID | 13 |
Feature activation | -4.19e+01 |
Pos logit contributions | |
civilisation | +25.854 |
paradise | +25.115 |
Construction | +25.084 |
rebuilt | +24.508 |
transformed | +23.823 |
Neg logit contributions | |
percentages | -17.778 |
percentile | -16.728 |
pts | -15.739 |
inacc | -15.187 |
unfavorable | -14.979 |
Token |
|
Token ID | 198 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
Construction | +24.624 |
Located | +23.218 |
Built | +22.789 |
Building | +22.703 |
Located | +22.458 |
Neg logit contributions | |
percentages | -24.802 |
unfavorable | -23.415 |
regress | -23.166 |
inaccur | -22.888 |
inconsist | -22.884 |
Token |
|
Token ID | 198 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
Construction | +6.516 |
Built | +6.040 |
Located | +6.033 |
Building | +5.878 |
paradise | +5.819 |
Neg logit contributions | |
percentages | -12.604 |
disapprove | -11.912 |
unfavorable | -11.456 |
percentile | -11.434 |
injure | -11.336 |
Token | " |
Token ID | 1 |
Feature activation | -4.78e+01 |
Pos logit contributions | |
Construction | +18.786 |
Built | +17.106 |
Building | +16.891 |
Located | +16.728 |
Laun | +16.011 |
Neg logit contributions | |
percentages | -21.385 |
percentile | -19.544 |
unfavorable | -19.174 |
disapprove | -18.940 |
percentage | -18.861 |
Token | Opening |
Token ID | 43093 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
Construction | +29.975 |
Building | +28.373 |
Located | +27.991 |
Built | +27.826 |
Laun | +26.914 |
Neg logit contributions | |
percentages | -27.376 |
disapprove | -26.393 |
unfavorable | -25.417 |
percentile | -25.095 |
regress | -25.030 |
Token | our |
Token ID | 674 |
Feature activation | -2.63e+01 |
Pos logit contributions | |
civilisation | +19.257 |
Construction | +18.526 |
paradise | +18.356 |
Harbour | +17.561 |
transformed | +17.089 |
Neg logit contributions | |
percentages | -11.223 |
percentile | -10.545 |
unfavorable | -9.965 |
pts | -9.660 |
percent | -9.472 |
Token | 6 |
Token ID | 21 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
percentages | +4.730 |
percentile | +4.162 |
percentage | +3.906 |
pts | +3.684 |
vs | +3.474 |
Neg logit contributions | |
civilisation | -17.385 |
Construction | -16.688 |
paradise | -16.480 |
ufact | -16.362 |
rebuilt | -15.890 |
Token | m |
Token ID | 76 |
Feature activation | -2.60e+01 |
Pos logit contributions | |
civilisation | +3.645 |
Construction | +3.511 |
paradise | +3.454 |
Built | +3.348 |
Located | +3.313 |
Neg logit contributions | |
percentages | -2.584 |
percentile | -2.350 |
percentage | -2.193 |
unfavorable | -2.179 |
pts | -2.157 |
Token | garden |
Token ID | 11376 |
Feature activation | -2.52e+01 |
Pos logit contributions | |
civilisation | +23.709 |
paradise | +23.143 |
Construction | +22.236 |
refurb | +22.118 |
renovation | +22.090 |
Neg logit contributions | |
percentages | -14.696 |
percentile | -13.113 |
pts | -12.342 |
offenses | -12.029 |
unfavorable | -11.993 |
Token | centre |
Token ID | 7372 |
Feature activation | -3.76e+01 |
Pos logit contributions | |
paradise | +23.576 |
civilisation | +23.501 |
renovation | +21.773 |
refurb | +21.449 |
Construction | +21.394 |
Neg logit contributions | |
percentages | -14.124 |
percentile | -12.669 |
pts | -12.230 |
unfavorable | -12.041 |
Percent | -11.763 |
Token | has |
Token ID | 468 |
Feature activation | -3.33e+01 |
Pos logit contributions | |
civilisation | +27.230 |
paradise | +26.867 |
Construction | +25.866 |
refurb | +25.711 |
transformed | +25.697 |
Neg logit contributions | |
percentages | -17.812 |
percentile | -16.953 |
pts | -15.837 |
unfavorable | -15.664 |
partName | -15.298 |
Token | been |
Token ID | 587 |
Feature activation | -4.18e+01 |
Pos logit contributions | |
transformed | +24.215 |
civilisation | +23.856 |
rebuilt | +23.319 |
revital | +23.119 |
paradise | +23.053 |
Neg logit contributions | |
percentages | -18.111 |
percentile | -16.882 |
Percent | -16.421 |
disapprove | -16.194 |
pts | -16.080 |
Token | officially |
Token ID | 8720 |
Feature activation | -3.99e+01 |
Pos logit contributions | |
rebuilt | +26.772 |
transformed | +26.408 |
erected | +26.164 |
refurb | +26.131 |
civilisation | +25.234 |
Neg logit contributions | |
percentages | -21.091 |
percentile | -20.344 |
pts | -18.772 |
Percent | -18.482 |
offenses | -18.448 |
Token | opened |
Token ID | 4721 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
refurb | +25.016 |
rebuilt | +24.874 |
transformed | +24.862 |
erected | +24.257 |
civilisation | +24.005 |
Neg logit contributions | |
percentages | -22.005 |
percentile | -21.742 |
pts | -19.342 |
inacc | -18.947 |
Percent | -18.904 |
Token | in |
Token ID | 287 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
civilisation | +20.261 |
paradise | +20.105 |
Construction | +19.679 |
refurb | +18.962 |
rebuilt | +18.915 |
Neg logit contributions | |
percentages | -17.242 |
percentile | -16.297 |
pts | -15.346 |
unfavorable | -15.175 |
inacc | -14.843 |
Token | Aberdeen |
Token ID | 44985 |
Feature activation | -2.60e+01 |
Pos logit contributions | |
civilisation | +20.718 |
paradise | +20.136 |
Harbour | +19.070 |
rebuilt | +19.010 |
Construction | +18.847 |
Neg logit contributions | |
percentages | -14.382 |
percentile | -13.776 |
unfavorable | -12.752 |
pts | -12.663 |
disapprove | -12.558 |
Token | , |
Token ID | 11 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
civilisation | +21.855 |
Construction | +21.323 |
Harbour | +21.068 |
paradise | +20.737 |
countryside | +20.183 |
Neg logit contributions | |
percentages | -16.252 |
percentile | -14.606 |
unfavorable | -14.127 |
regress | -13.841 |
pts | -13.759 |
Token | be |
Token ID | 307 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
civilisation | +6.643 |
paradise | +6.143 |
Construction | +5.983 |
rebuilt | +5.817 |
Built | +5.680 |
Neg logit contributions | |
percentages | -6.474 |
percentile | -5.983 |
unfavorable | -5.765 |
pts | -5.722 |
offenses | -5.642 |
Token | heard |
Token ID | 2982 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
civilisation | +8.538 |
rebuilt | +7.745 |
paradise | +7.570 |
Construction | +7.556 |
transformed | +7.466 |
Neg logit contributions | |
percentages | -13.070 |
percentile | -12.324 |
pts | -11.871 |
unfavorable | -11.848 |
disapprove | -11.846 |
Token | . |
Token ID | 13 |
Feature activation | -3.50e+01 |
Pos logit contributions | |
civilisation | +12.025 |
Construction | +11.142 |
paradise | +11.132 |
rebuilt | +10.616 |
revital | +10.397 |
Neg logit contributions | |
percentages | -11.319 |
percentile | -10.381 |
pts | -10.013 |
percentage | -9.834 |
unfavorable | -9.701 |
Token |
|
Token ID | 198 |
Feature activation | -7.72e+00 |
Pos logit contributions | |
Construction | +21.495 |
Building | +21.192 |
Located | +20.446 |
Built | +20.427 |
Laun | +20.396 |
Neg logit contributions | |
percentages | -22.815 |
disapprove | -21.910 |
injure | -21.887 |
regress | -21.760 |
percentile | -21.549 |
Token |
|
Token ID | 198 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
Construction | +5.208 |
Located | +4.830 |
Built | +4.827 |
civilisation | +4.802 |
Building | +4.724 |
Neg logit contributions | |
percentages | -8.754 |
disapprove | -8.109 |
percentile | -7.970 |
unfavorable | -7.880 |
offenses | -7.777 |
Token | " |
Token ID | 1 |
Feature activation | -4.18e+01 |
Pos logit contributions | |
Construction | +16.262 |
Building | +15.082 |
Built | +14.951 |
Located | +14.660 |
Laun | +14.333 |
Neg logit contributions | |
percentages | -20.818 |
percentile | -19.468 |
disapprove | -19.064 |
unfavorable | -18.858 |
percentage | -18.613 |
Token | We |
Token ID | 1135 |
Feature activation | -8.49e+00 |
Pos logit contributions | |
Building | +26.179 |
Construction | +26.122 |
Laun | +25.135 |
Built | +24.715 |
Located | +24.571 |
Neg logit contributions | |
percentages | -26.155 |
disapprove | -26.029 |
injure | -25.123 |
percentile | -25.053 |
unfavorable | -24.197 |
Token | welcome |
Token ID | 7062 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
civilisation | +8.766 |
rebuilt | +8.303 |
Construction | +8.267 |
paradise | +8.263 |
revital | +7.837 |
Neg logit contributions | |
percentages | -6.515 |
percentile | -5.866 |
pts | -5.526 |
unfavorable | -5.493 |
offenses | -5.434 |
Token | the |
Token ID | 262 |
Feature activation | -3.01e+01 |
Pos logit contributions | |
civilisation | +21.371 |
paradise | +20.336 |
rebuilt | +20.139 |
revital | +20.070 |
Construction | +20.014 |
Neg logit contributions | |
percentile | -15.655 |
percentages | -15.051 |
injure | -13.725 |
percent | -13.566 |
pts | -13.464 |
Token | initiative |
Token ID | 10219 |
Feature activation | -2.69e+01 |
Pos logit contributions | |
civilisation | +23.228 |
revital | +23.024 |
rebuilt | +22.897 |
refurb | +22.580 |
Construction | +22.429 |
Neg logit contributions | |
percentages | -15.693 |
percentile | -15.570 |
injure | -14.807 |
disapprove | -14.342 |
criticize | -13.991 |
Token | by |
Token ID | 416 |
Feature activation | -2.22e+01 |
Pos logit contributions | |
civilisation | +23.539 |
rebuilt | +22.623 |
envis | +22.593 |
paradise | +22.350 |
revital | +22.337 |
Neg logit contributions | |
percentages | -13.446 |
percentile | -12.972 |
injure | -12.422 |
inacc | -11.863 |
disapprove | -11.756 |
Token | it |
Token ID | 340 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
civilisation | +27.214 |
Construction | +25.538 |
revital | +25.458 |
paradise | +25.146 |
building | +25.099 |
Neg logit contributions | |
percentile | -17.060 |
percentages | -16.357 |
percent | -15.551 |
injure | -14.883 |
offenses | -14.663 |
Token | is |
Token ID | 318 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
civilisation | +18.794 |
revital | +17.676 |
paradise | +16.874 |
transformed | +16.782 |
rebuilt | +16.643 |
Neg logit contributions | |
percentages | -17.276 |
percentile | -16.574 |
disapprove | -16.245 |
percent | -16.203 |
Percent | -16.125 |
Token | the |
Token ID | 262 |
Feature activation | -2.63e+01 |
Pos logit contributions | |
civilisation | +20.028 |
paradise | +19.133 |
Construction | +19.001 |
transformed | +18.788 |
rebuilt | +18.713 |
Neg logit contributions | |
percentages | -13.627 |
percentile | -12.753 |
disapprove | -12.427 |
pts | -12.298 |
percent | -11.795 |
Token | first |
Token ID | 717 |
Feature activation | -2.17e+01 |
Pos logit contributions | |
civilisation | +21.087 |
paradise | +20.366 |
Construction | +19.576 |
rebuilt | +19.218 |
revital | +19.019 |
Neg logit contributions | |
percentages | -16.218 |
percentile | -15.282 |
disapprove | -14.807 |
percent | -14.367 |
offenses | -14.176 |
Token | step |
Token ID | 2239 |
Feature activation | -3.33e+01 |
Pos logit contributions | |
civilisation | +21.703 |
paradise | +20.217 |
Construction | +19.798 |
rebuilt | +19.722 |
Building | +19.590 |
Neg logit contributions | |
percentages | -11.583 |
percentile | -10.220 |
offenses | -10.004 |
disapprove | -9.810 |
unfavorable | -9.719 |
Token | towards |
Token ID | 3371 |
Feature activation | -4.18e+01 |
Pos logit contributions | |
civilisation | +25.855 |
paradise | +23.282 |
Construction | +23.093 |
Harbour | +22.411 |
paved | +22.268 |
Neg logit contributions | |
percentages | -17.173 |
percentile | -16.649 |
disapprove | -15.251 |
injure | -15.019 |
criticize | -14.621 |
Token | Newcastle |
Token ID | 22410 |
Feature activation | -2.82e+01 |
Pos logit contributions | |
civilisation | +30.014 |
building | +28.937 |
revital | +28.783 |
paradise | +27.745 |
refurb | +27.620 |
Neg logit contributions | |
percentages | -15.980 |
percentile | -15.781 |
disapprove | -15.068 |
percent | -14.958 |
pts | -14.504 |
Token | United |
Token ID | 1578 |
Feature activation | -3.21e+01 |
Pos logit contributions | |
civilisation | +22.926 |
paradise | +21.315 |
revital | +21.188 |
Construction | +21.072 |
Building | +20.543 |
Neg logit contributions | |
percentages | -16.410 |
percentile | -15.688 |
pts | -14.251 |
unfavorable | -13.995 |
percent | -13.918 |
Token | developing |
Token ID | 5922 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
civilisation | +24.800 |
revital | +23.529 |
building | +22.830 |
paradise | +22.606 |
Construction | +22.604 |
Neg logit contributions | |
percentages | -16.881 |
percentile | -16.245 |
percent | -15.076 |
disapprove | -14.933 |
pts | -14.802 |
Token | a |
Token ID | 257 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
civilisation | +14.536 |
paradise | +13.240 |
Construction | +13.113 |
rebuilt | +12.734 |
Harbour | +12.698 |
Neg logit contributions | |
percentages | -12.121 |
percentile | -11.536 |
pts | -10.955 |
percent | -10.891 |
offenses | -10.881 |
Token | meaningful |
Token ID | 11570 |
Feature activation | -1.50e+01 |
Pos logit contributions | |
civilisation | +23.644 |
paradise | +21.836 |
rebuilt | +21.575 |
Harbour | +21.097 |
revital | +21.079 |
Neg logit contributions | |
percentages | -14.777 |
offenses | -13.759 |
percentile | -13.428 |
inacc | -13.085 |
pts | -12.960 |
Token | ie |
Token ID | 494 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
civilisation | +11.888 |
Construction | +11.852 |
Harbour | +11.211 |
ufact | +11.007 |
paradise | +10.918 |
Neg logit contributions | |
percentages | -12.160 |
percentile | -11.134 |
unfavorable | -11.117 |
percentage | -10.577 |
offenses | -10.555 |
Token | , |
Token ID | 11 |
Feature activation | -4.39e+00 |
Pos logit contributions | |
civilisation | +15.720 |
Construction | +15.347 |
paradise | +14.562 |
Harbour | +14.509 |
Built | +14.381 |
Neg logit contributions | |
percentages | -11.961 |
percentile | -10.833 |
unfavorable | -10.505 |
offenses | -10.159 |
percentage | -9.948 |
Token | the |
Token ID | 262 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
civilisation | +4.171 |
Construction | +3.993 |
paradise | +3.865 |
Built | +3.757 |
Located | +3.706 |
Neg logit contributions | |
percentages | -4.012 |
percentile | -3.744 |
percentage | -3.532 |
pts | -3.493 |
unfavorable | -3.484 |
Token | French |
Token ID | 4141 |
Feature activation | -1.95e+01 |
Pos logit contributions | |
civilisation | +19.389 |
paradise | +18.138 |
Construction | +18.116 |
rebuilt | +17.684 |
Harbour | +17.395 |
Neg logit contributions | |
percentages | -12.426 |
percentile | -11.228 |
offenses | -10.885 |
unfavorable | -10.660 |
disapprove | -10.412 |
Token | company |
Token ID | 1664 |
Feature activation | -3.27e+01 |
Pos logit contributions | |
civilisation | +18.156 |
Construction | +17.357 |
paradise | +16.569 |
rebuilt | +16.018 |
Built | +15.745 |
Neg logit contributions | |
percentages | -13.275 |
percentile | -11.798 |
offenses | -11.329 |
unfavorable | -11.308 |
disapprove | -11.074 |
Token | which |
Token ID | 543 |
Feature activation | -4.16e+01 |
Pos logit contributions | |
civilisation | +24.960 |
building | +24.109 |
rebuilt | +23.858 |
Construction | +23.810 |
refurb | +23.764 |
Neg logit contributions | |
percentages | -17.224 |
percentile | -15.762 |
pts | -14.857 |
regress | -14.520 |
offenses | -14.495 |
Token | is |
Token ID | 318 |
Feature activation | -3.13e+01 |
Pos logit contributions | |
refurb | +28.036 |
rebuilt | +28.023 |
civilisation | +27.784 |
transformed | +26.816 |
revital | +25.796 |
Neg logit contributions | |
percentages | -17.327 |
percentile | -16.370 |
pts | -16.044 |
unfavorable | -15.856 |
inacc | -15.847 |
Token | the |
Token ID | 262 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
civilisation | +24.884 |
Construction | +24.310 |
building | +24.168 |
refurb | +23.915 |
rebuilt | +23.524 |
Neg logit contributions | |
percentages | -15.828 |
percentile | -14.709 |
pts | -13.889 |
offenses | -13.863 |
inacc | -13.497 |
Token | majority |
Token ID | 3741 |
Feature activation | -6.03e+00 |
Pos logit contributions | |
civilisation | +22.202 |
paradise | +20.604 |
Construction | +20.390 |
refurb | +19.836 |
rebuilt | +19.738 |
Neg logit contributions | |
percentages | -13.439 |
percentile | -12.358 |
unfavorable | -11.992 |
offenses | -11.988 |
disapprove | -11.535 |
Token | owner |
Token ID | 4870 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
civilisation | +4.472 |
Construction | +4.214 |
paradise | +3.989 |
Built | +3.824 |
rebuilt | +3.754 |
Neg logit contributions | |
percentages | -6.648 |
percentile | -6.279 |
percentage | -5.985 |
inaccur | -5.979 |
offenses | -5.950 |
Token | of |
Token ID | 286 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
percentages | +6.819 |
percentile | +6.040 |
percentage | +5.958 |
vs | +5.517 |
pts | +5.504 |
Neg logit contributions | |
civilisation | -11.914 |
Construction | -11.546 |
paradise | -11.280 |
Located | -11.025 |
issance | -10.952 |
Token | M |
Token ID | 337 |
Feature activation | -9.85e+00 |
Pos logit contributions | |
civilisation | +18.663 |
paradise | +18.123 |
Construction | +16.970 |
rebuilt | +16.764 |
Harbour | +16.650 |
Neg logit contributions | |
percentages | -12.611 |
percentile | -11.750 |
pts | -11.257 |
disapprove | -10.832 |
unfavorable | -10.487 |
Token | oom |
Token ID | 4207 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
civilisation | +5.144 |
Construction | +4.911 |
paradise | +4.764 |
Located | +4.488 |
Built | +4.374 |
Neg logit contributions | |
percentages | -12.466 |
percentile | -11.588 |
percentage | -11.255 |
pts | -11.204 |
unfavorable | -11.124 |
Token | in |
Token ID | 259 |
Feature activation | -2.83e+01 |
Pos logit contributions | |
civilisation | +6.630 |
paradise | +6.438 |
Construction | +6.358 |
Located | +6.002 |
Built | +5.988 |
Neg logit contributions | |
percentages | -11.237 |
percentile | -10.503 |
unfavorable | -10.113 |
percentage | -10.001 |
offenses | -9.994 |
Token | theme |
Token ID | 7505 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
civilisation | +24.765 |
paradise | +24.733 |
Construction | +23.634 |
Harbour | +22.338 |
Built | +22.255 |
Neg logit contributions | |
percentages | -14.723 |
percentile | -13.404 |
pts | -12.697 |
unfavorable | -12.640 |
disapprove | -12.312 |
Token | park |
Token ID | 3952 |
Feature activation | -3.53e+01 |
Pos logit contributions | |
civilisation | +18.629 |
paradise | +18.451 |
Construction | +16.853 |
rebuilt | +16.812 |
Located | +16.602 |
Neg logit contributions | |
percentages | -17.290 |
percentile | -16.077 |
pts | -15.741 |
disapprove | -14.944 |
inacc | -14.938 |
Token | is |
Token ID | 318 |
Feature activation | -4.13e+01 |
Pos logit contributions | |
civilisation | +26.579 |
paradise | +26.574 |
Construction | +25.629 |
transformed | +24.871 |
rebuilt | +24.770 |
Neg logit contributions | |
percentages | -16.566 |
percentile | -16.350 |
pts | -14.970 |
disapprove | -14.466 |
percent | -14.149 |
Token | set |
Token ID | 900 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
civilisation | +27.194 |
Construction | +27.031 |
paradise | +26.568 |
rebuilt | +26.349 |
bustling | +26.261 |
Neg logit contributions | |
percentile | -18.918 |
percentages | -18.805 |
inacc | -16.398 |
disapprove | -16.181 |
utterstock | -16.140 |
Token | to |
Token ID | 284 |
Feature activation | -3.40e+01 |
Pos logit contributions | |
civilisation | +18.728 |
Construction | +18.725 |
paradise | +17.928 |
Built | +17.423 |
Located | +16.999 |
Neg logit contributions | |
percentages | -15.115 |
percentile | -14.438 |
disapprove | -13.087 |
inacc | -13.027 |
unfavorable | -12.946 |
Token | open |
Token ID | 1280 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
civilisation | +22.212 |
paradise | +21.650 |
refurb | +21.070 |
revital | +21.020 |
Construction | +20.818 |
Neg logit contributions | |
percentages | -20.818 |
percentile | -20.137 |
inacc | -17.958 |
percent | -17.854 |
Percent | -17.596 |
Token | in |
Token ID | 287 |
Feature activation | -1.65e+01 |
Pos logit contributions | |
paradise | +20.488 |
civilisation | +20.442 |
Construction | +20.217 |
rebuilt | +18.999 |
Harbour | +18.871 |
Neg logit contributions | |
percentages | -16.487 |
percentile | -15.692 |
inacc | -13.973 |
pts | -13.945 |
percentage | -13.797 |
Token | 2019 |
Token ID | 13130 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
civilisation | +15.528 |
paradise | +15.106 |
Construction | +14.351 |
Harbour | +14.076 |
rebuilt | +14.044 |
Neg logit contributions | |
percentages | -11.718 |
percentile | -11.116 |
disapprove | -10.315 |
unfavorable | -10.125 |
pts | -10.102 |
Token | or |
Token ID | 393 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
percentages | +20.078 |
percentile | +18.762 |
percentage | +18.664 |
vs | +18.511 |
inaccur | +17.932 |
Neg logit contributions | |
Construction | -16.277 |
civilisation | -15.993 |
Built | -14.955 |
Located | -14.912 |
ufact | -14.878 |
Token | does |
Token ID | 857 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
percentages | +12.919 |
percentage | +11.772 |
percentile | +11.699 |
fewer | +11.193 |
unfavorable | +11.160 |
Neg logit contributions | |
civilisation | -12.982 |
Construction | -12.879 |
ufact | -12.311 |
Built | -12.220 |
Located | -12.194 |
Token | anyone |
Token ID | 2687 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
percentages | +2.768 |
percentile | +2.590 |
percentage | +2.517 |
unfavorable | +2.441 |
pts | +2.437 |
Neg logit contributions | |
civilisation | -2.050 |
Construction | -1.982 |
paradise | -1.893 |
Built | -1.829 |
Located | -1.820 |
Token | else |
Token ID | 2073 |
Feature activation | +2.82e+01 |
Pos logit contributions | |
percentages | +19.931 |
percentile | +19.000 |
percentage | +18.909 |
hate | +18.733 |
inaccur | +18.652 |
Neg logit contributions | |
Construction | -17.926 |
civilisation | -17.046 |
ufact | -16.971 |
Located | -16.718 |
Built | -16.371 |
Token | out |
Token ID | 503 |
Feature activation | +2.25e+01 |
Pos logit contributions | |
percentages | +22.263 |
hate | +21.747 |
percentile | +21.538 |
disapprove | +21.517 |
inaccur | +21.391 |
Neg logit contributions | |
Construction | -18.522 |
ufact | -17.246 |
civilisation | -17.158 |
Located | -16.778 |
Built | -16.751 |
Token | there |
Token ID | 612 |
Feature activation | +3.38e+01 |
Pos logit contributions | |
percentages | +17.694 |
percentile | +16.433 |
percentage | +16.172 |
vs | +15.970 |
hate | +15.816 |
Neg logit contributions | |
civilisation | -16.975 |
Construction | -16.781 |
ufact | -16.200 |
Located | -15.652 |
Built | -15.529 |
Token | think |
Token ID | 892 |
Feature activation | +8.30e+00 |
Pos logit contributions | |
percentages | +25.227 |
hate | +25.136 |
inaccur | +24.285 |
disapprove | +24.283 |
percentile | +24.210 |
Neg logit contributions | |
Construction | -19.428 |
ufact | -18.444 |
civilisation | -17.913 |
Located | -17.607 |
Built | -17.491 |
Token | this |
Token ID | 428 |
Feature activation | +7.21e+00 |
Pos logit contributions | |
percentages | +8.699 |
percentile | +8.049 |
percentage | +7.887 |
inaccur | +7.630 |
unfavorable | +7.617 |
Neg logit contributions | |
civilisation | -6.504 |
Construction | -6.468 |
paradise | -5.998 |
Built | -5.984 |
Located | -5.920 |
Token | could |
Token ID | 714 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
percentages | +7.151 |
percentile | +6.647 |
percentage | +6.543 |
unfavorable | +6.295 |
inaccur | +6.246 |
Neg logit contributions | |
civilisation | -6.116 |
Construction | -6.082 |
paradise | -5.665 |
Built | -5.646 |
ufact | -5.583 |
Token | be |
Token ID | 307 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
percentages | +16.190 |
percentile | +15.457 |
percentage | +15.279 |
inaccur | +15.153 |
injure | +14.672 |
Neg logit contributions | |
Construction | -14.859 |
civilisation | -14.512 |
ufact | -13.778 |
Built | -13.644 |
Building | -13.455 |
Token | turn |
Token ID | 1210 |
Feature activation | +1.22e+01 |
Pos logit contributions | |
percentages | +12.626 |
percentile | +11.677 |
percentage | +11.577 |
inaccur | +11.428 |
unfavorable | +11.276 |
Neg logit contributions | |
Construction | -10.641 |
civilisation | -10.611 |
Located | -9.854 |
Built | -9.621 |
Building | -9.581 |
Token | Political |
Token ID | 14611 |
Feature activation | -3.16e+00 |
Pos logit contributions | |
civilisation | +0.212 |
Construction | +0.204 |
paradise | +0.198 |
Built | +0.190 |
Located | +0.188 |
Neg logit contributions | |
percentages | -0.249 |
percentile | -0.232 |
percentage | -0.223 |
pts | -0.219 |
unfavorable | -0.217 |
Token | Victory |
Token ID | 21203 |
Feature activation | -5.09e+00 |
Pos logit contributions | |
civilisation | +2.736 |
Construction | +2.654 |
paradise | +2.568 |
Built | +2.456 |
Located | +2.449 |
Neg logit contributions | |
percentages | -3.154 |
percentile | -2.947 |
percentage | -2.815 |
pts | -2.762 |
unfavorable | -2.756 |
Token | Fund |
Token ID | 7557 |
Feature activation | -6.54e+00 |
Pos logit contributions | |
civilisation | +3.396 |
Construction | +3.285 |
paradise | +3.211 |
Built | +3.011 |
Building | +3.003 |
Neg logit contributions | |
percentages | -5.880 |
percentile | -5.635 |
unfavorable | -5.344 |
percentage | -5.330 |
offenses | -5.307 |
Token | mailed |
Token ID | 37789 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
civilisation | +5.992 |
Construction | +5.837 |
paradise | +5.682 |
rebuilt | +5.535 |
Built | +5.511 |
Neg logit contributions | |
percentages | -5.865 |
percentile | -5.468 |
pts | -5.153 |
percentage | -5.125 |
unfavorable | -5.013 |
Token | out |
Token ID | 503 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
percentages | +18.279 |
percentage | +17.105 |
fewer | +16.982 |
percentile | +16.603 |
percent | +16.263 |
Neg logit contributions | |
civilisation | -17.107 |
Construction | -16.339 |
ufact | -15.898 |
paradise | -15.602 |
Built | -15.477 |
Token | tens |
Token ID | 11192 |
Feature activation | +3.48e+01 |
Pos logit contributions | |
percentages | +23.717 |
percentage | +22.260 |
fewer | +22.207 |
tweets | +21.880 |
unfavorable | +21.687 |
Neg logit contributions | |
civilisation | -18.234 |
Construction | -17.336 |
Located | -16.773 |
ufact | -16.726 |
issance | -16.584 |
Token | of |
Token ID | 286 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
of | +20.197 |
percentages | +20.072 |
fewer | +19.611 |
percent | +19.529 |
percentage | +18.995 |
Neg logit contributions | |
civilisation | -26.108 |
ufact | -24.022 |
Construction | -23.546 |
paradise | -23.519 |
issance | -23.240 |
Token | thousands |
Token ID | 4138 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
percentages | +11.331 |
percentage | +10.264 |
percent | +9.929 |
percentile | +9.894 |
fewer | +9.573 |
Neg logit contributions | |
civilisation | -18.326 |
Construction | -17.418 |
paradise | -17.250 |
Located | -16.957 |
Built | -16.902 |
Token | of |
Token ID | 286 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
percentages | +16.332 |
fewer | +15.540 |
percentile | +15.151 |
percent | +15.054 |
percentage | +15.007 |
Neg logit contributions | |
civilisation | -19.584 |
Construction | -18.063 |
paradise | -18.043 |
Located | -17.803 |
ufact | -17.659 |
Token | broch |
Token ID | 41978 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
percentages | +15.442 |
percentage | +14.355 |
unfavorable | +14.224 |
percentile | +14.011 |
fewer | +13.931 |
Neg logit contributions | |
civilisation | -14.620 |
Construction | -13.807 |
paradise | -13.427 |
Located | -13.184 |
ufact | -13.139 |
Token | ures |
Token ID | 942 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
percentages | +0.651 |
percentile | +0.612 |
percentage | +0.592 |
unfavorable | +0.577 |
offenses | +0.574 |
Neg logit contributions | |
civilisation | -0.446 |
Construction | -0.433 |
paradise | -0.413 |
Built | -0.400 |
Located | -0.395 |
Token | highest |
Token ID | 4511 |
Feature activation | +9.95e+00 |
Pos logit contributions | |
percentages | +6.524 |
percentile | +6.019 |
percentage | +5.911 |
unfavorable | +5.690 |
offenses | +5.645 |
Neg logit contributions | |
civilisation | -5.604 |
Construction | -5.527 |
paradise | -5.193 |
Built | -5.160 |
Located | -5.109 |
Token | of |
Token ID | 286 |
Feature activation | +8.90e+00 |
Pos logit contributions | |
percentages | +9.156 |
percentile | +8.497 |
percentage | +8.369 |
unfavorable | +7.921 |
offenses | +7.798 |
Neg logit contributions | |
Construction | -8.936 |
civilisation | -8.916 |
ufact | -8.364 |
paradise | -8.362 |
Built | -8.354 |
Token | the |
Token ID | 262 |
Feature activation | +6.34e+00 |
Pos logit contributions | |
percentages | +8.622 |
percentile | +7.834 |
percentage | +7.724 |
offenses | +7.406 |
unfavorable | +7.357 |
Neg logit contributions | |
Construction | -7.817 |
civilisation | -7.703 |
Built | -7.244 |
Located | -7.195 |
paradise | -7.172 |
Token | high |
Token ID | 1029 |
Feature activation | +8.84e+00 |
Pos logit contributions | |
percentages | +5.953 |
percentile | +5.464 |
percentage | +5.323 |
offenses | +5.080 |
unfavorable | +5.079 |
Neg logit contributions | |
civilisation | -5.875 |
Construction | -5.810 |
paradise | -5.483 |
Built | -5.392 |
Located | -5.359 |
Token | in |
Token ID | 287 |
Feature activation | +5.69e+00 |
Pos logit contributions | |
percentages | +8.559 |
percentile | +7.902 |
percentage | +7.742 |
offenses | +7.335 |
unfavorable | +7.331 |
Neg logit contributions | |
civilisation | -7.698 |
Construction | -7.522 |
paradise | -7.152 |
Built | -7.115 |
ufact | -7.099 |
Token | terms |
Token ID | 2846 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
percentages | +5.525 |
percentile | +5.051 |
percentage | +4.999 |
unfavorable | +4.793 |
offenses | +4.755 |
Neg logit contributions | |
civilisation | -5.093 |
Construction | -4.979 |
paradise | -4.716 |
Built | -4.647 |
Located | -4.627 |
Token | of |
Token ID | 286 |
Feature activation | +8.83e+00 |
Pos logit contributions | |
percentages | +19.441 |
of | +19.289 |
percentage | +18.513 |
fewer | +18.126 |
percent | +17.964 |
Neg logit contributions | |
exting | -26.739 |
ufact | -26.543 |
arrang | -26.471 |
civilisation | -25.509 |
Nitrome | -24.718 |
Token | a |
Token ID | 257 |
Feature activation | -2.05e+00 |
Pos logit contributions | |
percentages | +8.687 |
percentage | +7.882 |
percentile | +7.879 |
unfavorable | +7.514 |
offenses | +7.449 |
Neg logit contributions | |
civilisation | -7.594 |
Construction | -7.517 |
paradise | -7.060 |
Built | -7.039 |
Located | -7.014 |
Token | money |
Token ID | 1637 |
Feature activation | +3.23e-01 |
Pos logit contributions | |
civilisation | +1.977 |
Construction | +1.878 |
paradise | +1.851 |
Built | +1.766 |
Located | +1.752 |
Neg logit contributions | |
percentages | -1.856 |
percentile | -1.718 |
percentage | -1.626 |
pts | -1.616 |
unfavorable | -1.603 |
Token | fight |
Token ID | 1907 |
Feature activation | -5.87e+00 |
Pos logit contributions | |
percentages | +0.330 |
percentile | +0.307 |
percentage | +0.296 |
pts | +0.289 |
unfavorable | +0.289 |
Neg logit contributions | |
civilisation | -0.279 |
Construction | -0.267 |
paradise | -0.260 |
Built | -0.248 |
Located | -0.247 |
Token | . |
Token ID | 13 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
civilisation | +5.425 |
Construction | +5.148 |
paradise | +5.119 |
Built | +4.829 |
Located | +4.792 |
Neg logit contributions | |
percentages | -5.338 |
percentile | -4.949 |
pts | -4.697 |
percentage | -4.671 |
unfavorable | -4.636 |
Token | or |
Token ID | 393 |
Feature activation | +2.37e+01 |
Pos logit contributions | |
percentages | +17.076 |
percentage | +15.482 |
vs | +15.327 |
offenses | +15.076 |
inaccur | +15.034 |
Neg logit contributions | |
civilisation | -15.190 |
Construction | -14.998 |
ufact | -14.256 |
Building | -14.076 |
Located | -14.071 |
Token | sexist |
Token ID | 24651 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
percentages | +18.826 |
percentage | +17.513 |
unfavorable | +17.509 |
hate | +17.492 |
inaccurate | +17.250 |
Neg logit contributions | |
ufact | -17.437 |
civilisation | -17.322 |
Construction | -17.017 |
Located | -16.375 |
issance | -16.365 |
Token | . |
Token ID | 13 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
percentages | +19.036 |
percentage | +17.466 |
vs | +17.231 |
inaccur | +17.176 |
offenses | +16.982 |
Neg logit contributions | |
civilisation | -16.593 |
Construction | -16.529 |
Located | -15.846 |
ufact | -15.740 |
Built | -15.519 |
Token | Were |
Token ID | 15176 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
percentages | +14.324 |
percentile | +13.369 |
percentage | +13.301 |
pts | +13.211 |
vs | +13.100 |
Neg logit contributions | |
civilisation | -10.872 |
ufact | -9.708 |
paradise | -9.627 |
Construction | -9.605 |
arrang | -9.284 |
Token | there |
Token ID | 612 |
Feature activation | +3.93e+01 |
Pos logit contributions | |
percentages | +17.192 |
percentage | +15.743 |
unfavorable | +15.234 |
fewer | +15.233 |
percentile | +15.209 |
Neg logit contributions | |
civilisation | -14.502 |
Construction | -14.319 |
ufact | -13.720 |
Located | -13.582 |
paradise | -13.397 |
Token | random |
Token ID | 4738 |
Feature activation | +3.77e+01 |
Pos logit contributions | |
percentages | +29.456 |
fewer | +27.497 |
percentage | +27.352 |
inaccur | +26.882 |
tweets | +26.510 |
Neg logit contributions | |
Construction | -19.648 |
ufact | -19.261 |
civilisation | -18.791 |
Located | -18.269 |
issance | -17.986 |
Token | people |
Token ID | 661 |
Feature activation | +2.73e+01 |
Pos logit contributions | |
percentages | +30.795 |
percentage | +28.649 |
tweets | +27.551 |
bias | +27.094 |
inaccur | +27.002 |
Neg logit contributions | |
Construction | -19.205 |
ufact | -19.183 |
civilisation | -17.969 |
Located | -17.322 |
Building | -16.842 |
Token | on |
Token ID | 319 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
percentages | +22.840 |
inaccur | +21.274 |
percentage | +21.088 |
vs | +20.958 |
statistically | +20.827 |
Neg logit contributions | |
Construction | -17.458 |
ufact | -16.645 |
civilisation | -16.635 |
Located | -16.060 |
Built | -15.760 |
Token | Twitter |
Token ID | 3009 |
Feature activation | +3.13e+01 |
Pos logit contributions | |
percentages | +12.575 |
percentage | +11.437 |
percentile | +11.281 |
unfavorable | +11.208 |
fewer | +11.141 |
Neg logit contributions | |
Construction | -11.621 |
civilisation | -11.482 |
ufact | -10.998 |
Located | -10.862 |
Built | -10.622 |
Token | , |
Token ID | 11 |
Feature activation | +3.67e+01 |
Pos logit contributions | |
percentages | +24.908 |
tweets | +23.150 |
vs | +23.107 |
inaccur | +22.972 |
percentage | +22.580 |
Neg logit contributions | |
Construction | -17.571 |
civilisation | -17.486 |
ufact | -16.570 |
Located | -16.366 |
Built | -15.550 |
Token | claiming |
Token ID | 8512 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
percentages | +28.017 |
tweets | +26.926 |
fewer | +26.019 |
percentage | +25.938 |
hate | +25.712 |
Neg logit contributions | |
Construction | -18.368 |
ufact | -17.524 |
civilisation | -17.297 |
Located | -16.459 |
Built | -15.943 |
Token | . |
Token ID | 13 |
Feature activation | +3.14e+00 |
Pos logit contributions | |
Construction | +2.658 |
civilisation | +2.628 |
paradise | +2.490 |
Located | +2.429 |
Built | +2.418 |
Neg logit contributions | |
percentages | -5.072 |
percentile | -4.676 |
disapprove | -4.570 |
percentage | -4.558 |
unfavorable | -4.556 |
Token | m |
Token ID | 76 |
Feature activation | -5.19e+00 |
Pos logit contributions | |
percentages | +2.989 |
percentile | +2.780 |
percentage | +2.684 |
pts | +2.598 |
unfavorable | +2.592 |
Neg logit contributions | |
civilisation | -2.925 |
Construction | -2.803 |
paradise | -2.726 |
Built | -2.614 |
Located | -2.601 |
Token | .: |
Token ID | 11207 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
civilisation | +3.527 |
Construction | +3.457 |
paradise | +3.278 |
Located | +3.108 |
Built | +3.107 |
Neg logit contributions | |
percentages | -6.024 |
percentile | -5.644 |
percentage | -5.488 |
unfavorable | -5.380 |
inaccur | -5.339 |
Token | CNN |
Token ID | 8100 |
Feature activation | +8.56e+00 |
Pos logit contributions | |
percentages | +14.767 |
percentile | +13.583 |
percentage | +13.575 |
fewer | +13.464 |
pts | +13.448 |
Neg logit contributions | |
civilisation | -11.911 |
paradise | -10.472 |
ufact | -10.464 |
issance | -10.354 |
Construction | -10.285 |
Token | reports |
Token ID | 3136 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
percentages | +8.249 |
percentile | +7.715 |
percentage | +7.492 |
inaccur | +7.367 |
offenses | +7.222 |
Neg logit contributions | |
civilisation | -7.460 |
Construction | -7.060 |
paradise | -6.897 |
Built | -6.690 |
Located | -6.648 |
Token | two |
Token ID | 734 |
Feature activation | +3.41e+01 |
Pos logit contributions | |
percentages | +15.043 |
percentile | +13.677 |
fewer | +13.645 |
percentage | +13.623 |
inaccur | +13.317 |
Neg logit contributions | |
civilisation | -12.931 |
Construction | -12.338 |
ufact | -11.991 |
Built | -11.879 |
issance | -11.784 |
Token | people |
Token ID | 661 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
percentages | +27.157 |
fewer | +25.994 |
percentage | +25.464 |
percent | +25.250 |
tweets | +24.927 |
Neg logit contributions | |
civilisation | -17.556 |
ufact | -17.272 |
issance | -16.651 |
Construction | -16.483 |
Built | -16.298 |
Token | are |
Token ID | 389 |
Feature activation | +7.30e+00 |
Pos logit contributions | |
percentages | +14.804 |
percentage | +13.675 |
percentile | +13.650 |
vs | +13.396 |
fewer | +13.194 |
Neg logit contributions | |
civilisation | -14.187 |
Construction | -13.809 |
Located | -13.009 |
Built | -12.981 |
Building | -12.920 |
Token | confirmed |
Token ID | 4999 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
percentages | +6.072 |
percentile | +5.542 |
percentage | +5.394 |
unfavorable | +5.208 |
pts | +5.192 |
Neg logit contributions | |
civilisation | -7.495 |
Construction | -7.274 |
paradise | -6.964 |
Built | -6.860 |
ufact | -6.796 |
Token | dead |
Token ID | 2636 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
percentages | +7.251 |
percentile | +6.611 |
percentage | +6.331 |
unfavorable | +6.079 |
inaccur | +6.063 |
Neg logit contributions | |
civilisation | -11.685 |
Construction | -11.482 |
paradise | -10.927 |
ufact | -10.793 |
Built | -10.728 |
Token | , |
Token ID | 11 |
Feature activation | +3.29e+01 |
Pos logit contributions | |
percentages | +16.854 |
vs | +15.806 |
percentile | +15.526 |
percentage | +15.453 |
percent | +15.168 |
Neg logit contributions | |
civilisation | -18.430 |
Construction | -17.183 |
ufact | -16.623 |
Built | -16.417 |
Building | -16.334 |
Token | , |
Token ID | 11 |
Feature activation | +2.34e+01 |
Pos logit contributions | |
civilisation | +6.348 |
Construction | +6.293 |
paradise | +6.072 |
Built | +5.827 |
Located | +5.763 |
Neg logit contributions | |
percentages | -5.213 |
percentile | -4.840 |
percentage | -4.545 |
pts | -4.444 |
unfavorable | -4.377 |
Token | Clinton |
Token ID | 2605 |
Feature activation | +8.91e+00 |
Pos logit contributions | |
percentages | +20.525 |
percentage | +18.951 |
fewer | +18.936 |
percentile | +18.625 |
unfavorable | +18.552 |
Neg logit contributions | |
civilisation | -15.154 |
Construction | -14.579 |
ufact | -14.552 |
Located | -14.180 |
Built | -14.172 |
Token | has |
Token ID | 468 |
Feature activation | +6.93e+00 |
Pos logit contributions | |
percentages | +8.995 |
percentile | +8.354 |
percentage | +8.160 |
inaccur | +7.996 |
vs | +7.927 |
Neg logit contributions | |
civilisation | -7.375 |
Construction | -7.026 |
paradise | -6.765 |
Located | -6.601 |
Built | -6.505 |
Token | received |
Token ID | 2722 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
percentages | +6.847 |
percentile | +6.356 |
percentage | +6.197 |
unfavorable | +6.047 |
inaccur | +6.043 |
Neg logit contributions | |
civilisation | -6.025 |
Construction | -5.840 |
paradise | -5.568 |
Located | -5.452 |
Built | -5.421 |
Token | criticism |
Token ID | 7734 |
Feature activation | +2.34e+01 |
Pos logit contributions | |
percentages | +26.954 |
unfavorable | +26.057 |
fewer | +25.863 |
percentage | +25.282 |
hate | +25.107 |
Neg logit contributions | |
Construction | -18.081 |
civilisation | -18.076 |
Located | -17.917 |
Built | -17.754 |
ufact | -17.247 |
Token | from |
Token ID | 422 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
percentages | +17.853 |
unfavorable | +16.371 |
inaccur | +16.360 |
percentile | +16.336 |
percentage | +16.295 |
Neg logit contributions | |
civilisation | -18.591 |
Construction | -17.709 |
Located | -17.268 |
ufact | -16.722 |
paradise | -16.660 |
Token | environmentalists |
Token ID | 40586 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
percentages | +8.941 |
percentile | +8.195 |
percentage | +8.128 |
unfavorable | +7.875 |
fewer | +7.860 |
Neg logit contributions | |
civilisation | -9.218 |
Construction | -8.890 |
paradise | -8.628 |
Located | -8.580 |
Built | -8.513 |
Token | for |
Token ID | 329 |
Feature activation | +6.85e+00 |
Pos logit contributions | |
percentages | +14.207 |
percentile | +13.160 |
inaccur | +12.955 |
vs | +12.828 |
percentage | +12.788 |
Neg logit contributions | |
civilisation | -16.424 |
Construction | -15.697 |
Located | -15.035 |
Built | -14.818 |
ufact | -14.765 |
Token | her |
Token ID | 607 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
percentages | +6.886 |
percentile | +6.379 |
percentage | +6.241 |
unfavorable | +6.153 |
inaccur | +6.153 |
Neg logit contributions | |
civilisation | -5.793 |
Construction | -5.592 |
paradise | -5.352 |
Built | -5.269 |
Located | -5.231 |
Token | support |
Token ID | 1104 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
percentages | +10.912 |
percentage | +9.959 |
percentile | +9.923 |
unfavorable | +9.896 |
offenses | +9.550 |
Neg logit contributions | |
civilisation | -9.824 |
Construction | -9.481 |
Built | -9.076 |
paradise | -9.063 |
ufact | -9.009 |
Token | for |
Token ID | 329 |
Feature activation | -4.76e-01 |
Pos logit contributions | |
percentages | +8.818 |
percentage | +7.756 |
percentile | +7.754 |
unfavorable | +7.522 |
fewer | +7.403 |
Neg logit contributions | |
civilisation | -12.827 |
Construction | -12.198 |
paradise | -11.929 |
issance | -11.701 |
Located | -11.678 |
Token | , |
Token ID | 11 |
Feature activation | -3.95e+00 |
Pos logit contributions | |
percentages | +1.954 |
percentile | +1.799 |
percentage | +1.732 |
unfavorable | +1.669 |
pts | +1.667 |
Neg logit contributions | |
civilisation | -2.280 |
Construction | -2.203 |
paradise | -2.143 |
Built | -2.070 |
Located | -2.061 |
Token | she |
Token ID | 673 |
Feature activation | -5.86e+00 |
Pos logit contributions | |
civilisation | +3.172 |
Construction | +3.033 |
paradise | +2.978 |
Built | +2.790 |
Located | +2.786 |
Neg logit contributions | |
percentages | -4.138 |
percentile | -3.880 |
percentage | -3.715 |
pts | -3.645 |
unfavorable | -3.633 |
Token | was |
Token ID | 373 |
Feature activation | -8.74e+00 |
Pos logit contributions | |
civilisation | +4.436 |
paradise | +4.161 |
Construction | +4.146 |
rebuilt | +3.937 |
Built | +3.829 |
Neg logit contributions | |
percentages | -6.322 |
percentile | -5.942 |
percentage | -5.698 |
unfavorable | -5.606 |
pts | -5.587 |
Token | an |
Token ID | 281 |
Feature activation | +5.36e+00 |
Pos logit contributions | |
civilisation | +7.693 |
Construction | +7.505 |
paradise | +7.268 |
rebuilt | +6.962 |
Built | +6.911 |
Neg logit contributions | |
percentages | -7.913 |
percentile | -7.399 |
offenses | -6.880 |
percentage | -6.875 |
unfavorable | -6.851 |
Token | assistant |
Token ID | 8796 |
Feature activation | -2.38e+00 |
Pos logit contributions | |
percentages | +5.140 |
percentile | +4.769 |
percentage | +4.637 |
unfavorable | +4.507 |
pts | +4.479 |
Neg logit contributions | |
civilisation | -4.868 |
Construction | -4.681 |
paradise | -4.530 |
Built | -4.377 |
Located | -4.365 |
Token | director |
Token ID | 3437 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
civilisation | +1.912 |
Construction | +1.834 |
paradise | +1.778 |
Built | +1.675 |
Located | +1.667 |
Neg logit contributions | |
percentages | -2.527 |
percentile | -2.364 |
percentage | -2.261 |
unfavorable | -2.236 |
pts | -2.223 |
Token | of |
Token ID | 286 |
Feature activation | -6.27e-01 |
Pos logit contributions | |
percentages | +8.361 |
percentile | +7.701 |
percentage | +7.585 |
percent | +7.038 |
vs | +7.018 |
Neg logit contributions | |
civilisation | -12.221 |
Construction | -11.626 |
paradise | -11.395 |
Located | -11.191 |
Built | -11.154 |
Token | the |
Token ID | 262 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
civilisation | +0.526 |
Construction | +0.504 |
paradise | +0.488 |
Built | +0.465 |
Located | +0.462 |
Neg logit contributions | |
percentages | -0.654 |
percentile | -0.612 |
percentage | -0.590 |
unfavorable | -0.575 |
pts | -0.575 |
Token | Women |
Token ID | 6926 |
Feature activation | +7.22e+00 |
Pos logit contributions | |
percentages | +0.822 |
percentile | +0.766 |
percentage | +0.740 |
unfavorable | +0.719 |
pts | +0.718 |
Neg logit contributions | |
civilisation | -0.728 |
Construction | -0.700 |
paradise | -0.678 |
Built | -0.651 |
Located | -0.648 |
Token | 's |
Token ID | 338 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
percentages | +8.020 |
percentile | +7.578 |
percentage | +7.451 |
pts | +7.178 |
vs | +7.175 |
Neg logit contributions | |
civilisation | -5.323 |
Construction | -4.973 |
paradise | -4.827 |
Built | -4.589 |
Located | -4.569 |
Token | Army |
Token ID | 5407 |
Feature activation | -4.15e+00 |
Pos logit contributions | |
percentages | +2.559 |
percentile | +2.395 |
percentage | +2.327 |
unfavorable | +2.256 |
pts | +2.254 |
Neg logit contributions | |
civilisation | -1.945 |
Construction | -1.860 |
paradise | -1.796 |
Built | -1.722 |
Located | -1.713 |
Token | not |
Token ID | 407 |
Feature activation | +7.50e+00 |
Pos logit contributions | |
percentages | +7.415 |
percentile | +6.824 |
percentage | +6.598 |
unfavorable | +6.422 |
fewer | +6.394 |
Neg logit contributions | |
civilisation | -9.329 |
Construction | -9.146 |
paradise | -8.693 |
Built | -8.591 |
ufact | -8.569 |
Token | . |
Token ID | 13 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
percentages | +7.218 |
percentile | +6.727 |
percentage | +6.533 |
unfavorable | +6.345 |
offenses | +6.312 |
Neg logit contributions | |
civilisation | -6.564 |
Construction | -6.360 |
paradise | -6.068 |
Built | -5.909 |
Located | -5.896 |
Token | Here |
Token ID | 3423 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
percentages | +11.757 |
percentile | +11.137 |
percentage | +10.770 |
vs | +10.659 |
pts | +10.610 |
Neg logit contributions | |
civilisation | -9.405 |
Construction | -8.584 |
paradise | -8.501 |
ufact | -8.433 |
issance | -8.107 |
Token | 's |
Token ID | 338 |
Feature activation | +6.24e+00 |
Pos logit contributions | |
percentages | +0.313 |
percentile | +0.291 |
percentage | +0.280 |
unfavorable | +0.272 |
pts | +0.271 |
Neg logit contributions | |
civilisation | -0.301 |
Construction | -0.290 |
paradise | -0.282 |
Built | -0.270 |
Located | -0.269 |
Token | some |
Token ID | 617 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
percentages | +5.748 |
percentile | +5.351 |
percentage | +5.172 |
unfavorable | +4.943 |
fewer | +4.937 |
Neg logit contributions | |
civilisation | -5.890 |
Construction | -5.713 |
paradise | -5.453 |
Built | -5.367 |
Located | -5.352 |
Token | common |
Token ID | 2219 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
percentages | +22.085 |
percentile | +20.589 |
percentage | +20.499 |
tweets | +19.790 |
fewer | +19.595 |
Neg logit contributions | |
civilisation | -15.804 |
Construction | -15.716 |
ufact | -15.588 |
Located | -15.518 |
issance | -15.146 |
Token | questions |
Token ID | 2683 |
Feature activation | +1.03e+01 |
Pos logit contributions | |
percentages | +13.110 |
percentile | +12.226 |
percentage | +11.939 |
offenses | +11.764 |
inaccur | +11.671 |
Neg logit contributions | |
civilisation | -10.452 |
Construction | -10.219 |
ufact | -9.727 |
Built | -9.618 |
Located | -9.569 |
Token | / |
Token ID | 14 |
Feature activation | +9.93e+00 |
Pos logit contributions | |
percentages | +9.685 |
percentile | +9.101 |
percentage | +8.796 |
vs | +8.476 |
offenses | +8.450 |
Neg logit contributions | |
civilisation | -8.996 |
Construction | -8.854 |
ufact | -8.375 |
paradise | -8.355 |
Located | -8.287 |
Token | mis |
Token ID | 25413 |
Feature activation | +5.11e+00 |
Pos logit contributions | |
percentages | +9.844 |
percentile | +8.981 |
percentage | +8.776 |
inaccur | +8.735 |
unfavorable | +8.635 |
Neg logit contributions | |
civilisation | -8.431 |
Construction | -7.662 |
paradise | -7.638 |
ufact | -7.430 |
rebuilt | -7.283 |
Token | con |
Token ID | 1102 |
Feature activation | +5.06e+00 |
Pos logit contributions | |
percentages | +4.753 |
percentile | +4.376 |
percentage | +4.230 |
pts | +4.085 |
inaccur | +4.083 |
Neg logit contributions | |
civilisation | -4.865 |
Construction | -4.611 |
paradise | -4.537 |
Built | -4.309 |
ufact | -4.294 |
Token | ceptions |
Token ID | 11755 |
Feature activation | +1.60e+01 |
Pos logit contributions | |
percentages | +3.646 |
percentile | +3.252 |
percentage | +3.132 |
pts | +2.974 |
inaccur | +2.961 |
Neg logit contributions | |
civilisation | -5.896 |
Construction | -5.665 |
paradise | -5.590 |
Built | -5.365 |
Located | -5.362 |
Token | purge |
Token ID | 35714 |
Feature activation | +7.42e+00 |
Pos logit contributions | |
percentages | +1.315 |
percentile | +1.212 |
percentage | +1.166 |
unfavorable | +1.125 |
pts | +1.123 |
Neg logit contributions | |
civilisation | -1.517 |
Construction | -1.465 |
paradise | -1.426 |
Built | -1.376 |
Located | -1.370 |
Token | . |
Token ID | 13 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
percentages | +6.395 |
percentile | +5.837 |
percentage | +5.731 |
offenses | +5.504 |
unfavorable | +5.452 |
Neg logit contributions | |
civilisation | -7.390 |
Construction | -7.163 |
paradise | -6.867 |
Built | -6.731 |
Located | -6.719 |
Token | But |
Token ID | 887 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
percentages | +1.473 |
percentile | +1.381 |
percentage | +1.339 |
unfavorable | +1.304 |
pts | +1.301 |
Neg logit contributions | |
civilisation | -1.056 |
Construction | -1.012 |
paradise | -0.976 |
Built | -0.933 |
Located | -0.927 |
Token | Powell |
Token ID | 19675 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
civilisation | +1.168 |
Construction | +1.125 |
paradise | +1.098 |
Built | +1.047 |
Located | +1.038 |
Neg logit contributions | |
percentages | -1.214 |
percentile | -1.131 |
percentage | -1.088 |
pts | -1.058 |
unfavorable | -1.057 |
Token | stands |
Token ID | 6296 |
Feature activation | +7.75e+00 |
Pos logit contributions | |
percentages | +3.212 |
percentile | +2.995 |
percentage | +2.904 |
unfavorable | +2.803 |
pts | +2.796 |
Neg logit contributions | |
civilisation | -2.719 |
Construction | -2.592 |
paradise | -2.512 |
Built | -2.407 |
Located | -2.400 |
Token | out |
Token ID | 503 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
percentages | +6.717 |
percentile | +6.220 |
percentage | +6.009 |
fewer | +5.765 |
unfavorable | +5.763 |
Neg logit contributions | |
civilisation | -7.602 |
Construction | -7.400 |
paradise | -7.026 |
ufact | -6.892 |
issance | -6.863 |
Token | : |
Token ID | 25 |
Feature activation | +7.98e+00 |
Pos logit contributions | |
percentages | +8.134 |
percentile | +7.517 |
percentage | +7.218 |
fewer | +6.924 |
statistically | +6.918 |
Neg logit contributions | |
civilisation | -10.491 |
Construction | -10.071 |
paradise | -9.634 |
Built | -9.542 |
ufact | -9.514 |
Token | The |
Token ID | 383 |
Feature activation | +1.06e+01 |
Pos logit contributions | |
percentages | +8.868 |
percentile | +8.316 |
percentage | +8.150 |
fewer | +7.873 |
offenses | +7.859 |
Neg logit contributions | |
civilisation | -5.935 |
Construction | -5.565 |
paradise | -5.343 |
ufact | -5.125 |
Located | -5.078 |
Token | seventh |
Token ID | 14024 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
percentages | +9.895 |
percentile | +9.071 |
percentage | +8.992 |
offenses | +8.614 |
unfavorable | +8.531 |
Neg logit contributions | |
civilisation | -9.317 |
Construction | -9.142 |
ufact | -8.582 |
paradise | -8.572 |
Located | -8.568 |
Token | - |
Token ID | 12 |
Feature activation | +7.53e+00 |
Pos logit contributions | |
percentages | +7.889 |
percentile | +7.635 |
percentage | +7.153 |
percent | +6.862 |
fewer | +6.745 |
Neg logit contributions | |
civilisation | -12.061 |
Construction | -11.819 |
ufact | -11.414 |
paradise | -11.357 |
Located | -11.186 |
Token | year |
Token ID | 1941 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
percentages | +6.810 |
percentile | +6.399 |
percentage | +6.158 |
percent | +5.956 |
fewer | +5.874 |
Neg logit contributions | |
civilisation | -7.150 |
Construction | -6.739 |
paradise | -6.610 |
ufact | -6.345 |
Located | -6.283 |
Token |
|
Token ID | 198 |
Feature activation | -7.35e+00 |
Pos logit contributions | |
Construction | +2.330 |
civilisation | +2.272 |
paradise | +2.180 |
Built | +2.167 |
Located | +2.155 |
Neg logit contributions | |
percentages | -3.105 |
percentile | -2.861 |
disapprove | -2.766 |
unfavorable | -2.753 |
percentage | -2.746 |
Token | Cont |
Token ID | 4264 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
Construction | +5.973 |
Built | +5.551 |
Building | +5.495 |
Located | +5.492 |
civilisation | +5.412 |
Neg logit contributions | |
percentages | -7.721 |
percentile | -7.202 |
unfavorable | -6.917 |
percentage | -6.904 |
offenses | -6.857 |
Token | rad |
Token ID | 6335 |
Feature activation | -8.95e+00 |
Pos logit contributions | |
percentages | +1.499 |
percentile | +1.391 |
percentage | +1.342 |
unfavorable | +1.299 |
pts | +1.297 |
Neg logit contributions | |
civilisation | -1.490 |
Construction | -1.436 |
paradise | -1.393 |
Built | -1.342 |
Located | -1.335 |
Token | ict |
Token ID | 713 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
civilisation | +7.425 |
Construction | +7.218 |
ufact | +6.917 |
paradise | +6.905 |
Built | +6.812 |
Neg logit contributions | |
percentages | -8.508 |
percentile | -7.825 |
unfavorable | -7.651 |
percentage | -7.545 |
inacc | -7.404 |
Token | ing |
Token ID | 278 |
Feature activation | +8.96e+00 |
Pos logit contributions | |
civilisation | +1.147 |
Construction | +1.098 |
paradise | +1.065 |
Built | +1.018 |
Located | +1.004 |
Neg logit contributions | |
percentages | -1.527 |
percentile | -1.440 |
percentage | -1.386 |
pts | -1.351 |
unfavorable | -1.346 |
Token | the |
Token ID | 262 |
Feature activation | +4.99e+00 |
Pos logit contributions | |
percentages | +8.770 |
percentile | +8.018 |
percentage | +7.894 |
unfavorable | +7.620 |
inaccur | +7.591 |
Neg logit contributions | |
civilisation | -7.643 |
Construction | -7.552 |
paradise | -7.128 |
Located | -7.108 |
ufact | -7.062 |
Token | sense |
Token ID | 2565 |
Feature activation | +3.64e+00 |
Pos logit contributions | |
percentages | +5.044 |
percentile | +4.675 |
percentage | +4.568 |
unfavorable | +4.398 |
inaccur | +4.376 |
Neg logit contributions | |
civilisation | -4.286 |
Construction | -4.181 |
paradise | -3.985 |
Located | -3.878 |
Built | -3.878 |
Token | of |
Token ID | 286 |
Feature activation | -5.34e+00 |
Pos logit contributions | |
percentages | +2.487 |
percentile | +2.236 |
percentage | +2.132 |
unfavorable | +2.033 |
pts | +2.016 |
Neg logit contributions | |
civilisation | -4.355 |
Construction | -4.240 |
paradise | -4.131 |
Built | -4.023 |
Located | -4.013 |
Token | isolation |
Token ID | 15133 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
civilisation | +5.174 |
paradise | +4.889 |
Construction | +4.793 |
rebuilt | +4.552 |
Built | +4.539 |
Neg logit contributions | |
percentages | -4.664 |
percentile | -4.359 |
percentage | -4.122 |
pts | -4.101 |
unfavorable | -4.060 |
Token | expressed |
Token ID | 6241 |
Feature activation | +7.59e+00 |
Pos logit contributions | |
civilisation | +1.430 |
Construction | +1.381 |
paradise | +1.351 |
Built | +1.302 |
Located | +1.293 |
Neg logit contributions | |
percentages | -1.138 |
percentile | -1.049 |
percentage | -0.998 |
pts | -0.969 |
unfavorable | -0.963 |
Token | by |
Token ID | 416 |
Feature activation | +1.07e+01 |
Pos logit contributions | |
percentages | +6.272 |
percentile | +5.765 |
percentage | +5.540 |
unfavorable | +5.377 |
inaccur | +5.359 |
Neg logit contributions | |
civilisation | -7.755 |
Construction | -7.573 |
paradise | -7.247 |
Built | -7.186 |
Located | -7.165 |
Token |
|
Token ID | 198 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
Construction | +8.422 |
Built | +7.682 |
Located | +7.578 |
Building | +7.426 |
civilisation | +7.353 |
Neg logit contributions | |
percentages | -13.326 |
unfavorable | -12.439 |
percentile | -12.389 |
regress | -12.300 |
disapprove | -12.293 |
Token |
|
Token ID | 198 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
Construction | +5.643 |
Located | +5.217 |
Built | +5.213 |
civilisation | +5.089 |
Building | +5.072 |
Neg logit contributions | |
percentages | -9.635 |
disapprove | -8.965 |
percentile | -8.813 |
unfavorable | -8.747 |
offenses | -8.609 |
Token | Th |
Token ID | 817 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
Construction | +18.511 |
Built | +17.000 |
Located | +16.863 |
Building | +16.541 |
Laun | +16.024 |
Neg logit contributions | |
percentages | -19.442 |
percentile | -18.299 |
unfavorable | -17.654 |
disapprove | -17.590 |
offenses | -17.013 |
Token | ur |
Token ID | 333 |
Feature activation | -6.45e+00 |
Pos logit contributions | |
civilisation | +7.021 |
Construction | +6.857 |
Built | +6.396 |
paradise | +6.346 |
Building | +6.268 |
Neg logit contributions | |
percentages | -8.390 |
percentile | -7.607 |
percentage | -7.476 |
unfavorable | -7.431 |
inaccur | -7.342 |
Token | rock |
Token ID | 10823 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
civilisation | +4.057 |
Construction | +3.856 |
paradise | +3.635 |
ufact | +3.513 |
Built | +3.452 |
Neg logit contributions | |
percentages | -7.881 |
percentile | -7.323 |
percentage | -7.182 |
unfavorable | -7.118 |
offenses | -7.002 |
Token | Council |
Token ID | 4281 |
Feature activation | -1.56e+01 |
Pos logit contributions | |
civilisation | +20.367 |
Construction | +19.920 |
Harbour | +18.841 |
paradise | +18.700 |
rebuilt | +18.584 |
Neg logit contributions | |
percentages | -13.031 |
percentile | -12.038 |
unfavorable | -11.358 |
pts | -10.628 |
regress | -10.570 |
Token | said |
Token ID | 531 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
civilisation | +15.110 |
Construction | +14.725 |
rebuilt | +14.099 |
paradise | +14.077 |
Built | +13.879 |
Neg logit contributions | |
percentages | -11.015 |
percentile | -10.192 |
unfavorable | -9.583 |
pts | -9.401 |
percentage | -9.259 |
Token | workers |
Token ID | 3259 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
civilisation | +22.909 |
Construction | +21.732 |
paradise | +21.342 |
refurb | +20.885 |
rebuilt | +20.674 |
Neg logit contributions | |
percentages | -12.465 |
percentile | -12.400 |
partName | -11.145 |
percent | -11.024 |
criticize | -10.853 |
Token | had |
Token ID | 550 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
civilisation | +9.886 |
Construction | +9.320 |
paradise | +9.317 |
rebuilt | +9.172 |
refurb | +8.741 |
Neg logit contributions | |
percentages | -9.317 |
percentile | -8.802 |
pts | -8.201 |
percentage | -8.074 |
unfavorable | -8.055 |
Token | begun |
Token ID | 9258 |
Feature activation | -2.56e+01 |
Pos logit contributions | |
civilisation | +18.179 |
rebuilt | +17.755 |
paradise | +17.084 |
refurb | +17.067 |
transformed | +16.912 |
Neg logit contributions | |
percentages | -13.375 |
percentile | -12.514 |
pts | -12.069 |
Percent | -11.779 |
percent | -11.484 |
Token | removing |
Token ID | 10829 |
Feature activation | +4.72e+00 |
Pos logit contributions | |
civilisation | +22.206 |
Construction | +20.752 |
refurb | +20.749 |
paradise | +20.455 |
rebuilt | +20.058 |
Neg logit contributions | |
percentages | -14.544 |
percentile | -13.859 |
pts | -12.941 |
Percent | -12.689 |
percent | -12.484 |
Token | buddies |
Token ID | 35548 |
Feature activation | +6.71e+00 |
Pos logit contributions | |
percentages | +5.944 |
percentile | +5.545 |
percentage | +5.412 |
unfavorable | +5.229 |
pts | +5.204 |
Neg logit contributions | |
civilisation | -5.076 |
Construction | -4.907 |
paradise | -4.654 |
Located | -4.561 |
Built | -4.522 |
Token | " |
Token ID | 1 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
percentages | +6.683 |
percentile | +6.231 |
percentage | +6.088 |
unfavorable | +5.872 |
pts | +5.859 |
Neg logit contributions | |
civilisation | -5.778 |
Construction | -5.573 |
paradise | -5.231 |
Located | -5.138 |
Built | -5.121 |
Token | having |
Token ID | 1719 |
Feature activation | -8.91e+00 |
Pos logit contributions | |
percentages | +9.264 |
percentile | +8.476 |
percentage | +8.319 |
fewer | +8.080 |
inaccur | +7.995 |
Neg logit contributions | |
civilisation | -10.744 |
Construction | -10.553 |
Located | -9.879 |
Built | -9.846 |
ufact | -9.822 |
Token | worked |
Token ID | 3111 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
civilisation | +7.480 |
paradise | +7.135 |
rebuilt | +6.963 |
Construction | +6.907 |
Built | +6.675 |
Neg logit contributions | |
percentages | -8.305 |
percentile | -7.872 |
percentage | -7.424 |
inacc | -7.241 |
pts | -7.228 |
Token | on |
Token ID | 319 |
Feature activation | -5.72e+00 |
Pos logit contributions | |
percentages | +0.196 |
percentile | +0.182 |
percentage | +0.174 |
pts | +0.169 |
unfavorable | +0.169 |
Neg logit contributions | |
civilisation | -0.217 |
Construction | -0.210 |
paradise | -0.205 |
Built | -0.196 |
Located | -0.195 |
Token | cars |
Token ID | 5006 |
Feature activation | -1.10e+01 |
Pos logit contributions | |
civilisation | +5.088 |
Construction | +4.921 |
paradise | +4.832 |
Built | +4.544 |
rebuilt | +4.530 |
Neg logit contributions | |
percentages | -5.387 |
percentile | -5.073 |
percentage | -4.817 |
pts | -4.669 |
unfavorable | -4.639 |
Token | alongside |
Token ID | 7848 |
Feature activation | +4.72e+00 |
Pos logit contributions | |
civilisation | +10.847 |
Construction | +10.674 |
paradise | +10.539 |
Built | +10.355 |
rebuilt | +10.325 |
Neg logit contributions | |
percentages | -8.226 |
percentile | -7.684 |
percentage | -7.176 |
pts | -7.096 |
unfavorable | -6.959 |
Token | Bel |
Token ID | 3944 |
Feature activation | -4.26e+00 |
Pos logit contributions | |
percentages | +5.561 |
percentile | +5.233 |
percentage | +5.102 |
unfavorable | +4.981 |
pts | +4.980 |
Neg logit contributions | |
civilisation | -3.242 |
Construction | -3.118 |
paradise | -2.956 |
Located | -2.830 |
Built | -2.821 |
Token | ton |
Token ID | 1122 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
Construction | +2.689 |
civilisation | +2.668 |
paradise | +2.516 |
Built | +2.501 |
Located | +2.454 |
Neg logit contributions | |
percentages | -5.081 |
percentile | -4.769 |
percentage | -4.584 |
unfavorable | -4.576 |
inacc | -4.544 |
Token | for |
Token ID | 329 |
Feature activation | +5.93e+00 |
Pos logit contributions | |
civilisation | +4.187 |
Construction | +4.067 |
paradise | +3.973 |
Built | +3.781 |
rebuilt | +3.779 |
Neg logit contributions | |
percentages | -4.169 |
percentile | -3.900 |
percentage | -3.699 |
pts | -3.641 |
unfavorable | -3.612 |
Token | over |
Token ID | 625 |
Feature activation | +1.91e+01 |
Pos logit contributions | |
percentages | +4.819 |
percentile | +4.397 |
percentage | +4.277 |
fewer | +4.076 |
unfavorable | +4.069 |
Neg logit contributions | |
civilisation | -6.245 |
Construction | -6.036 |
paradise | -5.869 |
Built | -5.730 |
Located | -5.730 |
Token | was |
Token ID | 373 |
Feature activation | -3.45e+00 |
Pos logit contributions | |
civilisation | +9.456 |
Construction | +9.302 |
paradise | +9.157 |
Built | +8.677 |
rebuilt | +8.676 |
Neg logit contributions | |
percentages | -9.892 |
percentile | -9.260 |
percentage | -8.779 |
disapprove | -8.662 |
pts | -8.660 |
Token | 25 |
Token ID | 1679 |
Feature activation | +9.95e+00 |
Pos logit contributions | |
civilisation | +3.385 |
Construction | +3.270 |
paradise | +3.263 |
Built | +3.077 |
Located | +3.037 |
Neg logit contributions | |
percentages | -3.045 |
percentile | -2.806 |
percentage | -2.684 |
pts | -2.612 |
offenses | -2.594 |
Token | percent |
Token ID | 1411 |
Feature activation | +5.67e+00 |
Pos logit contributions | |
percentages | +8.209 |
percentile | +7.701 |
percentage | +7.410 |
percent | +7.202 |
pts | +7.092 |
Neg logit contributions | |
civilisation | -10.087 |
Construction | -9.565 |
paradise | -9.130 |
Built | -9.030 |
Located | -9.028 |
Token | lower |
Token ID | 2793 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
percentages | +5.709 |
percentile | +5.369 |
percentage | +5.212 |
unfavorable | +5.054 |
fewer | +5.045 |
Neg logit contributions | |
civilisation | -4.876 |
Construction | -4.687 |
paradise | -4.424 |
Built | -4.372 |
Located | -4.350 |
Token | than |
Token ID | 621 |
Feature activation | -5.98e+00 |
Pos logit contributions | |
percentages | +1.961 |
percentile | +1.813 |
percentage | +1.749 |
unfavorable | +1.689 |
pts | +1.685 |
Neg logit contributions | |
civilisation | -2.093 |
Construction | -2.019 |
paradise | -1.960 |
Built | -1.893 |
Located | -1.883 |
Token | average |
Token ID | 2811 |
Feature activation | -6.29e-01 |
Pos logit contributions | |
civilisation | +6.510 |
paradise | +6.227 |
Construction | +6.219 |
Built | +5.914 |
ufact | +5.886 |
Neg logit contributions | |
percentages | -4.354 |
percentile | -3.980 |
percentage | -3.751 |
pts | -3.685 |
inaccur | -3.682 |
Token | yields |
Token ID | 19299 |
Feature activation | +5.65e+00 |
Pos logit contributions | |
civilisation | +0.527 |
Construction | +0.507 |
paradise | +0.492 |
Built | +0.468 |
Located | +0.467 |
Neg logit contributions | |
percentages | -0.650 |
percentile | -0.609 |
percentage | -0.587 |
unfavorable | -0.573 |
pts | -0.573 |
Token | . |
Token ID | 13 |
Feature activation | +3.27e+00 |
Pos logit contributions | |
percentages | +5.773 |
percentile | +5.387 |
percentage | +5.249 |
unfavorable | +5.040 |
pts | +5.016 |
Neg logit contributions | |
civilisation | -4.819 |
Construction | -4.602 |
paradise | -4.435 |
Built | -4.260 |
Located | -4.256 |
Token | I |
Token ID | 314 |
Feature activation | +6.29e+00 |
Pos logit contributions | |
percentages | +3.016 |
percentile | +2.795 |
percentage | +2.701 |
pts | +2.614 |
unfavorable | +2.598 |
Neg logit contributions | |
civilisation | -3.131 |
Construction | -2.991 |
paradise | -2.915 |
Built | -2.802 |
Located | -2.783 |
Token | � |
Token ID | 447 |
Feature activation | -5.61e+00 |
Pos logit contributions | |
percentages | +5.882 |
percentile | +5.454 |
percentage | +5.328 |
unfavorable | +5.098 |
inaccur | +5.062 |
Neg logit contributions | |
civilisation | -5.802 |
Construction | -5.523 |
paradise | -5.357 |
Built | -5.148 |
Located | -5.139 |
Token | � |
Token ID | 247 |
Feature activation | -7.22e+00 |
Pos logit contributions | |
civilisation | +3.930 |
Construction | +3.914 |
paradise | +3.734 |
Built | +3.629 |
Located | +3.582 |
Neg logit contributions | |
percentages | -6.227 |
percentile | -5.784 |
percentage | -5.645 |
pts | -5.556 |
inaccur | -5.549 |
Token | Help |
Token ID | 22087 |
Feature activation | -8.78e+00 |
Pos logit contributions | |
civilisation | +6.863 |
Construction | +6.791 |
paradise | +6.486 |
Built | +6.363 |
Located | +6.311 |
Neg logit contributions | |
percentages | -5.681 |
percentile | -5.213 |
percentage | -4.941 |
unfavorable | -4.904 |
pts | -4.824 |
Token | and |
Token ID | 290 |
Feature activation | +8.46e-01 |
Pos logit contributions | |
civilisation | +8.411 |
Construction | +8.192 |
paradise | +7.876 |
Built | +7.678 |
Located | +7.615 |
Neg logit contributions | |
percentages | -7.562 |
percentile | -6.958 |
unfavorable | -6.634 |
percentage | -6.577 |
inaccur | -6.487 |
Token | # |
Token ID | 1303 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
percentages | +0.581 |
percentile | +0.524 |
percentage | +0.497 |
unfavorable | +0.475 |
pts | +0.473 |
Neg logit contributions | |
civilisation | -1.012 |
Construction | -0.983 |
paradise | -0.960 |
Built | -0.933 |
Located | -0.929 |
Token | C |
Token ID | 34 |
Feature activation | -8.58e+00 |
Pos logit contributions | |
Construction | +10.358 |
civilisation | +10.090 |
Built | +9.851 |
Building | +9.710 |
Located | +9.584 |
Neg logit contributions | |
percentages | -10.924 |
percentile | -9.969 |
percentage | -9.636 |
unfavorable | -9.463 |
inaccur | -9.393 |
Token | hen |
Token ID | 831 |
Feature activation | -7.68e+00 |
Pos logit contributions | |
civilisation | +4.268 |
Construction | +4.106 |
paradise | +3.707 |
Built | +3.657 |
Building | +3.580 |
Neg logit contributions | |
percentages | -11.261 |
percentile | -10.566 |
percentage | -10.317 |
unfavorable | -10.272 |
inaccur | -10.235 |
Token | nai |
Token ID | 38600 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
civilisation | +6.576 |
Construction | +6.314 |
paradise | +6.042 |
Built | +6.018 |
Located | +5.926 |
Neg logit contributions | |
percentages | -7.461 |
percentile | -6.920 |
percentage | -6.616 |
unfavorable | -6.545 |
inaccur | -6.476 |
Token | Fl |
Token ID | 7414 |
Feature activation | -7.84e+00 |
Pos logit contributions | |
Construction | +10.111 |
civilisation | +10.049 |
Built | +9.558 |
Building | +9.380 |
Located | +9.285 |
Neg logit contributions | |
percentages | -10.187 |
percentile | -9.403 |
unfavorable | -9.010 |
percentage | -8.986 |
inaccur | -8.802 |
Token | ood |
Token ID | 702 |
Feature activation | -9.71e+00 |
Pos logit contributions | |
civilisation | +4.369 |
Construction | +4.193 |
paradise | +3.883 |
Located | +3.857 |
Built | +3.856 |
Neg logit contributions | |
percentages | -9.849 |
percentile | -9.198 |
unfavorable | -8.931 |
percentage | -8.880 |
pts | -8.849 |
Token | s |
Token ID | 82 |
Feature activation | -3.17e+00 |
Pos logit contributions | |
Construction | +9.648 |
civilisation | +9.638 |
paradise | +9.170 |
Built | +9.047 |
Building | +8.899 |
Neg logit contributions | |
percentages | -7.671 |
percentile | -7.115 |
unfavorable | -6.681 |
percentage | -6.639 |
inaccur | -6.505 |
Token | have |
Token ID | 423 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
civilisation | +2.922 |
Construction | +2.852 |
paradise | +2.740 |
Built | +2.668 |
Located | +2.640 |
Neg logit contributions | |
percentages | -3.002 |
percentile | -2.791 |
percentage | -2.675 |
unfavorable | -2.634 |
pts | -2.593 |
Token | been |
Token ID | 587 |
Feature activation | -6.63e+00 |
Pos logit contributions | |
civilisation | +8.080 |
paradise | +7.718 |
rebuilt | +7.669 |
Construction | +7.543 |
transformed | +7.384 |
Neg logit contributions | |
percentages | -10.307 |
percentile | -9.706 |
inacc | -9.231 |
percentage | -9.205 |
unfavorable | -9.163 |
Token | answers |
Token ID | 7429 |
Feature activation | +6.15e+00 |
Pos logit contributions | |
percentages | +2.365 |
percentile | +2.203 |
percentage | +2.140 |
unfavorable | +2.071 |
pts | +2.061 |
Neg logit contributions | |
civilisation | -2.051 |
Construction | -1.973 |
paradise | -1.896 |
Built | -1.835 |
Located | -1.828 |
Token | on |
Token ID | 319 |
Feature activation | +4.50e+00 |
Pos logit contributions | |
percentages | +5.584 |
percentile | +5.132 |
percentage | +5.009 |
unfavorable | +4.852 |
pts | +4.823 |
Neg logit contributions | |
civilisation | -5.873 |
Construction | -5.623 |
paradise | -5.420 |
ufact | -5.319 |
Located | -5.284 |
Token | exec |
Token ID | 2452 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
percentages | +4.532 |
percentile | +4.207 |
percentage | +4.114 |
unfavorable | +3.971 |
inaccur | +3.940 |
Neg logit contributions | |
civilisation | -3.924 |
Construction | -3.780 |
paradise | -3.601 |
Built | -3.526 |
Located | -3.511 |
Token | pay |
Token ID | 1414 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
percentages | +9.681 |
percentile | +8.961 |
percentage | +8.753 |
vs | +8.288 |
pts | +8.252 |
Neg logit contributions | |
civilisation | -10.104 |
Construction | -9.902 |
Built | -9.297 |
Located | -9.267 |
ufact | -9.131 |
Token | � |
Token ID | 564 |
Feature activation | +7.37e-01 |
Pos logit contributions | |
percentages | +16.647 |
percentile | +15.225 |
percentage | +15.210 |
inaccur | +14.660 |
vs | +14.653 |
Neg logit contributions | |
civilisation | -14.149 |
Construction | -13.486 |
Located | -12.851 |
ufact | -12.810 |
Built | -12.713 |
Token | � |
Token ID | 250 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
percentages | +0.832 |
percentile | +0.779 |
percentage | +0.757 |
unfavorable | +0.737 |
pts | +0.735 |
Neg logit contributions | |
civilisation | -0.553 |
Construction | -0.532 |
paradise | -0.513 |
Built | -0.490 |
Located | -0.486 |
Token | I |
Token ID | 40 |
Feature activation | +8.07e+00 |
Pos logit contributions | |
civilisation | +1.072 |
Construction | +1.050 |
paradise | +1.014 |
Built | +0.973 |
Located | +0.973 |
Neg logit contributions | |
percentages | -1.078 |
percentile | -1.003 |
percentage | -0.959 |
unfavorable | -0.934 |
pts | -0.927 |
Token | � |
Token ID | 447 |
Feature activation | -5.83e+00 |
Pos logit contributions | |
percentages | +7.687 |
percentile | +7.132 |
percentage | +6.998 |
inaccur | +6.763 |
unfavorable | +6.742 |
Neg logit contributions | |
civilisation | -7.153 |
Construction | -6.800 |
paradise | -6.602 |
Located | -6.348 |
Built | -6.328 |
Token | � |
Token ID | 247 |
Feature activation | -2.96e+00 |
Pos logit contributions | |
Construction | +3.776 |
civilisation | +3.768 |
paradise | +3.537 |
Built | +3.444 |
Located | +3.420 |
Neg logit contributions | |
percentages | -6.765 |
percentile | -6.296 |
percentage | -6.147 |
pts | -6.100 |
unfavorable | -6.059 |
Token | m |
Token ID | 76 |
Feature activation | +6.46e+00 |
Pos logit contributions | |
civilisation | +2.604 |
Construction | +2.557 |
paradise | +2.453 |
Built | +2.376 |
Located | +2.361 |
Neg logit contributions | |
percentages | -2.891 |
percentile | -2.693 |
percentage | -2.583 |
pts | -2.512 |
offenses | -2.506 |
Token | shocked |
Token ID | 11472 |
Feature activation | +3.32e+00 |
Pos logit contributions | |
percentages | +6.059 |
percentile | +5.611 |
percentage | +5.466 |
unfavorable | +5.302 |
inaccur | +5.276 |
Neg logit contributions | |
civilisation | -5.942 |
Construction | -5.657 |
paradise | -5.466 |
Built | -5.297 |
Located | -5.290 |
Token | and |
Token ID | 290 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
civilisation | +1.122 |
Construction | +1.085 |
paradise | +1.061 |
Built | +1.023 |
Located | +1.019 |
Neg logit contributions | |
percentages | -0.779 |
percentile | -0.714 |
percentage | -0.677 |
pts | -0.652 |
unfavorable | -0.649 |
Token | travel |
Token ID | 3067 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
civilisation | +1.448 |
Construction | +1.381 |
paradise | +1.347 |
Built | +1.282 |
rebuilt | +1.271 |
Neg logit contributions | |
percentages | -1.460 |
percentile | -1.360 |
percentage | -1.303 |
pts | -1.270 |
unfavorable | -1.263 |
Token | bans |
Token ID | 20075 |
Feature activation | -9.77e+00 |
Pos logit contributions | |
civilisation | +5.200 |
Construction | +4.956 |
paradise | +4.920 |
rebuilt | +4.682 |
Building | +4.651 |
Neg logit contributions | |
percentages | -3.307 |
percentile | -3.043 |
percentage | -2.882 |
pts | -2.801 |
unfavorable | -2.746 |
Token | and |
Token ID | 290 |
Feature activation | -6.96e+00 |
Pos logit contributions | |
civilisation | +10.192 |
Construction | +9.743 |
paradise | +9.615 |
rebuilt | +9.142 |
Built | +9.104 |
Neg logit contributions | |
percentages | -7.221 |
percentile | -6.705 |
percentage | -6.205 |
inacc | -6.122 |
pts | -6.116 |
Token | is |
Token ID | 318 |
Feature activation | -6.11e+00 |
Pos logit contributions | |
civilisation | +7.060 |
Construction | +6.618 |
paradise | +6.556 |
rebuilt | +6.243 |
Building | +6.113 |
Neg logit contributions | |
percentages | -5.674 |
percentile | -5.293 |
percentage | -4.967 |
pts | -4.897 |
inaccur | -4.832 |
Token | expected |
Token ID | 2938 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
civilisation | +5.652 |
Construction | +5.299 |
paradise | +5.247 |
rebuilt | +5.017 |
Building | +4.886 |
Neg logit contributions | |
percentages | -5.563 |
percentile | -5.180 |
percentage | -4.951 |
pts | -4.872 |
offenses | -4.785 |
Token | to |
Token ID | 284 |
Feature activation | -3.28e+00 |
Pos logit contributions | |
civilisation | +19.908 |
paradise | +18.371 |
Construction | +18.320 |
rebuilt | +17.185 |
ufact | +16.841 |
Neg logit contributions | |
percentages | -13.814 |
percentile | -13.014 |
inacc | -11.953 |
percentage | -11.750 |
percent | -11.731 |
Token | advocate |
Token ID | 12811 |
Feature activation | -9.09e+00 |
Pos logit contributions | |
civilisation | +3.413 |
paradise | +3.222 |
Construction | +3.197 |
rebuilt | +3.079 |
Built | +2.992 |
Neg logit contributions | |
percentages | -2.694 |
percentile | -2.437 |
percentage | -2.302 |
pts | -2.283 |
unfavorable | -2.265 |
Token | careful |
Token ID | 8161 |
Feature activation | -9.73e+00 |
Pos logit contributions | |
civilisation | +9.001 |
paradise | +8.286 |
Construction | +8.244 |
rebuilt | +7.828 |
Building | +7.670 |
Neg logit contributions | |
percentages | -7.379 |
percentile | -6.859 |
percentage | -6.494 |
pts | -6.478 |
percent | -6.338 |
Token | medical |
Token ID | 3315 |
Feature activation | -3.60e+00 |
Pos logit contributions | |
civilisation | +9.529 |
Construction | +8.740 |
paradise | +8.546 |
rebuilt | +8.157 |
countryside | +8.119 |
Neg logit contributions | |
percentages | -7.967 |
percentile | -7.494 |
percentage | -7.007 |
pts | -6.961 |
unfavorable | -6.852 |
Token | management |
Token ID | 4542 |
Feature activation | +7.13e-01 |
Pos logit contributions | |
civilisation | +3.458 |
Construction | +3.244 |
paradise | +3.182 |
Located | +2.979 |
Built | +2.970 |
Neg logit contributions | |
percentages | -3.294 |
percentile | -3.080 |
percentage | -2.941 |
unfavorable | -2.870 |
pts | -2.855 |
Token | system |
Token ID | 1080 |
Feature activation | -6.57e+00 |
Pos logit contributions | |
civilisation | +4.881 |
paradise | +4.594 |
Construction | +4.438 |
rebuilt | +4.142 |
Built | +4.101 |
Neg logit contributions | |
percentages | -5.198 |
percentile | -4.876 |
pts | -4.683 |
percentage | -4.611 |
unfavorable | -4.560 |
Token | must |
Token ID | 1276 |
Feature activation | -5.77e+00 |
Pos logit contributions | |
civilisation | +5.965 |
paradise | +5.566 |
Construction | +5.557 |
rebuilt | +5.313 |
Built | +5.164 |
Neg logit contributions | |
percentages | -6.054 |
percentile | -5.642 |
percentage | -5.408 |
pts | -5.327 |
unfavorable | -5.224 |
Token | stay |
Token ID | 2652 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
civilisation | +5.525 |
paradise | +5.235 |
Construction | +5.125 |
rebuilt | +5.010 |
Built | +4.803 |
Neg logit contributions | |
percentages | -5.080 |
percentile | -4.627 |
percentage | -4.393 |
pts | -4.393 |
inacc | -4.300 |
Token | the |
Token ID | 262 |
Feature activation | -9.36e+00 |
Pos logit contributions | |
civilisation | +12.400 |
paradise | +11.847 |
rebuilt | +11.315 |
Construction | +11.269 |
transformed | +10.916 |
Neg logit contributions | |
percentages | -9.473 |
percentile | -8.886 |
pts | -8.591 |
percentage | -8.185 |
percent | -8.122 |
Token | way |
Token ID | 835 |
Feature activation | -2.19e+01 |
Pos logit contributions | |
civilisation | +8.445 |
paradise | +8.116 |
Construction | +7.684 |
rebuilt | +7.362 |
Built | +7.273 |
Neg logit contributions | |
percentages | -8.230 |
percentile | -7.830 |
pts | -7.603 |
inaccur | -7.285 |
percentage | -7.249 |
Token | it |
Token ID | 340 |
Feature activation | -2.16e+01 |
Pos logit contributions | |
civilisation | +17.860 |
paradise | +16.754 |
rebuilt | +15.778 |
Construction | +15.653 |
transformed | +15.091 |
Neg logit contributions | |
percentages | -15.581 |
percentile | -15.084 |
pts | -14.296 |
disapprove | -14.113 |
inacc | -14.085 |
Token | is |
Token ID | 318 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
civilisation | +13.796 |
paradise | +13.295 |
rebuilt | +13.135 |
transformed | +12.389 |
Built | +12.304 |
Neg logit contributions | |
percentages | -18.305 |
percentile | -17.945 |
inacc | -17.508 |
disapprove | -16.937 |
unfavorable | -16.798 |
Token | ." |
Token ID | 526 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
civilisation | +13.273 |
paradise | +12.883 |
Construction | +12.796 |
rebuilt | +12.558 |
Built | +12.156 |
Neg logit contributions | |
percentages | -9.755 |
percentile | -8.788 |
pts | -8.451 |
percentage | -8.424 |
inacc | -8.271 |
Token | ( |
Token ID | 357 |
Feature activation | -5.05e-01 |
Pos logit contributions | |
civilisation | +1.882 |
Construction | +1.840 |
paradise | +1.767 |
Built | +1.711 |
Located | +1.694 |
Neg logit contributions | |
percentages | -2.485 |
percentile | -2.323 |
percentage | -2.232 |
unfavorable | -2.202 |
inaccur | -2.198 |
Token | Me |
Token ID | 5308 |
Feature activation | +6.37e+00 |
Pos logit contributions | |
civilisation | +0.377 |
Construction | +0.367 |
paradise | +0.349 |
Built | +0.338 |
Located | +0.336 |
Neg logit contributions | |
percentages | -0.571 |
percentile | -0.537 |
percentage | -0.520 |
unfavorable | -0.507 |
inaccur | -0.505 |
Token | aning |
Token ID | 7574 |
Feature activation | -5.69e+00 |
Pos logit contributions | |
percentages | +6.166 |
percentile | +5.724 |
percentage | +5.583 |
unfavorable | +5.345 |
pts | +5.338 |
Neg logit contributions | |
civilisation | -5.673 |
Construction | -5.521 |
paradise | -5.285 |
Built | -5.143 |
Located | -5.137 |
Token | its |
Token ID | 663 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
civilisation | +16.772 |
paradise | +15.489 |
Construction | +15.080 |
countryside | +14.478 |
rebuilt | +14.353 |
Neg logit contributions | |
percentages | -10.791 |
percentile | -10.409 |
pts | -9.467 |
inaccur | -9.232 |
disapprove | -9.183 |
Token | being |
Token ID | 852 |
Feature activation | -7.63e+00 |
Pos logit contributions | |
civilisation | +12.411 |
paradise | +11.559 |
Construction | +11.359 |
rebuilt | +10.876 |
countryside | +10.815 |
Neg logit contributions | |
percentages | -8.730 |
percentile | -8.146 |
pts | -7.564 |
percent | -7.439 |
percentage | -7.422 |
Token | , |
Token ID | 11 |
Feature activation | -9.05e+00 |
Pos logit contributions | |
civilisation | +8.349 |
Construction | +8.007 |
paradise | +7.806 |
Built | +7.601 |
rebuilt | +7.573 |
Neg logit contributions | |
percentages | -5.565 |
percentile | -5.104 |
percentage | -4.727 |
pts | -4.649 |
offenses | -4.602 |
Token | but |
Token ID | 4360 |
Feature activation | -2.17e+01 |
Pos logit contributions | |
civilisation | +9.359 |
Construction | +8.938 |
paradise | +8.756 |
Built | +8.473 |
Building | +8.390 |
Neg logit contributions | |
percentages | -6.925 |
percentile | -6.484 |
percentage | -5.985 |
pts | -5.848 |
unfavorable | -5.798 |
Token | also |
Token ID | 635 |
Feature activation | -2.01e+01 |
Pos logit contributions | |
civilisation | +20.781 |
paradise | +19.548 |
Construction | +19.361 |
rebuilt | +18.491 |
transformed | +18.489 |
Neg logit contributions | |
percentages | -12.468 |
percentile | -11.515 |
pts | -10.341 |
percentage | -10.243 |
disapprove | -10.205 |
Token | in |
Token ID | 287 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
civilisation | +19.707 |
Construction | +18.596 |
paradise | +18.395 |
rebuilt | +17.603 |
transformed | +17.600 |
Neg logit contributions | |
percentages | -11.562 |
percentile | -10.646 |
percentage | -9.525 |
pts | -9.506 |
offenses | -9.498 |
Token | its |
Token ID | 663 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
civilisation | +22.655 |
paradise | +21.025 |
Construction | +20.270 |
ufact | +19.756 |
transformed | +19.598 |
Neg logit contributions | |
percentages | -14.688 |
percentile | -13.875 |
pts | -12.730 |
disapprove | -12.480 |
percent | -12.405 |
Token | process |
Token ID | 1429 |
Feature activation | -7.68e+00 |
Pos logit contributions | |
civilisation | +16.093 |
paradise | +14.899 |
Construction | +14.507 |
rebuilt | +13.964 |
countryside | +13.929 |
Neg logit contributions | |
percentages | -10.387 |
percentile | -9.606 |
pts | -9.055 |
percent | -9.026 |
percentage | -8.673 |
Token | . |
Token ID | 13 |
Feature activation | -2.60e+01 |
Pos logit contributions | |
civilisation | +9.987 |
Construction | +9.749 |
paradise | +9.413 |
Built | +9.201 |
Building | +9.160 |
Neg logit contributions | |
percentages | -4.030 |
percentile | -3.556 |
percentage | -3.216 |
unfavorable | -3.104 |
pts | -3.072 |
Token | Contrary |
Token ID | 43607 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
Construction | +22.343 |
Building | +21.585 |
civilisation | +21.501 |
Built | +21.421 |
Located | +21.009 |
Neg logit contributions | |
percentages | -14.989 |
percentile | -13.852 |
inaccur | -12.948 |
unfavorable | -12.720 |
percentage | -12.558 |
Token | to |
Token ID | 284 |
Feature activation | -9.85e+00 |
Pos logit contributions | |
civilisation | +9.965 |
Construction | +9.469 |
paradise | +9.213 |
Built | +8.675 |
issance | +8.640 |
Neg logit contributions | |
percentages | -11.682 |
percentile | -11.195 |
percentage | -10.400 |
inacc | -10.199 |
unfavorable | -10.164 |
Token | works |
Token ID | 2499 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
civilisation | +7.161 |
paradise | +6.881 |
Construction | +6.850 |
rebuilt | +6.797 |
Built | +6.449 |
Neg logit contributions | |
percentages | -9.175 |
percentile | -8.599 |
pts | -8.231 |
percentage | -8.224 |
unfavorable | -8.204 |
Token | hard |
Token ID | 1327 |
Feature activation | -4.78e+00 |
Pos logit contributions | |
civilisation | +1.670 |
Construction | +1.601 |
paradise | +1.588 |
Built | +1.490 |
Located | +1.486 |
Neg logit contributions | |
percentages | -1.653 |
percentile | -1.527 |
percentage | -1.477 |
pts | -1.449 |
unfavorable | -1.436 |
Token | at |
Token ID | 379 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
civilisation | +4.927 |
Construction | +4.775 |
paradise | +4.735 |
rebuilt | +4.460 |
ufact | +4.439 |
Neg logit contributions | |
percentages | -3.813 |
percentile | -3.504 |
percentage | -3.325 |
pts | -3.298 |
unfavorable | -3.281 |
Token | her |
Token ID | 607 |
Feature activation | -7.86e+00 |
Pos logit contributions | |
civilisation | +13.222 |
paradise | +12.768 |
Construction | +12.503 |
rebuilt | +11.848 |
Building | +11.631 |
Neg logit contributions | |
percentages | -10.773 |
percentile | -10.192 |
unfavorable | -9.734 |
disapprove | -9.703 |
pts | -9.618 |
Token | job |
Token ID | 1693 |
Feature activation | +2.86e-01 |
Pos logit contributions | |
civilisation | +5.956 |
paradise | +5.730 |
Construction | +5.725 |
rebuilt | +5.307 |
Located | +5.216 |
Neg logit contributions | |
percentages | -7.834 |
percentile | -7.452 |
pts | -7.181 |
unfavorable | -7.158 |
disapprove | -7.112 |
Token | and |
Token ID | 290 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
percentages | +0.237 |
percentile | +0.218 |
percentage | +0.209 |
pts | +0.202 |
unfavorable | +0.202 |
Neg logit contributions | |
civilisation | -0.300 |
Construction | -0.290 |
paradise | -0.283 |
Built | -0.272 |
Located | -0.271 |
Token | has |
Token ID | 468 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
civilisation | +19.683 |
paradise | +19.246 |
rebuilt | +18.808 |
Construction | +18.314 |
transformed | +17.816 |
Neg logit contributions | |
percentages | -13.791 |
percentile | -12.931 |
disapprove | -12.738 |
pts | -12.573 |
unfavorable | -12.422 |
Token | great |
Token ID | 1049 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
civilisation | +13.226 |
rebuilt | +13.031 |
paradise | +12.968 |
transformed | +12.378 |
Construction | +12.370 |
Neg logit contributions | |
percentages | -12.313 |
percentile | -11.374 |
disapprove | -11.267 |
pts | -11.048 |
percentage | -10.880 |
Token | relationships |
Token ID | 6958 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
civilisation | +4.016 |
Construction | +3.806 |
paradise | +3.764 |
rebuilt | +3.544 |
Located | +3.517 |
Neg logit contributions | |
percentages | -3.977 |
percentile | -3.739 |
percentage | -3.560 |
pts | -3.531 |
unfavorable | -3.524 |
Token | with |
Token ID | 351 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
civilisation | +9.039 |
paradise | +8.819 |
Construction | +8.638 |
rebuilt | +8.420 |
Built | +8.182 |
Neg logit contributions | |
percentages | -9.759 |
percentile | -9.065 |
percentage | -8.675 |
pts | -8.656 |
inacc | -8.594 |
Token | people |
Token ID | 661 |
Feature activation | +3.27e-01 |
Pos logit contributions | |
civilisation | +0.645 |
Construction | +0.615 |
paradise | +0.600 |
Built | +0.573 |
Located | +0.568 |
Neg logit contributions | |
percentages | -0.723 |
percentile | -0.673 |
percentage | -0.650 |
pts | -0.633 |
unfavorable | -0.632 |
Token | only |
Token ID | 691 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
civilisation | +0.920 |
Construction | +0.878 |
paradise | +0.874 |
rebuilt | +0.830 |
Built | +0.830 |
Neg logit contributions | |
percentages | -0.696 |
percentile | -0.630 |
percentage | -0.600 |
unfavorable | -0.590 |
pts | -0.588 |
Token | speculate |
Token ID | 26256 |
Feature activation | -5.04e+00 |
Pos logit contributions | |
civilisation | +1.394 |
Construction | +1.336 |
paradise | +1.331 |
Built | +1.272 |
rebuilt | +1.270 |
Neg logit contributions | |
percentages | -0.775 |
percentile | -0.688 |
percentage | -0.649 |
unfavorable | -0.630 |
pts | -0.630 |
Token | what |
Token ID | 644 |
Feature activation | -2.83e+01 |
Pos logit contributions | |
civilisation | +4.920 |
paradise | +4.658 |
Construction | +4.652 |
rebuilt | +4.332 |
Built | +4.316 |
Neg logit contributions | |
percentages | -4.401 |
percentile | -4.106 |
percentage | -3.910 |
pts | -3.813 |
offenses | -3.783 |
Token | it |
Token ID | 340 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
civilisation | +26.587 |
paradise | +24.502 |
transformed | +23.623 |
rebuilt | +23.050 |
Construction | +22.749 |
Neg logit contributions | |
percentages | -12.180 |
percentile | -11.789 |
pts | -11.647 |
percent | -11.231 |
disapprove | -10.848 |
Token | was |
Token ID | 373 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
civilisation | +16.240 |
paradise | +15.144 |
rebuilt | +15.011 |
transformed | +14.739 |
revital | +14.052 |
Neg logit contributions | |
percentages | -15.815 |
percentile | -14.865 |
inacc | -14.707 |
unfavorable | -14.627 |
pts | -14.372 |
Token | for |
Token ID | 329 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
civilisation | +17.827 |
paradise | +17.141 |
rebuilt | +16.197 |
Construction | +15.972 |
transformed | +15.574 |
Neg logit contributions | |
percentages | -12.939 |
percentile | -11.861 |
pts | -11.522 |
offenses | -11.082 |
percentage | -11.014 |
Token | . |
Token ID | 13 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
civilisation | +20.249 |
paradise | +18.778 |
Construction | +18.524 |
rebuilt | +17.523 |
Harbour | +17.185 |
Neg logit contributions | |
percentages | -13.787 |
percentile | -13.016 |
pts | -11.631 |
disapprove | -11.592 |
percent | -11.560 |
Token | It |
Token ID | 632 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
Construction | +15.931 |
civilisation | +15.161 |
Built | +14.863 |
Harbour | +14.790 |
Building | +14.745 |
Neg logit contributions | |
percentages | -16.944 |
regress | -15.759 |
percentile | -15.741 |
disapprove | -15.583 |
offenses | -15.562 |
Token | might |
Token ID | 1244 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
civilisation | +14.746 |
paradise | +13.872 |
rebuilt | +13.855 |
transformed | +13.603 |
revital | +13.115 |
Neg logit contributions | |
percentages | -15.203 |
percentile | -14.105 |
pts | -13.627 |
inacc | -13.622 |
Percent | -13.536 |
Token | have |
Token ID | 423 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
civilisation | +2.339 |
Construction | +2.219 |
paradise | +2.219 |
Built | +2.114 |
Located | +2.111 |
Neg logit contributions | |
percentages | -1.490 |
percentile | -1.329 |
percentage | -1.255 |
pts | -1.232 |
unfavorable | -1.229 |
Token | been |
Token ID | 587 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
civilisation | +19.182 |
transformed | +18.237 |
rebuilt | +18.064 |
paradise | +17.821 |
revital | +17.338 |
Neg logit contributions | |
percentages | -16.646 |
percentile | -15.733 |
Percent | -15.461 |
percent | -15.386 |
inacc | -15.012 |