Token | good |
Token ID | 922 |
Feature activation | +8.57e-01 |
Pos logit contributions | |
damaging | +9.105 |
meaningful | +8.950 |
categ | +8.731 |
contrasting | +8.728 |
compelling | +8.637 |
Neg logit contributions | |
eers | -11.448 |
culosis | -10.945 |
Transactions | -10.549 |
Companies | -10.081 |
Works | -10.043 |
Token | job |
Token ID | 1693 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
damaging | +4.222 |
meaningful | +4.147 |
categ | +4.090 |
contrasting | +4.073 |
insofar | +4.044 |
Neg logit contributions | |
eers | -4.731 |
culosis | -4.386 |
Transactions | -4.169 |
Works | -4.130 |
Companies | -4.038 |
Token | repeatedly |
Token ID | 7830 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
damaging | +9.830 |
meaningful | +9.560 |
contrasting | +9.540 |
categ | +9.391 |
insofar | +9.365 |
Neg logit contributions | |
eers | -12.110 |
culosis | -11.489 |
Transactions | -11.182 |
Works | -10.686 |
Facility | -10.582 |
Token | pressing |
Token ID | 12273 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
damaging | +9.350 |
contrasting | +9.092 |
meaningful | +8.983 |
ignoring | +8.841 |
categ | +8.826 |
Neg logit contributions | |
eers | -14.084 |
culosis | -13.341 |
Transactions | -13.076 |
Works | -12.517 |
Facility | -12.455 |
Token | on |
Token ID | 319 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
damaging | +9.356 |
meaningful | +9.145 |
contrasting | +8.990 |
categ | +8.958 |
insofar | +8.893 |
Neg logit contributions | |
eers | -10.519 |
culosis | -9.941 |
Transactions | -9.521 |
Works | -9.121 |
Companies | -9.016 |
Token | Trump |
Token ID | 1301 |
Feature activation | +4.37e+00 |
Pos logit contributions | |
damaging | +9.435 |
meaningful | +9.233 |
categ | +9.059 |
contrasting | +9.056 |
insofar | +9.016 |
Neg logit contributions | |
eers | -9.926 |
culosis | -9.313 |
Transactions | -8.929 |
Works | -8.558 |
Companies | -8.454 |
Token | � |
Token ID | 447 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
damaging | +21.465 |
meaningful | +20.736 |
insofar | +20.632 |
whether | +20.579 |
contrasting | +20.474 |
Neg logit contributions | |
eers | -17.153 |
culosis | -16.069 |
Transactions | -15.699 |
Works | -14.346 |
Facility | -14.309 |
Token | � |
Token ID | 247 |
Feature activation | +3.31e-01 |
Pos logit contributions | |
damaging | +1.730 |
meaningful | +1.699 |
categ | +1.672 |
contrasting | +1.669 |
insofar | +1.666 |
Neg logit contributions | |
eers | -1.404 |
culosis | -1.301 |
Transactions | -1.233 |
Works | -1.188 |
Companies | -1.170 |
Token | s |
Token ID | 82 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
damaging | +2.052 |
meaningful | +2.039 |
contrasting | +2.022 |
categ | +2.020 |
insofar | +1.989 |
Neg logit contributions | |
eers | -1.387 |
culosis | -1.280 |
Transactions | -1.169 |
Works | -1.154 |
Companies | -1.122 |
Token | essentially |
Token ID | 6986 |
Feature activation | +2.01e+00 |
Pos logit contributions | |
damaging | +11.932 |
meaningful | +11.525 |
categ | +11.442 |
contrasting | +11.379 |
ignoring | +11.109 |
Neg logit contributions | |
eers | -11.457 |
culosis | -11.022 |
Transactions | -10.486 |
Works | -9.892 |
Queue | -9.830 |
Token | admitted |
Token ID | 6848 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
damaging | +9.007 |
meaningful | +8.759 |
categ | +8.696 |
contrasting | +8.610 |
insofar | +8.477 |
Neg logit contributions | |
eers | -11.678 |
culosis | -11.101 |
Transactions | -10.665 |
Works | -10.279 |
Companies | -10.191 |
Token | criticism |
Token ID | 7734 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
damaging | +8.439 |
meaningful | +8.292 |
categ | +8.205 |
contrasting | +8.152 |
insofar | +8.026 |
Neg logit contributions | |
eers | -10.163 |
culosis | -9.591 |
Transactions | -9.282 |
Works | -8.915 |
Facility | -8.851 |
Token | of |
Token ID | 286 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
damaging | +7.709 |
meaningful | +7.574 |
categ | +7.456 |
contrasting | +7.426 |
insofar | +7.400 |
Neg logit contributions | |
eers | -8.367 |
culosis | -7.791 |
Transactions | -7.453 |
Works | -7.261 |
Companies | -7.169 |
Token | Trump |
Token ID | 1301 |
Feature activation | +2.95e+00 |
Pos logit contributions | |
damaging | +5.976 |
meaningful | +5.864 |
categ | +5.774 |
contrasting | +5.766 |
insofar | +5.763 |
Neg logit contributions | |
eers | -6.856 |
culosis | -6.385 |
Transactions | -6.142 |
Works | -5.991 |
Companies | -5.909 |
Token | on |
Token ID | 319 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
damaging | +17.390 |
contrasting | +16.898 |
meaningful | +16.838 |
insofar | +16.780 |
categ | +16.766 |
Neg logit contributions | |
eers | -11.471 |
culosis | -10.564 |
Transactions | -10.071 |
Works | -9.336 |
Facility | -9.321 |
Token | Thursday |
Token ID | 3635 |
Feature activation | +3.27e+00 |
Pos logit contributions | |
damaging | +7.915 |
meaningful | +7.726 |
contrasting | +7.622 |
categ | +7.613 |
insofar | +7.534 |
Neg logit contributions | |
eers | -8.646 |
culosis | -8.101 |
Transactions | -7.766 |
Works | -7.491 |
Companies | -7.392 |
Token | , |
Token ID | 11 |
Feature activation | +4.26e+00 |
Pos logit contributions | |
damaging | +14.883 |
contrasting | +14.567 |
meaningful | +14.288 |
insofar | +14.256 |
categ | +14.111 |
Neg logit contributions | |
eers | -16.954 |
culosis | -16.211 |
Transactions | -15.730 |
Works | -14.707 |
Facility | -14.690 |
Token | saying |
Token ID | 2282 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
contrasting | +18.473 |
damaging | +18.310 |
ignoring | +17.812 |
categ | +17.685 |
meaningful | +17.395 |
Neg logit contributions | |
eers | -20.832 |
culosis | -19.668 |
Transactions | -19.261 |
Queue | -17.823 |
Works | -17.716 |
Token | he |
Token ID | 339 |
Feature activation | +9.93e-01 |
Pos logit contributions | |
damaging | +6.781 |
meaningful | +6.646 |
categ | +6.540 |
contrasting | +6.533 |
insofar | +6.503 |
Neg logit contributions | |
eers | -7.098 |
culosis | -6.637 |
Transactions | -6.346 |
Works | -6.150 |
Companies | -6.066 |
Token | was |
Token ID | 373 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
damaging | +6.713 |
meaningful | +6.612 |
categ | +6.535 |
contrasting | +6.532 |
insofar | +6.506 |
Neg logit contributions | |
eers | -3.592 |
culosis | -3.249 |
Transactions | -3.047 |
Works | -2.884 |
Companies | -2.833 |
Token | � |
Token ID | 564 |
Feature activation | +2.15e+00 |
Pos logit contributions | |
damaging | +7.381 |
meaningful | +7.158 |
categ | +7.038 |
contrasting | +7.021 |
insofar | +6.908 |
Neg logit contributions | |
eers | -11.734 |
culosis | -11.116 |
Transactions | -10.729 |
Works | -10.405 |
Companies | -10.306 |
Token | � |
Token ID | 250 |
Feature activation | +7.95e-01 |
Pos logit contributions | |
damaging | +12.625 |
meaningful | +12.363 |
contrasting | +12.216 |
categ | +12.174 |
ignoring | +12.151 |
Neg logit contributions | |
eers | -8.803 |
culosis | -8.130 |
Transactions | -7.729 |
Works | -7.273 |
Companies | -7.188 |
Token | is |
Token ID | 318 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
eers | +3.368 |
culosis | +2.883 |
Works | +2.751 |
Transactions | +2.696 |
Companies | +2.562 |
Neg logit contributions | |
damaging | -6.002 |
meaningful | -5.925 |
categ | -5.877 |
contrasting | -5.776 |
insofar | -5.764 |
Token | unclear |
Token ID | 10061 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
damaging | +1.793 |
meaningful | +1.732 |
categ | +1.714 |
contrasting | +1.712 |
insofar | +1.696 |
Neg logit contributions | |
eers | -3.434 |
culosis | -3.207 |
Transactions | -3.126 |
Works | -3.073 |
Companies | -3.034 |
Token | whether |
Token ID | 1771 |
Feature activation | +7.87e-01 |
Pos logit contributions | |
damaging | +4.097 |
meaningful | +3.976 |
categ | +3.909 |
contrasting | +3.888 |
insofar | +3.796 |
Neg logit contributions | |
eers | -7.472 |
culosis | -7.027 |
Transactions | -6.799 |
Works | -6.698 |
Companies | -6.589 |
Token | these |
Token ID | 777 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
damaging | +4.097 |
meaningful | +4.004 |
categ | +3.949 |
insofar | +3.934 |
contrasting | +3.934 |
Neg logit contributions | |
eers | -4.106 |
culosis | -3.775 |
Transactions | -3.624 |
Works | -3.547 |
Companies | -3.489 |
Token | disagreements |
Token ID | 37990 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
damaging | +2.611 |
meaningful | +2.553 |
insofar | +2.513 |
categ | +2.511 |
contrasting | +2.477 |
Neg logit contributions | |
eers | -2.845 |
culosis | -2.611 |
Transactions | -2.530 |
Works | -2.490 |
Companies | -2.429 |
Token | reflect |
Token ID | 4079 |
Feature activation | +4.24e+00 |
Pos logit contributions | |
damaging | +9.289 |
meaningful | +9.145 |
contrasting | +9.054 |
insofar | +9.038 |
categ | +8.970 |
Neg logit contributions | |
eers | -7.061 |
culosis | -6.560 |
Transactions | -6.267 |
Works | -5.943 |
Companies | -5.915 |
Token | a |
Token ID | 257 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
meaningful | +20.379 |
contrasting | +20.054 |
damaging | +19.732 |
categ | +19.627 |
consequential | +19.403 |
Neg logit contributions | |
culosis | -17.580 |
eers | -17.035 |
Transactions | -16.033 |
Facility | -15.288 |
Companies | -15.182 |
Token | real |
Token ID | 1103 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
meaningful | +16.079 |
damaging | +15.898 |
contrasting | +15.814 |
categ | +15.798 |
compelling | +15.319 |
Neg logit contributions | |
eers | -14.919 |
culosis | -14.456 |
Transactions | -13.702 |
Companies | -12.908 |
Queue | -12.864 |
Token | difference |
Token ID | 3580 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
damaging | +12.813 |
meaningful | +12.733 |
categ | +12.590 |
contrasting | +12.588 |
insofar | +12.217 |
Neg logit contributions | |
eers | -12.410 |
culosis | -11.829 |
Transactions | -11.312 |
Companies | -10.792 |
Queue | -10.683 |
Token | in |
Token ID | 287 |
Feature activation | +1.72e+00 |
Pos logit contributions | |
damaging | +4.168 |
meaningful | +4.035 |
categ | +3.972 |
contrasting | +3.937 |
insofar | +3.860 |
Neg logit contributions | |
eers | -6.395 |
culosis | -5.967 |
Transactions | -5.777 |
Works | -5.670 |
Companies | -5.603 |
Token | the |
Token ID | 262 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
damaging | +8.235 |
meaningful | +8.163 |
contrasting | +8.041 |
categ | +7.992 |
insofar | +7.876 |
Neg logit contributions | |
eers | -9.391 |
culosis | -8.933 |
Transactions | -8.510 |
Works | -8.141 |
Companies | -8.121 |
Token | points |
Token ID | 2173 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
eers | +1.268 |
culosis | +1.115 |
Transactions | +1.044 |
Works | +1.028 |
Queue | +1.021 |
Neg logit contributions | |
damaging | -1.781 |
categ | -1.757 |
insofar | -1.748 |
meaningful | -1.742 |
contrasting | -1.722 |
Token | on |
Token ID | 319 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
damaging | +7.699 |
meaningful | +7.531 |
categ | +7.396 |
contrasting | +7.395 |
insofar | +7.355 |
Neg logit contributions | |
eers | -9.887 |
culosis | -9.292 |
Transactions | -8.936 |
Works | -8.688 |
Companies | -8.584 |
Token | criminal |
Token ID | 4301 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
damaging | +6.234 |
meaningful | +6.105 |
categ | +5.994 |
contrasting | +5.993 |
insofar | +5.952 |
Neg logit contributions | |
eers | -7.702 |
culosis | -7.225 |
Transactions | -6.951 |
Works | -6.750 |
Companies | -6.671 |
Token | justice |
Token ID | 5316 |
Feature activation | +8.94e-01 |
Pos logit contributions | |
damaging | +3.372 |
meaningful | +3.303 |
categ | +3.237 |
insofar | +3.215 |
contrasting | +3.186 |
Neg logit contributions | |
eers | -7.732 |
culosis | -7.331 |
Transactions | -7.097 |
Works | -6.951 |
Companies | -6.868 |
Token | reform |
Token ID | 4975 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
damaging | +4.215 |
meaningful | +4.132 |
categ | +4.100 |
insofar | +4.043 |
contrasting | +4.026 |
Neg logit contributions | |
eers | -5.116 |
culosis | -4.741 |
Transactions | -4.555 |
Works | -4.506 |
Companies | -4.395 |
Token | , |
Token ID | 11 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
damaging | +5.593 |
meaningful | +5.470 |
categ | +5.413 |
contrasting | +5.360 |
insofar | +5.349 |
Neg logit contributions | |
eers | -6.742 |
culosis | -6.267 |
Transactions | -5.996 |
Works | -5.891 |
Companies | -5.795 |
Token | job |
Token ID | 1693 |
Feature activation | +6.23e-01 |
Pos logit contributions | |
damaging | +20.184 |
contrasting | +19.999 |
meaningful | +19.752 |
ignoring | +19.470 |
compelling | +19.199 |
Neg logit contributions | |
eers | -17.772 |
culosis | -16.394 |
Transactions | -16.255 |
Queue | -15.370 |
Facility | -15.020 |
Token | creation |
Token ID | 6282 |
Feature activation | -1.92e-03 |
Pos logit contributions | |
damaging | +3.176 |
meaningful | +3.153 |
insofar | +3.128 |
categ | +3.116 |
contrasting | +3.082 |
Neg logit contributions | |
eers | -3.282 |
culosis | -3.009 |
Transactions | -2.879 |
Works | -2.837 |
Companies | -2.761 |
Token | and |
Token ID | 290 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
eers | +0.011 |
culosis | +0.010 |
Works | +0.010 |
Transactions | +0.009 |
Companies | +0.009 |
Neg logit contributions | |
damaging | -0.009 |
meaningful | -0.009 |
categ | -0.009 |
contrasting | -0.009 |
insofar | -0.009 |
Token | increasing |
Token ID | 3649 |
Feature activation | +9.29e-01 |
Pos logit contributions | |
damaging | +9.207 |
meaningful | +9.085 |
contrasting | +8.894 |
categ | +8.796 |
insofar | +8.676 |
Neg logit contributions | |
eers | -10.724 |
culosis | -10.087 |
Transactions | -9.777 |
Works | -9.339 |
Queue | -9.315 |
Token | minimum |
Token ID | 5288 |
Feature activation | +4.17e-01 |
Pos logit contributions | |
damaging | +4.414 |
meaningful | +4.304 |
insofar | +4.257 |
categ | +4.249 |
contrasting | +4.240 |
Neg logit contributions | |
eers | -5.257 |
culosis | -4.890 |
Transactions | -4.707 |
Works | -4.620 |
Companies | -4.535 |
Token | ically |
Token ID | 1146 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
damaging | +3.304 |
meaningful | +3.228 |
categ | +3.191 |
contrasting | +3.186 |
consequential | +3.169 |
Neg logit contributions | |
eers | -2.258 |
culosis | -2.025 |
Transactions | -1.893 |
Works | -1.865 |
Companies | -1.795 |
Token | as |
Token ID | 355 |
Feature activation | +1.68e+00 |
Pos logit contributions | |
damaging | +10.499 |
meaningful | +10.319 |
insofar | +10.157 |
contrasting | +10.148 |
categ | +10.067 |
Neg logit contributions | |
eers | -13.347 |
culosis | -12.673 |
Transactions | -12.098 |
Works | -11.701 |
Companies | -11.604 |
Token | cos |
Token ID | 8615 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
damaging | +8.239 |
meaningful | +8.109 |
categ | +7.962 |
contrasting | +7.949 |
insofar | +7.917 |
Neg logit contributions | |
eers | -9.167 |
culosis | -8.637 |
Transactions | -8.223 |
Works | -7.945 |
Companies | -7.867 |
Token | m |
Token ID | 76 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
damaging | +6.888 |
meaningful | +6.741 |
contrasting | +6.663 |
categ | +6.651 |
insofar | +6.612 |
Neg logit contributions | |
eers | -6.012 |
culosis | -5.549 |
Transactions | -5.294 |
Works | -5.136 |
Companies | -5.061 |
Token | ological |
Token ID | 2770 |
Feature activation | +6.26e-01 |
Pos logit contributions | |
eers | +3.785 |
culosis | +3.377 |
Transactions | +3.159 |
Works | +3.005 |
arium | +2.803 |
Neg logit contributions | |
damaging | -7.512 |
consequential | -7.459 |
ignoring | -7.426 |
wounding | -7.421 |
categ | -7.418 |
Token | , |
Token ID | 11 |
Feature activation | +4.08e+00 |
Pos logit contributions | |
damaging | +2.984 |
meaningful | +2.878 |
contrasting | +2.847 |
categ | +2.824 |
insofar | +2.812 |
Neg logit contributions | |
eers | -3.567 |
culosis | -3.231 |
Transactions | -3.220 |
Works | -3.147 |
Companies | -3.072 |
Token | psychological |
Token ID | 10590 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
meaningful | +19.940 |
damaging | +19.783 |
insofar | +19.691 |
categ | +19.524 |
contrasting | +19.452 |
Neg logit contributions | |
eers | -18.050 |
culosis | -16.926 |
Transactions | -15.597 |
Facility | -15.117 |
Companies | -14.900 |
Token | or |
Token ID | 393 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
damaging | +7.823 |
meaningful | +7.665 |
categ | +7.536 |
contrasting | +7.526 |
insofar | +7.494 |
Neg logit contributions | |
eers | -9.423 |
culosis | -8.847 |
Transactions | -8.480 |
Works | -8.239 |
Companies | -8.146 |
Token | philosophical |
Token ID | 17580 |
Feature activation | +1.75e+00 |
Pos logit contributions | |
damaging | +10.841 |
meaningful | +10.827 |
categ | +10.601 |
contrasting | +10.464 |
insofar | +10.461 |
Neg logit contributions | |
eers | -14.296 |
culosis | -13.440 |
Transactions | -12.819 |
Companies | -12.420 |
Facility | -12.400 |
Token | messages |
Token ID | 6218 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
damaging | +8.713 |
meaningful | +8.580 |
categ | +8.440 |
contrasting | +8.427 |
insofar | +8.419 |
Neg logit contributions | |
eers | -9.319 |
culosis | -8.796 |
Transactions | -8.323 |
Works | -8.046 |
Companies | -7.999 |
Token | .[ |
Token ID | 3693 |
Feature activation | +4.63e-01 |
Pos logit contributions | |
damaging | +5.349 |
meaningful | +5.214 |
categ | +5.143 |
contrasting | +5.092 |
insofar | +5.074 |
Neg logit contributions | |
eers | -7.109 |
culosis | -6.616 |
Transactions | -6.388 |
Works | -6.249 |
Companies | -6.166 |
Token | dinner |
Token ID | 8073 |
Feature activation | -9.16e-02 |
Pos logit contributions | |
damaging | +7.100 |
meaningful | +6.992 |
contrasting | +6.876 |
categ | +6.868 |
insofar | +6.778 |
Neg logit contributions | |
eers | -6.631 |
culosis | -6.194 |
Transactions | -5.895 |
Works | -5.673 |
Companies | -5.618 |
Token | to |
Token ID | 284 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
eers | +0.525 |
culosis | +0.480 |
Transactions | +0.462 |
Works | +0.457 |
Facility | +0.454 |
Neg logit contributions | |
damaging | -0.413 |
categ | -0.405 |
meaningful | -0.401 |
insofar | -0.400 |
contrasting | -0.392 |
Token | discuss |
Token ID | 2112 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
eers | +5.103 |
culosis | +4.708 |
Companies | +4.377 |
Transactions | +4.356 |
Works | +4.292 |
Neg logit contributions | |
damaging | -5.072 |
categ | -5.051 |
insofar | -4.999 |
meaningful | -4.889 |
wounding | -4.830 |
Token | foreign |
Token ID | 3215 |
Feature activation | +9.51e-01 |
Pos logit contributions | |
damaging | +6.451 |
meaningful | +6.327 |
categ | +6.229 |
contrasting | +6.220 |
insofar | +6.196 |
Neg logit contributions | |
eers | -6.802 |
culosis | -6.344 |
Transactions | -6.077 |
Works | -5.895 |
Companies | -5.817 |
Token | policy |
Token ID | 2450 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
damaging | +4.677 |
meaningful | +4.581 |
categ | +4.520 |
insofar | +4.509 |
contrasting | +4.496 |
Neg logit contributions | |
eers | -5.262 |
culosis | -4.900 |
Transactions | -4.724 |
Works | -4.567 |
Companies | -4.523 |
Token | , |
Token ID | 11 |
Feature activation | +4.02e+00 |
Pos logit contributions | |
damaging | +5.985 |
meaningful | +5.861 |
categ | +5.795 |
contrasting | +5.747 |
insofar | +5.720 |
Neg logit contributions | |
eers | -6.573 |
culosis | -6.059 |
Transactions | -5.865 |
Works | -5.680 |
Companies | -5.605 |
Token | including |
Token ID | 1390 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
damaging | +19.648 |
contrasting | +19.210 |
meaningful | +19.064 |
insofar | +18.919 |
ignoring | +18.914 |
Neg logit contributions | |
eers | -15.882 |
culosis | -15.581 |
Transactions | -14.583 |
Queue | -14.353 |
Works | -14.007 |
Token | Russia |
Token ID | 3284 |
Feature activation | +2.29e+00 |
Pos logit contributions | |
damaging | +7.621 |
meaningful | +7.475 |
contrasting | +7.354 |
categ | +7.347 |
insofar | +7.313 |
Neg logit contributions | |
eers | -7.786 |
culosis | -7.279 |
Transactions | -6.959 |
Works | -6.741 |
Companies | -6.653 |
Token | and |
Token ID | 290 |
Feature activation | +8.81e-01 |
Pos logit contributions | |
damaging | +15.069 |
meaningful | +14.795 |
categ | +14.667 |
contrasting | +14.654 |
insofar | +14.644 |
Neg logit contributions | |
eers | -8.181 |
culosis | -7.399 |
Transactions | -6.911 |
Works | -6.536 |
Companies | -6.422 |
Token | EU |
Token ID | 4576 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
damaging | +5.036 |
meaningful | +4.944 |
categ | +4.906 |
insofar | +4.875 |
contrasting | +4.871 |
Neg logit contributions | |
eers | -4.154 |
culosis | -3.797 |
Transactions | -3.616 |
Works | -3.513 |
Companies | -3.459 |
Token | assistance |
Token ID | 6829 |
Feature activation | -6.27e-01 |
Pos logit contributions | |
damaging | +3.449 |
meaningful | +3.390 |
categ | +3.340 |
contrasting | +3.333 |
insofar | +3.323 |
Neg logit contributions | |
eers | -3.409 |
culosis | -3.157 |
Transactions | -3.029 |
Works | -2.942 |
Companies | -2.886 |
Token | of |
Token ID | 286 |
Feature activation | +7.37e-01 |
Pos logit contributions | |
damaging | +3.029 |
meaningful | +3.007 |
contrasting | +2.944 |
categ | +2.943 |
insofar | +2.912 |
Neg logit contributions | |
eers | -3.273 |
culosis | -3.050 |
Transactions | -2.897 |
Companies | -2.845 |
Works | -2.839 |
Token | the |
Token ID | 262 |
Feature activation | +5.42e-01 |
Pos logit contributions | |
damaging | +3.587 |
meaningful | +3.488 |
contrasting | +3.461 |
insofar | +3.456 |
categ | +3.419 |
Neg logit contributions | |
eers | -4.086 |
culosis | -3.809 |
Transactions | -3.675 |
Works | -3.608 |
Companies | -3.555 |
Token | office |
Token ID | 2607 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
damaging | +3.312 |
meaningful | +3.255 |
contrasting | +3.221 |
insofar | +3.219 |
categ | +3.204 |
Neg logit contributions | |
eers | -2.312 |
culosis | -2.114 |
Transactions | -2.017 |
Works | -1.959 |
Companies | -1.913 |
Token | as |
Token ID | 355 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
damaging | +7.726 |
meaningful | +7.620 |
categ | +7.522 |
contrasting | +7.520 |
insofar | +7.489 |
Neg logit contributions | |
eers | -4.298 |
culosis | -3.880 |
Transactions | -3.638 |
Works | -3.479 |
Companies | -3.410 |
Token | dysfunctional |
Token ID | 38127 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
damaging | +5.060 |
meaningful | +4.948 |
contrasting | +4.846 |
categ | +4.836 |
insofar | +4.830 |
Neg logit contributions | |
eers | -8.034 |
culosis | -7.577 |
Transactions | -7.309 |
Works | -7.143 |
Companies | -7.073 |
Token | , |
Token ID | 11 |
Feature activation | +3.88e+00 |
Pos logit contributions | |
damaging | +7.560 |
meaningful | +7.407 |
categ | +7.280 |
contrasting | +7.276 |
insofar | +7.223 |
Neg logit contributions | |
eers | -9.021 |
culosis | -8.431 |
Transactions | -8.105 |
Works | -7.885 |
Companies | -7.793 |
Token | committing |
Token ID | 17222 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
damaging | +20.481 |
ignoring | +19.643 |
meaningful | +19.506 |
categ | +19.500 |
contrasting | +19.348 |
Neg logit contributions | |
eers | -16.179 |
culosis | -15.074 |
Transactions | -14.220 |
Works | -13.257 |
ttes | -12.968 |
Token | to |
Token ID | 284 |
Feature activation | +7.84e-01 |
Pos logit contributions | |
damaging | +2.310 |
meaningful | +2.260 |
insofar | +2.252 |
contrasting | +2.250 |
categ | +2.217 |
Neg logit contributions | |
eers | -2.309 |
culosis | -2.106 |
Transactions | -2.047 |
Works | -2.010 |
Companies | -1.976 |
Token | annual |
Token ID | 5079 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
damaging | +3.602 |
meaningful | +3.502 |
contrasting | +3.461 |
insofar | +3.458 |
categ | +3.457 |
Neg logit contributions | |
eers | -4.556 |
culosis | -4.263 |
Transactions | -4.110 |
Works | -4.007 |
Companies | -3.956 |
Token | surveys |
Token ID | 16255 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
damaging | +3.181 |
meaningful | +3.099 |
insofar | +3.087 |
contrasting | +3.083 |
categ | +3.065 |
Neg logit contributions | |
eers | -2.516 |
culosis | -2.306 |
Transactions | -2.205 |
Works | -2.146 |
Facility | -2.091 |
Token | of |
Token ID | 286 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
damaging | +0.739 |
categ | +0.714 |
meaningful | +0.711 |
contrasting | +0.698 |
consequential | +0.696 |
Neg logit contributions | |
eers | -1.050 |
culosis | -0.969 |
Transactions | -0.939 |
Works | -0.931 |
Companies | -0.924 |
Token | what |
Token ID | 644 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
damaging | +9.442 |
meaningful | +9.311 |
categ | +9.185 |
contrasting | +9.150 |
insofar | +9.026 |
Neg logit contributions | |
eers | -11.216 |
culosis | -10.628 |
Transactions | -10.072 |
Works | -9.718 |
Facility | -9.648 |
Token | constitutes |
Token ID | 19300 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
damaging | +1.983 |
meaningful | +1.933 |
contrasting | +1.911 |
insofar | +1.910 |
categ | +1.909 |
Neg logit contributions | |
eers | -1.733 |
culosis | -1.590 |
Transactions | -1.533 |
Works | -1.494 |
Companies | -1.468 |
Token | the |
Token ID | 262 |
Feature activation | +1.20e+00 |
Pos logit contributions | |
damaging | +5.923 |
meaningful | +5.762 |
categ | +5.668 |
contrasting | +5.668 |
insofar | +5.656 |
Neg logit contributions | |
eers | -8.194 |
culosis | -7.679 |
Transactions | -7.418 |
Works | -7.249 |
Companies | -7.151 |
Token | middle |
Token ID | 3504 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
damaging | +5.467 |
meaningful | +5.351 |
categ | +5.258 |
contrasting | +5.251 |
insofar | +5.225 |
Neg logit contributions | |
eers | -6.967 |
culosis | -6.542 |
Transactions | -6.287 |
Works | -6.115 |
Companies | -6.042 |
Token | class |
Token ID | 1398 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
damaging | +10.002 |
meaningful | +9.878 |
categ | +9.650 |
contrasting | +9.634 |
insofar | +9.568 |
Neg logit contributions | |
eers | -12.384 |
culosis | -11.789 |
Transactions | -11.252 |
Works | -10.907 |
Facility | -10.775 |
Token | , |
Token ID | 11 |
Feature activation | +3.85e+00 |
Pos logit contributions | |
damaging | +7.648 |
meaningful | +7.493 |
categ | +7.360 |
contrasting | +7.349 |
insofar | +7.328 |
Neg logit contributions | |
eers | -10.213 |
culosis | -9.620 |
Transactions | -9.242 |
Works | -8.994 |
Companies | -8.889 |
Token | rather |
Token ID | 2138 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
insofar | +18.774 |
meaningful | +18.570 |
contrasting | +18.550 |
damaging | +18.509 |
ignoring | +18.264 |
Neg logit contributions | |
eers | -16.755 |
culosis | -15.873 |
Transactions | -14.425 |
ttes | -13.994 |
Facility | -13.986 |
Token | than |
Token ID | 621 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
damaging | +3.794 |
meaningful | +3.612 |
contrasting | +3.454 |
insofar | +3.422 |
ignoring | +3.402 |
Neg logit contributions | |
eers | -9.734 |
culosis | -9.582 |
Transactions | -9.118 |
Works | -8.901 |
Facility | -8.792 |
Token | the |
Token ID | 262 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
damaging | +6.615 |
meaningful | +6.475 |
contrasting | +6.373 |
categ | +6.362 |
insofar | +6.323 |
Neg logit contributions | |
eers | -8.983 |
culosis | -8.484 |
Transactions | -8.135 |
Works | -7.910 |
Companies | -7.812 |
Token | median |
Token ID | 14288 |
Feature activation | +4.89e-01 |
Pos logit contributions | |
damaging | +5.626 |
meaningful | +5.517 |
categ | +5.434 |
contrasting | +5.425 |
insofar | +5.377 |
Neg logit contributions | |
eers | -6.545 |
culosis | -6.156 |
Transactions | -5.876 |
Works | -5.702 |
Companies | -5.632 |
Token | 20 |
Token ID | 1160 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
damaging | +2.466 |
meaningful | +2.379 |
contrasting | +2.352 |
insofar | +2.331 |
categ | +2.331 |
Neg logit contributions | |
eers | -2.663 |
culosis | -2.393 |
Transactions | -2.336 |
Works | -2.288 |
Companies | -2.268 |
Token | , |
Token ID | 11 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
eers | +0.638 |
culosis | +0.587 |
Transactions | +0.559 |
Works | +0.552 |
Companies | +0.541 |
Neg logit contributions | |
damaging | -0.802 |
meaningful | -0.785 |
categ | -0.784 |
insofar | -0.776 |
contrasting | -0.774 |
Token | he |
Token ID | 339 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
damaging | +8.030 |
meaningful | +7.872 |
contrasting | +7.744 |
categ | +7.742 |
insofar | +7.711 |
Neg logit contributions | |
eers | -7.837 |
culosis | -7.305 |
Transactions | -6.962 |
Works | -6.723 |
Companies | -6.636 |
Token | gets |
Token ID | 3011 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
damaging | +9.146 |
meaningful | +8.961 |
categ | +8.866 |
contrasting | +8.842 |
insofar | +8.771 |
Neg logit contributions | |
eers | -6.224 |
culosis | -5.775 |
Transactions | -5.487 |
Works | -5.140 |
Facility | -5.134 |
Token | everything |
Token ID | 2279 |
Feature activation | +2.76e-01 |
Pos logit contributions | |
damaging | +9.645 |
meaningful | +9.442 |
categ | +9.296 |
contrasting | +9.235 |
insofar | +9.105 |
Neg logit contributions | |
eers | -11.296 |
culosis | -10.806 |
Transactions | -10.269 |
Works | -9.888 |
Companies | -9.768 |
Token | backward |
Token ID | 19528 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
damaging | +1.226 |
meaningful | +1.199 |
categ | +1.189 |
insofar | +1.180 |
contrasting | +1.179 |
Neg logit contributions | |
eers | -1.622 |
culosis | -1.459 |
Transactions | -1.432 |
Works | -1.431 |
Companies | -1.406 |
Token | , |
Token ID | 11 |
Feature activation | +3.84e+00 |
Pos logit contributions | |
damaging | +4.868 |
meaningful | +4.784 |
categ | +4.753 |
contrasting | +4.718 |
insofar | +4.642 |
Neg logit contributions | |
eers | -5.898 |
culosis | -5.467 |
Transactions | -5.258 |
Works | -5.169 |
Companies | -5.083 |
Token | making |
Token ID | 1642 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
damaging | +18.820 |
ignoring | +18.229 |
contrasting | +18.055 |
meaningful | +17.882 |
categ | +17.810 |
Neg logit contributions | |
eers | -17.141 |
culosis | -16.306 |
Transactions | -15.468 |
Works | -14.281 |
Facility | -14.273 |
Token | it |
Token ID | 340 |
Feature activation | +8.05e-01 |
Pos logit contributions | |
damaging | +5.614 |
meaningful | +5.504 |
categ | +5.416 |
contrasting | +5.411 |
insofar | +5.388 |
Neg logit contributions | |
eers | -6.063 |
culosis | -5.661 |
Transactions | -5.425 |
Works | -5.265 |
Companies | -5.196 |
Token | hard |
Token ID | 1327 |
Feature activation | +1.98e+00 |
Pos logit contributions | |
damaging | +3.355 |
meaningful | +3.263 |
insofar | +3.232 |
contrasting | +3.231 |
categ | +3.227 |
Neg logit contributions | |
eers | -4.998 |
culosis | -4.716 |
Transactions | -4.526 |
Works | -4.445 |
Companies | -4.388 |
Token | for |
Token ID | 329 |
Feature activation | -5.80e-02 |
Pos logit contributions | |
damaging | +7.561 |
meaningful | +7.376 |
categ | +7.205 |
contrasting | +7.203 |
insofar | +7.158 |
Neg logit contributions | |
eers | -12.990 |
culosis | -12.287 |
Transactions | -11.880 |
Works | -11.579 |
Companies | -11.460 |
Token | supporters |
Token ID | 5941 |
Feature activation | +7.69e-01 |
Pos logit contributions | |
eers | +0.316 |
culosis | +0.283 |
Transactions | +0.280 |
Works | +0.274 |
Companies | +0.270 |
Neg logit contributions | |
damaging | -0.280 |
insofar | -0.277 |
categ | -0.274 |
contrasting | -0.273 |
meaningful | -0.272 |
Token | on |
Token ID | 319 |
Feature activation | +8.00e-02 |
Pos logit contributions | |
eers | +5.368 |
Companies | +4.841 |
Transactions | +4.766 |
culosis | +4.698 |
Works | +4.665 |
Neg logit contributions | |
categ | -3.780 |
damaging | -3.770 |
meaningful | -3.735 |
wounding | -3.729 |
pessimistic | -3.728 |
Token | agriculture |
Token ID | 14510 |
Feature activation | -5.29e-01 |
Pos logit contributions | |
damaging | +0.378 |
insofar | +0.376 |
meaningful | +0.374 |
categ | +0.373 |
contrasting | +0.368 |
Neg logit contributions | |
eers | -0.444 |
culosis | -0.397 |
Transactions | -0.392 |
Works | -0.383 |
Companies | -0.380 |
Token | . |
Token ID | 13 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
eers | +3.191 |
Transactions | +2.795 |
Companies | +2.789 |
culosis | +2.770 |
Works | +2.750 |
Neg logit contributions | |
categ | -2.183 |
meaningful | -2.162 |
pessimistic | -2.134 |
damaging | -2.127 |
contrasting | -2.124 |
Token |
|
Token ID | 198 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
eers | +3.834 |
Transactions | +3.507 |
Companies | +3.496 |
culosis | +3.449 |
Works | +3.358 |
Neg logit contributions | |
damaging | -6.293 |
meaningful | -6.277 |
categ | -6.227 |
contrasting | -6.204 |
wounding | -6.189 |
Token |
|
Token ID | 198 |
Feature activation | -7.53e-01 |
Pos logit contributions | |
damaging | +4.832 |
meaningful | +4.740 |
insofar | +4.678 |
ignoring | +4.560 |
compelling | +4.548 |
Neg logit contributions | |
culosis | -6.004 |
eers | -5.935 |
Transactions | -5.475 |
Works | -5.166 |
Facility | -5.114 |
Token | - |
Token ID | 12 |
Feature activation | +3.80e+00 |
Pos logit contributions | |
eers | +3.108 |
Queue | +2.663 |
culosis | +2.606 |
Transactions | +2.577 |
Companies | +2.527 |
Neg logit contributions | |
meaningful | -4.610 |
categ | -4.597 |
damaging | -4.589 |
contrasting | -4.582 |
insofar | -4.488 |
Token | Commit |
Token ID | 35910 |
Feature activation | +7.31e-01 |
Pos logit contributions | |
damaging | +21.870 |
meaningful | +20.957 |
contrasting | +20.757 |
whether | +20.662 |
ignoring | +20.546 |
Neg logit contributions | |
eers | -11.456 |
culosis | -10.903 |
tyard | -9.105 |
atcher | -9.074 |
Queue | -8.761 |
Token | ment |
Token ID | 434 |
Feature activation | +4.51e-01 |
Pos logit contributions | |
damaging | +4.347 |
meaningful | +4.284 |
insofar | +4.266 |
categ | +4.260 |
contrasting | +4.242 |
Neg logit contributions | |
eers | -3.324 |
culosis | -3.037 |
Transactions | -2.911 |
Works | -2.807 |
Companies | -2.751 |
Token | to |
Token ID | 284 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
damaging | +1.790 |
meaningful | +1.765 |
categ | +1.765 |
insofar | +1.762 |
contrasting | +1.746 |
Neg logit contributions | |
eers | -2.905 |
culosis | -2.638 |
Transactions | -2.578 |
Works | -2.549 |
Facility | -2.522 |
Token | NATO |
Token ID | 11332 |
Feature activation | +2.77e-01 |
Pos logit contributions | |
damaging | +5.532 |
meaningful | +5.418 |
categ | +5.344 |
contrasting | +5.340 |
insofar | +5.328 |
Neg logit contributions | |
eers | -5.951 |
culosis | -5.553 |
Transactions | -5.329 |
Works | -5.173 |
Companies | -5.107 |
Token | - |
Token ID | 532 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
damaging | +1.468 |
meaningful | +1.440 |
insofar | +1.435 |
contrasting | +1.430 |
categ | +1.424 |
Neg logit contributions | |
eers | -1.418 |
culosis | -1.280 |
Transactions | -1.246 |
Works | -1.219 |
Facility | -1.198 |
Token | on |
Token ID | 319 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
damaging | +2.158 |
contrasting | +2.074 |
meaningful | +2.073 |
categ | +2.066 |
insofar | +2.057 |
Neg logit contributions | |
eers | -2.932 |
culosis | -2.703 |
Transactions | -2.637 |
Works | -2.611 |
Companies | -2.557 |
Token | it |
Token ID | 340 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
damaging | +0.845 |
meaningful | +0.825 |
contrasting | +0.819 |
categ | +0.817 |
insofar | +0.817 |
Neg logit contributions | |
eers | -0.966 |
culosis | -0.895 |
Transactions | -0.867 |
Works | -0.862 |
Companies | -0.832 |
Token | with |
Token ID | 351 |
Feature activation | +9.41e-01 |
Pos logit contributions | |
damaging | +5.832 |
meaningful | +5.720 |
contrasting | +5.624 |
categ | +5.624 |
insofar | +5.512 |
Neg logit contributions | |
eers | -8.135 |
culosis | -7.630 |
Transactions | -7.329 |
Works | -7.178 |
Companies | -7.077 |
Token | more |
Token ID | 517 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
damaging | +4.336 |
meaningful | +4.229 |
insofar | +4.184 |
contrasting | +4.174 |
categ | +4.171 |
Neg logit contributions | |
eers | -5.443 |
culosis | -5.058 |
Transactions | -4.871 |
Works | -4.780 |
Companies | -4.693 |
Token | creativity |
Token ID | 16389 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
damaging | +4.691 |
meaningful | +4.582 |
contrasting | +4.520 |
insofar | +4.518 |
categ | +4.509 |
Neg logit contributions | |
eers | -6.043 |
culosis | -5.628 |
Transactions | -5.419 |
Works | -5.311 |
Companies | -5.231 |
Token | , |
Token ID | 11 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
damaging | +7.515 |
meaningful | +7.351 |
categ | +7.230 |
contrasting | +7.219 |
insofar | +7.135 |
Neg logit contributions | |
eers | -9.852 |
culosis | -9.198 |
Transactions | -8.854 |
Works | -8.657 |
Companies | -8.540 |
Token | artist |
Token ID | 6802 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
damaging | +18.487 |
meaningful | +18.388 |
insofar | +18.289 |
contrasting | +18.001 |
ignoring | +17.910 |
Neg logit contributions | |
eers | -16.888 |
culosis | -16.165 |
Transactions | -15.281 |
Queue | -14.352 |
Companies | -14.326 |
Token | ically |
Token ID | 1146 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
damaging | +6.712 |
meaningful | +6.561 |
categ | +6.469 |
contrasting | +6.458 |
insofar | +6.399 |
Neg logit contributions | |
eers | -5.465 |
culosis | -5.035 |
Transactions | -4.709 |
Works | -4.640 |
Companies | -4.515 |
Token | forging |
Token ID | 44096 |
Feature activation | +4.91e-01 |
Pos logit contributions | |
damaging | +5.488 |
categ | +5.348 |
meaningful | +5.343 |
contrasting | +5.269 |
insofar | +5.229 |
Neg logit contributions | |
eers | -7.068 |
culosis | -6.531 |
Transactions | -6.309 |
Works | -6.242 |
Companies | -6.123 |
Token | our |
Token ID | 674 |
Feature activation | +4.44e-01 |
Pos logit contributions | |
damaging | +2.183 |
insofar | +2.083 |
meaningful | +2.082 |
categ | +2.071 |
contrasting | +2.062 |
Neg logit contributions | |
eers | -2.890 |
culosis | -2.652 |
Transactions | -2.594 |
Works | -2.574 |
Companies | -2.498 |
Token | own |
Token ID | 898 |
Feature activation | +5.99e-01 |
Pos logit contributions | |
damaging | +2.135 |
meaningful | +2.067 |
insofar | +2.052 |
categ | +2.038 |
contrasting | +2.036 |
Neg logit contributions | |
eers | -2.470 |
culosis | -2.290 |
Transactions | -2.210 |
Works | -2.185 |
Companies | -2.127 |
Token | • |
Token ID | 3581 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
eers | +2.702 |
culosis | +2.384 |
Queue | +2.326 |
Services | +2.151 |
Transactions | +2.143 |
Neg logit contributions | |
damaging | -5.004 |
meaningful | -4.905 |
contrasting | -4.903 |
categ | -4.887 |
insofar | -4.801 |
Token | MP |
Token ID | 4904 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
damaging | +7.592 |
meaningful | +7.454 |
categ | +7.355 |
contrasting | +7.331 |
insofar | +7.311 |
Neg logit contributions | |
eers | -7.460 |
culosis | -6.932 |
Transactions | -6.558 |
Works | -6.326 |
Companies | -6.254 |
Token | P |
Token ID | 47 |
Feature activation | -9.05e-02 |
Pos logit contributions | |
damaging | +5.089 |
meaningful | +5.052 |
insofar | +4.880 |
categ | +4.845 |
compelling | +4.761 |
Neg logit contributions | |
eers | -7.713 |
culosis | -7.443 |
Transactions | -6.974 |
Works | -6.652 |
Companies | -6.574 |
Token | grade |
Token ID | 9559 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
eers | +0.535 |
culosis | +0.501 |
Transactions | +0.480 |
Works | +0.473 |
Companies | +0.466 |
Neg logit contributions | |
damaging | -0.397 |
meaningful | -0.389 |
contrasting | -0.385 |
insofar | -0.381 |
categ | -0.381 |
Token | : |
Token ID | 25 |
Feature activation | +2.97e+00 |
Pos logit contributions | |
damaging | +0.054 |
meaningful | +0.053 |
categ | +0.052 |
contrasting | +0.052 |
insofar | +0.052 |
Neg logit contributions | |
eers | -0.069 |
culosis | -0.065 |
Transactions | -0.062 |
Works | -0.061 |
Companies | -0.060 |
Token | C |
Token ID | 327 |
Feature activation | +3.76e+00 |
Pos logit contributions | |
damaging | +15.179 |
meaningful | +15.028 |
categ | +14.921 |
contrasting | +14.665 |
insofar | +14.537 |
Neg logit contributions | |
eers | -13.300 |
culosis | -12.264 |
Transactions | -11.555 |
Queue | -11.114 |
atcher | -10.719 |
Token | - |
Token ID | 12 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
damaging | +18.310 |
meaningful | +17.937 |
categ | +17.877 |
insofar | +17.524 |
contrasting | +17.456 |
Neg logit contributions | |
eers | -16.498 |
culosis | -15.201 |
Transactions | -14.871 |
Queue | -13.590 |
Facility | -13.553 |
Token |
|
Token ID | 198 |
Feature activation | +6.79e-01 |
Pos logit contributions | |
damaging | +16.661 |
meaningful | +16.465 |
categ | +16.201 |
insofar | +16.178 |
contrasting | +16.150 |
Neg logit contributions | |
eers | -14.323 |
culosis | -13.298 |
Transactions | -12.820 |
Works | -11.756 |
Facility | -11.686 |
Token |
|
Token ID | 198 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
damaging | +3.286 |
meaningful | +3.228 |
insofar | +3.148 |
categ | +3.103 |
compelling | +3.101 |
Neg logit contributions | |
eers | -3.631 |
culosis | -3.573 |
Transactions | -3.314 |
Works | -3.141 |
Companies | -3.099 |
Token | In |
Token ID | 818 |
Feature activation | -3.94e-01 |
Pos logit contributions | |
eers | +7.799 |
Queue | +7.125 |
Services | +6.837 |
culosis | +6.340 |
Companies | +6.086 |
Neg logit contributions | |
damaging | -12.115 |
categ | -12.066 |
contrasting | -11.923 |
meaningful | -11.789 |
consequential | -11.754 |
Token | an |
Token ID | 281 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
eers | +2.073 |
culosis | +1.909 |
Transactions | +1.852 |
Works | +1.807 |
Companies | +1.771 |
Neg logit contributions | |
insofar | -1.908 |
damaging | -1.899 |
meaningful | -1.866 |
categ | -1.857 |
pessimistic | -1.811 |
Token | faults |
Token ID | 31025 |
Feature activation | +9.42e-01 |
Pos logit contributions | |
eers | +1.238 |
culosis | +1.130 |
Transactions | +1.127 |
Works | +1.100 |
Companies | +1.075 |
Neg logit contributions | |
meaningful | -0.925 |
damaging | -0.916 |
insofar | -0.910 |
categ | -0.892 |
contrasting | -0.889 |
Token | , |
Token ID | 11 |
Feature activation | +2.36e+00 |
Pos logit contributions | |
damaging | +5.094 |
meaningful | +5.013 |
categ | +4.941 |
contrasting | +4.925 |
insofar | +4.897 |
Neg logit contributions | |
eers | -4.699 |
culosis | -4.345 |
Transactions | -4.172 |
Works | -4.041 |
Companies | -3.982 |
Token | we |
Token ID | 356 |
Feature activation | +4.16e-01 |
Pos logit contributions | |
damaging | +12.898 |
meaningful | +12.730 |
insofar | +12.678 |
categ | +12.601 |
contrasting | +12.601 |
Neg logit contributions | |
eers | -10.808 |
culosis | -10.123 |
Transactions | -9.293 |
Queue | -8.968 |
Facility | -8.805 |
Token | shall |
Token ID | 2236 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
damaging | +2.343 |
meaningful | +2.301 |
categ | +2.267 |
contrasting | +2.264 |
insofar | +2.255 |
Neg logit contributions | |
eers | -1.976 |
culosis | -1.823 |
Transactions | -1.739 |
Works | -1.682 |
Companies | -1.653 |
Token | try |
Token ID | 1949 |
Feature activation | +8.58e-01 |
Pos logit contributions | |
damaging | +0.971 |
meaningful | +0.951 |
categ | +0.936 |
contrasting | +0.929 |
insofar | +0.920 |
Neg logit contributions | |
eers | -1.077 |
culosis | -0.994 |
Transactions | -0.960 |
Works | -0.937 |
Companies | -0.919 |
Token | , |
Token ID | 11 |
Feature activation | +3.74e+00 |
Pos logit contributions | |
damaging | +3.534 |
meaningful | +3.439 |
categ | +3.372 |
contrasting | +3.343 |
insofar | +3.326 |
Neg logit contributions | |
eers | -5.459 |
culosis | -5.114 |
Transactions | -4.939 |
Works | -4.853 |
Companies | -4.800 |
Token | by |
Token ID | 416 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
insofar | +16.975 |
damaging | +16.743 |
contrasting | +16.554 |
whether | +16.405 |
ignoring | +16.363 |
Neg logit contributions | |
eers | -17.373 |
culosis | -16.345 |
Transactions | -15.394 |
Queue | -14.940 |
Facility | -14.712 |
Token | God |
Token ID | 1793 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
damaging | +7.110 |
meaningful | +6.983 |
contrasting | +6.880 |
categ | +6.867 |
insofar | +6.799 |
Neg logit contributions | |
eers | -8.041 |
culosis | -7.566 |
Transactions | -7.220 |
Works | -6.976 |
Companies | -6.909 |
Token | 's |
Token ID | 338 |
Feature activation | +2.62e-01 |
Pos logit contributions | |
damaging | +10.855 |
meaningful | +10.703 |
categ | +10.580 |
contrasting | +10.566 |
insofar | +10.550 |
Neg logit contributions | |
eers | -5.130 |
culosis | -4.631 |
Transactions | -4.270 |
Works | -4.013 |
Companies | -3.945 |
Token | help |
Token ID | 1037 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
damaging | +1.280 |
insofar | +1.243 |
meaningful | +1.242 |
contrasting | +1.233 |
categ | +1.223 |
Neg logit contributions | |
eers | -1.428 |
culosis | -1.301 |
Transactions | -1.299 |
Works | -1.290 |
Companies | -1.243 |
Token | , |
Token ID | 11 |
Feature activation | +3.15e+00 |
Pos logit contributions | |
damaging | +2.395 |
meaningful | +2.336 |
categ | +2.304 |
contrasting | +2.304 |
consequential | +2.258 |
Neg logit contributions | |
eers | -1.935 |
culosis | -1.718 |
Transactions | -1.672 |
Works | -1.669 |
Companies | -1.617 |
Token | that |
Token ID | 326 |
Feature activation | +9.35e-01 |
Pos logit contributions | |
damaging | +12.816 |
meaningful | +12.619 |
contrasting | +12.420 |
categ | +12.417 |
insofar | +12.367 |
Neg logit contributions | |
eers | -8.554 |
culosis | -7.827 |
Transactions | -7.253 |
Works | -6.815 |
Queue | -6.772 |
Token | the |
Token ID | 262 |
Feature activation | +8.88e-01 |
Pos logit contributions | |
damaging | +4.665 |
meaningful | +4.566 |
categ | +4.506 |
contrasting | +4.501 |
insofar | +4.480 |
Neg logit contributions | |
eers | -5.060 |
culosis | -4.711 |
Transactions | -4.526 |
Works | -4.405 |
Companies | -4.346 |
Token | coalition |
Token ID | 9906 |
Feature activation | +3.85e-01 |
Pos logit contributions | |
damaging | +4.859 |
meaningful | +4.771 |
categ | +4.704 |
contrasting | +4.701 |
insofar | +4.695 |
Neg logit contributions | |
eers | -4.378 |
culosis | -4.048 |
Transactions | -3.876 |
Works | -3.754 |
Companies | -3.697 |
Token | was |
Token ID | 373 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
damaging | +2.456 |
meaningful | +2.424 |
categ | +2.396 |
contrasting | +2.395 |
insofar | +2.389 |
Neg logit contributions | |
eers | -1.560 |
culosis | -1.391 |
Transactions | -1.318 |
Works | -1.279 |
Companies | -1.250 |
Token | illegitimate |
Token ID | 41368 |
Feature activation | +2.62e+00 |
Pos logit contributions | |
damaging | +7.604 |
meaningful | +7.374 |
categ | +7.184 |
contrasting | +7.148 |
insofar | +7.122 |
Neg logit contributions | |
eers | -11.011 |
culosis | -10.494 |
Transactions | -10.097 |
Works | -9.762 |
Companies | -9.666 |
Token | , |
Token ID | 11 |
Feature activation | +3.73e+00 |
Pos logit contributions | |
damaging | +12.263 |
insofar | +12.073 |
meaningful | +12.041 |
categ | +11.824 |
contrasting | +11.763 |
Neg logit contributions | |
eers | -13.919 |
culosis | -13.368 |
Transactions | -12.583 |
Works | -12.166 |
Companies | -12.031 |
Token | divisive |
Token ID | 29656 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
damaging | +18.717 |
meaningful | +17.858 |
insofar | +17.745 |
categ | +17.477 |
ignoring | +17.405 |
Neg logit contributions | |
eers | -16.802 |
culosis | -16.559 |
Transactions | -15.221 |
Facility | -14.289 |
Works | -14.270 |
Token | , |
Token ID | 11 |
Feature activation | +3.55e+00 |
Pos logit contributions | |
damaging | +10.478 |
meaningful | +10.269 |
insofar | +10.093 |
categ | +10.091 |
contrasting | +10.070 |
Neg logit contributions | |
eers | -10.735 |
culosis | -10.114 |
Transactions | -9.598 |
Works | -9.278 |
Companies | -9.158 |
Token | unstable |
Token ID | 21354 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
damaging | +17.216 |
meaningful | +16.350 |
categ | +15.885 |
insofar | +15.878 |
contrasting | +15.848 |
Neg logit contributions | |
eers | -16.976 |
culosis | -16.736 |
Transactions | -15.708 |
Works | -14.900 |
Facility | -14.803 |
Token | and |
Token ID | 290 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
damaging | +9.458 |
meaningful | +9.279 |
categ | +9.134 |
contrasting | +9.124 |
insofar | +9.101 |
Neg logit contributions | |
eers | -9.435 |
culosis | -8.810 |
Transactions | -8.406 |
Works | -8.144 |
Companies | -8.029 |
Token | , |
Token ID | 11 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
damaging | +8.686 |
meaningful | +8.393 |
categ | +8.220 |
contrasting | +8.194 |
insofar | +8.175 |
Neg logit contributions | |
eers | -10.210 |
culosis | -9.765 |
Transactions | -9.322 |
Works | -8.986 |
Companies | -8.886 |
Token |
|
Token ID | 198 |
Feature activation | +1.47e+00 |
Pos logit contributions | |
eers | +2.122 |
culosis | +1.964 |
Transactions | +1.896 |
Works | +1.844 |
Companies | +1.824 |
Neg logit contributions | |
damaging | -3.188 |
meaningful | -3.152 |
categ | -3.077 |
insofar | -3.075 |
contrasting | -3.063 |
Token |
|
Token ID | 198 |
Feature activation | +1.67e-01 |
Pos logit contributions | |
damaging | +6.124 |
meaningful | +6.015 |
insofar | +5.867 |
whether | +5.798 |
compelling | +5.773 |
Neg logit contributions | |
culosis | -8.402 |
eers | -8.243 |
Transactions | -7.644 |
Works | -7.126 |
atcher | -7.125 |
Token | Like |
Token ID | 7594 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
damaging | +1.055 |
meaningful | +1.037 |
categ | +1.024 |
contrasting | +1.024 |
insofar | +1.012 |
Neg logit contributions | |
eers | -0.703 |
culosis | -0.622 |
Queue | -0.596 |
Transactions | -0.592 |
Works | -0.572 |
Token | Bush |
Token ID | 5511 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
damaging | +1.392 |
meaningful | +1.368 |
categ | +1.355 |
contrasting | +1.346 |
insofar | +1.345 |
Neg logit contributions | |
eers | -1.409 |
culosis | -1.299 |
Transactions | -1.246 |
Works | -1.232 |
Facility | -1.205 |
Token | , |
Token ID | 11 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
damaging | +5.856 |
meaningful | +5.775 |
categ | +5.665 |
contrasting | +5.643 |
insofar | +5.631 |
Neg logit contributions | |
eers | -5.083 |
culosis | -4.717 |
Transactions | -4.467 |
Works | -4.365 |
Companies | -4.282 |
Token | Cruz |
Token ID | 8742 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
damaging | +5.603 |
meaningful | +5.503 |
categ | +5.425 |
contrasting | +5.383 |
insofar | +5.362 |
Neg logit contributions | |
eers | -5.717 |
culosis | -5.317 |
Transactions | -5.091 |
Works | -4.985 |
Companies | -4.882 |
Token | smoked |
Token ID | 21603 |
Feature activation | +6.96e-01 |
Pos logit contributions | |
damaging | +18.273 |
contrasting | +18.112 |
categ | +17.890 |
ignoring | +17.729 |
meaningful | +17.716 |
Neg logit contributions | |
eers | -14.438 |
culosis | -13.636 |
Transactions | -13.435 |
Facility | -12.571 |
Queue | -12.041 |
Token | pot |
Token ID | 1787 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
damaging | +3.206 |
meaningful | +3.139 |
categ | +3.120 |
contrasting | +3.097 |
insofar | +3.071 |
Neg logit contributions | |
eers | -4.014 |
culosis | -3.722 |
Transactions | -3.613 |
Works | -3.551 |
Companies | -3.490 |
Token | when |
Token ID | 618 |
Feature activation | -8.65e-01 |
Pos logit contributions | |
damaging | +7.665 |
meaningful | +7.498 |
contrasting | +7.351 |
categ | +7.348 |
insofar | +7.344 |
Neg logit contributions | |
eers | -9.387 |
culosis | -8.817 |
Transactions | -8.487 |
Works | -8.205 |
Companies | -8.118 |
Token | he |
Token ID | 339 |
Feature activation | -4.49e-01 |
Pos logit contributions | |
eers | +3.868 |
culosis | +3.516 |
Works | +3.483 |
Transactions | +3.396 |
Facility | +3.347 |
Neg logit contributions | |
meaningful | -4.471 |
categ | -4.462 |
insofar | -4.438 |
damaging | -4.413 |
pessimistic | -4.267 |
Token | was |
Token ID | 373 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
eers | +1.124 |
culosis | +0.964 |
Works | +0.921 |
Transactions | +0.878 |
Facility | +0.811 |
Neg logit contributions | |
damaging | -3.370 |
meaningful | -3.363 |
categ | -3.343 |
insofar | -3.304 |
contrasting | -3.289 |
Token | The |
Token ID | 383 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
damaging | +9.664 |
meaningful | +9.509 |
contrasting | +9.438 |
categ | +9.414 |
insofar | +9.396 |
Neg logit contributions | |
eers | -6.174 |
culosis | -5.652 |
Transactions | -5.154 |
Queue | -4.897 |
Works | -4.878 |
Token | contemporary |
Token ID | 11811 |
Feature activation | +2.14e-02 |
Pos logit contributions | |
damaging | +2.961 |
meaningful | +2.913 |
insofar | +2.878 |
categ | +2.862 |
contrasting | +2.849 |
Neg logit contributions | |
eers | -2.838 |
culosis | -2.615 |
Transactions | -2.544 |
Works | -2.478 |
Companies | -2.420 |
Token | Bible |
Token ID | 9111 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
damaging | +0.113 |
meaningful | +0.111 |
insofar | +0.110 |
categ | +0.109 |
contrasting | +0.109 |
Neg logit contributions | |
eers | -0.108 |
culosis | -0.097 |
Transactions | -0.096 |
Works | -0.095 |
Companies | -0.092 |
Token | scholar |
Token ID | 15606 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
damaging | +3.322 |
meaningful | +3.271 |
categ | +3.222 |
contrasting | +3.216 |
insofar | +3.200 |
Neg logit contributions | |
eers | -2.288 |
culosis | -2.067 |
Transactions | -1.980 |
Works | -1.925 |
Companies | -1.875 |
Token | , |
Token ID | 11 |
Feature activation | +2.34e+00 |
Pos logit contributions | |
eers | +0.500 |
culosis | +0.459 |
Transactions | +0.449 |
Works | +0.443 |
Companies | +0.427 |
Neg logit contributions | |
damaging | -0.596 |
meaningful | -0.581 |
categ | -0.573 |
contrasting | -0.567 |
insofar | -0.566 |
Token | Y |
Token ID | 575 |
Feature activation | +3.72e+00 |
Pos logit contributions | |
damaging | +12.976 |
meaningful | +12.801 |
contrasting | +12.720 |
categ | +12.662 |
insofar | +12.636 |
Neg logit contributions | |
eers | -10.643 |
culosis | -9.784 |
Transactions | -9.125 |
Queue | -8.739 |
Companies | -8.708 |
Token | air |
Token ID | 958 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
damaging | +18.495 |
meaningful | +18.111 |
categ | +17.940 |
contrasting | +17.606 |
insofar | +17.602 |
Neg logit contributions | |
eers | -14.223 |
culosis | -13.894 |
Transactions | -13.236 |
Facility | -12.071 |
Works | -11.927 |
Token | Zak |
Token ID | 32605 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
damaging | +1.838 |
meaningful | +1.805 |
contrasting | +1.775 |
categ | +1.762 |
insofar | +1.759 |
Neg logit contributions | |
eers | -1.404 |
culosis | -1.291 |
Transactions | -1.248 |
Works | -1.203 |
Companies | -1.184 |
Token | ov |
Token ID | 709 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
damaging | +10.040 |
meaningful | +9.876 |
insofar | +9.780 |
contrasting | +9.773 |
categ | +9.748 |
Neg logit contributions | |
eers | -4.848 |
culosis | -4.384 |
Transactions | -4.121 |
Works | -3.827 |
Companies | -3.783 |
Token | itch |
Token ID | 2007 |
Feature activation | -5.70e-01 |
Pos logit contributions | |
eers | +1.815 |
culosis | +1.657 |
Transactions | +1.597 |
Works | +1.546 |
Companies | +1.517 |
Neg logit contributions | |
damaging | -2.216 |
meaningful | -2.175 |
categ | -2.127 |
contrasting | -2.125 |
insofar | -2.124 |
Token | of |
Token ID | 286 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
eers | +2.519 |
culosis | +2.287 |
Transactions | +2.228 |
Works | +2.200 |
Companies | +2.126 |
Neg logit contributions | |
damaging | -3.259 |
meaningful | -3.175 |
categ | -3.113 |
insofar | -3.099 |
consequential | -3.085 |
Token | wise |
Token ID | 10787 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
damaging | +2.667 |
meaningful | +2.617 |
insofar | +2.610 |
categ | +2.566 |
contrasting | +2.522 |
Neg logit contributions | |
eers | -3.436 |
culosis | -3.167 |
Transactions | -3.018 |
Works | -2.995 |
Companies | -2.946 |
Token | proposals |
Token ID | 11628 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
damaging | +6.246 |
meaningful | +6.118 |
categ | +6.004 |
contrasting | +5.994 |
insofar | +5.987 |
Neg logit contributions | |
eers | -7.447 |
culosis | -6.957 |
Transactions | -6.675 |
Works | -6.506 |
Companies | -6.413 |
Token | for |
Token ID | 329 |
Feature activation | +4.86e-01 |
Pos logit contributions | |
damaging | +5.244 |
meaningful | +5.136 |
categ | +5.065 |
contrasting | +4.997 |
insofar | +4.985 |
Neg logit contributions | |
eers | -7.544 |
culosis | -7.050 |
Transactions | -6.768 |
Works | -6.662 |
Companies | -6.590 |
Token | confronting |
Token ID | 31291 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
damaging | +2.013 |
categ | +1.967 |
insofar | +1.966 |
meaningful | +1.949 |
contrasting | +1.932 |
Neg logit contributions | |
eers | -3.018 |
culosis | -2.784 |
Transactions | -2.677 |
Works | -2.661 |
Companies | -2.610 |
Token | Putin |
Token ID | 8144 |
Feature activation | +3.22e+00 |
Pos logit contributions | |
damaging | +5.274 |
meaningful | +5.170 |
categ | +5.138 |
insofar | +5.115 |
contrasting | +5.107 |
Neg logit contributions | |
eers | -5.340 |
culosis | -4.905 |
Transactions | -4.671 |
Works | -4.571 |
Companies | -4.497 |
Token | , |
Token ID | 11 |
Feature activation | +3.71e+00 |
Pos logit contributions | |
damaging | +18.573 |
meaningful | +18.192 |
insofar | +18.118 |
categ | +17.894 |
contrasting | +17.890 |
Neg logit contributions | |
eers | -12.560 |
culosis | -11.645 |
Transactions | -11.373 |
Works | -10.594 |
Facility | -10.409 |
Token | calling |
Token ID | 4585 |
Feature activation | +8.09e-01 |
Pos logit contributions | |
damaging | +16.814 |
contrasting | +16.676 |
insofar | +16.513 |
ignoring | +16.412 |
meaningful | +16.387 |
Neg logit contributions | |
eers | -17.860 |
culosis | -17.196 |
Transactions | -16.742 |
Works | -15.427 |
Facility | -15.406 |
Token | on |
Token ID | 319 |
Feature activation | +8.92e-01 |
Pos logit contributions | |
damaging | +3.979 |
meaningful | +3.897 |
contrasting | +3.845 |
categ | +3.845 |
insofar | +3.832 |
Neg logit contributions | |
eers | -4.456 |
culosis | -4.119 |
Transactions | -3.943 |
Works | -3.863 |
Companies | -3.806 |
Token | the |
Token ID | 262 |
Feature activation | +8.39e-01 |
Pos logit contributions | |
damaging | +4.710 |
meaningful | +4.614 |
categ | +4.562 |
insofar | +4.553 |
contrasting | +4.549 |
Neg logit contributions | |
eers | -4.610 |
culosis | -4.221 |
Transactions | -4.053 |
Works | -3.946 |
Companies | -3.892 |
Token | United |
Token ID | 1578 |
Feature activation | +6.88e-01 |
Pos logit contributions | |
damaging | +4.729 |
meaningful | +4.647 |
categ | +4.584 |
contrasting | +4.578 |
insofar | +4.571 |
Neg logit contributions | |
eers | -3.990 |
culosis | -3.677 |
Transactions | -3.508 |
Works | -3.398 |
Companies | -3.341 |
Token | States |
Token ID | 1829 |
Feature activation | +2.36e+00 |
Pos logit contributions | |
damaging | +4.589 |
meaningful | +4.510 |
insofar | +4.458 |
contrasting | +4.449 |
categ | +4.442 |
Neg logit contributions | |
eers | -2.654 |
culosis | -2.351 |
Transactions | -2.232 |
Works | -2.168 |
Companies | -2.136 |
Token | times |
Token ID | 1661 |
Feature activation | -7.01e-01 |
Pos logit contributions | |
damaging | +9.117 |
meaningful | +8.953 |
categ | +8.743 |
contrasting | +8.689 |
compelling | +8.575 |
Neg logit contributions | |
eers | -8.795 |
culosis | -8.351 |
Transactions | -7.823 |
Works | -7.596 |
Queue | -7.540 |
Token | cale |
Token ID | 38765 |
Feature activation | -5.12e-01 |
Pos logit contributions | |
eers | +2.807 |
culosis | +2.536 |
Works | +2.466 |
Transactions | +2.416 |
Companies | +2.401 |
Neg logit contributions | |
damaging | -4.109 |
meaningful | -4.064 |
insofar | -4.044 |
categ | -4.000 |
wounding | -3.963 |
Token | you |
Token ID | 345 |
Feature activation | -6.86e-01 |
Pos logit contributions | |
eers | +2.982 |
culosis | +2.597 |
Transactions | +2.570 |
Works | +2.564 |
Companies | +2.537 |
Neg logit contributions | |
categ | -2.147 |
damaging | -2.144 |
insofar | -2.086 |
meaningful | -2.080 |
contrasting | -2.058 |
Token | cannot |
Token ID | 2314 |
Feature activation | +4.46e-03 |
Pos logit contributions | |
eers | +2.946 |
culosis | +2.620 |
Transactions | +2.510 |
Works | +2.425 |
Companies | +2.418 |
Neg logit contributions | |
damaging | -3.975 |
meaningful | -3.950 |
categ | -3.908 |
contrasting | -3.904 |
insofar | -3.898 |
Token | predict |
Token ID | 4331 |
Feature activation | +1.71e-01 |
Pos logit contributions | |
damaging | +0.021 |
meaningful | +0.021 |
contrasting | +0.020 |
categ | +0.020 |
insofar | +0.020 |
Neg logit contributions | |
eers | -0.025 |
culosis | -0.023 |
Transactions | -0.022 |
Works | -0.022 |
Companies | -0.021 |
Token | , |
Token ID | 11 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
damaging | +0.793 |
contrasting | +0.777 |
categ | +0.774 |
meaningful | +0.769 |
insofar | +0.756 |
Neg logit contributions | |
eers | -0.973 |
Transactions | -0.862 |
culosis | -0.861 |
Works | -0.839 |
Companies | -0.833 |
Token | on |
Token ID | 319 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
damaging | +20.186 |
meaningful | +19.375 |
insofar | +18.967 |
compelling | +18.939 |
ignoring | +18.835 |
Neg logit contributions | |
eers | -13.857 |
culosis | -13.642 |
Transactions | -12.617 |
tyard | -11.830 |
Queue | -11.657 |
Token | an |
Token ID | 281 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
damaging | +6.580 |
meaningful | +6.433 |
categ | +6.297 |
contrasting | +6.295 |
insofar | +6.248 |
Neg logit contributions | |
eers | -9.453 |
culosis | -8.924 |
Transactions | -8.591 |
Works | -8.369 |
Companies | -8.262 |
Token | outcome |
Token ID | 8055 |
Feature activation | +1.94e-02 |
Pos logit contributions | |
damaging | +8.250 |
meaningful | +8.101 |
categ | +7.926 |
contrasting | +7.906 |
insofar | +7.889 |
Neg logit contributions | |
eers | -8.096 |
culosis | -7.681 |
Transactions | -7.248 |
Works | -7.007 |
Queue | -6.928 |
Token | that |
Token ID | 326 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
damaging | +0.094 |
categ | +0.093 |
meaningful | +0.092 |
contrasting | +0.091 |
insofar | +0.091 |
Neg logit contributions | |
eers | -0.105 |
culosis | -0.093 |
Transactions | -0.091 |
Companies | -0.089 |
Works | -0.089 |
Token | 's |
Token ID | 338 |
Feature activation | +7.25e-01 |
Pos logit contributions | |
eers | +6.219 |
Works | +5.345 |
culosis | +5.318 |
Companies | +5.216 |
Transactions | +5.200 |
Neg logit contributions | |
damaging | -6.998 |
categ | -6.933 |
contrasting | -6.905 |
insofar | -6.864 |
meaningful | -6.851 |
Token | their |
Token ID | 511 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
damaging | +5.085 |
meaningful | +4.961 |
contrasting | +4.852 |
categ | +4.848 |
insofar | +4.810 |
Neg logit contributions | |
eers | -8.485 |
culosis | -8.038 |
Transactions | -7.776 |
Works | -7.565 |
Companies | -7.487 |
Token | realism |
Token ID | 30787 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
damaging | +7.999 |
meaningful | +7.922 |
categ | +7.769 |
contrasting | +7.722 |
compelling | +7.584 |
Neg logit contributions | |
eers | -9.992 |
culosis | -9.564 |
Transactions | -9.227 |
Works | -8.800 |
Companies | -8.781 |
Token | and |
Token ID | 290 |
Feature activation | +1.63e+00 |
Pos logit contributions | |
damaging | +7.390 |
meaningful | +7.212 |
categ | +7.116 |
contrasting | +7.079 |
insofar | +7.014 |
Neg logit contributions | |
eers | -9.279 |
culosis | -8.649 |
Transactions | -8.306 |
Works | -8.110 |
Companies | -7.995 |
Token | bold |
Token ID | 10758 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
damaging | +7.491 |
meaningful | +7.387 |
categ | +7.240 |
contrasting | +7.222 |
insofar | +7.189 |
Neg logit contributions | |
eers | -9.325 |
culosis | -8.819 |
Transactions | -8.485 |
Works | -8.196 |
Companies | -8.115 |
Token | ness |
Token ID | 1108 |
Feature activation | +1.71e+00 |
Pos logit contributions | |
damaging | +7.848 |
meaningful | +7.727 |
categ | +7.606 |
contrasting | +7.594 |
insofar | +7.526 |
Neg logit contributions | |
eers | -9.490 |
culosis | -8.947 |
Transactions | -8.598 |
Works | -8.309 |
Companies | -8.239 |
Token | , |
Token ID | 11 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
damaging | +7.730 |
meaningful | +7.561 |
categ | +7.431 |
contrasting | +7.416 |
insofar | +7.376 |
Neg logit contributions | |
eers | -10.092 |
culosis | -9.473 |
Transactions | -9.111 |
Works | -8.872 |
Companies | -8.765 |
Token | and |
Token ID | 290 |
Feature activation | +8.92e-01 |
Pos logit contributions | |
meaningful | +16.404 |
insofar | +16.384 |
damaging | +16.298 |
contrasting | +16.274 |
ignoring | +16.072 |
Neg logit contributions | |
eers | -18.110 |
culosis | -17.575 |
Transactions | -17.074 |
Facility | -15.943 |
Works | -15.937 |
Token | hope |
Token ID | 2911 |
Feature activation | -1.28e-02 |
Pos logit contributions | |
damaging | +4.383 |
meaningful | +4.288 |
categ | +4.223 |
contrasting | +4.216 |
insofar | +4.192 |
Neg logit contributions | |
eers | -4.896 |
culosis | -4.572 |
Transactions | -4.378 |
Works | -4.258 |
Companies | -4.208 |
Token | the |
Token ID | 262 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
eers | +0.062 |
culosis | +0.055 |
Works | +0.053 |
Transactions | +0.052 |
Companies | +0.052 |
Neg logit contributions | |
damaging | -0.070 |
categ | -0.068 |
contrasting | -0.068 |
meaningful | -0.068 |
insofar | -0.066 |
Token | Obama |
Token ID | 2486 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
damaging | +0.949 |
insofar | +0.935 |
meaningful | +0.929 |
categ | +0.921 |
contrasting | +0.920 |
Neg logit contributions | |
eers | -0.934 |
culosis | -0.842 |
Transactions | -0.813 |
Works | -0.807 |
Companies | -0.784 |
Token | administration |
Token ID | 3662 |
Feature activation | +4.36e-01 |
Pos logit contributions | |
damaging | +9.159 |
meaningful | +9.019 |
categ | +8.914 |
contrasting | +8.893 |
insofar | +8.846 |
Neg logit contributions | |
eers | -5.617 |
culosis | -5.165 |
Transactions | -4.856 |
Works | -4.626 |
Companies | -4.535 |
Token | ophon |
Token ID | 48982 |
Feature activation | -7.02e-01 |
Pos logit contributions | |
damaging | +8.139 |
meaningful | +8.022 |
categ | +7.929 |
contrasting | +7.900 |
insofar | +7.885 |
Neg logit contributions | |
eers | -4.830 |
culosis | -4.353 |
Transactions | -4.102 |
Works | -3.954 |
Companies | -3.858 |
Token | ist |
Token ID | 396 |
Feature activation | +8.39e-01 |
Pos logit contributions | |
eers | +2.415 |
culosis | +1.907 |
Works | +1.812 |
Transactions | +1.746 |
Facility | +1.719 |
Neg logit contributions | |
meaningful | -4.752 |
categ | -4.747 |
damaging | -4.734 |
insofar | -4.664 |
consequential | -4.632 |
Token | , |
Token ID | 11 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
damaging | +4.873 |
meaningful | +4.792 |
categ | +4.724 |
insofar | +4.672 |
contrasting | +4.664 |
Neg logit contributions | |
eers | -3.888 |
culosis | -3.567 |
Transactions | -3.385 |
Works | -3.337 |
Companies | -3.220 |
Token | seem |
Token ID | 1283 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
damaging | +12.593 |
contrasting | +12.502 |
meaningful | +12.390 |
insofar | +12.340 |
categ | +12.189 |
Neg logit contributions | |
eers | -9.144 |
culosis | -8.711 |
Transactions | -8.080 |
Companies | -7.693 |
Facility | -7.568 |
Token | to |
Token ID | 284 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
damaging | +4.690 |
meaningful | +4.530 |
categ | +4.430 |
contrasting | +4.414 |
insofar | +4.399 |
Neg logit contributions | |
eers | -10.539 |
culosis | -9.994 |
Transactions | -9.692 |
Works | -9.491 |
Companies | -9.389 |
Token | reflect |
Token ID | 4079 |
Feature activation | +3.68e+00 |
Pos logit contributions | |
damaging | +6.607 |
meaningful | +6.499 |
contrasting | +6.417 |
categ | +6.375 |
insofar | +6.363 |
Neg logit contributions | |
eers | -6.756 |
culosis | -6.378 |
Transactions | -6.061 |
Works | -5.850 |
Companies | -5.783 |
Token | a |
Token ID | 257 |
Feature activation | +2.88e+00 |
Pos logit contributions | |
contrasting | +17.657 |
meaningful | +17.429 |
damaging | +17.336 |
categ | +16.896 |
consequential | +16.562 |
Neg logit contributions | |
culosis | -16.562 |
eers | -16.386 |
Transactions | -14.809 |
Queue | -14.323 |
Companies | -14.288 |
Token | stance |
Token ID | 12046 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
damaging | +14.609 |
meaningful | +14.571 |
contrasting | +14.495 |
categ | +14.301 |
compelling | +13.935 |
Neg logit contributions | |
eers | -13.575 |
culosis | -13.003 |
Transactions | -12.253 |
Companies | -11.632 |
Queue | -11.601 |
Token | that |
Token ID | 326 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
damaging | +6.648 |
meaningful | +6.507 |
categ | +6.394 |
contrasting | +6.391 |
insofar | +6.358 |
Neg logit contributions | |
eers | -8.460 |
culosis | -7.946 |
Transactions | -7.637 |
Works | -7.425 |
Companies | -7.336 |
Token | rejects |
Token ID | 28317 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
eers | +0.103 |
culosis | +0.094 |
Transactions | +0.090 |
Works | +0.089 |
Companies | +0.087 |
Neg logit contributions | |
damaging | -0.114 |
meaningful | -0.111 |
categ | -0.109 |
insofar | -0.109 |
contrasting | -0.108 |
Token | straightforward |
Token ID | 15836 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
damaging | +10.013 |
meaningful | +9.909 |
categ | +9.761 |
contrasting | +9.744 |
insofar | +9.561 |
Neg logit contributions | |
eers | -11.385 |
culosis | -10.832 |
Transactions | -10.248 |
Works | -9.857 |
Companies | -9.817 |
Token | Naval |
Token ID | 20818 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
eers | +9.818 |
Works | +8.758 |
culosis | +8.658 |
Facility | +8.642 |
Companies | +8.635 |
Neg logit contributions | |
damaging | -13.458 |
categ | -13.251 |
insofar | -13.210 |
meaningful | -13.141 |
contrasting | -12.981 |
Token | Air |
Token ID | 3701 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
eers | +9.214 |
Facility | +8.624 |
Works | +8.530 |
Exchange | +8.099 |
Facilities | +7.824 |
Neg logit contributions | |
contrasting | -21.806 |
damaging | -21.526 |
pessimistic | -21.406 |
meaningful | -21.389 |
consequential | -21.367 |
Token | Station |
Token ID | 9327 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
Facility | +11.358 |
eers | +11.357 |
Works | +10.590 |
Exchange | +10.429 |
Services | +10.105 |
Neg logit contributions | |
contrasting | -24.375 |
consequential | -24.238 |
pessimistic | -23.926 |
damaging | -23.767 |
meaningful | -23.545 |
Token | in |
Token ID | 287 |
Feature activation | -3.02e+00 |
Pos logit contributions | |
eers | +15.827 |
Works | +13.902 |
Transactions | +13.704 |
culosis | +13.688 |
Facility | +13.666 |
Neg logit contributions | |
damaging | -13.919 |
consequential | -13.849 |
categ | -13.649 |
pessimistic | -13.574 |
contrasting | -13.558 |
Token | South |
Token ID | 2520 |
Feature activation | -9.40e-01 |
Pos logit contributions | |
eers | +9.942 |
Transactions | +9.150 |
Works | +8.967 |
Facility | +8.706 |
culosis | +8.706 |
Neg logit contributions | |
damaging | -15.739 |
categ | -15.668 |
meaningful | -15.593 |
insofar | -15.285 |
contrasting | -15.093 |
Token | We |
Token ID | 775 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
eers | +1.813 |
Transactions | +1.416 |
culosis | +1.388 |
Works | +1.363 |
Companies | +1.253 |
Neg logit contributions | |
damaging | -7.732 |
meaningful | -7.596 |
contrasting | -7.574 |
categ | -7.546 |
ignoring | -7.453 |
Token | ym |
Token ID | 4948 |
Feature activation | -3.51e+00 |
Pos logit contributions | |
eers | +11.228 |
artment | +8.686 |
erville | +8.668 |
ttes | +8.482 |
culosis | +8.474 |
Neg logit contributions | |
consequential | -24.065 |
contrasting | -23.904 |
categ | -23.833 |
damaging | -23.682 |
conced | -23.068 |
Token | outh |
Token ID | 1536 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
eers | +12.698 |
culosis | +11.006 |
swick | +10.632 |
artment | +10.206 |
acas | +10.195 |
Neg logit contributions | |
contrasting | -19.073 |
categ | -18.806 |
consequential | -18.336 |
pessimistic | -18.237 |
damaging | -18.226 |
Token | . |
Token ID | 13 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
eers | +8.148 |
culosis | +7.375 |
Transactions | +7.278 |
Works | +7.247 |
Queue | +7.079 |
Neg logit contributions | |
damaging | -6.083 |
categ | -5.966 |
contrasting | -5.961 |
meaningful | -5.935 |
consequential | -5.852 |
Token | This |
Token ID | 770 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
eers | +2.753 |
culosis | +2.424 |
Works | +2.420 |
Transactions | +2.384 |
Companies | +2.276 |
Neg logit contributions | |
damaging | -7.930 |
meaningful | -7.884 |
categ | -7.867 |
insofar | -7.789 |
contrasting | -7.740 |
Token | is |
Token ID | 318 |
Feature activation | -9.38e-01 |
Pos logit contributions | |
eers | +5.281 |
culosis | +4.408 |
Works | +4.277 |
Transactions | +4.231 |
Facility | +4.127 |
Neg logit contributions | |
damaging | -11.833 |
meaningful | -11.651 |
contrasting | -11.644 |
categ | -11.644 |
insofar | -11.643 |
Token | , |
Token ID | 11 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
eers | +7.022 |
Transactions | +6.038 |
Works | +5.922 |
culosis | +5.908 |
Companies | +5.786 |
Neg logit contributions | |
damaging | -9.595 |
categ | -9.562 |
contrasting | -9.466 |
meaningful | -9.462 |
consequential | -9.363 |
Token | in |
Token ID | 259 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
eers | +0.643 |
culosis | +0.611 |
Transactions | +0.583 |
Works | +0.565 |
Companies | +0.559 |
Neg logit contributions | |
damaging | -0.478 |
meaningful | -0.467 |
categ | -0.457 |
contrasting | -0.457 |
insofar | -0.456 |
Token | the |
Token ID | 262 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
eers | +6.218 |
culosis | +5.621 |
Works | +5.562 |
Transactions | +5.477 |
Facility | +5.440 |
Neg logit contributions | |
damaging | -6.987 |
meaningful | -6.769 |
insofar | -6.741 |
categ | -6.630 |
contrasting | -6.615 |
Token | old |
Token ID | 1468 |
Feature activation | -2.65e+00 |
Pos logit contributions | |
eers | +6.049 |
Works | +5.498 |
culosis | +5.303 |
Facility | +5.170 |
Transactions | +5.108 |
Neg logit contributions | |
damaging | -8.842 |
meaningful | -8.657 |
insofar | -8.558 |
categ | -8.508 |
wounding | -8.461 |
Token | Naval |
Token ID | 20818 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
eers | +9.818 |
Works | +8.758 |
culosis | +8.658 |
Facility | +8.642 |
Companies | +8.635 |
Neg logit contributions | |
damaging | -13.458 |
categ | -13.251 |
insofar | -13.210 |
meaningful | -13.141 |
contrasting | -12.981 |
Token | Air |
Token ID | 3701 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
eers | +9.214 |
Facility | +8.624 |
Works | +8.530 |
Exchange | +8.099 |
Facilities | +7.824 |
Neg logit contributions | |
contrasting | -21.806 |
damaging | -21.526 |
pessimistic | -21.406 |
meaningful | -21.389 |
consequential | -21.367 |
Token | Station |
Token ID | 9327 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
Facility | +11.358 |
eers | +11.357 |
Works | +10.590 |
Exchange | +10.429 |
Services | +10.105 |
Neg logit contributions | |
contrasting | -24.375 |
consequential | -24.238 |
pessimistic | -23.926 |
damaging | -23.767 |
meaningful | -23.545 |
Token | in |
Token ID | 287 |
Feature activation | -3.02e+00 |
Pos logit contributions | |
eers | +15.827 |
Works | +13.902 |
Transactions | +13.704 |
culosis | +13.688 |
Facility | +13.666 |
Neg logit contributions | |
damaging | -13.919 |
consequential | -13.849 |
categ | -13.649 |
pessimistic | -13.574 |
contrasting | -13.558 |
Token | South |
Token ID | 2520 |
Feature activation | -9.40e-01 |
Pos logit contributions | |
eers | +9.942 |
Transactions | +9.150 |
Works | +8.967 |
Facility | +8.706 |
culosis | +8.706 |
Neg logit contributions | |
damaging | -15.739 |
categ | -15.668 |
meaningful | -15.593 |
insofar | -15.285 |
contrasting | -15.093 |
Token | We |
Token ID | 775 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
eers | +1.813 |
Transactions | +1.416 |
culosis | +1.388 |
Works | +1.363 |
Companies | +1.253 |
Neg logit contributions | |
damaging | -7.732 |
meaningful | -7.596 |
contrasting | -7.574 |
categ | -7.546 |
ignoring | -7.453 |
Token | ym |
Token ID | 4948 |
Feature activation | -3.51e+00 |
Pos logit contributions | |
eers | +11.228 |
artment | +8.686 |
erville | +8.668 |
ttes | +8.482 |
culosis | +8.474 |
Neg logit contributions | |
consequential | -24.065 |
contrasting | -23.904 |
categ | -23.833 |
damaging | -23.682 |
conced | -23.068 |
Token | . |
Token ID | 13 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
damaging | +1.122 |
meaningful | +1.095 |
categ | +1.093 |
contrasting | +1.069 |
consequential | +1.057 |
Neg logit contributions | |
eers | -1.816 |
culosis | -1.715 |
Works | -1.661 |
Transactions | -1.648 |
Companies | -1.618 |
Token | ( |
Token ID | 357 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
eers | +8.347 |
Works | +8.291 |
Transactions | +8.025 |
Companies | +7.886 |
Services | +7.654 |
Neg logit contributions | |
wounding | -13.984 |
damaging | -13.958 |
categ | -13.939 |
meaningful | -13.758 |
contrasting | -13.591 |
Token | Wa |
Token ID | 33484 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
eers | +4.664 |
Queue | +4.182 |
culosis | +4.128 |
Transactions | +4.020 |
Works | +4.000 |
Neg logit contributions | |
damaging | -5.889 |
meaningful | -5.778 |
categ | -5.756 |
contrasting | -5.712 |
insofar | -5.657 |
Token | ub |
Token ID | 549 |
Feature activation | -2.48e+00 |
Pos logit contributions | |
eers | +5.979 |
culosis | +5.410 |
Transactions | +5.039 |
Queue | +5.023 |
Works | +4.884 |
Neg logit contributions | |
damaging | -8.479 |
meaningful | -8.232 |
contrasting | -8.216 |
categ | -8.188 |
insofar | -8.082 |
Token | ges |
Token ID | 3212 |
Feature activation | -2.40e+00 |
Pos logit contributions | |
eers | +6.769 |
culosis | +5.670 |
Works | +4.970 |
Transactions | +4.676 |
enges | +4.569 |
Neg logit contributions | |
damaging | -17.411 |
contrasting | -17.339 |
pessimistic | -17.245 |
meaningful | -17.000 |
categ | -16.937 |
Token | hig |
Token ID | 25196 |
Feature activation | -3.89e+00 |
Pos logit contributions | |
eers | +10.208 |
culosis | +9.148 |
Works | +8.161 |
Queue | +8.154 |
acas | +8.154 |
Neg logit contributions | |
damaging | -13.104 |
contrasting | -13.097 |
categ | -12.892 |
meaningful | -12.769 |
consequential | -12.692 |
Token | Rice |
Token ID | 13823 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
eers | +12.360 |
Transactions | +10.963 |
Works | +10.925 |
Services | +10.875 |
Companies | +10.674 |
Neg logit contributions | |
consequential | -20.487 |
damaging | -20.349 |
pessimistic | -20.201 |
categ | -20.155 |
contrasting | -19.975 |
Token | / |
Token ID | 14 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
eers | +7.511 |
Transactions | +6.696 |
culosis | +6.583 |
Works | +6.578 |
Companies | +6.468 |
Neg logit contributions | |
damaging | -8.526 |
categ | -8.382 |
meaningful | -8.365 |
contrasting | -8.328 |
consequential | -8.188 |
Token | CBC |
Token ID | 29208 |
Feature activation | -8.86e-01 |
Pos logit contributions | |
eers | +5.441 |
culosis | +4.693 |
Queue | +4.567 |
Transactions | +4.548 |
Works | +4.320 |
Neg logit contributions | |
damaging | -10.849 |
contrasting | -10.711 |
meaningful | -10.699 |
categ | -10.649 |
consequential | -10.582 |
Token | ) |
Token ID | 8 |
Feature activation | -4.95e-01 |
Pos logit contributions | |
eers | +3.253 |
culosis | +2.922 |
Transactions | +2.898 |
Works | +2.817 |
Companies | +2.709 |
Neg logit contributions | |
damaging | -5.675 |
meaningful | -5.608 |
categ | -5.607 |
insofar | -5.499 |
contrasting | -5.487 |
Token |
|
Token ID | 198 |
Feature activation | +8.74e-01 |
Pos logit contributions | |
eers | +2.180 |
culosis | +1.991 |
Works | +1.969 |
Transactions | +1.967 |
Companies | +1.909 |
Neg logit contributions | |
damaging | -2.901 |
meaningful | -2.853 |
categ | -2.851 |
contrasting | -2.824 |
insofar | -2.797 |
Token | . |
Token ID | 13 |
Feature activation | -6.02e-01 |
Pos logit contributions | |
damaging | +0.802 |
contrasting | +0.767 |
meaningful | +0.766 |
categ | +0.765 |
pessimistic | +0.758 |
Neg logit contributions | |
eers | -1.138 |
culosis | -1.043 |
Transactions | -1.028 |
Works | -1.017 |
Companies | -0.997 |
Token | The |
Token ID | 383 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
eers | +2.296 |
Transactions | +2.066 |
Works | +2.034 |
culosis | +1.996 |
Companies | +1.974 |
Neg logit contributions | |
damaging | -3.887 |
meaningful | -3.818 |
contrasting | -3.767 |
categ | -3.761 |
consequential | -3.726 |
Token | Lac |
Token ID | 23115 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
eers | +1.287 |
culosis | +1.185 |
Transactions | +1.144 |
Works | +1.142 |
Facility | +1.113 |
Neg logit contributions | |
damaging | -1.366 |
insofar | -1.342 |
meaningful | -1.337 |
contrasting | -1.304 |
categ | -1.303 |
Token | anian |
Token ID | 38336 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
damaging | +5.468 |
meaningful | +5.369 |
categ | +5.284 |
contrasting | +5.277 |
insofar | +5.254 |
Neg logit contributions | |
eers | -5.832 |
culosis | -5.452 |
Transactions | -5.221 |
Works | -5.059 |
Companies | -4.990 |
Token | do |
Token ID | 466 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
eers | +1.202 |
culosis | +1.092 |
Transactions | +1.060 |
Works | +1.057 |
Facility | +1.017 |
Neg logit contributions | |
damaging | -1.086 |
meaningful | -1.054 |
insofar | -1.033 |
contrasting | -1.031 |
compelling | -1.013 |
Token | jo |
Token ID | 7639 |
Feature activation | -3.88e+00 |
Pos logit contributions | |
eers | +7.359 |
culosis | +6.359 |
Works | +6.150 |
Transactions | +5.964 |
Facility | +5.927 |
Neg logit contributions | |
damaging | -7.753 |
categ | -7.475 |
contrasting | -7.435 |
meaningful | -7.356 |
wounding | -7.356 |
Token | . |
Token ID | 13 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
eers | +20.132 |
Works | +17.942 |
culosis | +17.517 |
Queue | +17.379 |
Services | +17.072 |
Neg logit contributions | |
damaging | -11.485 |
meaningful | -10.761 |
consequential | -10.454 |
contrasting | -10.422 |
wounding | -10.257 |
Token |
|
Token ID | 198 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
eers | +3.802 |
Works | +3.492 |
Transactions | +3.424 |
culosis | +3.402 |
Companies | +3.308 |
Neg logit contributions | |
damaging | -6.563 |
meaningful | -6.428 |
contrasting | -6.364 |
categ | -6.317 |
consequential | -6.275 |
Token |
|
Token ID | 198 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
damaging | +2.657 |
meaningful | +2.612 |
insofar | +2.564 |
categ | +2.509 |
ignoring | +2.505 |
Neg logit contributions | |
eers | -2.961 |
culosis | -2.938 |
Transactions | -2.697 |
Works | -2.567 |
Facility | -2.535 |
Token | We |
Token ID | 1135 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
eers | +4.080 |
Queue | +3.569 |
culosis | +3.376 |
Works | +3.296 |
Transactions | +3.268 |
Neg logit contributions | |
damaging | -7.304 |
meaningful | -7.177 |
contrasting | -7.176 |
categ | -7.068 |
consequential | -7.021 |
Token | live |
Token ID | 2107 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
eers | +5.962 |
culosis | +5.501 |
Works | +5.193 |
Transactions | +5.181 |
Queue | +5.144 |
Neg logit contributions | |
damaging | -6.372 |
meaningful | -6.239 |
categ | -6.112 |
insofar | -6.085 |
contrasting | -6.042 |
Token | different |
Token ID | 1180 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
eers | +3.793 |
culosis | +3.542 |
Works | +3.479 |
Transactions | +3.449 |
Facility | +3.434 |
Neg logit contributions | |
insofar | -2.896 |
damaging | -2.893 |
categ | -2.800 |
meaningful | -2.780 |
contrasting | -2.764 |
Token | flight |
Token ID | 5474 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
eers | +7.482 |
Facility | +6.823 |
Works | +6.731 |
culosis | +6.701 |
Companies | +6.580 |
Neg logit contributions | |
damaging | -8.192 |
insofar | -8.095 |
contrasting | -7.970 |
categ | -7.902 |
meaningful | -7.891 |
Token | ( |
Token ID | 357 |
Feature activation | +9.54e-03 |
Pos logit contributions | |
eers | +3.864 |
culosis | +3.515 |
Facility | +3.435 |
Works | +3.413 |
Transactions | +3.387 |
Neg logit contributions | |
damaging | -2.929 |
categ | -2.868 |
meaningful | -2.847 |
contrasting | -2.816 |
insofar | -2.761 |
Token | because |
Token ID | 13893 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
damaging | +0.052 |
meaningful | +0.051 |
categ | +0.051 |
contrasting | +0.050 |
insofar | +0.050 |
Neg logit contributions | |
eers | -0.047 |
culosis | -0.043 |
Transactions | -0.041 |
Works | -0.041 |
Queue | -0.040 |
Token | Exp |
Token ID | 5518 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
eers | +11.449 |
Works | +10.519 |
Companies | +10.280 |
Transactions | +10.241 |
Services | +10.208 |
Neg logit contributions | |
damaging | -8.298 |
meaningful | -8.058 |
contrasting | -8.050 |
categ | -8.023 |
pessimistic | -8.001 |
Token | edia |
Token ID | 5507 |
Feature activation | -3.86e+00 |
Pos logit contributions | |
eers | +3.768 |
culosis | +3.189 |
Transactions | +3.007 |
Works | +2.926 |
Services | +2.735 |
Neg logit contributions | |
damaging | -9.278 |
contrasting | -9.193 |
meaningful | -9.082 |
insofar | -9.040 |
categ | -9.013 |
Token | informed |
Token ID | 7981 |
Feature activation | -2.35e+00 |
Pos logit contributions | |
eers | +19.288 |
Services | +17.902 |
Works | +17.692 |
Transactions | +17.612 |
Companies | +17.387 |
Neg logit contributions | |
damaging | -12.235 |
contrasting | -12.088 |
meaningful | -12.072 |
insofar | -11.814 |
wounding | -11.807 |
Token | her |
Token ID | 607 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
eers | +10.842 |
Companies | +9.927 |
Transactions | +9.800 |
Works | +9.651 |
Services | +9.647 |
Neg logit contributions | |
damaging | -10.456 |
contrasting | -10.289 |
meaningful | -10.165 |
categ | -10.160 |
insofar | -10.153 |
Token | that |
Token ID | 326 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
damaging | +0.958 |
meaningful | +0.941 |
contrasting | +0.930 |
categ | +0.929 |
insofar | +0.922 |
Neg logit contributions | |
eers | -0.990 |
culosis | -0.919 |
Transactions | -0.882 |
Works | -0.865 |
Companies | -0.855 |
Token | her |
Token ID | 607 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
eers | +10.454 |
Works | +9.826 |
Companies | +9.665 |
culosis | +9.618 |
Transactions | +9.599 |
Neg logit contributions | |
damaging | -7.942 |
contrasting | -7.810 |
categ | -7.723 |
meaningful | -7.671 |
pessimistic | -7.662 |
Token | original |
Token ID | 2656 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
eers | +3.303 |
culosis | +3.015 |
Transactions | +2.971 |
Works | +2.958 |
Companies | +2.908 |
Neg logit contributions | |
damaging | -3.002 |
insofar | -2.962 |
contrasting | -2.945 |
meaningful | -2.937 |
categ | -2.917 |
Token | . |
Token ID | 13 |
Feature activation | -1.90e+00 |
Pos logit contributions | |
eers | +7.540 |
Works | +6.863 |
culosis | +6.837 |
Companies | +6.658 |
Transactions | +6.636 |
Neg logit contributions | |
contrasting | -5.171 |
meaningful | -5.165 |
categ | -5.161 |
damaging | -5.153 |
pessimistic | -4.973 |
Token | While |
Token ID | 2893 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
eers | +6.445 |
Transactions | +6.044 |
Works | +6.031 |
Companies | +5.952 |
culosis | +5.713 |
Neg logit contributions | |
damaging | -11.999 |
meaningful | -11.859 |
contrasting | -11.751 |
categ | -11.666 |
consequential | -11.627 |
Token | the |
Token ID | 262 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
eers | +8.491 |
culosis | +7.896 |
Works | +7.833 |
Companies | +7.586 |
Transactions | +7.571 |
Neg logit contributions | |
meaningful | -5.795 |
categ | -5.784 |
damaging | -5.709 |
contrasting | -5.616 |
insofar | -5.606 |
Token | c |
Token ID | 269 |
Feature activation | -7.11e-01 |
Pos logit contributions | |
eers | +8.215 |
culosis | +7.386 |
Works | +7.351 |
Transactions | +7.201 |
Companies | +7.156 |
Neg logit contributions | |
damaging | -6.669 |
meaningful | -6.658 |
insofar | -6.608 |
categ | -6.535 |
contrasting | -6.411 |
Token | uck |
Token ID | 1347 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
eers | +2.346 |
culosis | +1.943 |
atcher | +1.825 |
Transactions | +1.734 |
acas | +1.730 |
Neg logit contributions | |
damaging | -5.005 |
meaningful | -4.984 |
contrasting | -4.941 |
categ | -4.894 |
consequential | -4.888 |
Token | oo |
Token ID | 2238 |
Feature activation | -3.77e+00 |
Pos logit contributions | |
eers | +7.297 |
culosis | +5.922 |
atcher | +5.435 |
Works | +5.348 |
Queue | +5.283 |
Neg logit contributions | |
damaging | -13.406 |
categ | -13.285 |
meaningful | -13.164 |
contrasting | -13.099 |
consequential | -13.071 |
Token | is |
Token ID | 318 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
eers | +19.352 |
culosis | +16.360 |
Works | +16.114 |
atcher | +15.718 |
ttes | +15.702 |
Neg logit contributions | |
categ | -12.293 |
meaningful | -12.012 |
consequential | -11.720 |
contrasting | -11.646 |
damaging | -11.358 |
Token | in |
Token ID | 287 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
eers | +8.744 |
culosis | +7.972 |
Works | +7.936 |
Transactions | +7.703 |
Companies | +7.686 |
Neg logit contributions | |
categ | -4.444 |
meaningful | -4.269 |
insofar | -4.268 |
contrasting | -4.200 |
consequential | -4.164 |
Token | the |
Token ID | 262 |
Feature activation | -1.76e+00 |
Pos logit contributions | |
eers | +9.606 |
Works | +8.598 |
Transactions | +8.579 |
culosis | +8.517 |
Companies | +8.390 |
Neg logit contributions | |
categ | -7.789 |
contrasting | -7.787 |
damaging | -7.766 |
meaningful | -7.712 |
insofar | -7.675 |
Token | hospital |
Token ID | 4436 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
eers | +9.224 |
Works | +8.563 |
Transactions | +8.354 |
culosis | +8.104 |
Facility | +8.028 |
Neg logit contributions | |
meaningful | -7.348 |
categ | -7.290 |
damaging | -7.247 |
contrasting | -7.219 |
insofar | -7.203 |
Token | , |
Token ID | 11 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
eers | +12.009 |
culosis | +11.248 |
Works | +10.879 |
Facility | +10.715 |
Transactions | +10.543 |
Neg logit contributions | |
meaningful | -8.042 |
damaging | -7.904 |
categ | -7.895 |
contrasting | -7.861 |
compelling | -7.697 |
Token | . |
Token ID | 13 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
eers | +0.250 |
culosis | +0.228 |
Works | +0.220 |
Transactions | +0.217 |
Companies | +0.213 |
Neg logit contributions | |
damaging | -0.209 |
categ | -0.207 |
meaningful | -0.206 |
pessimistic | -0.202 |
insofar | -0.202 |
Token | ( |
Token ID | 357 |
Feature activation | -7.51e-01 |
Pos logit contributions | |
eers | +6.206 |
Works | +5.976 |
Companies | +5.728 |
Transactions | +5.652 |
Services | +5.523 |
Neg logit contributions | |
damaging | -10.151 |
categ | -10.110 |
consequential | -10.051 |
meaningful | -10.015 |
wounding | -9.986 |
Token | Wa |
Token ID | 33484 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
eers | +3.448 |
culosis | +3.106 |
Queue | +3.062 |
Transactions | +2.987 |
Works | +2.979 |
Neg logit contributions | |
damaging | -4.243 |
meaningful | -4.154 |
categ | -4.143 |
contrasting | -4.109 |
insofar | -4.086 |
Token | ub |
Token ID | 549 |
Feature activation | -2.57e+00 |
Pos logit contributions | |
eers | +5.647 |
culosis | +5.177 |
Transactions | +4.845 |
Queue | +4.773 |
Works | +4.686 |
Neg logit contributions | |
damaging | -7.698 |
meaningful | -7.493 |
contrasting | -7.459 |
categ | -7.454 |
consequential | -7.350 |
Token | ges |
Token ID | 3212 |
Feature activation | -2.51e+00 |
Pos logit contributions | |
eers | +7.189 |
culosis | +6.057 |
Works | +5.269 |
Transactions | +4.980 |
ttes | +4.875 |
Neg logit contributions | |
damaging | -17.810 |
contrasting | -17.755 |
pessimistic | -17.573 |
meaningful | -17.499 |
consequential | -17.358 |
Token | hig |
Token ID | 25196 |
Feature activation | -3.77e+00 |
Pos logit contributions | |
eers | +10.505 |
culosis | +9.370 |
ttes | +8.342 |
acas | +8.319 |
Queue | +8.292 |
Neg logit contributions | |
contrasting | -13.730 |
damaging | -13.681 |
categ | -13.535 |
meaningful | -13.427 |
consequential | -13.324 |
Token | Rice |
Token ID | 13823 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
eers | +12.951 |
Transactions | +11.716 |
Services | +11.614 |
Works | +11.561 |
Companies | +11.407 |
Neg logit contributions | |
consequential | -19.229 |
damaging | -18.996 |
categ | -18.823 |
pessimistic | -18.811 |
meaningful | -18.641 |
Token | / |
Token ID | 14 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
eers | +7.977 |
Transactions | +7.127 |
Works | +7.004 |
culosis | +6.995 |
Companies | +6.892 |
Neg logit contributions | |
damaging | -9.073 |
categ | -8.931 |
meaningful | -8.908 |
contrasting | -8.867 |
consequential | -8.741 |
Token | CBC |
Token ID | 29208 |
Feature activation | -9.87e-01 |
Pos logit contributions | |
eers | +5.154 |
culosis | +4.477 |
Transactions | +4.342 |
Queue | +4.334 |
Works | +4.132 |
Neg logit contributions | |
damaging | -10.015 |
contrasting | -9.880 |
meaningful | -9.867 |
categ | -9.843 |
consequential | -9.754 |
Token | ) |
Token ID | 8 |
Feature activation | -6.55e-01 |
Pos logit contributions | |
eers | +3.809 |
Transactions | +3.345 |
culosis | +3.341 |
Works | +3.236 |
Companies | +3.151 |
Neg logit contributions | |
damaging | -6.239 |
categ | -6.154 |
meaningful | -6.151 |
contrasting | -6.083 |
consequential | -6.042 |
Token | Carter |
Token ID | 10831 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
eers | +2.830 |
Works | +2.604 |
culosis | +2.598 |
Transactions | +2.555 |
Companies | +2.532 |
Neg logit contributions | |
damaging | -3.810 |
categ | -3.760 |
meaningful | -3.735 |
contrasting | -3.721 |
consequential | -3.705 |
Token | It |
Token ID | 632 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
eers | +4.965 |
Transactions | +4.662 |
Companies | +4.485 |
Works | +4.441 |
culosis | +4.267 |
Neg logit contributions | |
damaging | -9.896 |
categ | -9.675 |
meaningful | -9.668 |
wounding | -9.633 |
consequential | -9.576 |
Token | is |
Token ID | 318 |
Feature activation | -5.48e-01 |
Pos logit contributions | |
eers | +9.967 |
culosis | +8.904 |
Works | +8.825 |
Transactions | +8.537 |
Companies | +8.394 |
Neg logit contributions | |
damaging | -10.428 |
meaningful | -10.028 |
consequential | -9.969 |
categ | -9.961 |
wounding | -9.860 |
Token | a |
Token ID | 257 |
Feature activation | +9.31e-02 |
Pos logit contributions | |
eers | +3.472 |
culosis | +3.217 |
Transactions | +3.150 |
Works | +3.133 |
Companies | +3.090 |
Neg logit contributions | |
damaging | -2.031 |
categ | -1.957 |
meaningful | -1.951 |
insofar | -1.944 |
contrasting | -1.913 |
Token | peer |
Token ID | 12720 |
Feature activation | -2.68e-01 |
Pos logit contributions | |
damaging | +0.445 |
insofar | +0.430 |
meaningful | +0.427 |
categ | +0.426 |
contrasting | +0.423 |
Neg logit contributions | |
eers | -0.516 |
culosis | -0.476 |
Transactions | -0.466 |
Works | -0.459 |
Companies | -0.450 |
Token | - |
Token ID | 12 |
Feature activation | -7.33e-02 |
Pos logit contributions | |
eers | +1.293 |
culosis | +1.224 |
Transactions | +1.204 |
Companies | +1.174 |
Works | +1.162 |
Neg logit contributions | |
damaging | -1.408 |
categ | -1.360 |
wounding | -1.360 |
insofar | -1.350 |
contrasting | -1.333 |
Token | to |
Token ID | 1462 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
eers | +0.282 |
culosis | +0.257 |
Transactions | +0.244 |
Works | +0.239 |
Companies | +0.237 |
Neg logit contributions | |
damaging | -0.473 |
categ | -0.464 |
meaningful | -0.460 |
wounding | -0.457 |
contrasting | -0.456 |
Token | - |
Token ID | 12 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
eers | +12.485 |
Queue | +10.455 |
Transactions | +10.128 |
Companies | +10.087 |
Works | +10.071 |
Neg logit contributions | |
contrasting | -19.119 |
categ | -19.007 |
wounding | -18.943 |
damaging | -18.714 |
consequential | -18.480 |
Token | peer |
Token ID | 33350 |
Feature activation | -6.88e-01 |
Pos logit contributions | |
eers | +6.477 |
culosis | +5.867 |
Queue | +5.665 |
Transactions | +5.628 |
Works | +5.536 |
Neg logit contributions | |
damaging | -9.495 |
categ | -9.411 |
contrasting | -9.306 |
wounding | -9.233 |
meaningful | -9.181 |
Token | app |
Token ID | 598 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
eers | +3.528 |
Transactions | +3.208 |
culosis | +3.191 |
Works | +3.133 |
Companies | +3.062 |
Neg logit contributions | |
damaging | -3.406 |
categ | -3.282 |
meaningful | -3.267 |
contrasting | -3.257 |
insofar | -3.242 |
Token | , |
Token ID | 11 |
Feature activation | +8.52e-01 |
Pos logit contributions | |
eers | +8.759 |
culosis | +8.045 |
Works | +7.777 |
Companies | +7.728 |
Exchange | +7.723 |
Neg logit contributions | |
damaging | -6.183 |
categ | -5.986 |
meaningful | -5.870 |
wounding | -5.839 |
consequential | -5.802 |
Token | founded |
Token ID | 9393 |
Feature activation | -9.04e-01 |
Pos logit contributions | |
damaging | +3.586 |
meaningful | +3.486 |
categ | +3.446 |
contrasting | +3.417 |
insofar | +3.388 |
Neg logit contributions | |
eers | -5.280 |
culosis | -4.963 |
Transactions | -4.813 |
Works | -4.719 |
Companies | -4.646 |
Token | April |
Token ID | 3035 |
Feature activation | +9.05e-01 |
Pos logit contributions | |
eers | +5.151 |
Works | +4.595 |
Transactions | +4.539 |
culosis | +4.496 |
Companies | +4.496 |
Neg logit contributions | |
damaging | -6.337 |
insofar | -6.326 |
categ | -6.287 |
meaningful | -6.268 |
contrasting | -6.232 |
Token | 6 |
Token ID | 718 |
Feature activation | +9.04e-01 |
Pos logit contributions | |
damaging | +4.396 |
meaningful | +4.295 |
insofar | +4.202 |
contrasting | +4.201 |
categ | +4.168 |
Neg logit contributions | |
eers | -4.950 |
culosis | -4.760 |
Transactions | -4.426 |
Works | -4.253 |
Companies | -4.237 |
Token | . |
Token ID | 13 |
Feature activation | -2.07e+00 |
Pos logit contributions | |
damaging | +4.067 |
meaningful | +4.001 |
categ | +3.973 |
contrasting | +3.900 |
insofar | +3.874 |
Neg logit contributions | |
eers | -5.382 |
culosis | -5.024 |
Transactions | -4.873 |
Works | -4.778 |
Facility | -4.718 |
Token | That |
Token ID | 1320 |
Feature activation | -3.06e+00 |
Pos logit contributions | |
eers | +6.913 |
Transactions | +6.720 |
Works | +6.684 |
Companies | +6.511 |
Facility | +6.386 |
Neg logit contributions | |
meaningful | -12.206 |
damaging | -12.201 |
categ | -12.091 |
contrasting | -12.040 |
wounding | -11.970 |
Token | spac |
Token ID | 34752 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
eers | +15.404 |
Works | +13.996 |
Facility | +13.828 |
culosis | +13.628 |
Exchange | +13.318 |
Neg logit contributions | |
contrasting | -10.775 |
damaging | -10.580 |
insofar | -10.501 |
meaningful | -10.320 |
conced | -10.226 |
Token | ew |
Token ID | 413 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
eers | +8.202 |
culosis | +7.169 |
Works | +6.654 |
Queue | +6.508 |
Facility | +6.448 |
Neg logit contributions | |
damaging | -12.530 |
categ | -12.217 |
contrasting | -12.192 |
consequential | -12.172 |
meaningful | -12.151 |
Token | alk |
Token ID | 971 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
eers | +12.577 |
atcher | +10.914 |
culosis | +10.344 |
Queue | +10.260 |
acas | +10.254 |
Neg logit contributions | |
consequential | -20.382 |
contrasting | -19.952 |
pessimistic | -19.820 |
categ | -19.719 |
meaningful | -19.688 |
Token | , |
Token ID | 11 |
Feature activation | -6.69e-03 |
Pos logit contributions | |
eers | +14.160 |
Works | +12.244 |
Facility | +12.215 |
culosis | +12.176 |
Queue | +12.005 |
Neg logit contributions | |
meaningful | -12.246 |
damaging | -12.114 |
categ | -12.108 |
contrasting | -12.016 |
insofar | -11.980 |
Token | Gat |
Token ID | 29074 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
eers | +0.036 |
culosis | +0.033 |
Transactions | +0.033 |
Works | +0.033 |
Facility | +0.032 |
Neg logit contributions | |
damaging | -0.032 |
categ | -0.032 |
meaningful | -0.032 |
contrasting | -0.031 |
insofar | -0.031 |
Token | ens |
Token ID | 641 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
eers | +2.553 |
culosis | +2.328 |
Transactions | +2.204 |
Works | +2.156 |
Companies | +2.110 |
Neg logit contributions | |
damaging | -3.261 |
meaningful | -3.205 |
contrasting | -3.179 |
categ | -3.175 |
insofar | -3.153 |
Token | said |
Token ID | 531 |
Feature activation | +2.24e-02 |
Pos logit contributions | |
eers | +0.624 |
culosis | +0.549 |
Works | +0.525 |
Transactions | +0.523 |
Companies | +0.519 |
Neg logit contributions | |
damaging | -0.956 |
meaningful | -0.941 |
insofar | -0.930 |
contrasting | -0.928 |
categ | -0.922 |
Token |
|
Token ID | 198 |
Feature activation | +7.72e-01 |
Pos logit contributions | |
damaging | +1.380 |
meaningful | +1.369 |
insofar | +1.340 |
categ | +1.339 |
contrasting | +1.337 |
Neg logit contributions | |
eers | -1.001 |
culosis | -0.905 |
Transactions | -0.890 |
Works | -0.862 |
Facility | -0.843 |
Token |
|
Token ID | 198 |
Feature activation | -4.59e-01 |
Pos logit contributions | |
damaging | +3.689 |
meaningful | +3.610 |
insofar | +3.543 |
categ | +3.477 |
ignoring | +3.463 |
Neg logit contributions | |
eers | -4.144 |
culosis | -4.103 |
Transactions | -3.771 |
Works | -3.585 |
Companies | -3.543 |
Token | T |
Token ID | 51 |
Feature activation | +8.52e-01 |
Pos logit contributions | |
eers | +1.757 |
culosis | +1.507 |
Queue | +1.500 |
Transactions | +1.486 |
Works | +1.403 |
Neg logit contributions | |
damaging | -2.975 |
meaningful | -2.971 |
contrasting | -2.924 |
categ | -2.915 |
insofar | -2.892 |
Token | ric |
Token ID | 1173 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
damaging | +3.984 |
meaningful | +3.926 |
contrasting | +3.847 |
categ | +3.838 |
insofar | +3.822 |
Neg logit contributions | |
eers | -4.962 |
culosis | -4.650 |
Transactions | -4.436 |
Works | -4.328 |
Companies | -4.259 |
Token | er |
Token ID | 263 |
Feature activation | -2.44e+00 |
Pos logit contributions | |
eers | +4.926 |
culosis | +4.374 |
Transactions | +4.148 |
Works | +4.069 |
Facility | +3.964 |
Neg logit contributions | |
damaging | -6.666 |
meaningful | -6.650 |
categ | -6.603 |
contrasting | -6.559 |
insofar | -6.471 |
Token | at |
Token ID | 265 |
Feature activation | -3.71e+00 |
Pos logit contributions | |
eers | +5.173 |
culosis | +4.631 |
atcher | +3.724 |
Transactions | +3.689 |
acas | +3.567 |
Neg logit contributions | |
damaging | -17.948 |
meaningful | -17.943 |
contrasting | -17.812 |
categ | -17.540 |
consequential | -17.540 |
Token | ops |
Token ID | 2840 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
eers | +5.882 |
culosis | +3.781 |
acas | +3.275 |
Works | +3.202 |
Transactions | +2.839 |
Neg logit contributions | |
contrasting | -27.413 |
pessimistic | -27.076 |
categ | -26.822 |
consequential | -26.747 |
meaningful | -26.728 |
Token | # |
Token ID | 1303 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
eers | +7.035 |
Transactions | +6.331 |
Works | +6.049 |
culosis | +6.035 |
Facility | +6.033 |
Neg logit contributions | |
damaging | -13.793 |
meaningful | -13.706 |
pessimistic | -13.665 |
insofar | -13.522 |
contrasting | -13.521 |
Token | 1 |
Token ID | 16 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
eers | +0.639 |
culosis | +0.590 |
Transactions | +0.580 |
Works | +0.568 |
Companies | +0.557 |
Neg logit contributions | |
damaging | -0.616 |
meaningful | -0.609 |
insofar | -0.596 |
categ | -0.595 |
contrasting | -0.595 |
Token |
|
Token ID | 198 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
damaging | +2.862 |
meaningful | +2.829 |
insofar | +2.779 |
contrasting | +2.774 |
categ | +2.773 |
Neg logit contributions | |
eers | -2.097 |
culosis | -1.909 |
Transactions | -1.853 |
Works | -1.794 |
Facility | -1.758 |
Token |
|
Token ID | 198 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
damaging | +5.619 |
meaningful | +5.491 |
insofar | +5.384 |
ignoring | +5.258 |
compelling | +5.251 |
Neg logit contributions | |
culosis | -7.196 |
eers | -7.093 |
Transactions | -6.540 |
Works | -6.182 |
Companies | -6.114 |
Token | had |
Token ID | 550 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
eers | +1.986 |
culosis | +1.716 |
Transactions | +1.676 |
Works | +1.629 |
Companies | +1.608 |
Neg logit contributions | |
damaging | -3.006 |
meaningful | -2.988 |
contrasting | -2.931 |
categ | -2.926 |
insofar | -2.895 |
Token | noted |
Token ID | 4367 |
Feature activation | +4.04e-01 |
Pos logit contributions | |
eers | +0.924 |
culosis | +0.836 |
Transactions | +0.814 |
Works | +0.799 |
Companies | +0.791 |
Neg logit contributions | |
damaging | -0.911 |
meaningful | -0.900 |
contrasting | -0.879 |
categ | -0.876 |
insofar | -0.864 |
Token | that |
Token ID | 326 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
damaging | +2.045 |
meaningful | +2.014 |
categ | +1.969 |
contrasting | +1.961 |
insofar | +1.957 |
Neg logit contributions | |
eers | -2.148 |
culosis | -1.955 |
Transactions | -1.913 |
Works | -1.865 |
Companies | -1.856 |
Token | the |
Token ID | 262 |
Feature activation | -5.99e-01 |
Pos logit contributions | |
eers | +1.615 |
culosis | +1.446 |
Transactions | +1.437 |
Works | +1.421 |
Companies | +1.406 |
Neg logit contributions | |
damaging | -1.321 |
meaningful | -1.291 |
categ | -1.268 |
contrasting | -1.265 |
insofar | -1.244 |
Token | joint |
Token ID | 6466 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
eers | +3.043 |
Transactions | +2.726 |
culosis | +2.686 |
Works | +2.675 |
Companies | +2.660 |
Neg logit contributions | |
damaging | -3.041 |
meaningful | -2.996 |
insofar | -2.950 |
contrasting | -2.911 |
categ | -2.905 |
Token | venture |
Token ID | 13189 |
Feature activation | -3.68e+00 |
Pos logit contributions | |
eers | +10.610 |
Companies | +9.563 |
Transactions | +9.315 |
Works | +9.155 |
Facility | +9.108 |
Neg logit contributions | |
damaging | -13.170 |
meaningful | -12.882 |
contrasting | -12.854 |
insofar | -12.767 |
ignoring | -12.725 |
Token | was |
Token ID | 373 |
Feature activation | -7.46e-01 |
Pos logit contributions | |
eers | +18.165 |
Companies | +16.050 |
Transactions | +15.835 |
Works | +15.643 |
Facility | +15.610 |
Neg logit contributions | |
damaging | -11.878 |
pessimistic | -11.664 |
categ | -11.642 |
contrasting | -11.457 |
meaningful | -11.363 |
Token | signed |
Token ID | 4488 |
Feature activation | -3.45e-01 |
Pos logit contributions | |
eers | +4.481 |
Transactions | +4.166 |
culosis | +4.120 |
Companies | +4.111 |
Works | +4.096 |
Neg logit contributions | |
damaging | -2.706 |
contrasting | -2.665 |
categ | -2.631 |
insofar | -2.623 |
meaningful | -2.613 |
Token | without |
Token ID | 1231 |
Feature activation | -6.63e-01 |
Pos logit contributions | |
eers | +2.159 |
culosis | +1.997 |
Transactions | +1.961 |
Companies | +1.956 |
Works | +1.953 |
Neg logit contributions | |
damaging | -1.325 |
categ | -1.288 |
meaningful | -1.281 |
contrasting | -1.261 |
pessimistic | -1.242 |
Token | any |
Token ID | 597 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
eers | +3.913 |
Transactions | +3.494 |
Companies | +3.462 |
culosis | +3.436 |
Works | +3.431 |
Neg logit contributions | |
damaging | -2.710 |
insofar | -2.705 |
contrasting | -2.636 |
categ | -2.626 |
pessimistic | -2.609 |
Token | formal |
Token ID | 8766 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
eers | +0.128 |
culosis | +0.115 |
Transactions | +0.114 |
Works | +0.111 |
Companies | +0.111 |
Neg logit contributions | |
damaging | -0.111 |
insofar | -0.109 |
contrasting | -0.108 |
meaningful | -0.107 |
categ | -0.107 |
Token | .' |
Token ID | 2637 |
Feature activation | -6.39e-02 |
Pos logit contributions | |
eers | +2.610 |
culosis | +2.366 |
Works | +2.338 |
Transactions | +2.315 |
Facility | +2.301 |
Neg logit contributions | |
categ | -1.821 |
damaging | -1.809 |
contrasting | -1.789 |
meaningful | -1.743 |
pessimistic | -1.718 |
Token |
|
Token ID | 198 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
eers | +0.270 |
culosis | +0.249 |
Transactions | +0.244 |
Works | +0.237 |
Companies | +0.234 |
Neg logit contributions | |
damaging | -0.384 |
meaningful | -0.381 |
categ | -0.379 |
contrasting | -0.374 |
insofar | -0.373 |
Token |
|
Token ID | 198 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
damaging | +3.876 |
meaningful | +3.799 |
insofar | +3.729 |
ignoring | +3.657 |
compelling | +3.648 |
Neg logit contributions | |
culosis | -4.533 |
eers | -4.505 |
Transactions | -4.144 |
Works | -3.901 |
Facility | -3.869 |
Token | The |
Token ID | 464 |
Feature activation | -7.42e-01 |
Pos logit contributions | |
eers | +5.742 |
Queue | +5.119 |
Services | +4.865 |
Transactions | +4.769 |
Works | +4.691 |
Neg logit contributions | |
categ | -9.608 |
meaningful | -9.520 |
contrasting | -9.498 |
damaging | -9.442 |
consequential | -9.355 |
Token | Gross |
Token ID | 21796 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
eers | +3.852 |
culosis | +3.530 |
Transactions | +3.509 |
Works | +3.447 |
Facility | +3.418 |
Neg logit contributions | |
insofar | -3.557 |
meaningful | -3.511 |
categ | -3.497 |
damaging | -3.475 |
contrasting | -3.434 |
Token | man |
Token ID | 805 |
Feature activation | -3.63e+00 |
Pos logit contributions | |
eers | +5.641 |
culosis | +5.064 |
Transactions | +4.897 |
Works | +4.881 |
Facility | +4.807 |
Neg logit contributions | |
damaging | -6.639 |
categ | -6.592 |
contrasting | -6.572 |
meaningful | -6.557 |
insofar | -6.475 |
Token | Burn |
Token ID | 8942 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
eers | +14.651 |
Facility | +14.432 |
culosis | +14.151 |
Works | +13.879 |
Exchange | +13.123 |
Neg logit contributions | |
meaningful | -14.681 |
insofar | -14.523 |
contrasting | -14.430 |
categ | -14.344 |
damaging | -13.965 |
Token | Center |
Token ID | 3337 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
eers | +10.874 |
Facility | +10.261 |
culosis | +9.855 |
Works | +9.664 |
Services | +9.447 |
Neg logit contributions | |
meaningful | -12.951 |
damaging | -12.882 |
insofar | -12.866 |
contrasting | -12.787 |
categ | -12.714 |
Token | was |
Token ID | 373 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
eers | +16.544 |
Facility | +15.148 |
Works | +14.975 |
Services | +14.804 |
Transactions | +14.570 |
Neg logit contributions | |
damaging | -11.774 |
meaningful | -11.689 |
categ | -11.556 |
contrasting | -11.548 |
consequential | -11.270 |
Token | founded |
Token ID | 9393 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
eers | +10.438 |
culosis | +9.856 |
Facility | +9.821 |
Companies | +9.578 |
Works | +9.566 |
Neg logit contributions | |
damaging | -7.034 |
insofar | -7.030 |
contrasting | -6.934 |
meaningful | -6.921 |
categ | -6.856 |
Token | by |
Token ID | 416 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
eers | +7.999 |
culosis | +7.470 |
Works | +7.361 |
Companies | +7.286 |
Facility | +7.076 |
Neg logit contributions | |
categ | -5.592 |
damaging | -5.569 |
contrasting | -5.392 |
meaningful | -5.390 |
consequential | -5.329 |
Token | Boston |
Token ID | 6182 |
Feature activation | +8.19e-02 |
Pos logit contributions | |
damaging | +1.217 |
meaningful | +1.196 |
categ | +1.183 |
insofar | +1.178 |
contrasting | +1.174 |
Neg logit contributions | |
eers | -0.945 |
culosis | -0.864 |
Transactions | -0.837 |
Works | -0.827 |
Companies | -0.805 |
Token | . |
Token ID | 13 |
Feature activation | -2.26e+00 |
Pos logit contributions | |
damaging | +0.553 |
meaningful | +0.545 |
categ | +0.537 |
insofar | +0.535 |
contrasting | +0.533 |
Neg logit contributions | |
eers | -0.302 |
culosis | -0.276 |
Transactions | -0.263 |
Works | -0.261 |
Companies | -0.253 |
Token | com |
Token ID | 785 |
Feature activation | -2.25e+00 |
Pos logit contributions | |
eers | +9.485 |
culosis | +8.867 |
Works | +8.857 |
Transactions | +8.469 |
Companies | +8.436 |
Neg logit contributions | |
damaging | -11.495 |
meaningful | -11.212 |
categ | -11.187 |
contrasting | -11.141 |
consequential | -10.908 |
Token | The |
Token ID | 383 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
eers | +11.988 |
culosis | +11.196 |
Works | +10.944 |
Companies | +10.633 |
Transactions | +10.521 |
Neg logit contributions | |
categ | -9.101 |
damaging | -8.976 |
meaningful | -8.786 |
contrasting | -8.779 |
consequential | -8.525 |
Token | old |
Token ID | 1468 |
Feature activation | -2.36e+00 |
Pos logit contributions | |
eers | +5.395 |
culosis | +4.640 |
Works | +4.489 |
Facility | +4.358 |
Transactions | +4.340 |
Neg logit contributions | |
damaging | -7.723 |
meaningful | -7.683 |
insofar | -7.547 |
categ | -7.528 |
contrasting | -7.513 |
Token | building |
Token ID | 16894 |
Feature activation | -3.61e+00 |
Pos logit contributions | |
eers | +8.219 |
culosis | +7.236 |
Works | +6.950 |
Exchange | +6.750 |
Facility | +6.611 |
Neg logit contributions | |
damaging | -13.544 |
categ | -13.384 |
contrasting | -13.126 |
meaningful | -13.104 |
insofar | -12.830 |
Token | was |
Token ID | 373 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
eers | +15.408 |
Queue | +14.005 |
culosis | +13.761 |
Companies | +13.436 |
Works | +13.425 |
Neg logit contributions | |
damaging | -14.054 |
meaningful | -13.669 |
categ | -13.610 |
pessimistic | -13.597 |
contrasting | -13.558 |
Token | renamed |
Token ID | 25121 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
eers | +6.423 |
culosis | +5.574 |
Companies | +5.458 |
swick | +5.414 |
Queue | +5.264 |
Neg logit contributions | |
damaging | -10.584 |
contrasting | -10.580 |
wounding | -10.539 |
categ | -10.538 |
pessimistic | -10.300 |
Token | for |
Token ID | 1640 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
eers | +5.158 |
culosis | +4.833 |
Works | +4.587 |
Companies | +4.491 |
Transactions | +4.420 |
Neg logit contributions | |
damaging | -5.051 |
categ | -4.980 |
contrasting | -4.964 |
meaningful | -4.900 |
consequential | -4.818 |
Token | the |
Token ID | 262 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
eers | +6.901 |
culosis | +6.187 |
Works | +6.020 |
Facility | +5.985 |
Transactions | +5.959 |
Neg logit contributions | |
damaging | -8.045 |
insofar | -8.005 |
pessimistic | -7.949 |
meaningful | -7.941 |
categ | -7.926 |
Token | shooting |
Token ID | 4395 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
eers | +6.774 |
culosis | +6.251 |
Transactions | +5.987 |
Facility | +5.964 |
Works | +5.918 |
Neg logit contributions | |
damaging | -4.726 |
meaningful | -4.698 |
categ | -4.697 |
insofar | -4.674 |
contrasting | -4.634 |
Token | facilitate |
Token ID | 15570 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
damaging | +0.202 |
meaningful | +0.202 |
categ | +0.201 |
contrasting | +0.200 |
insofar | +0.198 |
Neg logit contributions | |
eers | -0.231 |
culosis | -0.215 |
Transactions | -0.207 |
Works | -0.201 |
Companies | -0.199 |
Token | construction |
Token ID | 5103 |
Feature activation | -9.87e-01 |
Pos logit contributions | |
eers | +2.018 |
culosis | +1.790 |
Transactions | +1.773 |
Works | +1.737 |
Companies | +1.706 |
Neg logit contributions | |
insofar | -1.575 |
categ | -1.554 |
meaningful | -1.543 |
damaging | -1.536 |
contrasting | -1.529 |
Token | of |
Token ID | 286 |
Feature activation | -8.28e-01 |
Pos logit contributions | |
eers | +5.008 |
Works | +4.271 |
Transactions | +4.265 |
Companies | +4.183 |
culosis | +4.151 |
Neg logit contributions | |
categ | -4.845 |
contrasting | -4.750 |
pessimistic | -4.745 |
damaging | -4.704 |
meaningful | -4.702 |
Token | multi |
Token ID | 5021 |
Feature activation | +9.98e-03 |
Pos logit contributions | |
eers | +4.402 |
Works | +3.939 |
culosis | +3.901 |
Transactions | +3.884 |
Companies | +3.850 |
Neg logit contributions | |
insofar | -3.875 |
damaging | -3.725 |
wounding | -3.672 |
contrasting | -3.670 |
meaningful | -3.665 |
Token | - |
Token ID | 12 |
Feature activation | +7.41e-01 |
Pos logit contributions | |
insofar | +0.053 |
damaging | +0.053 |
meaningful | +0.053 |
contrasting | +0.052 |
categ | +0.052 |
Neg logit contributions | |
eers | -0.049 |
culosis | -0.046 |
Transactions | -0.044 |
Works | -0.043 |
Companies | -0.043 |
Token | store |
Token ID | 8095 |
Feature activation | -3.61e+00 |
Pos logit contributions | |
damaging | +4.636 |
meaningful | +4.568 |
insofar | +4.525 |
contrasting | +4.506 |
categ | +4.500 |
Neg logit contributions | |
eers | -3.096 |
culosis | -2.844 |
Transactions | -2.688 |
Works | -2.605 |
Companies | -2.559 |
Token | y |
Token ID | 88 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
eers | +9.077 |
artment | +7.387 |
culosis | +6.764 |
Transactions | +6.656 |
Companies | +6.595 |
Neg logit contributions | |
insofar | -22.334 |
wounding | -22.122 |
damaging | -22.071 |
pessimistic | -21.580 |
meaningful | -21.518 |
Token | residential |
Token ID | 12420 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
eers | +9.560 |
Works | +8.669 |
Transactions | +8.539 |
Companies | +8.512 |
culosis | +8.472 |
Neg logit contributions | |
insofar | -8.816 |
wounding | -8.612 |
damaging | -8.554 |
meaningful | -8.524 |
pessimistic | -8.463 |
Token | and |
Token ID | 290 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
eers | +5.051 |
culosis | +4.497 |
Transactions | +4.438 |
Works | +4.415 |
Companies | +4.318 |
Neg logit contributions | |
damaging | -5.276 |
insofar | -5.261 |
meaningful | -5.236 |
pessimistic | -5.156 |
wounding | -5.143 |
Token | commercial |
Token ID | 5068 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
eers | +0.657 |
culosis | +0.606 |
Works | +0.587 |
Transactions | +0.585 |
Companies | +0.572 |
Neg logit contributions | |
damaging | -0.779 |
meaningful | -0.765 |
insofar | -0.763 |
contrasting | -0.753 |
ignoring | -0.741 |
Token | buildings |
Token ID | 6832 |
Feature activation | -7.10e-01 |
Pos logit contributions | |
eers | +6.643 |
Transactions | +5.788 |
culosis | +5.754 |
Works | +5.713 |
Companies | +5.645 |
Neg logit contributions | |
insofar | -7.836 |
damaging | -7.788 |
wounding | -7.750 |
meaningful | -7.696 |
pessimistic | -7.664 |
Token | MOR |
Token ID | 35208 |
Feature activation | -9.64e-01 |
Pos logit contributions | |
eers | +0.922 |
culosis | +0.860 |
Transactions | +0.827 |
Works | +0.812 |
Companies | +0.787 |
Neg logit contributions | |
damaging | -1.505 |
insofar | -1.500 |
meaningful | -1.487 |
contrasting | -1.476 |
categ | -1.455 |
Token | PH |
Token ID | 11909 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
eers | +4.337 |
Transactions | +3.894 |
culosis | +3.858 |
Works | +3.746 |
Queue | +3.743 |
Neg logit contributions | |
damaging | -5.421 |
contrasting | -5.395 |
categ | -5.373 |
meaningful | -5.325 |
consequential | -5.278 |
Token | _ |
Token ID | 62 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
eers | +6.173 |
Queue | +5.079 |
Transactions | +5.075 |
Works | +5.015 |
Companies | +4.768 |
Neg logit contributions | |
contrasting | -13.010 |
categ | -12.959 |
consequential | -12.892 |
damaging | -12.870 |
meaningful | -12.715 |
Token | BL |
Token ID | 9148 |
Feature activation | -5.71e-01 |
Pos logit contributions | |
eers | +6.185 |
Queue | +5.482 |
Works | +5.403 |
culosis | +5.373 |
Transactions | +5.305 |
Neg logit contributions | |
categ | -7.548 |
damaging | -7.481 |
consequential | -7.451 |
meaningful | -7.404 |
contrasting | -7.349 |
Token | ACK |
Token ID | 8120 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
eers | +3.212 |
culosis | +2.991 |
Transactions | +2.887 |
Works | +2.826 |
Queue | +2.794 |
Neg logit contributions | |
damaging | -2.673 |
meaningful | -2.627 |
categ | -2.599 |
contrasting | -2.595 |
insofar | -2.560 |
Token | H |
Token ID | 39 |
Feature activation | -3.55e+00 |
Pos logit contributions | |
eers | +5.859 |
Transactions | +5.041 |
Queue | +5.002 |
culosis | +4.957 |
Works | +4.924 |
Neg logit contributions | |
categ | -8.828 |
contrasting | -8.764 |
consequential | -8.733 |
damaging | -8.731 |
meaningful | -8.688 |
Token | AT |
Token ID | 1404 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
eers | +7.950 |
atcher | +7.015 |
Queue | +6.936 |
Facility | +6.320 |
Transactions | +6.160 |
Neg logit contributions | |
consequential | -23.091 |
contrasting | -22.683 |
categ | -22.584 |
meaningful | -22.141 |
conced | -21.945 |
Token | , |
Token ID | 837 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
eers | +10.301 |
Works | +9.164 |
Transactions | +8.978 |
Queue | +8.898 |
Companies | +8.823 |
Neg logit contributions | |
categ | -11.144 |
consequential | -10.989 |
contrasting | -10.975 |
damaging | -10.947 |
pessimistic | -10.688 |
Token | rect |
Token ID | 13621 |
Feature activation | +3.42e-01 |
Pos logit contributions | |
damaging | +4.503 |
meaningful | +4.353 |
categ | +4.252 |
contrasting | +4.242 |
insofar | +4.229 |
Neg logit contributions | |
eers | -9.544 |
culosis | -9.057 |
Transactions | -8.790 |
Works | -8.620 |
Companies | -8.500 |
Token | K |
Token ID | 42 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
damaging | +1.496 |
meaningful | +1.464 |
insofar | +1.426 |
categ | +1.416 |
contrasting | +1.404 |
Neg logit contributions | |
eers | -2.016 |
culosis | -1.962 |
Transactions | -1.842 |
Works | -1.771 |
Companies | -1.767 |
Token | ernel |
Token ID | 7948 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
eers | +2.326 |
culosis | +2.139 |
Transactions | +2.031 |
Works | +1.967 |
Companies | +1.934 |
Neg logit contributions | |
damaging | -2.858 |
meaningful | -2.809 |
contrasting | -2.777 |
categ | -2.776 |
insofar | -2.759 |
Token | math |
Token ID | 11018 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
damaging | +2.541 |
meaningful | +2.491 |
categ | +2.446 |
contrasting | +2.439 |
insofar | +2.437 |
Neg logit contributions | |
eers | -3.074 |
culosis | -2.883 |
Transactions | -2.771 |
Works | -2.684 |
Companies | -2.659 |
Token | . |
Token ID | 13 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
eers | +6.373 |
Works | +5.874 |
culosis | +5.708 |
Facility | +5.675 |
Transactions | +5.642 |
Neg logit contributions | |
damaging | -4.973 |
meaningful | -4.929 |
contrasting | -4.909 |
categ | -4.863 |
pessimistic | -4.830 |
Token | The |
Token ID | 383 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
eers | +6.641 |
Works | +5.976 |
Transactions | +5.809 |
culosis | +5.784 |
Companies | +5.715 |
Neg logit contributions | |
damaging | -10.481 |
categ | -10.380 |
meaningful | -10.282 |
contrasting | -10.133 |
wounding | -10.084 |
Token | B |
Token ID | 347 |
Feature activation | +6.54e-01 |
Pos logit contributions | |
eers | +9.134 |
Works | +8.296 |
Transactions | +8.115 |
Facility | +8.050 |
culosis | +8.002 |
Neg logit contributions | |
damaging | -7.210 |
insofar | -7.097 |
categ | -6.980 |
meaningful | -6.954 |
ignoring | -6.766 |
Token | & |
Token ID | 5 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
damaging | +3.645 |
meaningful | +3.563 |
categ | +3.536 |
contrasting | +3.529 |
insofar | +3.508 |
Neg logit contributions | |
eers | -3.224 |
culosis | -3.004 |
Transactions | -2.818 |
Works | -2.809 |
Companies | -2.727 |
Token | B |
Token ID | 33 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
eers | +6.486 |
Queue | +5.310 |
Works | +5.307 |
culosis | +5.142 |
Transactions | +5.117 |
Neg logit contributions | |
damaging | -11.973 |
meaningful | -11.799 |
insofar | -11.705 |
categ | -11.558 |
contrasting | -11.541 |
Token | � |
Token ID | 447 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
eers | +17.884 |
Works | +16.449 |
culosis | +15.913 |
Facility | +15.810 |
Services | +15.674 |
Neg logit contributions | |
damaging | -12.323 |
meaningful | -11.951 |
insofar | -11.746 |
categ | -11.583 |
wounding | -11.486 |
Token | � |
Token ID | 247 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
eers | +4.002 |
culosis | +3.459 |
Transactions | +3.356 |
Queue | +3.245 |
Works | +3.236 |
Neg logit contributions | |
categ | -7.880 |
damaging | -7.873 |
contrasting | -7.860 |
meaningful | -7.817 |
insofar | -7.781 |
Token | s |
Token ID | 82 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
eers | +8.037 |
culosis | +7.214 |
Works | +6.973 |
Facility | +6.587 |
Transactions | +6.539 |
Neg logit contributions | |
damaging | -10.047 |
meaningful | -9.924 |
insofar | -9.818 |
categ | -9.778 |
contrasting | -9.720 |
Token | breakfast |
Token ID | 12607 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
eers | +14.219 |
culosis | +12.933 |
Works | +12.779 |
Transactions | +12.645 |
Facility | +12.535 |
Neg logit contributions | |
damaging | -9.685 |
meaningful | -9.205 |
insofar | -9.160 |
categ | -9.113 |
wounding | -8.921 |
Token | , |
Token ID | 11 |
Feature activation | +4.65e-01 |
Pos logit contributions | |
eers | +11.201 |
culosis | +9.667 |
Works | +9.649 |
Facility | +9.523 |
Queue | +9.277 |
Neg logit contributions | |
damaging | -9.231 |
meaningful | -9.000 |
categ | -8.893 |
insofar | -8.870 |
consequential | -8.758 |
Token | soft |
Token ID | 2705 |
Feature activation | -8.67e-01 |
Pos logit contributions | |
eers | +6.291 |
culosis | +5.731 |
Works | +5.716 |
Transactions | +5.642 |
Companies | +5.594 |
Neg logit contributions | |
insofar | -4.235 |
damaging | -4.225 |
categ | -4.105 |
contrasting | -4.071 |
wounding | -4.016 |
Token | - |
Token ID | 12 |
Feature activation | +9.90e-01 |
Pos logit contributions | |
eers | +4.499 |
culosis | +4.314 |
Works | +4.096 |
Transactions | +4.048 |
Companies | +4.023 |
Neg logit contributions | |
damaging | -4.072 |
categ | -4.000 |
contrasting | -3.968 |
insofar | -3.946 |
meaningful | -3.928 |
Token | dr |
Token ID | 7109 |
Feature activation | -2.31e-01 |
Pos logit contributions | |
damaging | +4.635 |
meaningful | +4.544 |
categ | +4.497 |
contrasting | +4.469 |
insofar | +4.445 |
Neg logit contributions | |
eers | -5.754 |
culosis | -5.374 |
Transactions | -5.127 |
Works | -5.031 |
Companies | -4.973 |
Token | ink |
Token ID | 676 |
Feature activation | -2.59e+00 |
Pos logit contributions | |
eers | +0.934 |
culosis | +0.883 |
Transactions | +0.819 |
Facility | +0.806 |
Works | +0.795 |
Neg logit contributions | |
damaging | -1.395 |
meaningful | -1.384 |
categ | -1.370 |
contrasting | -1.369 |
consequential | -1.367 |
Token | bott |
Token ID | 3005 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
eers | +13.575 |
culosis | +12.410 |
Works | +11.975 |
Companies | +11.857 |
Facility | +11.655 |
Neg logit contributions | |
damaging | -9.935 |
categ | -9.496 |
wounding | -9.493 |
meaningful | -9.453 |
consequential | -9.413 |
Token | ling |
Token ID | 1359 |
Feature activation | -3.53e+00 |
Pos logit contributions | |
eers | +6.187 |
culosis | +5.609 |
Works | +4.997 |
Transactions | +4.972 |
Facility | +4.867 |
Neg logit contributions | |
meaningful | -9.633 |
categ | -9.582 |
damaging | -9.463 |
consequential | -9.374 |
pessimistic | -9.331 |
Token | company |
Token ID | 1664 |
Feature activation | -2.81e+00 |
Pos logit contributions | |
eers | +15.717 |
Works | +14.435 |
Facility | +13.845 |
Companies | +13.746 |
Company | +13.550 |
Neg logit contributions | |
categ | -13.548 |
damaging | -13.495 |
wounding | -13.178 |
pessimistic | -13.069 |
meaningful | -13.006 |
Token | that |
Token ID | 326 |
Feature activation | -3.37e+00 |
Pos logit contributions | |
eers | +14.783 |
culosis | +12.999 |
Companies | +12.923 |
Works | +12.801 |
Queue | +12.220 |
Neg logit contributions | |
categ | -9.675 |
damaging | -9.441 |
meaningful | -9.169 |
pessimistic | -9.166 |
consequential | -9.150 |
Token | became |
Token ID | 2627 |
Feature activation | -8.87e-01 |
Pos logit contributions | |
eers | +17.125 |
Companies | +15.189 |
Works | +15.104 |
culosis | +14.800 |
Services | +14.352 |
Neg logit contributions | |
damaging | -11.459 |
contrasting | -11.219 |
categ | -11.197 |
meaningful | -11.019 |
wounding | -10.902 |
Token | one |
Token ID | 530 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
eers | +5.153 |
culosis | +4.819 |
Companies | +4.593 |
Works | +4.561 |
Transactions | +4.539 |
Neg logit contributions | |
damaging | -3.566 |
contrasting | -3.547 |
insofar | -3.488 |
categ | -3.481 |
meaningful | -3.439 |
Token | of |
Token ID | 286 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
eers | +1.436 |
culosis | +1.296 |
Transactions | +1.223 |
Companies | +1.214 |
Works | +1.202 |
Neg logit contributions | |
damaging | -1.685 |
meaningful | -1.650 |
categ | -1.642 |
contrasting | -1.641 |
insofar | -1.626 |
Token | � |
Token ID | 250 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
eers | +0.454 |
culosis | +0.402 |
Transactions | +0.394 |
Works | +0.383 |
Facility | +0.380 |
Neg logit contributions | |
damaging | -0.963 |
meaningful | -0.935 |
insofar | -0.932 |
contrasting | -0.925 |
categ | -0.925 |
Token | lot |
Token ID | 26487 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
eers | +8.448 |
culosis | +7.984 |
Transactions | +7.704 |
Facility | +7.637 |
Works | +7.520 |
Neg logit contributions | |
damaging | -8.241 |
contrasting | -8.112 |
meaningful | -8.075 |
consequential | -8.007 |
insofar | -7.955 |
Token | tery |
Token ID | 11471 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
eers | +10.708 |
culosis | +9.813 |
Transactions | +9.473 |
Facility | +9.322 |
Works | +9.309 |
Neg logit contributions | |
damaging | -9.109 |
contrasting | -8.908 |
meaningful | -8.870 |
categ | -8.816 |
consequential | -8.812 |
Token | � |
Token ID | 447 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
eers | +14.479 |
Works | +12.746 |
culosis | +12.662 |
Companies | +12.532 |
Transactions | +12.507 |
Neg logit contributions | |
contrasting | -9.246 |
damaging | -9.206 |
pessimistic | -8.962 |
categ | -8.933 |
meaningful | -8.920 |
Token | � |
Token ID | 251 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
eers | +4.276 |
culosis | +3.588 |
Transactions | +3.423 |
Facility | +3.246 |
Queue | +3.242 |
Neg logit contributions | |
damaging | -9.948 |
categ | -9.930 |
insofar | -9.853 |
contrasting | -9.848 |
meaningful | -9.763 |
Token | that |
Token ID | 326 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
eers | +10.889 |
culosis | +9.950 |
Transactions | +9.757 |
Works | +9.717 |
Facility | +9.664 |
Neg logit contributions | |
damaging | -6.983 |
contrasting | -6.872 |
meaningful | -6.697 |
categ | -6.693 |
pessimistic | -6.671 |
Token | the |
Token ID | 262 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
eers | +17.717 |
Works | +15.765 |
Companies | +15.602 |
Transactions | +15.320 |
Facility | +15.016 |
Neg logit contributions | |
damaging | -12.005 |
contrasting | -11.873 |
insofar | -11.801 |
categ | -11.512 |
meaningful | -11.477 |
Token | city |
Token ID | 1748 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
eers | +6.728 |
Transactions | +6.023 |
culosis | +5.960 |
Works | +5.861 |
Companies | +5.852 |
Neg logit contributions | |
insofar | -6.668 |
damaging | -6.607 |
meaningful | -6.577 |
contrasting | -6.548 |
categ | -6.472 |
Token | held |
Token ID | 2714 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
eers | +5.581 |
culosis | +4.833 |
Transactions | +4.786 |
Works | +4.776 |
Companies | +4.697 |
Neg logit contributions | |
damaging | -5.561 |
contrasting | -5.524 |
meaningful | -5.518 |
categ | -5.424 |
insofar | -5.404 |
Token | . |
Token ID | 13 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
eers | +8.340 |
Companies | +7.305 |
Transactions | +7.254 |
Works | +7.216 |
Facility | +7.157 |
Neg logit contributions | |
damaging | -5.053 |
contrasting | -5.040 |
categ | -4.920 |
pessimistic | -4.902 |
insofar | -4.857 |
Token | The |
Token ID | 383 |
Feature activation | -7.26e-01 |
Pos logit contributions | |
eers | +3.776 |
Transactions | +3.467 |
Companies | +3.395 |
Works | +3.387 |
culosis | +3.345 |
Neg logit contributions | |
damaging | -6.357 |
meaningful | -6.310 |
categ | -6.276 |
contrasting | -6.252 |
consequential | -6.242 |
Token | . |
Token ID | 13 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
eers | +0.308 |
culosis | +0.284 |
Works | +0.280 |
Transactions | +0.274 |
Companies | +0.270 |
Neg logit contributions | |
damaging | -0.236 |
categ | -0.231 |
meaningful | -0.227 |
contrasting | -0.224 |
pessimistic | -0.224 |
Token | ( |
Token ID | 357 |
Feature activation | -9.49e-01 |
Pos logit contributions | |
eers | +5.697 |
Works | +5.334 |
Transactions | +5.145 |
Companies | +5.019 |
Services | +4.992 |
Neg logit contributions | |
damaging | -11.068 |
categ | -11.028 |
wounding | -10.888 |
consequential | -10.887 |
meaningful | -10.848 |
Token | Wa |
Token ID | 33484 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
eers | +4.274 |
Queue | +3.833 |
culosis | +3.799 |
Transactions | +3.686 |
Works | +3.674 |
Neg logit contributions | |
damaging | -5.389 |
meaningful | -5.263 |
categ | -5.246 |
contrasting | -5.209 |
insofar | -5.168 |
Token | ub |
Token ID | 549 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
eers | +6.227 |
culosis | +5.690 |
Transactions | +5.338 |
Queue | +5.300 |
Works | +5.153 |
Neg logit contributions | |
damaging | -8.868 |
contrasting | -8.613 |
meaningful | -8.611 |
categ | -8.596 |
consequential | -8.481 |
Token | ges |
Token ID | 3212 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
eers | +6.602 |
culosis | +5.542 |
Works | +4.813 |
Transactions | +4.561 |
Companies | +4.427 |
Neg logit contributions | |
damaging | -17.387 |
contrasting | -17.328 |
pessimistic | -17.107 |
meaningful | -17.052 |
categ | -16.932 |
Token | hig |
Token ID | 25196 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
eers | +9.827 |
culosis | +8.829 |
Transactions | +7.868 |
ttes | +7.859 |
Queue | +7.845 |
Neg logit contributions | |
contrasting | -12.455 |
damaging | -12.433 |
categ | -12.273 |
meaningful | -12.192 |
consequential | -12.062 |
Token | Rice |
Token ID | 13823 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
eers | +12.137 |
Transactions | +10.913 |
Works | +10.766 |
Services | +10.763 |
Companies | +10.676 |
Neg logit contributions | |
consequential | -18.633 |
damaging | -18.539 |
pessimistic | -18.311 |
categ | -18.267 |
contrasting | -18.237 |
Token | / |
Token ID | 14 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
eers | +8.408 |
Transactions | +7.507 |
Works | +7.392 |
Companies | +7.298 |
culosis | +7.292 |
Neg logit contributions | |
damaging | -9.836 |
categ | -9.690 |
meaningful | -9.651 |
contrasting | -9.641 |
consequential | -9.486 |
Token | CBC |
Token ID | 29208 |
Feature activation | -9.72e-01 |
Pos logit contributions | |
eers | +4.936 |
culosis | +4.308 |
Transactions | +4.165 |
Queue | +4.130 |
Works | +3.975 |
Neg logit contributions | |
damaging | -9.310 |
contrasting | -9.168 |
meaningful | -9.148 |
categ | -9.114 |
consequential | -9.023 |
Token | ) |
Token ID | 8 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
eers | +3.260 |
Transactions | +2.921 |
culosis | +2.893 |
Works | +2.831 |
Companies | +2.752 |
Neg logit contributions | |
damaging | -6.414 |
meaningful | -6.330 |
categ | -6.328 |
consequential | -6.224 |
contrasting | -6.202 |
Token | " |
Token ID | 366 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
eers | +5.436 |
Works | +5.147 |
Companies | +5.021 |
Transactions | +5.019 |
culosis | +4.973 |
Neg logit contributions | |
damaging | -6.372 |
categ | -6.296 |
consequential | -6.260 |
meaningful | -6.186 |
contrasting | -6.171 |
Token | together |
Token ID | 1978 |
Feature activation | -7.32e-01 |
Pos logit contributions | |
eers | +1.157 |
culosis | +1.066 |
Transactions | +1.044 |
Works | +1.024 |
Companies | +1.010 |
Neg logit contributions | |
damaging | -0.772 |
categ | -0.743 |
meaningful | -0.738 |
contrasting | -0.731 |
consequential | -0.725 |
Token | . |
Token ID | 13 |
Feature activation | -6.61e-01 |
Pos logit contributions | |
eers | +4.176 |
culosis | +3.888 |
Transactions | +3.733 |
Works | +3.694 |
Queue | +3.658 |
Neg logit contributions | |
damaging | -3.212 |
categ | -3.089 |
meaningful | -3.074 |
contrasting | -3.058 |
insofar | -2.995 |
Token | The |
Token ID | 383 |
Feature activation | +8.12e-02 |
Pos logit contributions | |
eers | +2.143 |
culosis | +1.944 |
Transactions | +1.878 |
Works | +1.809 |
Companies | +1.738 |
Neg logit contributions | |
damaging | -4.553 |
meaningful | -4.513 |
categ | -4.453 |
insofar | -4.441 |
contrasting | -4.430 |
Token | epic |
Token ID | 12191 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
damaging | +0.382 |
categ | +0.373 |
contrasting | +0.373 |
insofar | +0.372 |
meaningful | +0.372 |
Neg logit contributions | |
eers | -0.452 |
culosis | -0.414 |
Transactions | -0.401 |
Works | -0.393 |
Companies | -0.388 |
Token | ghost |
Token ID | 10905 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
eers | +6.176 |
culosis | +5.783 |
Works | +5.423 |
Queue | +5.354 |
Transactions | +5.328 |
Neg logit contributions | |
categ | -5.792 |
insofar | -5.673 |
damaging | -5.657 |
contrasting | -5.650 |
meaningful | -5.646 |
Token | invasion |
Token ID | 11796 |
Feature activation | -3.51e+00 |
Pos logit contributions | |
eers | +2.340 |
culosis | +2.193 |
Transactions | +2.109 |
Works | +2.052 |
Companies | +2.030 |
Neg logit contributions | |
damaging | -1.815 |
meaningful | -1.778 |
categ | -1.747 |
contrasting | -1.746 |
insofar | -1.735 |
Token | of |
Token ID | 286 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
eers | +12.662 |
Queue | +10.287 |
Works | +10.243 |
Companies | +10.095 |
Facility | +9.982 |
Neg logit contributions | |
consequential | -18.459 |
categ | -18.432 |
contrasting | -18.381 |
pessimistic | -18.336 |
damaging | -18.201 |
Token | the |
Token ID | 262 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
eers | +10.604 |
culosis | +9.166 |
Companies | +9.065 |
Works | +9.060 |
Transactions | +8.976 |
Neg logit contributions | |
contrasting | -11.912 |
damaging | -11.906 |
categ | -11.773 |
meaningful | -11.707 |
insofar | -11.667 |
Token | big |
Token ID | 1263 |
Feature activation | -2.14e+00 |
Pos logit contributions | |
eers | +6.052 |
culosis | +5.498 |
Works | +5.284 |
Companies | +5.199 |
Transactions | +5.081 |
Neg logit contributions | |
damaging | -4.661 |
insofar | -4.632 |
contrasting | -4.576 |
categ | -4.555 |
meaningful | -4.510 |
Token | Apple |
Token ID | 4196 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
eers | +6.695 |
Companies | +5.962 |
culosis | +5.816 |
Works | +5.707 |
Facility | +5.407 |
Neg logit contributions | |
categ | -12.725 |
damaging | -12.545 |
meaningful | -12.536 |
consequential | -12.419 |
wounding | -12.379 |
Token | . |
Token ID | 13 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
eers | +8.297 |
culosis | +7.481 |
Transactions | +7.347 |
Works | +7.312 |
Facility | +7.128 |
Neg logit contributions | |
damaging | -6.248 |
contrasting | -6.159 |
categ | -6.154 |
meaningful | -6.119 |
consequential | -6.027 |
Token | has |
Token ID | 468 |
Feature activation | -2.77e-02 |
Pos logit contributions | |
eers | +3.531 |
culosis | +3.052 |
Transactions | +2.978 |
Works | +2.953 |
Companies | +2.913 |
Neg logit contributions | |
damaging | -3.525 |
meaningful | -3.522 |
contrasting | -3.503 |
categ | -3.440 |
insofar | -3.437 |
Token | unleashed |
Token ID | 28136 |
Feature activation | +4.86e-01 |
Pos logit contributions | |
eers | +0.141 |
culosis | +0.124 |
Transactions | +0.120 |
Works | +0.119 |
Companies | +0.118 |
Neg logit contributions | |
damaging | -0.142 |
meaningful | -0.141 |
contrasting | -0.140 |
categ | -0.140 |
insofar | -0.138 |
Token | , |
Token ID | 11 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
damaging | +2.530 |
meaningful | +2.514 |
categ | +2.482 |
contrasting | +2.475 |
insofar | +2.438 |
Neg logit contributions | |
eers | -2.492 |
culosis | -2.276 |
Transactions | -2.163 |
Works | -2.142 |
Companies | -2.115 |
Token | he |
Token ID | 339 |
Feature activation | +8.24e-01 |
Pos logit contributions | |
damaging | +9.060 |
meaningful | +8.897 |
contrasting | +8.721 |
insofar | +8.714 |
categ | +8.711 |
Neg logit contributions | |
eers | -9.323 |
culosis | -8.728 |
Transactions | -8.337 |
Works | -8.054 |
Facility | -7.936 |
Token | remains |
Token ID | 3793 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
damaging | +5.448 |
meaningful | +5.368 |
categ | +5.303 |
contrasting | +5.299 |
insofar | +5.281 |
Neg logit contributions | |
eers | -3.118 |
culosis | -2.824 |
Transactions | -2.651 |
Works | -2.533 |
Companies | -2.482 |
Token | un |
Token ID | 555 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
damaging | +9.119 |
meaningful | +8.908 |
categ | +8.728 |
insofar | +8.614 |
contrasting | +8.562 |
Neg logit contributions | |
eers | -13.544 |
culosis | -12.995 |
Transactions | -12.550 |
Works | -12.098 |
Queue | -12.012 |
Token | y |
Token ID | 88 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
damaging | +12.457 |
meaningful | +12.166 |
insofar | +11.918 |
contrasting | +11.893 |
categ | +11.892 |
Neg logit contributions | |
eers | -11.014 |
culosis | -10.505 |
Transactions | -10.304 |
Works | -9.622 |
Companies | -9.601 |
Token | ielding |
Token ID | 30449 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
damaging | +5.708 |
meaningful | +5.561 |
categ | +5.438 |
contrasting | +5.427 |
insofar | +5.410 |
Neg logit contributions | |
eers | -10.033 |
culosis | -9.521 |
Transactions | -9.198 |
Works | -8.964 |
Companies | -8.888 |
Token | in |
Token ID | 287 |
Feature activation | +9.68e-01 |
Pos logit contributions | |
damaging | +7.868 |
meaningful | +7.700 |
categ | +7.567 |
contrasting | +7.567 |
insofar | +7.489 |
Neg logit contributions | |
eers | -9.744 |
culosis | -9.112 |
Transactions | -8.762 |
Works | -8.538 |
Companies | -8.430 |
Token | his |
Token ID | 465 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
damaging | +4.368 |
meaningful | +4.284 |
insofar | +4.215 |
categ | +4.210 |
contrasting | +4.196 |
Neg logit contributions | |
eers | -5.719 |
culosis | -5.323 |
Transactions | -5.121 |
Works | -5.012 |
Companies | -4.947 |
Token | insistence |
Token ID | 30696 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
damaging | +6.745 |
meaningful | +6.600 |
categ | +6.521 |
contrasting | +6.494 |
insofar | +6.404 |
Neg logit contributions | |
eers | -7.913 |
culosis | -7.476 |
Transactions | -7.169 |
Works | -6.921 |
Companies | -6.850 |
Token | off |
Token ID | 572 |
Feature activation | +7.61e-01 |
Pos logit contributions | |
eers | +2.065 |
culosis | +1.930 |
Transactions | +1.877 |
Works | +1.846 |
Queue | +1.834 |
Neg logit contributions | |
damaging | -1.030 |
categ | -0.994 |
insofar | -0.992 |
contrasting | -0.985 |
meaningful | -0.975 |
Token | to |
Token ID | 284 |
Feature activation | -4.38e-01 |
Pos logit contributions | |
damaging | +2.483 |
meaningful | +2.415 |
categ | +2.411 |
contrasting | +2.383 |
insofar | +2.374 |
Neg logit contributions | |
eers | -5.412 |
culosis | -5.063 |
Transactions | -4.980 |
Works | -4.914 |
Companies | -4.865 |
Token | a |
Token ID | 257 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
eers | +2.690 |
culosis | +2.519 |
Transactions | +2.480 |
Companies | +2.401 |
Works | +2.393 |
Neg logit contributions | |
categ | -1.634 |
insofar | -1.628 |
damaging | -1.622 |
contrasting | -1.567 |
meaningful | -1.550 |
Token | rocky |
Token ID | 26898 |
Feature activation | +3.10e-02 |
Pos logit contributions | |
damaging | +4.288 |
meaningful | +4.184 |
categ | +4.120 |
insofar | +4.102 |
contrasting | +4.097 |
Neg logit contributions | |
eers | -7.310 |
culosis | -6.874 |
Transactions | -6.650 |
Works | -6.519 |
Companies | -6.449 |
Token | start |
Token ID | 923 |
Feature activation | +7.50e-01 |
Pos logit contributions | |
damaging | +0.201 |
meaningful | +0.197 |
insofar | +0.196 |
categ | +0.196 |
contrasting | +0.195 |
Neg logit contributions | |
eers | -0.118 |
culosis | -0.105 |
Transactions | -0.099 |
Works | -0.096 |
Companies | -0.096 |
Token | , |
Token ID | 11 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
damaging | +3.231 |
meaningful | +3.179 |
categ | +3.150 |
contrasting | +3.105 |
insofar | +3.041 |
Neg logit contributions | |
eers | -4.549 |
culosis | -4.250 |
Transactions | -4.064 |
Works | -4.025 |
Companies | -3.977 |
Token | after |
Token ID | 706 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
damaging | +9.968 |
meaningful | +9.671 |
insofar | +9.564 |
contrasting | +9.550 |
categ | +9.373 |
Neg logit contributions | |
eers | -14.177 |
culosis | -13.464 |
Transactions | -12.902 |
Works | -12.416 |
Queue | -12.263 |
Token | Ibrahim |
Token ID | 30917 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
damaging | +2.314 |
meaningful | +2.277 |
categ | +2.247 |
insofar | +2.241 |
contrasting | +2.226 |
Neg logit contributions | |
eers | -2.521 |
culosis | -2.326 |
Transactions | -2.239 |
Works | -2.200 |
Companies | -2.171 |
Token | 's |
Token ID | 338 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
damaging | +8.589 |
meaningful | +8.435 |
categ | +8.350 |
contrasting | +8.339 |
insofar | +8.283 |
Neg logit contributions | |
eers | -5.254 |
culosis | -4.803 |
Transactions | -4.534 |
Works | -4.289 |
Facility | -4.214 |
Token | lawyers |
Token ID | 9326 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
damaging | +1.066 |
meaningful | +1.047 |
insofar | +1.038 |
contrasting | +1.030 |
categ | +1.028 |
Neg logit contributions | |
eers | -1.354 |
culosis | -1.254 |
Transactions | -1.216 |
Works | -1.197 |
Companies | -1.180 |
Token | informed |
Token ID | 7981 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
damaging | +0.993 |
meaningful | +0.981 |
categ | +0.965 |
insofar | +0.965 |
contrasting | +0.962 |
Neg logit contributions | |
eers | -0.915 |
culosis | -0.841 |
Transactions | -0.807 |
Works | -0.785 |
Companies | -0.779 |
Token | misleading |
Token ID | 15850 |
Feature activation | +4.74e-01 |
Pos logit contributions | |
damaging | +0.719 |
meaningful | +0.712 |
categ | +0.705 |
contrasting | +0.701 |
insofar | +0.694 |
Neg logit contributions | |
eers | -0.840 |
culosis | -0.771 |
Transactions | -0.747 |
Works | -0.730 |
Companies | -0.726 |
Token | everyone |
Token ID | 2506 |
Feature activation | +8.42e-02 |
Pos logit contributions | |
damaging | +2.232 |
meaningful | +2.170 |
contrasting | +2.161 |
categ | +2.154 |
insofar | +2.137 |
Neg logit contributions | |
eers | -2.713 |
culosis | -2.469 |
Transactions | -2.407 |
Works | -2.345 |
Companies | -2.327 |
Token | else |
Token ID | 2073 |
Feature activation | -4.84e-01 |
Pos logit contributions | |
damaging | +0.364 |
categ | +0.359 |
contrasting | +0.356 |
meaningful | +0.355 |
insofar | +0.343 |
Neg logit contributions | |
eers | -0.497 |
culosis | -0.451 |
Transactions | -0.441 |
Works | -0.439 |
Companies | -0.431 |
Token | . |
Token ID | 13 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
eers | +2.797 |
culosis | +2.548 |
Works | +2.466 |
Transactions | +2.451 |
Companies | +2.446 |
Neg logit contributions | |
damaging | -2.021 |
contrasting | -1.995 |
categ | -1.991 |
meaningful | -1.972 |
pessimistic | -1.912 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
eers | +0.941 |
culosis | +0.838 |
Transactions | +0.819 |
Works | +0.786 |
Companies | +0.775 |
Neg logit contributions | |
damaging | -1.620 |
meaningful | -1.595 |
categ | -1.579 |
contrasting | -1.576 |
insofar | -1.557 |
Token | D |
Token ID | 35 |
Feature activation | +2.77e+00 |
Pos logit contributions | |
eers | +0.602 |
culosis | +0.530 |
Queue | +0.510 |
Transactions | +0.499 |
Works | +0.485 |
Neg logit contributions | |
damaging | -0.932 |
meaningful | -0.919 |
contrasting | -0.919 |
categ | -0.916 |
insofar | -0.901 |
Token | ude |
Token ID | 2507 |
Feature activation | +8.65e-01 |
Pos logit contributions | |
damaging | +15.868 |
meaningful | +15.416 |
categ | +15.291 |
insofar | +15.218 |
contrasting | +15.203 |
Neg logit contributions | |
eers | -10.889 |
culosis | -10.340 |
Transactions | -9.607 |
Works | -9.285 |
Companies | -9.047 |
Token | , |
Token ID | 11 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
damaging | +4.927 |
meaningful | +4.846 |
categ | +4.777 |
contrasting | +4.775 |
insofar | +4.754 |
Neg logit contributions | |
eers | -4.083 |
culosis | -3.786 |
Transactions | -3.599 |
Works | -3.494 |
Companies | -3.423 |
Token | when |
Token ID | 618 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
damaging | +10.875 |
meaningful | +10.720 |
insofar | +10.509 |
categ | +10.500 |
contrasting | +10.477 |
Neg logit contributions | |
eers | -8.132 |
culosis | -7.523 |
Transactions | -7.048 |
Queue | -6.620 |
Works | -6.605 |
Token | even |
Token ID | 772 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
eers | +2.354 |
culosis | +2.190 |
Transactions | +2.088 |
Works | +2.055 |
Companies | +2.010 |
Neg logit contributions | |
damaging | -3.266 |
meaningful | -3.230 |
insofar | -3.207 |
categ | -3.204 |
contrasting | -3.183 |
Token | the |
Token ID | 262 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
damaging | +1.506 |
meaningful | +1.475 |
categ | +1.468 |
contrasting | +1.456 |
insofar | +1.449 |
Neg logit contributions | |
eers | -1.678 |
culosis | -1.569 |
Transactions | -1.517 |
Works | -1.480 |
Companies | -1.463 |
Token | and |
Token ID | 290 |
Feature activation | +7.82e-01 |
Pos logit contributions | |
damaging | +2.841 |
categ | +2.762 |
meaningful | +2.758 |
insofar | +2.729 |
contrasting | +2.719 |
Neg logit contributions | |
eers | -3.666 |
culosis | -3.430 |
Transactions | -3.322 |
Works | -3.266 |
Companies | -3.206 |
Token | mourn |
Token ID | 25722 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
damaging | +3.723 |
meaningful | +3.646 |
categ | +3.597 |
contrasting | +3.578 |
insofar | +3.569 |
Neg logit contributions | |
eers | -4.405 |
culosis | -4.122 |
Transactions | -3.956 |
Works | -3.845 |
Companies | -3.803 |
Token | the |
Token ID | 262 |
Feature activation | -6.71e-02 |
Pos logit contributions | |
damaging | +6.023 |
meaningful | +5.905 |
categ | +5.818 |
contrasting | +5.809 |
insofar | +5.784 |
Neg logit contributions | |
eers | -6.302 |
culosis | -5.876 |
Transactions | -5.629 |
Works | -5.464 |
Companies | -5.389 |
Token | death |
Token ID | 1918 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
eers | +0.402 |
culosis | +0.371 |
Transactions | +0.366 |
Works | +0.364 |
Companies | +0.357 |
Neg logit contributions | |
damaging | -0.279 |
insofar | -0.279 |
categ | -0.274 |
meaningful | -0.272 |
contrasting | -0.269 |
Token | of |
Token ID | 286 |
Feature activation | +7.95e-01 |
Pos logit contributions | |
damaging | +1.963 |
categ | +1.927 |
meaningful | +1.905 |
contrasting | +1.896 |
insofar | +1.890 |
Neg logit contributions | |
eers | -1.819 |
culosis | -1.668 |
Transactions | -1.585 |
Works | -1.558 |
Companies | -1.528 |
Token | O |
Token ID | 440 |
Feature activation | +2.19e+00 |
Pos logit contributions | |
damaging | +4.111 |
meaningful | +4.020 |
categ | +3.979 |
insofar | +3.973 |
contrasting | +3.962 |
Neg logit contributions | |
eers | -4.160 |
culosis | -3.874 |
Transactions | -3.706 |
Works | -3.619 |
Companies | -3.561 |
Token | der |
Token ID | 1082 |
Feature activation | -6.54e-01 |
Pos logit contributions | |
damaging | +6.248 |
meaningful | +6.239 |
compelling | +5.934 |
albeit | +5.832 |
categ | +5.767 |
Neg logit contributions | |
eers | -14.062 |
Transactions | -13.871 |
culosis | -13.797 |
Facility | -13.235 |
Works | -13.157 |
Token | us |
Token ID | 385 |
Feature activation | +6.54e-01 |
Pos logit contributions | |
eers | +2.701 |
culosis | +2.443 |
Transactions | +2.306 |
Works | +2.242 |
Companies | +2.187 |
Neg logit contributions | |
damaging | -4.065 |
meaningful | -3.997 |
contrasting | -3.968 |
categ | -3.963 |
insofar | -3.918 |
Token | , |
Token ID | 11 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
damaging | +3.569 |
meaningful | +3.484 |
categ | +3.473 |
contrasting | +3.456 |
insofar | +3.389 |
Neg logit contributions | |
eers | -3.253 |
culosis | -3.028 |
Transactions | -2.903 |
Works | -2.854 |
Queue | -2.789 |
Token | who |
Token ID | 508 |
Feature activation | -8.48e-01 |
Pos logit contributions | |
damaging | +10.517 |
meaningful | +10.312 |
contrasting | +10.205 |
insofar | +10.159 |
categ | +10.056 |
Neg logit contributions | |
eers | -10.427 |
culosis | -9.740 |
Transactions | -9.247 |
Works | -8.863 |
Companies | -8.793 |
Token | in |
Token ID | 287 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
eers | +4.201 |
culosis | +3.775 |
Works | +3.642 |
Transactions | +3.562 |
Companies | +3.520 |
Neg logit contributions | |
damaging | -4.370 |
categ | -4.274 |
meaningful | -4.247 |
contrasting | -4.237 |
insofar | -4.165 |
Token | Party |
Token ID | 3615 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
damaging | +7.340 |
meaningful | +7.216 |
contrasting | +7.106 |
categ | +7.106 |
insofar | +7.091 |
Neg logit contributions | |
eers | -5.392 |
culosis | -4.980 |
Transactions | -4.704 |
Works | -4.519 |
Companies | -4.447 |
Token | if |
Token ID | 611 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
damaging | +5.641 |
meaningful | +5.515 |
categ | +5.430 |
contrasting | +5.412 |
insofar | +5.349 |
Neg logit contributions | |
eers | -8.015 |
culosis | -7.489 |
Transactions | -7.232 |
Works | -7.068 |
Companies | -6.986 |
Token | they |
Token ID | 484 |
Feature activation | -6.49e-02 |
Pos logit contributions | |
eers | +1.446 |
culosis | +1.270 |
Works | +1.205 |
Transactions | +1.204 |
Companies | +1.191 |
Neg logit contributions | |
damaging | -1.894 |
categ | -1.868 |
contrasting | -1.862 |
meaningful | -1.842 |
insofar | -1.817 |
Token | do |
Token ID | 466 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
eers | +0.302 |
culosis | +0.276 |
Transactions | +0.262 |
Works | +0.256 |
Companies | +0.251 |
Neg logit contributions | |
damaging | -0.367 |
meaningful | -0.360 |
categ | -0.358 |
contrasting | -0.357 |
insofar | -0.353 |
Token | lose |
Token ID | 4425 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
damaging | +0.421 |
categ | +0.417 |
contrasting | +0.414 |
meaningful | +0.408 |
insofar | +0.402 |
Neg logit contributions | |
eers | -0.762 |
culosis | -0.703 |
Transactions | -0.686 |
Works | -0.679 |
Companies | -0.671 |
Token | , |
Token ID | 11 |
Feature activation | +2.45e+00 |
Pos logit contributions | |
damaging | +5.761 |
meaningful | +5.617 |
categ | +5.595 |
contrasting | +5.575 |
insofar | +5.497 |
Neg logit contributions | |
eers | -7.308 |
culosis | -6.783 |
Transactions | -6.541 |
Works | -6.394 |
Companies | -6.319 |
Token | but |
Token ID | 475 |
Feature activation | -3.18e-01 |
Pos logit contributions | |
damaging | +12.667 |
meaningful | +12.428 |
insofar | +12.327 |
contrasting | +12.095 |
categ | +12.068 |
Neg logit contributions | |
eers | -11.900 |
culosis | -11.321 |
Transactions | -10.695 |
Works | -10.151 |
Queue | -10.121 |
Token | it |
Token ID | 340 |
Feature activation | -6.23e-01 |
Pos logit contributions | |
eers | +1.674 |
culosis | +1.515 |
Transactions | +1.458 |
Works | +1.446 |
Companies | +1.427 |
Neg logit contributions | |
damaging | -1.568 |
meaningful | -1.538 |
categ | -1.526 |
contrasting | -1.520 |
insofar | -1.478 |
Token | is |
Token ID | 318 |
Feature activation | +9.91e-01 |
Pos logit contributions | |
eers | +2.323 |
culosis | +1.976 |
Works | +1.891 |
Transactions | +1.805 |
Companies | +1.779 |
Neg logit contributions | |
damaging | -3.971 |
meaningful | -3.947 |
categ | -3.922 |
contrasting | -3.888 |
insofar | -3.870 |
Token | an |
Token ID | 281 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
damaging | +3.930 |
meaningful | +3.836 |
contrasting | +3.774 |
categ | +3.768 |
insofar | +3.749 |
Neg logit contributions | |
eers | -6.362 |
culosis | -5.964 |
Transactions | -5.769 |
Works | -5.649 |
Companies | -5.587 |
Token | " |
Token ID | 366 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
damaging | +5.492 |
meaningful | +5.373 |
categ | +5.300 |
contrasting | +5.269 |
insofar | +5.261 |
Neg logit contributions | |
eers | -5.833 |
culosis | -5.508 |
Transactions | -5.249 |
Works | -5.079 |
Companies | -5.015 |
Token | ā |
Token ID | 10235 |
Feature activation | -8.37e-01 |
Pos logit contributions | |
eers | +6.302 |
culosis | +5.794 |
Transactions | +5.381 |
Queue | +5.323 |
atcher | +5.213 |
Neg logit contributions | |
damaging | -9.872 |
meaningful | -9.843 |
categ | -9.667 |
consequential | -9.619 |
contrasting | -9.610 |
Token | p |
Token ID | 79 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
eers | +3.947 |
culosis | +3.767 |
Works | +3.550 |
Transactions | +3.521 |
Queue | +3.480 |
Neg logit contributions | |
damaging | -4.356 |
meaningful | -4.264 |
contrasting | -4.233 |
categ | -4.181 |
insofar | -4.160 |
Token | ā |
Token ID | 10235 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
eers | +8.437 |
culosis | +7.736 |
Transactions | +7.270 |
Queue | +7.228 |
Works | +7.006 |
Neg logit contributions | |
damaging | -13.265 |
meaningful | -13.160 |
categ | -13.133 |
contrasting | -13.064 |
pessimistic | -12.990 |
Token | |
Token ID | 220 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
damaging | +4.857 |
meaningful | +4.754 |
contrasting | +4.677 |
categ | +4.669 |
insofar | +4.646 |
Neg logit contributions | |
eers | -5.818 |
culosis | -5.451 |
Transactions | -5.229 |
Works | -5.103 |
Companies | -5.021 |
Token | � |
Token ID | 134 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
damaging | +6.549 |
meaningful | +6.448 |
contrasting | +6.363 |
categ | +6.358 |
insofar | +6.327 |
Neg logit contributions | |
eers | -4.875 |
culosis | -4.477 |
Transactions | -4.222 |
Works | -4.102 |
Queue | -4.008 |
Token | � |
Token ID | 119 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
damaging | +7.663 |
meaningful | +7.547 |
categ | +7.448 |
contrasting | +7.411 |
insofar | +7.369 |
Neg logit contributions | |
eers | -6.442 |
culosis | -5.926 |
Transactions | -5.655 |
Works | -5.441 |
Companies | -5.393 |
Token | o |
Token ID | 78 |
Feature activation | +2.22e-01 |
Pos logit contributions | |
damaging | +7.951 |
meaningful | +7.809 |
categ | +7.719 |
insofar | +7.697 |
contrasting | +7.685 |
Neg logit contributions | |
eers | -5.798 |
culosis | -5.368 |
Transactions | -5.120 |
Works | -4.893 |
Companies | -4.851 |
Token | |
Token ID | 220 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
damaging | +1.085 |
meaningful | +1.072 |
contrasting | +1.052 |
insofar | +1.042 |
categ | +1.040 |
Neg logit contributions | |
eers | -1.205 |
culosis | -1.126 |
Transactions | -1.084 |
Works | -1.072 |
Queue | -1.044 |
Token | ia |
Token ID | 544 |
Feature activation | +9.72e-01 |
Pos logit contributions | |
damaging | +12.604 |
meaningful | +12.406 |
categ | +12.272 |
insofar | +12.249 |
contrasting | +12.198 |
Neg logit contributions | |
eers | -10.093 |
culosis | -9.441 |
Transactions | -9.108 |
Companies | -8.689 |
Facility | -8.584 |
Token | i |
Token ID | 1312 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
damaging | +4.718 |
meaningful | +4.620 |
contrasting | +4.548 |
categ | +4.535 |
insofar | +4.518 |
Neg logit contributions | |
eers | -5.419 |
culosis | -5.065 |
Transactions | -4.864 |
Works | -4.745 |
Companies | -4.663 |
Token | lan |
Token ID | 26992 |
Feature activation | +5.08e-01 |
Pos logit contributions | |
damaging | +5.237 |
meaningful | +5.122 |
categ | +5.028 |
contrasting | +5.023 |
insofar | +4.998 |
Neg logit contributions | |
eers | -7.083 |
culosis | -6.660 |
Transactions | -6.409 |
Works | -6.242 |
Companies | -6.167 |
Token | board |
Token ID | 3096 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
eers | +9.105 |
Companies | +8.815 |
Works | +8.604 |
Transactions | +8.463 |
Services | +8.252 |
Neg logit contributions | |
damaging | -10.270 |
insofar | -10.068 |
meaningful | -10.052 |
categ | -10.024 |
contrasting | -9.976 |
Token | is |
Token ID | 318 |
Feature activation | -4.88e-02 |
Pos logit contributions | |
eers | +9.711 |
culosis | +8.697 |
Works | +8.633 |
Companies | +8.575 |
Transactions | +8.542 |
Neg logit contributions | |
damaging | -8.261 |
contrasting | -7.940 |
meaningful | -7.915 |
categ | -7.833 |
insofar | -7.811 |
Token | here |
Token ID | 994 |
Feature activation | -7.08e-02 |
Pos logit contributions | |
eers | +0.323 |
culosis | +0.301 |
Transactions | +0.292 |
Works | +0.290 |
Companies | +0.288 |
Neg logit contributions | |
damaging | -0.178 |
meaningful | -0.171 |
insofar | -0.171 |
contrasting | -0.169 |
categ | -0.168 |
Token | to |
Token ID | 284 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
eers | +0.465 |
culosis | +0.433 |
Companies | +0.421 |
Works | +0.421 |
Facility | +0.418 |
Neg logit contributions | |
damaging | -0.254 |
meaningful | -0.249 |
categ | -0.246 |
contrasting | -0.243 |
consequential | -0.241 |
Token | watch |
Token ID | 2342 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
eers | +5.135 |
culosis | +4.505 |
Transactions | +4.454 |
Works | +4.376 |
Companies | +4.354 |
Neg logit contributions | |
damaging | -6.852 |
contrasting | -6.708 |
categ | -6.669 |
meaningful | -6.652 |
insofar | -6.633 |
Token | out |
Token ID | 503 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
eers | +2.073 |
culosis | +1.893 |
Works | +1.863 |
Transactions | +1.854 |
Companies | +1.839 |
Neg logit contributions | |
damaging | -1.447 |
contrasting | -1.434 |
categ | -1.421 |
meaningful | -1.402 |
insofar | -1.381 |
Token | for |
Token ID | 329 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
damaging | +1.311 |
categ | +1.288 |
contrasting | +1.285 |
meaningful | +1.281 |
compelling | +1.231 |
Neg logit contributions | |
eers | -2.020 |
culosis | -1.859 |
Works | -1.808 |
Transactions | -1.795 |
Companies | -1.784 |
Token | workers |
Token ID | 3259 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
eers | +0.732 |
culosis | +0.669 |
Transactions | +0.648 |
Works | +0.645 |
Companies | +0.636 |
Neg logit contributions | |
damaging | -0.701 |
categ | -0.692 |
contrasting | -0.692 |
meaningful | -0.688 |
insofar | -0.687 |
Token | by |
Token ID | 416 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
eers | +1.751 |
culosis | +1.613 |
Transactions | +1.585 |
Works | +1.576 |
Companies | +1.568 |
Neg logit contributions | |
categ | -0.899 |
meaningful | -0.882 |
contrasting | -0.876 |
damaging | -0.859 |
insofar | -0.838 |
Token | sc |
Token ID | 629 |
Feature activation | +5.78e-01 |
Pos logit contributions | |
eers | +0.987 |
culosis | +0.931 |
Companies | +0.897 |
Works | +0.896 |
Transactions | +0.895 |
Neg logit contributions | |
damaging | -0.436 |
meaningful | -0.424 |
insofar | -0.421 |
categ | -0.417 |
consequential | -0.404 |
Token | aring |
Token ID | 1723 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
damaging | +3.663 |
meaningful | +3.623 |
categ | +3.574 |
insofar | +3.560 |
contrasting | +3.557 |
Neg logit contributions | |
eers | -2.357 |
culosis | -2.150 |
Transactions | -2.000 |
Works | -1.944 |
Companies | -1.920 |
Token | 000 |
Token ID | 830 |
Feature activation | +3.66e-01 |
Pos logit contributions | |
damaging | +5.321 |
meaningful | +5.212 |
categ | +5.136 |
contrasting | +5.106 |
insofar | +5.092 |
Neg logit contributions | |
eers | -7.059 |
culosis | -6.653 |
Transactions | -6.412 |
Works | -6.252 |
Companies | -6.170 |
Token | books |
Token ID | 3835 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
damaging | +1.888 |
insofar | +1.835 |
contrasting | +1.834 |
categ | +1.833 |
meaningful | +1.832 |
Neg logit contributions | |
eers | -1.939 |
culosis | -1.740 |
Transactions | -1.736 |
Works | -1.698 |
Companies | -1.653 |
Token | a |
Token ID | 257 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
damaging | +4.224 |
meaningful | +4.102 |
contrasting | +4.024 |
categ | +4.014 |
insofar | +3.992 |
Neg logit contributions | |
eers | -7.672 |
culosis | -7.252 |
Transactions | -7.023 |
Works | -6.874 |
Companies | -6.796 |
Token | month |
Token ID | 1227 |
Feature activation | +7.10e-01 |
Pos logit contributions | |
eers | +0.762 |
culosis | +0.690 |
Transactions | +0.684 |
Works | +0.674 |
Companies | +0.654 |
Neg logit contributions | |
insofar | -0.937 |
damaging | -0.935 |
contrasting | -0.933 |
meaningful | -0.912 |
categ | -0.910 |
Token | , |
Token ID | 11 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
damaging | +3.337 |
meaningful | +3.260 |
contrasting | +3.228 |
categ | +3.227 |
insofar | +3.181 |
Neg logit contributions | |
eers | -4.084 |
culosis | -3.778 |
Transactions | -3.669 |
Works | -3.608 |
Companies | -3.547 |
Token | and |
Token ID | 290 |
Feature activation | +9.65e-02 |
Pos logit contributions | |
damaging | +10.231 |
meaningful | +10.024 |
contrasting | +9.866 |
categ | +9.866 |
insofar | +9.817 |
Neg logit contributions | |
eers | -8.825 |
culosis | -8.207 |
Transactions | -7.789 |
Works | -7.410 |
Facility | -7.384 |
Token | nets |
Token ID | 31720 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
damaging | +0.564 |
meaningful | +0.553 |
contrasting | +0.547 |
categ | +0.547 |
insofar | +0.544 |
Neg logit contributions | |
eers | -0.438 |
culosis | -0.401 |
Transactions | -0.381 |
Works | -0.375 |
Companies | -0.366 |
Token | $ |
Token ID | 720 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
eers | +1.662 |
culosis | +1.518 |
Transactions | +1.505 |
Works | +1.471 |
Companies | +1.463 |
Neg logit contributions | |
damaging | -1.187 |
insofar | -1.173 |
contrasting | -1.157 |
categ | -1.149 |
meaningful | -1.144 |
Token | 150 |
Token ID | 8628 |
Feature activation | +8.28e-01 |
Pos logit contributions | |
damaging | +7.313 |
meaningful | +7.118 |
insofar | +6.985 |
contrasting | +6.889 |
compelling | +6.801 |
Neg logit contributions | |
eers | -10.993 |
culosis | -10.722 |
Transactions | -9.976 |
Works | -9.615 |
Companies | -9.567 |
Token | , |
Token ID | 11 |
Feature activation | +7.74e-01 |
Pos logit contributions | |
damaging | +4.141 |
meaningful | +4.045 |
contrasting | +4.003 |
categ | +3.982 |
insofar | +3.974 |
Neg logit contributions | |
eers | -4.502 |
culosis | -4.205 |
Transactions | -4.063 |
Works | -3.946 |
Companies | -3.887 |
Token | 000 |
Token ID | 830 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
damaging | +3.737 |
meaningful | +3.675 |
categ | +3.653 |
insofar | +3.611 |
contrasting | +3.605 |
Neg logit contributions | |
eers | -4.303 |
culosis | -4.071 |
Transactions | -3.939 |
Works | -3.880 |
Companies | -3.772 |
Token | in |
Token ID | 287 |
Feature activation | +9.04e-02 |
Pos logit contributions | |
eers | +0.869 |
culosis | +0.788 |
Transactions | +0.779 |
Works | +0.773 |
Companies | +0.757 |
Neg logit contributions | |
damaging | -0.574 |
meaningful | -0.554 |
categ | -0.548 |
contrasting | -0.535 |
insofar | -0.532 |
Token | the |
Token ID | 262 |
Feature activation | +1.86e-01 |
Pos logit contributions | |
damaging | +0.444 |
meaningful | +0.430 |
insofar | +0.425 |
categ | +0.424 |
contrasting | +0.418 |
Neg logit contributions | |
eers | -0.491 |
culosis | -0.455 |
Transactions | -0.445 |
Works | -0.434 |
Companies | -0.425 |
Token | , |
Token ID | 11 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
damaging | +0.992 |
meaningful | +0.967 |
insofar | +0.957 |
categ | +0.955 |
contrasting | +0.945 |
Neg logit contributions | |
eers | -0.933 |
culosis | -0.856 |
Transactions | -0.840 |
Works | -0.826 |
Companies | -0.802 |
Token | for |
Token ID | 329 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
damaging | +10.127 |
meaningful | +9.992 |
insofar | +9.896 |
contrasting | +9.884 |
categ | +9.819 |
Neg logit contributions | |
eers | -8.977 |
culosis | -8.433 |
Transactions | -7.900 |
Works | -7.543 |
Queue | -7.519 |
Token | example |
Token ID | 1672 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
eers | +0.486 |
culosis | +0.443 |
Transactions | +0.424 |
Works | +0.413 |
Companies | +0.406 |
Neg logit contributions | |
damaging | -0.674 |
meaningful | -0.654 |
contrasting | -0.647 |
categ | -0.644 |
insofar | -0.641 |
Token | , |
Token ID | 11 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
damaging | +1.310 |
meaningful | +1.281 |
categ | +1.271 |
contrasting | +1.258 |
insofar | +1.246 |
Neg logit contributions | |
eers | -1.148 |
culosis | -1.056 |
Transactions | -1.011 |
Works | -0.989 |
Companies | -0.974 |
Token | Steve |
Token ID | 6542 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
damaging | +7.110 |
meaningful | +7.001 |
contrasting | +6.906 |
categ | +6.889 |
insofar | +6.881 |
Neg logit contributions | |
eers | -6.290 |
culosis | -5.838 |
Transactions | -5.521 |
Works | -5.313 |
Companies | -5.253 |
Token | Reich |
Token ID | 24560 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
damaging | +1.513 |
meaningful | +1.483 |
contrasting | +1.466 |
categ | +1.465 |
insofar | +1.457 |
Neg logit contributions | |
eers | -1.104 |
culosis | -0.997 |
Transactions | -0.987 |
Works | -0.962 |
Companies | -0.928 |
Token | En |
Token ID | 2039 |
Feature activation | +6.04e-01 |
Pos logit contributions | |
damaging | +1.316 |
meaningful | +1.287 |
categ | +1.273 |
contrasting | +1.264 |
insofar | +1.256 |
Neg logit contributions | |
eers | -1.152 |
culosis | -1.033 |
Transactions | -1.008 |
Works | -0.994 |
Companies | -0.969 |
Token | semble |
Token ID | 15140 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
damaging | +3.721 |
meaningful | +3.665 |
categ | +3.613 |
contrasting | +3.607 |
insofar | +3.598 |
Neg logit contributions | |
eers | -2.618 |
culosis | -2.397 |
Transactions | -2.274 |
Works | -2.233 |
Queue | -2.167 |
Token | . |
Token ID | 13 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
eers | +9.270 |
Works | +8.505 |
Transactions | +8.281 |
Facility | +8.139 |
Companies | +8.118 |
Neg logit contributions | |
damaging | -6.477 |
categ | -6.246 |
meaningful | -6.245 |
consequential | -6.143 |
contrasting | -6.060 |
Token | happening |
Token ID | 5836 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
eers | +7.856 |
culosis | +7.275 |
Facility | +7.004 |
Transactions | +6.999 |
Works | +6.948 |
Neg logit contributions | |
categ | -5.218 |
insofar | -5.145 |
meaningful | -5.133 |
damaging | -5.057 |
pessimistic | -5.018 |
Token | when |
Token ID | 618 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
eers | +2.410 |
culosis | +2.225 |
Transactions | +2.175 |
Works | +2.132 |
Companies | +2.092 |
Neg logit contributions | |
damaging | -1.687 |
categ | -1.674 |
meaningful | -1.665 |
contrasting | -1.614 |
pessimistic | -1.600 |
Token | it |
Token ID | 340 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
eers | +5.691 |
Transactions | +5.243 |
culosis | +5.210 |
Works | +5.002 |
Companies | +4.986 |
Neg logit contributions | |
damaging | -5.662 |
categ | -5.659 |
meaningful | -5.658 |
insofar | -5.623 |
pessimistic | -5.524 |
Token | breaks |
Token ID | 9457 |
Feature activation | -9.83e-02 |
Pos logit contributions | |
eers | +5.745 |
culosis | +5.188 |
Works | +4.970 |
Transactions | +4.928 |
Companies | +4.758 |
Neg logit contributions | |
meaningful | -6.294 |
categ | -6.255 |
damaging | -6.208 |
contrasting | -6.184 |
insofar | -6.167 |
Token | off |
Token ID | 572 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
eers | +0.606 |
culosis | +0.561 |
Transactions | +0.552 |
Works | +0.537 |
Companies | +0.534 |
Neg logit contributions | |
damaging | -0.391 |
meaningful | -0.387 |
categ | -0.385 |
insofar | -0.375 |
contrasting | -0.375 |
Token | , |
Token ID | 11 |
Feature activation | +7.85e-01 |
Pos logit contributions | |
damaging | +2.370 |
meaningful | +2.325 |
categ | +2.310 |
contrasting | +2.284 |
insofar | +2.275 |
Neg logit contributions | |
eers | -2.691 |
culosis | -2.493 |
Transactions | -2.417 |
Works | -2.344 |
Companies | -2.323 |
Token | it |
Token ID | 340 |
Feature activation | -9.90e-01 |
Pos logit contributions | |
damaging | +4.651 |
meaningful | +4.574 |
categ | +4.534 |
contrasting | +4.499 |
insofar | +4.495 |
Neg logit contributions | |
eers | -3.510 |
culosis | -3.216 |
Transactions | -3.071 |
Works | -2.969 |
Companies | -2.918 |
Token | might |
Token ID | 1244 |
Feature activation | +1.46e-01 |
Pos logit contributions | |
eers | +3.069 |
culosis | +2.506 |
Works | +2.432 |
Transactions | +2.336 |
Companies | +2.248 |
Neg logit contributions | |
damaging | -6.769 |
meaningful | -6.630 |
insofar | -6.620 |
categ | -6.599 |
consequential | -6.544 |
Token | look |
Token ID | 804 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
damaging | +0.747 |
meaningful | +0.728 |
categ | +0.726 |
insofar | +0.719 |
contrasting | +0.718 |
Neg logit contributions | |
eers | -0.759 |
culosis | -0.701 |
Transactions | -0.669 |
Works | -0.656 |
Companies | -0.647 |
Token | like |
Token ID | 588 |
Feature activation | +5.66e-01 |
Pos logit contributions | |
damaging | +4.190 |
meaningful | +4.047 |
categ | +3.964 |
contrasting | +3.947 |
insofar | +3.937 |
Neg logit contributions | |
eers | -9.709 |
culosis | -9.202 |
Transactions | -8.930 |
Works | -8.754 |
Companies | -8.677 |
Token | cutting |
Token ID | 7720 |
Feature activation | +2.93e-01 |
Pos logit contributions | |
damaging | +2.859 |
meaningful | +2.806 |
categ | +2.783 |
insofar | +2.770 |
contrasting | +2.760 |
Neg logit contributions | |
eers | -3.022 |
culosis | -2.793 |
Transactions | -2.695 |
Works | -2.629 |
Companies | -2.591 |
Token | PJ |
Token ID | 44941 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
eers | +2.576 |
Transactions | +2.287 |
culosis | +2.245 |
Works | +2.211 |
Companies | +2.207 |
Neg logit contributions | |
damaging | -5.065 |
meaningful | -4.971 |
contrasting | -4.940 |
categ | -4.920 |
insofar | -4.864 |
Token | RC |
Token ID | 7397 |
Feature activation | -1.98e+00 |
Pos logit contributions | |
damaging | +1.846 |
meaningful | +1.812 |
contrasting | +1.791 |
categ | +1.788 |
insofar | +1.784 |
Neg logit contributions | |
eers | -1.231 |
culosis | -1.114 |
Transactions | -1.080 |
Works | -1.059 |
Companies | -1.037 |
Token | � |
Token ID | 447 |
Feature activation | -7.92e-01 |
Pos logit contributions | |
eers | +10.544 |
Works | +9.531 |
Transactions | +9.508 |
Companies | +9.364 |
culosis | +9.218 |
Neg logit contributions | |
damaging | -8.450 |
contrasting | -8.165 |
meaningful | -8.141 |
insofar | -7.995 |
consequential | -7.982 |
Token | � |
Token ID | 247 |
Feature activation | -7.99e-01 |
Pos logit contributions | |
eers | +3.018 |
culosis | +2.669 |
Transactions | +2.572 |
Works | +2.494 |
Queue | +2.481 |
Neg logit contributions | |
damaging | -5.017 |
contrasting | -4.953 |
meaningful | -4.948 |
categ | -4.938 |
insofar | -4.897 |
Token | s |
Token ID | 82 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
eers | +3.549 |
culosis | +3.224 |
Transactions | +3.063 |
Works | +3.049 |
Companies | +2.971 |
Neg logit contributions | |
damaging | -4.660 |
meaningful | -4.575 |
contrasting | -4.536 |
insofar | -4.512 |
categ | -4.503 |
Token | main |
Token ID | 1388 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
eers | +8.789 |
Transactions | +8.113 |
Works | +8.039 |
Companies | +7.896 |
culosis | +7.876 |
Neg logit contributions | |
damaging | -6.410 |
insofar | -6.180 |
meaningful | -6.137 |
contrasting | -6.133 |
consequential | -5.974 |
Token | focus |
Token ID | 2962 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
eers | +6.947 |
Transactions | +6.315 |
culosis | +6.226 |
Works | +6.198 |
Facility | +6.148 |
Neg logit contributions | |
damaging | -6.616 |
insofar | -6.432 |
contrasting | -6.349 |
meaningful | -6.337 |
consequential | -6.207 |
Token | is |
Token ID | 318 |
Feature activation | +8.63e-01 |
Pos logit contributions | |
eers | +5.425 |
culosis | +4.868 |
Works | +4.823 |
Transactions | +4.681 |
Facility | +4.632 |
Neg logit contributions | |
damaging | -5.661 |
meaningful | -5.420 |
contrasting | -5.362 |
categ | -5.331 |
consequential | -5.268 |
Token | developing |
Token ID | 5922 |
Feature activation | +8.77e-01 |
Pos logit contributions | |
damaging | +4.043 |
meaningful | +3.948 |
contrasting | +3.904 |
categ | +3.891 |
insofar | +3.873 |
Neg logit contributions | |
eers | -4.941 |
culosis | -4.595 |
Transactions | -4.475 |
Works | -4.355 |
Companies | -4.301 |
Token | technology |
Token ID | 3037 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
damaging | +4.608 |
meaningful | +4.494 |
contrasting | +4.461 |
insofar | +4.453 |
categ | +4.449 |
Neg logit contributions | |
eers | -4.526 |
culosis | -4.158 |
Transactions | -4.048 |
Works | -3.934 |
Companies | -3.875 |
Token | for |
Token ID | 329 |
Feature activation | -6.02e-01 |
Pos logit contributions | |
damaging | +0.965 |
contrasting | +0.939 |
categ | +0.937 |
meaningful | +0.927 |
insofar | +0.921 |
Neg logit contributions | |
eers | -1.317 |
culosis | -1.195 |
Transactions | -1.182 |
Works | -1.166 |
Companies | -1.165 |
Token | refugees |
Token ID | 8015 |
Feature activation | +4.01e-01 |
Pos logit contributions | |
eers | +0.993 |
culosis | +0.926 |
Transactions | +0.895 |
Works | +0.890 |
Facility | +0.868 |
Neg logit contributions | |
damaging | -0.860 |
meaningful | -0.852 |
contrasting | -0.843 |
categ | -0.841 |
insofar | -0.839 |
Token | hiding |
Token ID | 11816 |
Feature activation | -2.17e-01 |
Pos logit contributions | |
meaningful | +1.551 |
damaging | +1.542 |
categ | +1.532 |
contrasting | +1.484 |
insofar | +1.483 |
Neg logit contributions | |
eers | -2.583 |
culosis | -2.409 |
Transactions | -2.304 |
Works | -2.279 |
Facility | -2.272 |
Token | on |
Token ID | 319 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
eers | +1.357 |
culosis | +1.258 |
Companies | +1.191 |
Facility | +1.185 |
Transactions | +1.184 |
Neg logit contributions | |
categ | -0.850 |
damaging | -0.842 |
meaningful | -0.833 |
contrasting | -0.828 |
consequential | -0.818 |
Token | Mount |
Token ID | 5628 |
Feature activation | -9.38e-01 |
Pos logit contributions | |
eers | +5.628 |
culosis | +5.112 |
Companies | +5.088 |
Facility | +5.032 |
Works | +4.978 |
Neg logit contributions | |
insofar | -5.667 |
categ | -5.493 |
damaging | -5.470 |
meaningful | -5.460 |
contrasting | -5.352 |
Token | Sin |
Token ID | 10884 |
Feature activation | +4.83e-01 |
Pos logit contributions | |
eers | +2.940 |
culosis | +2.854 |
Works | +2.652 |
Transactions | +2.625 |
Companies | +2.558 |
Neg logit contributions | |
damaging | -6.278 |
categ | -6.258 |
contrasting | -6.244 |
meaningful | -6.230 |
insofar | -6.194 |
Token | jar |
Token ID | 9491 |
Feature activation | -5.25e-01 |
Pos logit contributions | |
damaging | +2.941 |
contrasting | +2.892 |
meaningful | +2.870 |
categ | +2.857 |
ignoring | +2.804 |
Neg logit contributions | |
eers | -2.046 |
culosis | -1.919 |
Transactions | -1.815 |
Works | -1.762 |
Companies | -1.750 |
Token | from |
Token ID | 422 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
eers | +2.966 |
culosis | +2.830 |
Facility | +2.636 |
Works | +2.623 |
Transactions | +2.616 |
Neg logit contributions | |
meaningful | -2.299 |
categ | -2.295 |
damaging | -2.257 |
pessimistic | -2.211 |
contrasting | -2.201 |
Token | Islamic |
Token ID | 5533 |
Feature activation | -3.08e-02 |
Pos logit contributions | |
eers | +3.153 |
culosis | +2.743 |
Companies | +2.715 |
Works | +2.668 |
Transactions | +2.625 |
Neg logit contributions | |
categ | -2.945 |
insofar | -2.945 |
damaging | -2.931 |
contrasting | -2.931 |
meaningful | -2.909 |
Token | State |
Token ID | 1812 |
Feature activation | +3.53e-01 |
Pos logit contributions | |
eers | +0.136 |
culosis | +0.121 |
Transactions | +0.117 |
Works | +0.116 |
Companies | +0.116 |
Neg logit contributions | |
damaging | -0.179 |
meaningful | -0.177 |
contrasting | -0.176 |
insofar | -0.175 |
categ | -0.173 |
Token | in |
Token ID | 287 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
damaging | +1.793 |
meaningful | +1.774 |
contrasting | +1.763 |
categ | +1.744 |
insofar | +1.720 |
Neg logit contributions | |
eers | -1.893 |
culosis | -1.697 |
Transactions | -1.640 |
Companies | -1.602 |
Works | -1.588 |
Token | Iraq |
Token ID | 3908 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
eers | +5.311 |
Transactions | +4.497 |
Works | +4.473 |
Companies | +4.454 |
Facility | +4.333 |
Neg logit contributions | |
insofar | -7.904 |
pessimistic | -7.874 |
categ | -7.827 |
damaging | -7.813 |
meaningful | -7.780 |
Token | disappointing |
Token ID | 17185 |
Feature activation | +4.80e-01 |
Pos logit contributions | |
damaging | +8.757 |
meaningful | +8.599 |
contrasting | +8.405 |
categ | +8.397 |
insofar | +8.384 |
Neg logit contributions | |
eers | -9.450 |
culosis | -8.911 |
Transactions | -8.460 |
Works | -8.157 |
Queue | -8.062 |
Token | , |
Token ID | 11 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
damaging | +2.360 |
meaningful | +2.293 |
categ | +2.269 |
contrasting | +2.264 |
consequential | +2.211 |
Neg logit contributions | |
eers | -2.647 |
culosis | -2.424 |
Transactions | -2.370 |
Works | -2.309 |
Companies | -2.294 |
Token | and |
Token ID | 290 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
damaging | +7.436 |
meaningful | +7.299 |
categ | +7.180 |
contrasting | +7.178 |
insofar | +7.152 |
Neg logit contributions | |
eers | -6.967 |
culosis | -6.482 |
Transactions | -6.183 |
Works | -5.977 |
Companies | -5.886 |
Token | the |
Token ID | 262 |
Feature activation | -6.58e-01 |
Pos logit contributions | |
damaging | +3.089 |
meaningful | +3.032 |
categ | +2.989 |
contrasting | +2.980 |
insofar | +2.964 |
Neg logit contributions | |
eers | -4.065 |
culosis | -3.804 |
Transactions | -3.667 |
Works | -3.571 |
Companies | -3.535 |
Token | final |
Token ID | 2457 |
Feature activation | -7.05e-01 |
Pos logit contributions | |
eers | +3.555 |
Transactions | +3.227 |
culosis | +3.217 |
Works | +3.160 |
Companies | +3.112 |
Neg logit contributions | |
damaging | -3.030 |
insofar | -3.014 |
meaningful | -2.985 |
categ | -2.948 |
contrasting | -2.928 |
Token | project |
Token ID | 1628 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
eers | +3.782 |
culosis | +3.485 |
Transactions | +3.375 |
Works | +3.308 |
Companies | +3.249 |
Neg logit contributions | |
damaging | -3.224 |
contrasting | -3.161 |
meaningful | -3.152 |
categ | -3.146 |
insofar | -3.142 |
Token | is |
Token ID | 318 |
Feature activation | +1.23e-02 |
Pos logit contributions | |
eers | +8.333 |
culosis | +7.458 |
Companies | +7.168 |
Works | +7.153 |
Transactions | +7.142 |
Neg logit contributions | |
damaging | -5.856 |
categ | -5.815 |
contrasting | -5.714 |
meaningful | -5.708 |
wounding | -5.585 |
Token | rarely |
Token ID | 8365 |
Feature activation | +6.85e-01 |
Pos logit contributions | |
damaging | +0.047 |
contrasting | +0.046 |
insofar | +0.046 |
meaningful | +0.046 |
categ | +0.046 |
Neg logit contributions | |
eers | -0.078 |
culosis | -0.072 |
Transactions | -0.070 |
Works | -0.069 |
Companies | -0.068 |
Token | better |
Token ID | 1365 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
damaging | +3.076 |
meaningful | +2.984 |
contrasting | +2.970 |
categ | +2.970 |
insofar | +2.950 |
Neg logit contributions | |
eers | -4.019 |
culosis | -3.745 |
Transactions | -3.633 |
Works | -3.552 |
Companies | -3.498 |
Token | than |
Token ID | 621 |
Feature activation | -6.21e-01 |
Pos logit contributions | |
damaging | +2.644 |
meaningful | +2.578 |
categ | +2.569 |
contrasting | +2.528 |
insofar | +2.501 |
Neg logit contributions | |
eers | -3.602 |
culosis | -3.375 |
Transactions | -3.254 |
Works | -3.215 |
Companies | -3.174 |
Token | the |
Token ID | 262 |
Feature activation | -6.84e-01 |
Pos logit contributions | |
eers | +3.561 |
culosis | +3.255 |
Works | +3.234 |
Transactions | +3.199 |
Companies | +3.149 |
Neg logit contributions | |
damaging | -2.586 |
categ | -2.567 |
meaningful | -2.518 |
contrasting | -2.513 |
insofar | -2.509 |
Token | relative |
Token ID | 3585 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
eers | +4.386 |
culosis | +4.069 |
Works | +3.942 |
Transactions | +3.894 |
Companies | +3.826 |
Neg logit contributions | |
insofar | -3.610 |
categ | -3.507 |
damaging | -3.492 |
meaningful | -3.487 |
contrasting | -3.482 |
Token | was |
Token ID | 373 |
Feature activation | -5.58e-01 |
Pos logit contributions | |
eers | +6.008 |
Works | +5.419 |
culosis | +5.380 |
Companies | +5.193 |
Transactions | +5.179 |
Neg logit contributions | |
meaningful | -6.776 |
categ | -6.708 |
damaging | -6.697 |
insofar | -6.694 |
contrasting | -6.666 |
Token | also |
Token ID | 635 |
Feature activation | -3.76e-03 |
Pos logit contributions | |
eers | +3.253 |
culosis | +2.980 |
Works | +2.944 |
Transactions | +2.934 |
Facility | +2.909 |
Neg logit contributions | |
insofar | -2.209 |
meaningful | -2.188 |
damaging | -2.171 |
contrasting | -2.161 |
categ | -2.111 |
Token | hit |
Token ID | 2277 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
eers | +0.022 |
culosis | +0.020 |
Works | +0.019 |
Transactions | +0.019 |
Facility | +0.019 |
Neg logit contributions | |
meaningful | -0.016 |
insofar | -0.016 |
damaging | -0.016 |
contrasting | -0.016 |
categ | -0.016 |
Token | with |
Token ID | 351 |
Feature activation | -3.65e-01 |
Pos logit contributions | |
contrasting | +0.720 |
categ | +0.717 |
meaningful | +0.716 |
damaging | +0.705 |
pessimistic | +0.702 |
Neg logit contributions | |
eers | -1.128 |
culosis | -1.037 |
Works | -1.005 |
Companies | -0.979 |
Transactions | -0.975 |
Token | the |
Token ID | 262 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
eers | +2.275 |
culosis | +2.099 |
Works | +2.043 |
Transactions | +2.001 |
Facility | +1.977 |
Neg logit contributions | |
insofar | -1.415 |
categ | -1.377 |
meaningful | -1.372 |
contrasting | -1.335 |
compelling | -1.326 |
Token | item |
Token ID | 2378 |
Feature activation | -8.07e-01 |
Pos logit contributions | |
eers | +1.981 |
culosis | +1.814 |
Works | +1.753 |
Transactions | +1.725 |
Facility | +1.672 |
Neg logit contributions | |
insofar | -1.794 |
categ | -1.780 |
meaningful | -1.778 |
damaging | -1.738 |
contrasting | -1.737 |
Token | and |
Token ID | 290 |
Feature activation | -5.65e-01 |
Pos logit contributions | |
eers | +4.909 |
culosis | +4.499 |
Works | +4.351 |
Transactions | +4.217 |
Companies | +4.186 |
Neg logit contributions | |
categ | -3.125 |
meaningful | -2.999 |
contrasting | -2.917 |
pessimistic | -2.917 |
consequential | -2.856 |
Token | suffered |
Token ID | 6989 |
Feature activation | +3.11e-02 |
Pos logit contributions | |
eers | +2.907 |
culosis | +2.623 |
Works | +2.529 |
Transactions | +2.516 |
Companies | +2.455 |
Neg logit contributions | |
meaningful | -2.792 |
contrasting | -2.770 |
damaging | -2.769 |
categ | -2.760 |
insofar | -2.738 |
Token | a |
Token ID | 257 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
insofar | +0.110 |
categ | +0.110 |
contrasting | +0.108 |
meaningful | +0.108 |
damaging | +0.108 |
Neg logit contributions | |
eers | -0.206 |
culosis | -0.189 |
Works | -0.184 |
Transactions | -0.184 |
Companies | -0.180 |
Token | cut |
Token ID | 2005 |
Feature activation | +9.02e-02 |
Pos logit contributions | |
damaging | +3.960 |
meaningful | +3.857 |
categ | +3.774 |
contrasting | +3.769 |
insofar | +3.746 |
Neg logit contributions | |
eers | -6.743 |
culosis | -6.377 |
Transactions | -6.161 |
Works | -6.010 |
Companies | -5.949 |
Token | will |
Token ID | 481 |
Feature activation | -8.29e-01 |
Pos logit contributions | |
eers | +3.626 |
culosis | +3.379 |
Transactions | +3.185 |
Works | +3.162 |
Queue | +3.105 |
Neg logit contributions | |
damaging | -3.961 |
meaningful | -3.852 |
insofar | -3.822 |
categ | -3.813 |
contrasting | -3.800 |
Token | understand |
Token ID | 1833 |
Feature activation | +8.92e-02 |
Pos logit contributions | |
eers | +4.312 |
culosis | +3.942 |
Transactions | +3.846 |
Works | +3.804 |
Companies | +3.725 |
Neg logit contributions | |
damaging | -4.008 |
categ | -3.877 |
meaningful | -3.858 |
contrasting | -3.857 |
consequential | -3.792 |
Token | it |
Token ID | 340 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
damaging | +0.478 |
meaningful | +0.463 |
categ | +0.459 |
contrasting | +0.459 |
insofar | +0.453 |
Neg logit contributions | |
eers | -0.446 |
culosis | -0.406 |
Transactions | -0.399 |
Works | -0.392 |
Companies | -0.384 |
Token | differently |
Token ID | 10338 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
damaging | +2.229 |
meaningful | +2.136 |
contrasting | +2.122 |
categ | +2.108 |
insofar | +2.077 |
Neg logit contributions | |
eers | -3.914 |
culosis | -3.695 |
Transactions | -3.571 |
Works | -3.524 |
Companies | -3.466 |
Token | five |
Token ID | 1936 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
damaging | +6.309 |
meaningful | +6.185 |
categ | +6.057 |
contrasting | +6.044 |
insofar | +6.036 |
Neg logit contributions | |
eers | -8.489 |
culosis | -7.998 |
Transactions | -7.690 |
Works | -7.464 |
Companies | -7.385 |
Token | years |
Token ID | 812 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
damaging | +6.321 |
meaningful | +6.162 |
categ | +6.088 |
insofar | +6.064 |
contrasting | +6.057 |
Neg logit contributions | |
eers | -8.258 |
culosis | -7.723 |
Transactions | -7.456 |
Works | -7.295 |
Companies | -7.220 |
Token | from |
Token ID | 422 |
Feature activation | -7.98e-01 |
Pos logit contributions | |
eers | +1.122 |
culosis | +1.039 |
Works | +0.999 |
Transactions | +0.983 |
Facility | +0.972 |
Neg logit contributions | |
damaging | -0.820 |
categ | -0.795 |
meaningful | -0.791 |
contrasting | -0.780 |
insofar | -0.776 |
Token | now |
Token ID | 783 |
Feature activation | +6.88e-01 |
Pos logit contributions | |
eers | +3.714 |
culosis | +3.358 |
Transactions | +3.270 |
Companies | +3.265 |
Works | +3.260 |
Neg logit contributions | |
damaging | -4.215 |
contrasting | -4.148 |
categ | -4.145 |
meaningful | -4.120 |
insofar | -4.041 |
Token | . |
Token ID | 13 |
Feature activation | -8.06e-01 |
Pos logit contributions | |
damaging | +3.170 |
meaningful | +3.093 |
categ | +3.078 |
contrasting | +3.054 |
pessimistic | +2.972 |
Neg logit contributions | |
eers | -3.978 |
culosis | -3.725 |
Transactions | -3.608 |
Works | -3.555 |
Companies | -3.497 |
Token | The |
Token ID | 383 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
eers | +2.599 |
Transactions | +2.318 |
culosis | +2.253 |
Works | +2.246 |
Companies | +2.242 |
Neg logit contributions | |
damaging | -5.677 |
meaningful | -5.565 |
contrasting | -5.518 |
categ | -5.510 |
pessimistic | -5.428 |
Token | book |
Token ID | 1492 |
Feature activation | -7.50e-01 |
Pos logit contributions | |
eers | +2.079 |
culosis | +1.891 |
Transactions | +1.866 |
Works | +1.843 |
Companies | +1.835 |
Neg logit contributions | |
damaging | -1.843 |
insofar | -1.816 |
meaningful | -1.777 |
categ | -1.772 |
contrasting | -1.749 |
Token | … |
Token ID | 1399 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
damaging | +2.191 |
meaningful | +2.170 |
categ | +2.147 |
contrasting | +2.106 |
consequential | +2.076 |
Neg logit contributions | |
eers | -2.751 |
culosis | -2.530 |
Transactions | -2.422 |
Companies | -2.394 |
Works | -2.378 |
Token | The |
Token ID | 464 |
Feature activation | +4.19e-02 |
Pos logit contributions | |
damaging | +1.111 |
meaningful | +1.091 |
categ | +1.086 |
contrasting | +1.079 |
insofar | +1.072 |
Neg logit contributions | |
eers | -0.713 |
culosis | -0.652 |
Transactions | -0.615 |
Works | -0.594 |
Companies | -0.590 |
Token | running |
Token ID | 2491 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
damaging | +0.203 |
insofar | +0.201 |
meaningful | +0.199 |
categ | +0.197 |
contrasting | +0.196 |
Neg logit contributions | |
eers | -0.227 |
culosis | -0.208 |
Transactions | -0.202 |
Works | -0.199 |
Companies | -0.196 |
Token | of |
Token ID | 286 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
eers | +8.556 |
culosis | +8.108 |
Transactions | +7.614 |
Companies | +7.518 |
Works | +7.462 |
Neg logit contributions | |
damaging | -7.454 |
meaningful | -7.407 |
insofar | -7.375 |
compelling | -7.122 |
categ | -7.101 |
Token | joint |
Token ID | 6466 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
eers | +7.785 |
culosis | +7.144 |
Companies | +6.953 |
Transactions | +6.891 |
Works | +6.790 |
Neg logit contributions | |
insofar | -6.554 |
damaging | -6.174 |
categ | -6.152 |
wounding | -6.107 |
meaningful | -5.973 |
Token | venture |
Token ID | 13189 |
Feature activation | -2.39e+00 |
Pos logit contributions | |
eers | +7.023 |
culosis | +6.493 |
Companies | +6.412 |
Works | +6.347 |
Transactions | +6.335 |
Neg logit contributions | |
damaging | -6.390 |
insofar | -6.330 |
categ | -6.204 |
meaningful | -6.194 |
contrasting | -6.144 |
Token | hospitals |
Token ID | 11301 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
eers | +12.888 |
Companies | +12.011 |
culosis | +11.865 |
Transactions | +11.638 |
Works | +11.323 |
Neg logit contributions | |
damaging | -8.898 |
categ | -8.824 |
wounding | -8.592 |
contrasting | -8.580 |
meaningful | -8.556 |
Token | will |
Token ID | 481 |
Feature activation | -9.81e-01 |
Pos logit contributions | |
eers | +11.017 |
culosis | +10.295 |
Companies | +9.864 |
Works | +9.788 |
Transactions | +9.671 |
Neg logit contributions | |
categ | -6.849 |
damaging | -6.840 |
meaningful | -6.810 |
consequential | -6.626 |
pessimistic | -6.490 |
Token | also |
Token ID | 635 |
Feature activation | -7.69e-01 |
Pos logit contributions | |
eers | +5.231 |
culosis | +4.799 |
Transactions | +4.507 |
Companies | +4.456 |
Works | +4.450 |
Neg logit contributions | |
categ | -4.458 |
contrasting | -4.424 |
damaging | -4.404 |
meaningful | -4.387 |
consequential | -4.281 |
Token | be |
Token ID | 307 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
eers | +3.909 |
culosis | +3.548 |
Transactions | +3.330 |
Companies | +3.298 |
Works | +3.292 |
Neg logit contributions | |
categ | -3.767 |
contrasting | -3.715 |
damaging | -3.711 |
meaningful | -3.695 |
insofar | -3.606 |
Token | an |
Token ID | 281 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
damaging | +1.875 |
meaningful | +1.846 |
categ | +1.843 |
insofar | +1.843 |
contrasting | +1.829 |
Neg logit contributions | |
eers | -2.887 |
culosis | -2.694 |
Transactions | -2.598 |
Works | -2.558 |
Companies | -2.536 |
Token | ' |
Token ID | 705 |
Feature activation | +8.85e-01 |
Pos logit contributions | |
eers | +4.364 |
Works | +4.164 |
culosis | +4.012 |
Transactions | +3.970 |
Facility | +3.904 |
Neg logit contributions | |
damaging | -4.542 |
categ | -4.484 |
insofar | -4.482 |
consequential | -4.403 |
contrasting | -4.380 |
Token | H |
Token ID | 39 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
damaging | +5.507 |
meaningful | +5.415 |
categ | +5.363 |
contrasting | +5.347 |
insofar | +5.333 |
Neg logit contributions | |
eers | -3.739 |
culosis | -3.427 |
Transactions | -3.227 |
Works | -3.144 |
Companies | -3.061 |
Token | KC |
Token ID | 36222 |
Feature activation | -2.49e+00 |
Pos logit contributions | |
damaging | +2.760 |
meaningful | +2.710 |
insofar | +2.699 |
contrasting | +2.690 |
categ | +2.686 |
Neg logit contributions | |
eers | -2.045 |
culosis | -1.876 |
Transactions | -1.759 |
Works | -1.722 |
Companies | -1.698 |
Token | U |
Token ID | 52 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
Queue | +5.815 |
eers | +5.722 |
Works | +5.598 |
Transactions | +5.579 |
Services | +5.508 |
Neg logit contributions | |
insofar | -15.788 |
wounding | -15.283 |
damaging | -15.213 |
meaningful | -15.181 |
categ | -15.169 |
Token | :\ |
Token ID | 7479 |
Feature activation | -9.77e-01 |
Pos logit contributions | |
eers | +7.371 |
culosis | +6.895 |
Works | +6.759 |
Services | +6.535 |
Companies | +6.378 |
Neg logit contributions | |
insofar | -11.479 |
pessimistic | -11.445 |
meaningful | -11.431 |
damaging | -11.387 |
contrasting | -11.285 |
Token | Control |
Token ID | 15988 |
Feature activation | -2.60e+00 |
Pos logit contributions | |
eers | +3.260 |
culosis | +2.805 |
Works | +2.785 |
Transactions | +2.690 |
Companies | +2.670 |
Neg logit contributions | |
damaging | -6.498 |
meaningful | -6.367 |
categ | -6.354 |
insofar | -6.353 |
contrasting | -6.300 |
Token | Panel |
Token ID | 18810 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
eers | +7.483 |
Works | +6.965 |
Queue | +6.687 |
Services | +6.563 |
Facility | +6.544 |
Neg logit contributions | |
insofar | -16.174 |
damaging | -16.103 |
categ | -15.950 |
meaningful | -15.948 |
consequential | -15.942 |
Token | \ |
Token ID | 59 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
eers | +6.776 |
Works | +6.243 |
Services | +5.823 |
Transactions | +5.710 |
Facility | +5.645 |
Neg logit contributions | |
categ | -12.251 |
damaging | -12.219 |
meaningful | -12.140 |
contrasting | -12.093 |
insofar | -12.064 |
Token | Desktop |
Token ID | 36881 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
eers | +1.239 |
culosis | +1.064 |
Works | +1.044 |
Transactions | +1.018 |
Queue | +1.008 |
Neg logit contributions | |
damaging | -2.340 |
categ | -2.316 |
meaningful | -2.312 |
contrasting | -2.299 |
insofar | -2.284 |
Token | ' |
Token ID | 6 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
eers | +4.557 |
Works | +4.193 |
Transactions | +4.006 |
Services | +4.000 |
Queue | +3.980 |
Neg logit contributions | |
damaging | -6.943 |
categ | -6.933 |
meaningful | -6.839 |
contrasting | -6.817 |
insofar | -6.800 |
Token | - |
Token ID | 532 |
Feature activation | +8.56e-01 |
Pos logit contributions | |
damaging | +1.472 |
categ | +1.455 |
contrasting | +1.447 |
meaningful | +1.434 |
insofar | +1.434 |
Neg logit contributions | |
eers | -1.235 |
culosis | -1.142 |
Transactions | -1.109 |
Works | -1.106 |
Facility | -1.075 |
Token | - |
Token ID | 12 |
Feature activation | -6.79e-01 |
Pos logit contributions | |
eers | +7.617 |
Transactions | +7.383 |
Works | +7.361 |
Companies | +7.327 |
Services | +7.119 |
Neg logit contributions | |
damaging | -9.553 |
meaningful | -9.451 |
wounding | -9.405 |
categ | -9.397 |
contrasting | -9.341 |
Token | N |
Token ID | 45 |
Feature activation | -7.87e-01 |
Pos logit contributions | |
eers | +3.032 |
culosis | +2.683 |
Transactions | +2.661 |
Companies | +2.634 |
Works | +2.622 |
Neg logit contributions | |
damaging | -3.926 |
meaningful | -3.853 |
categ | -3.838 |
contrasting | -3.833 |
insofar | -3.774 |
Token | op |
Token ID | 404 |
Feature activation | -1.92e+00 |
Pos logit contributions | |
eers | +3.689 |
culosis | +3.348 |
Companies | +3.315 |
Transactions | +3.254 |
Works | +3.240 |
Neg logit contributions | |
damaging | -4.228 |
meaningful | -4.191 |
contrasting | -4.178 |
categ | -4.157 |
insofar | -4.075 |
Token | ec |
Token ID | 721 |
Feature activation | -2.41e+00 |
Pos logit contributions | |
eers | +8.689 |
Works | +7.811 |
culosis | +7.768 |
Companies | +7.599 |
Queue | +7.469 |
Neg logit contributions | |
damaging | -9.847 |
wounding | -9.668 |
meaningful | -9.518 |
contrasting | -9.516 |
consequential | -9.494 |
Token | Ge |
Token ID | 2269 |
Feature activation | -6.04e-01 |
Pos logit contributions | |
eers | +11.654 |
Works | +11.254 |
Companies | +11.193 |
Services | +11.117 |
Transactions | +11.088 |
Neg logit contributions | |
damaging | -9.930 |
categ | -9.794 |
wounding | -9.781 |
meaningful | -9.745 |
contrasting | -9.717 |
Token | ophysical |
Token ID | 41789 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
eers | +1.943 |
culosis | +1.669 |
Transactions | +1.624 |
Works | +1.568 |
Companies | +1.524 |
Neg logit contributions | |
damaging | -4.303 |
meaningful | -4.272 |
contrasting | -4.234 |
categ | -4.225 |
insofar | -4.196 |
Token | Co |
Token ID | 1766 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
eers | +13.992 |
Services | +13.960 |
Works | +13.669 |
Transactions | +13.542 |
Facility | +13.426 |
Neg logit contributions | |
categ | -11.552 |
meaningful | -11.496 |
contrasting | -11.301 |
consequential | -11.238 |
damaging | -11.152 |
Token | ASA |
Token ID | 49599 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
eers | +7.778 |
Works | +7.171 |
Transactions | +7.151 |
Services | +7.056 |
Companies | +7.045 |
Neg logit contributions | |
damaging | -8.573 |
categ | -8.538 |
meaningful | -8.434 |
contrasting | -8.393 |
consequential | -8.248 |
Token | . |
Token ID | 13 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
eers | +3.356 |
Transactions | +3.055 |
Companies | +3.006 |
Works | +2.991 |
culosis | +2.972 |
Neg logit contributions | |
damaging | -3.331 |
meaningful | -3.255 |
categ | -3.201 |
contrasting | -3.183 |
consequential | -3.163 |
Token |
|
Token ID | 198 |
Feature activation | +8.91e-01 |
Pos logit contributions | |
eers | +5.712 |
Transactions | +5.645 |
Companies | +5.467 |
Works | +5.366 |
Services | +5.063 |
Neg logit contributions | |
damaging | -9.611 |
wounding | -9.473 |
meaningful | -9.468 |
categ | -9.404 |
consequential | -9.348 |
Token |
|
Token ID | 198 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
damaging | +4.083 |
meaningful | +4.006 |
insofar | +3.933 |
ignoring | +3.845 |
compelling | +3.845 |
Neg logit contributions | |
culosis | -4.903 |
eers | -4.885 |
Transactions | -4.483 |
Works | -4.250 |
Facility | -4.187 |
Token | Rom |
Token ID | 3570 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
damaging | +5.827 |
meaningful | +5.645 |
contrasting | +5.583 |
insofar | +5.551 |
categ | +5.511 |
Neg logit contributions | |
eers | -7.721 |
culosis | -7.533 |
Transactions | -6.840 |
atcher | -6.618 |
Companies | -6.596 |
Token | ano |
Token ID | 5733 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
eers | +4.129 |
culosis | +3.667 |
Transactions | +3.441 |
Works | +3.363 |
Companies | +3.345 |
Neg logit contributions | |
damaging | -6.793 |
categ | -6.744 |
meaningful | -6.736 |
contrasting | -6.711 |
insofar | -6.627 |
Token | 2006 |
Token ID | 4793 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
eers | +5.449 |
culosis | +4.999 |
Transactions | +4.800 |
Works | +4.753 |
Facility | +4.618 |
Neg logit contributions | |
meaningful | -10.160 |
damaging | -9.971 |
categ | -9.917 |
contrasting | -9.816 |
consequential | -9.774 |
Token | Tony |
Token ID | 8832 |
Feature activation | -6.95e-02 |
Pos logit contributions | |
damaging | +2.118 |
meaningful | +2.093 |
categ | +2.078 |
insofar | +2.072 |
contrasting | +2.058 |
Neg logit contributions | |
eers | -1.686 |
culosis | -1.511 |
Transactions | -1.472 |
Works | -1.438 |
Companies | -1.403 |
Token | Shal |
Token ID | 47974 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
eers | +0.311 |
culosis | +0.289 |
Transactions | +0.270 |
Works | +0.259 |
Companies | +0.255 |
Neg logit contributions | |
damaging | -0.412 |
meaningful | -0.405 |
categ | -0.399 |
insofar | -0.398 |
contrasting | -0.398 |
Token | h |
Token ID | 71 |
Feature activation | -3.25e+00 |
Pos logit contributions | |
eers | +5.588 |
culosis | +4.807 |
Works | +4.512 |
Transactions | +4.504 |
Facility | +4.365 |
Neg logit contributions | |
contrasting | -10.703 |
damaging | -10.674 |
categ | -10.564 |
meaningful | -10.509 |
consequential | -10.443 |
Token | oub |
Token ID | 12944 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
eers | +12.360 |
culosis | +11.567 |
acas | +10.703 |
atcher | +10.621 |
Facility | +10.584 |
Neg logit contributions | |
contrasting | -16.467 |
categ | -16.354 |
consequential | -16.148 |
damaging | -16.060 |
wounding | -15.822 |
Token |
|
Token ID | 198 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
eers | +5.448 |
Transactions | +4.728 |
culosis | +4.720 |
Works | +4.641 |
Facility | +4.555 |
Neg logit contributions | |
damaging | -7.936 |
meaningful | -7.916 |
categ | -7.909 |
contrasting | -7.848 |
consequential | -7.695 |
Token |
|
Token ID | 198 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
damaging | +4.379 |
meaningful | +4.284 |
insofar | +4.196 |
ignoring | +4.121 |
compelling | +4.112 |
Neg logit contributions | |
culosis | -5.507 |
eers | -5.407 |
Transactions | -5.027 |
Works | -4.719 |
Companies | -4.684 |
Token | 2006 |
Token ID | 13330 |
Feature activation | +5.70e-01 |
Pos logit contributions | |
eers | +5.131 |
Queue | +4.556 |
culosis | +4.245 |
Services | +3.828 |
Transactions | +3.752 |
Neg logit contributions | |
categ | -16.182 |
meaningful | -16.084 |
contrasting | -15.730 |
damaging | -15.579 |
consequential | -15.539 |
Token | Steve |
Token ID | 6542 |
Feature activation | -2.03e-01 |
Pos logit contributions | |
damaging | +3.297 |
meaningful | +3.248 |
categ | +3.215 |
insofar | +3.205 |
contrasting | +3.198 |
Neg logit contributions | |
eers | -2.682 |
culosis | -2.435 |
Transactions | -2.348 |
Works | -2.290 |
Companies | -2.241 |
Token | Truth |
Token ID | 14056 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
eers | +3.948 |
Transactions | +3.588 |
culosis | +3.520 |
Works | +3.500 |
Companies | +3.457 |
Neg logit contributions | |
damaging | -6.835 |
meaningful | -6.794 |
categ | -6.744 |
contrasting | -6.738 |
insofar | -6.654 |
Token | be |
Token ID | 307 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
eers | +0.692 |
culosis | +0.650 |
Transactions | +0.622 |
Works | +0.621 |
Companies | +0.601 |
Neg logit contributions | |
damaging | -0.745 |
meaningful | -0.726 |
categ | -0.725 |
contrasting | -0.722 |
insofar | -0.714 |
Token | known |
Token ID | 1900 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
eers | +0.948 |
culosis | +0.830 |
Works | +0.786 |
Transactions | +0.781 |
Companies | +0.756 |
Neg logit contributions | |
damaging | -1.881 |
insofar | -1.869 |
contrasting | -1.863 |
meaningful | -1.849 |
categ | -1.840 |
Token | , |
Token ID | 11 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
eers | +7.036 |
culosis | +6.667 |
Transactions | +6.286 |
Works | +6.269 |
Companies | +6.267 |
Neg logit contributions | |
damaging | -6.983 |
contrasting | -6.937 |
meaningful | -6.894 |
categ | -6.858 |
pessimistic | -6.770 |
Token | the |
Token ID | 262 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
damaging | +0.959 |
meaningful | +0.945 |
categ | +0.939 |
contrasting | +0.936 |
insofar | +0.930 |
Neg logit contributions | |
eers | -0.941 |
culosis | -0.872 |
Transactions | -0.844 |
Works | -0.826 |
Companies | -0.816 |
Token | majority |
Token ID | 3741 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
eers | +5.327 |
Transactions | +4.877 |
culosis | +4.844 |
Works | +4.833 |
Companies | +4.741 |
Neg logit contributions | |
insofar | -5.001 |
damaging | -4.882 |
meaningful | -4.832 |
contrasting | -4.764 |
categ | -4.751 |
Token | are |
Token ID | 389 |
Feature activation | -2.15e-01 |
Pos logit contributions | |
eers | +11.329 |
culosis | +10.338 |
Transactions | +9.993 |
Works | +9.963 |
Companies | +9.659 |
Neg logit contributions | |
damaging | -11.463 |
insofar | -11.093 |
meaningful | -11.036 |
contrasting | -10.994 |
consequential | -10.871 |
Token | not |
Token ID | 407 |
Feature activation | +3.81e-01 |
Pos logit contributions | |
eers | +1.358 |
culosis | +1.246 |
Transactions | +1.228 |
Works | +1.222 |
Companies | +1.196 |
Neg logit contributions | |
damaging | -0.829 |
meaningful | -0.820 |
insofar | -0.818 |
contrasting | -0.811 |
categ | -0.798 |
Token | riding |
Token ID | 10311 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
damaging | +1.559 |
meaningful | +1.529 |
contrasting | +1.518 |
insofar | +1.513 |
categ | +1.509 |
Neg logit contributions | |
eers | -2.391 |
culosis | -2.215 |
Transactions | -2.159 |
Works | -2.129 |
Companies | -2.090 |
Token | bikes |
Token ID | 16715 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
eers | +3.033 |
Works | +2.672 |
culosis | +2.661 |
Transactions | +2.619 |
Companies | +2.618 |
Neg logit contributions | |
damaging | -3.127 |
contrasting | -3.119 |
categ | -3.046 |
meaningful | -3.028 |
wounding | -3.022 |
Token | . |
Token ID | 13 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
damaging | +1.916 |
contrasting | +1.865 |
meaningful | +1.864 |
categ | +1.854 |
insofar | +1.813 |
Neg logit contributions | |
eers | -2.700 |
culosis | -2.525 |
Transactions | -2.425 |
Works | -2.412 |
Companies | -2.366 |