Token | and |
Token ID | 290 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
thanking | +26.193 |
chatting | +25.823 |
reading | +25.209 |
learning | +25.178 |
monitor | +25.144 |
Neg logit contributions | |
Percentage | -17.137 |
サーティワン | -15.693 |
Worse | -15.572 |
Killed | -15.273 |
Percent | -15.089 |
Token | shared |
Token ID | 4888 |
Feature activation | -6.56e+00 |
Pos logit contributions | |
blogs | +11.986 |
learning | +11.779 |
thanking | +11.747 |
reading | +11.704 |
chatting | +11.695 |
Neg logit contributions | |
Percentage | -10.546 |
Worse | -9.523 |
Killed | -9.385 |
Percent | -9.293 |
Millions | -9.237 |
Token | some |
Token ID | 617 |
Feature activation | -6.07e+00 |
Pos logit contributions | |
learning | +5.645 |
blogs | +5.635 |
reading | +5.612 |
monitor | +5.538 |
thanking | +5.447 |
Neg logit contributions | |
Percentage | -7.578 |
Killed | -6.926 |
Worse | -6.926 |
Percent | -6.829 |
Millions | -6.812 |
Token | results |
Token ID | 2482 |
Feature activation | -7.59e+00 |
Pos logit contributions | |
blogs | +6.400 |
learning | +6.397 |
reading | +6.367 |
monitor | +6.285 |
thanking | +6.214 |
Neg logit contributions | |
Percentage | -5.827 |
Worse | -5.214 |
Killed | -5.206 |
Millions | -5.146 |
Percent | -5.138 |
Token | : |
Token ID | 25 |
Feature activation | +2.48e+01 |
Pos logit contributions | |
blogs | +8.286 |
reading | +8.285 |
learning | +8.247 |
monitor | +8.184 |
thanking | +8.148 |
Neg logit contributions | |
Percentage | -6.875 |
Worse | -6.148 |
Killed | -6.135 |
Millions | -6.048 |
Percent | -6.038 |
Token | 3 |
Token ID | 513 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
Percentage | +26.264 |
Only | +24.497 |
Worse | +24.060 |
Millions | +24.011 |
Percent | +23.826 |
Neg logit contributions | |
learning | -14.235 |
reading | -14.222 |
blogs | -14.194 |
reader | -13.827 |
monitor | -13.682 |
Token | Million |
Token ID | 23425 |
Feature activation | +3.26e+01 |
Pos logit contributions | |
Percentage | +32.478 |
Millions | +31.274 |
Percent | +31.162 |
Killed | +30.002 |
Worse | +29.615 |
Neg logit contributions | |
reading | -15.632 |
learning | -15.403 |
thanking | -15.361 |
blogs | -15.171 |
chatting | -14.907 |
Token | Storage |
Token ID | 20514 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
Percentage | +31.761 |
Percent | +29.743 |
Millions | +28.958 |
Killed | +28.877 |
Only | +28.722 |
Neg logit contributions | |
learning | -16.861 |
reading | -16.590 |
thanking | -15.725 |
blogs | -15.570 |
monitor | -15.545 |
Token | I |
Token ID | 314 |
Feature activation | +5.16e+00 |
Pos logit contributions | |
Percentage | +15.098 |
Percent | +13.670 |
Millions | +13.399 |
Only | +13.385 |
Killed | +13.384 |
Neg logit contributions | |
learning | -13.993 |
reading | -13.632 |
thanking | -13.431 |
blogs | -13.361 |
monitor | -13.306 |
Token | OPS |
Token ID | 30737 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
Percentage | +5.930 |
Killed | +5.407 |
Worse | +5.390 |
Only | +5.386 |
Percent | +5.369 |
Neg logit contributions | |
learning | -4.569 |
reading | -4.536 |
monitor | -4.483 |
blogs | -4.456 |
thanking | -4.428 |
Token | on |
Token ID | 319 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
Percentage | +23.917 |
Percent | +22.085 |
Only | +22.057 |
Killed | +21.966 |
Worse | +21.728 |
Neg logit contributions | |
learning | -15.435 |
blogs | -14.969 |
reading | -14.856 |
monitor | -14.780 |
reader | -14.603 |
Token | ) |
Token ID | 8 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
learning | +1.204 |
reading | +1.204 |
blogs | +1.200 |
monitor | +1.191 |
thanking | +1.167 |
Neg logit contributions | |
Percentage | -0.843 |
Worse | -0.742 |
Killed | -0.741 |
Percent | -0.725 |
Millions | -0.721 |
Token | tot |
Token ID | 2006 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
learning | +2.242 |
reading | +2.241 |
blogs | +2.235 |
monitor | +2.219 |
thanking | +2.176 |
Neg logit contributions | |
Percentage | -1.889 |
Killed | -1.682 |
Worse | -1.681 |
Percent | -1.651 |
Millions | -1.647 |
Token | alled |
Token ID | 4262 |
Feature activation | +2.42e+01 |
Pos logit contributions | |
Percentage | +13.568 |
Only | +12.513 |
Millions | +12.408 |
Percent | +12.234 |
Killed | +12.223 |
Neg logit contributions | |
monitor | -14.081 |
learning | -13.976 |
blogs | -13.841 |
thanking | -13.754 |
chatting | -13.599 |
Token | 2 |
Token ID | 362 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
Percentage | +20.997 |
Only | +20.216 |
Millions | +20.172 |
Approximately | +19.516 |
Twice | +19.508 |
Neg logit contributions | |
learning | -18.036 |
reading | -17.863 |
blogs | -17.747 |
monitor | -17.637 |
forums | -17.322 |
Token | . |
Token ID | 13 |
Feature activation | +2.71e+01 |
Pos logit contributions | |
Percentage | +23.568 |
Percent | +22.156 |
Millions | +21.921 |
Thirty | +20.650 |
Only | +20.648 |
Neg logit contributions | |
reading | -19.798 |
monitor | -19.562 |
learning | -19.525 |
blogs | -19.365 |
reader | -18.926 |
Token | 07 |
Token ID | 2998 |
Feature activation | +3.37e+01 |
Pos logit contributions | |
Percentage | +21.268 |
Only | +19.908 |
Millions | +19.543 |
Worse | +19.262 |
Percent | +19.070 |
Neg logit contributions | |
chatting | -20.537 |
blogs | -20.370 |
reading | -20.367 |
learning | -20.274 |
monitor | -20.162 |
Token | % |
Token ID | 4 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
Percentage | +26.068 |
Millions | +25.129 |
Percent | +24.831 |
Only | +23.607 |
Twice | +22.952 |
Neg logit contributions | |
monitor | -20.890 |
reading | -20.575 |
learning | -20.561 |
reader | -19.920 |
thanking | -19.796 |
Token | of |
Token ID | 286 |
Feature activation | +1.55e+01 |
Pos logit contributions | |
Percentage | +19.854 |
Percent | +17.762 |
Only | +17.415 |
(- | +17.363 |
Killed | +17.280 |
Neg logit contributions | |
learning | -17.374 |
monitor | -17.270 |
blogs | -17.058 |
reading | -16.887 |
thanking | -16.534 |
Token | its |
Token ID | 663 |
Feature activation | +1.61e+01 |
Pos logit contributions | |
Percentage | +13.416 |
Only | +11.943 |
Killed | +11.711 |
Percent | +11.696 |
(- | +11.631 |
Neg logit contributions | |
learning | -14.990 |
blogs | -14.916 |
monitor | -14.787 |
reading | -14.483 |
thanking | -14.115 |
Token | gross |
Token ID | 10319 |
Feature activation | +7.85e+00 |
Pos logit contributions | |
Percentage | +12.913 |
Only | +11.523 |
Killed | +11.265 |
Millions | +11.218 |
(- | +11.115 |
Neg logit contributions | |
learning | -16.881 |
blogs | -16.685 |
monitor | -16.320 |
reading | -16.267 |
forums | -15.955 |
Token | domestic |
Token ID | 5928 |
Feature activation | +2.17e+00 |
Pos logit contributions | |
Percentage | +7.018 |
Only | +6.290 |
Killed | +6.272 |
Millions | +6.250 |
Percent | +6.088 |
Neg logit contributions | |
learning | -8.687 |
blogs | -8.611 |
reading | -8.469 |
monitor | -8.432 |
forums | -8.210 |
Token | shared |
Token ID | 4888 |
Feature activation | -6.56e+00 |
Pos logit contributions | |
blogs | +11.986 |
learning | +11.779 |
thanking | +11.747 |
reading | +11.704 |
chatting | +11.695 |
Neg logit contributions | |
Percentage | -10.546 |
Worse | -9.523 |
Killed | -9.385 |
Percent | -9.293 |
Millions | -9.237 |
Token | some |
Token ID | 617 |
Feature activation | -6.07e+00 |
Pos logit contributions | |
learning | +5.645 |
blogs | +5.635 |
reading | +5.612 |
monitor | +5.538 |
thanking | +5.447 |
Neg logit contributions | |
Percentage | -7.578 |
Killed | -6.926 |
Worse | -6.926 |
Percent | -6.829 |
Millions | -6.812 |
Token | results |
Token ID | 2482 |
Feature activation | -7.59e+00 |
Pos logit contributions | |
blogs | +6.400 |
learning | +6.397 |
reading | +6.367 |
monitor | +6.285 |
thanking | +6.214 |
Neg logit contributions | |
Percentage | -5.827 |
Worse | -5.214 |
Killed | -5.206 |
Millions | -5.146 |
Percent | -5.138 |
Token | : |
Token ID | 25 |
Feature activation | +2.48e+01 |
Pos logit contributions | |
blogs | +8.286 |
reading | +8.285 |
learning | +8.247 |
monitor | +8.184 |
thanking | +8.148 |
Neg logit contributions | |
Percentage | -6.875 |
Worse | -6.148 |
Killed | -6.135 |
Millions | -6.048 |
Percent | -6.038 |
Token | 3 |
Token ID | 513 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
Percentage | +26.264 |
Only | +24.497 |
Worse | +24.060 |
Millions | +24.011 |
Percent | +23.826 |
Neg logit contributions | |
learning | -14.235 |
reading | -14.222 |
blogs | -14.194 |
reader | -13.827 |
monitor | -13.682 |
Token | Million |
Token ID | 23425 |
Feature activation | +3.26e+01 |
Pos logit contributions | |
Percentage | +32.478 |
Millions | +31.274 |
Percent | +31.162 |
Killed | +30.002 |
Worse | +29.615 |
Neg logit contributions | |
reading | -15.632 |
learning | -15.403 |
thanking | -15.361 |
blogs | -15.171 |
chatting | -14.907 |
Token | Storage |
Token ID | 20514 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
Percentage | +31.761 |
Percent | +29.743 |
Millions | +28.958 |
Killed | +28.877 |
Only | +28.722 |
Neg logit contributions | |
learning | -16.861 |
reading | -16.590 |
thanking | -15.725 |
blogs | -15.570 |
monitor | -15.545 |
Token | I |
Token ID | 314 |
Feature activation | +5.16e+00 |
Pos logit contributions | |
Percentage | +15.098 |
Percent | +13.670 |
Millions | +13.399 |
Only | +13.385 |
Killed | +13.384 |
Neg logit contributions | |
learning | -13.993 |
reading | -13.632 |
thanking | -13.431 |
blogs | -13.361 |
monitor | -13.306 |
Token | OPS |
Token ID | 30737 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
Percentage | +5.930 |
Killed | +5.407 |
Worse | +5.390 |
Only | +5.386 |
Percent | +5.369 |
Neg logit contributions | |
learning | -4.569 |
reading | -4.536 |
monitor | -4.483 |
blogs | -4.456 |
thanking | -4.428 |
Token | on |
Token ID | 319 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
Percentage | +23.917 |
Percent | +22.085 |
Only | +22.057 |
Killed | +21.966 |
Worse | +21.728 |
Neg logit contributions | |
learning | -15.435 |
blogs | -14.969 |
reading | -14.856 |
monitor | -14.780 |
reader | -14.603 |
Token | AWS |
Token ID | 30865 |
Feature activation | +1.09e+01 |
Pos logit contributions | |
Percentage | +10.476 |
Only | +9.441 |
Worse | +9.394 |
Killed | +9.378 |
Millions | +9.348 |
Neg logit contributions | |
learning | -10.271 |
reading | -10.224 |
blogs | -10.116 |
monitor | -10.077 |
thanking | -9.958 |
Token | growth |
Token ID | 3349 |
Feature activation | +3.88e+00 |
Pos logit contributions | |
Percentage | +9.518 |
Worse | +8.662 |
Millions | +8.608 |
Percent | +8.605 |
Killed | +8.574 |
Neg logit contributions | |
blogs | -6.052 |
learning | -6.034 |
monitor | -5.912 |
reading | -5.852 |
forums | -5.764 |
Token | estimate |
Token ID | 8636 |
Feature activation | +1.05e+01 |
Pos logit contributions | |
Percentage | +4.404 |
Worse | +3.980 |
Killed | +3.949 |
Percent | +3.931 |
Only | +3.922 |
Neg logit contributions | |
blogs | -3.501 |
learning | -3.496 |
reading | -3.431 |
monitor | -3.428 |
thanking | -3.350 |
Token | of |
Token ID | 286 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
Percentage | +11.211 |
Worse | +10.171 |
Only | +10.050 |
Killed | +9.951 |
Percent | +9.884 |
Neg logit contributions | |
learning | -9.513 |
blogs | -9.389 |
reading | -9.161 |
monitor | -9.160 |
forums | -8.869 |
Token | 7 |
Token ID | 767 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
Percentage | +16.364 |
Only | +15.033 |
(- | +14.674 |
Worse | +14.646 |
Killed | +14.601 |
Neg logit contributions | |
learning | -15.243 |
reading | -14.985 |
blogs | -14.822 |
monitor | -14.792 |
reader | -14.424 |
Token | . |
Token ID | 13 |
Feature activation | +2.46e+01 |
Pos logit contributions | |
Percentage | +23.111 |
Percent | +21.418 |
Millions | +20.290 |
Killed | +20.114 |
Only | +19.972 |
Neg logit contributions | |
learning | -17.400 |
monitor | -17.041 |
reading | -16.978 |
blogs | -16.909 |
reader | -16.815 |
Token | 8 |
Token ID | 23 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
Percentage | +19.365 |
Only | +17.559 |
Killed | +17.263 |
Percent | +17.257 |
Millions | +17.253 |
Neg logit contributions | |
chatting | -19.973 |
learning | -19.802 |
thanking | -19.671 |
blogs | -19.655 |
reading | -19.599 |
Token | percent |
Token ID | 1411 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
Percentage | +28.554 |
Percent | +27.167 |
Millions | +25.813 |
Only | +24.976 |
Worse | +24.833 |
Neg logit contributions | |
learning | -18.908 |
monitor | -18.221 |
reader | -17.835 |
reading | -17.823 |
chatting | -17.699 |
Token | � |
Token ID | 564 |
Feature activation | +3.99e+00 |
Pos logit contributions | |
Percentage | +21.774 |
(- | +19.854 |
Percent | +19.728 |
Worse | +19.480 |
Only | +19.392 |
Neg logit contributions | |
learning | -16.241 |
blogs | -16.195 |
monitor | -15.627 |
reading | -15.173 |
reader | -15.136 |
Token | � |
Token ID | 250 |
Feature activation | +9.42e+00 |
Pos logit contributions | |
Percentage | +3.342 |
Worse | +2.918 |
Killed | +2.917 |
Percent | +2.879 |
Millions | +2.863 |
Neg logit contributions | |
learning | -4.830 |
reading | -4.813 |
blogs | -4.805 |
monitor | -4.778 |
thanking | -4.675 |
Token | le |
Token ID | 293 |
Feature activation | +8.50e+00 |
Pos logit contributions | |
Percentage | +11.181 |
Worse | +10.197 |
Percent | +10.059 |
Only | +10.032 |
Killed | +10.032 |
Neg logit contributions | |
learning | -7.401 |
blogs | -7.367 |
reading | -7.214 |
monitor | -7.141 |
chatting | -7.031 |
Token | pre |
Token ID | 3866 |
Feature activation | +6.88e+00 |
Pos logit contributions | |
Percentage | +10.516 |
Worse | +9.648 |
Killed | +9.631 |
Percent | +9.582 |
Only | +9.512 |
Neg logit contributions | |
reading | -6.243 |
monitor | -6.156 |
learning | -6.154 |
blogs | -6.125 |
thanking | -5.965 |
Token | deficit |
Token ID | 11807 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
Percentage | +8.808 |
Millions | +7.902 |
Killed | +7.901 |
Percent | +7.884 |
Worse | +7.884 |
Neg logit contributions | |
learning | -6.728 |
blogs | -6.668 |
monitor | -6.576 |
reading | -6.571 |
thanking | -6.306 |
Token | down |
Token ID | 866 |
Feature activation | +7.23e+00 |
Pos logit contributions | |
Percentage | +10.814 |
Worse | +9.879 |
Only | +9.560 |
Millions | +9.477 |
(- | +9.439 |
Neg logit contributions | |
learning | -12.326 |
blogs | -12.031 |
reading | -11.960 |
monitor | -11.600 |
reader | -11.493 |
Token | to |
Token ID | 284 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
Percentage | +7.822 |
Worse | +7.104 |
Killed | +6.972 |
Only | +6.955 |
Millions | +6.943 |
Neg logit contributions | |
learning | -6.697 |
blogs | -6.681 |
reading | -6.653 |
monitor | -6.597 |
reader | -6.388 |
Token | 6 |
Token ID | 718 |
Feature activation | +2.74e+01 |
Pos logit contributions | |
Percentage | +17.482 |
Worse | +16.074 |
Only | +16.016 |
Millions | +16.007 |
Percent | +15.828 |
Neg logit contributions | |
learning | -13.483 |
reading | -13.346 |
blogs | -13.202 |
monitor | -13.057 |
reader | -12.453 |
Token | . |
Token ID | 13 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
Percentage | +24.278 |
Percent | +23.060 |
Millions | +22.031 |
Only | +21.197 |
Worse | +21.005 |
Neg logit contributions | |
monitor | -18.983 |
learning | -18.942 |
reading | -18.767 |
blogs | -18.460 |
thanking | -18.385 |
Token | 3 |
Token ID | 18 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
Percentage | +22.608 |
Percent | +20.859 |
Only | +20.808 |
Millions | +20.628 |
Worse | +20.460 |
Neg logit contributions | |
learning | -22.334 |
blogs | -22.143 |
chatting | -22.080 |
reading | -21.936 |
monitor | -21.796 |
Token | percent |
Token ID | 1411 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
Percentage | +25.794 |
Percent | +24.756 |
Millions | +23.282 |
Only | +22.181 |
Worse | +22.042 |
Neg logit contributions | |
learning | -21.590 |
monitor | -20.860 |
thanking | -20.421 |
reading | -20.273 |
chatting | -20.247 |
Token | of |
Token ID | 286 |
Feature activation | +1.67e+01 |
Pos logit contributions | |
Percentage | +19.575 |
(- | +17.561 |
Percent | +17.516 |
Worse | +17.442 |
Only | +17.397 |
Neg logit contributions | |
learning | -15.789 |
blogs | -15.683 |
monitor | -15.326 |
reading | -15.095 |
reader | -14.566 |
Token | GDP |
Token ID | 12396 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
Percentage | +12.981 |
(- | +11.279 |
Percent | +11.268 |
Only | +11.255 |
Killed | +11.161 |
Neg logit contributions | |
learning | -17.802 |
blogs | -17.767 |
monitor | -17.185 |
reading | -17.167 |
thanking | -16.604 |
Token | by |
Token ID | 416 |
Feature activation | +7.27e+00 |
Pos logit contributions | |
Percentage | +13.955 |
Worse | +12.483 |
Only | +12.448 |
Percent | +12.341 |
(- | +12.246 |
Neg logit contributions | |
learning | -11.250 |
blogs | -11.198 |
reading | -11.081 |
monitor | -10.851 |
reader | -10.756 |
Token | the |
Token ID | 262 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
Percentage | +6.238 |
Worse | +5.451 |
Killed | +5.447 |
Percent | +5.376 |
Only | +5.374 |
Neg logit contributions | |
blogs | -8.403 |
learning | -8.396 |
reading | -8.358 |
monitor | -8.328 |
reader | -8.108 |
Token |
|
Token ID | 198 |
Feature activation | -9.34e+00 |
Pos logit contributions | |
reading | +14.004 |
learning | +13.770 |
blogs | +13.733 |
monitor | +13.660 |
via | +13.584 |
Neg logit contributions | |
Percentage | -8.433 |
サーティワン | -7.651 |
Percent | -7.266 |
Worse | -7.240 |
Killed | -7.193 |
Token | City |
Token ID | 14941 |
Feature activation | -3.43e-01 |
Pos logit contributions | |
reading | +6.790 |
learning | +6.782 |
blogs | +6.775 |
monitor | +6.672 |
forums | +6.359 |
Neg logit contributions | |
Percentage | -11.850 |
Killed | -10.995 |
Worse | -10.816 |
Percent | -10.791 |
Millions | -10.683 |
Token | Council |
Token ID | 4281 |
Feature activation | +5.87e+00 |
Pos logit contributions | |
learning | +0.399 |
reading | +0.398 |
blogs | +0.398 |
monitor | +0.395 |
thanking | +0.387 |
Neg logit contributions | |
Percentage | -0.305 |
Killed | -0.270 |
Worse | -0.269 |
Percent | -0.265 |
Millions | -0.264 |
Token | — |
Token ID | 960 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
Percentage | +6.191 |
Killed | +5.632 |
Worse | +5.607 |
Only | +5.562 |
Percent | +5.513 |
Neg logit contributions | |
learning | -5.699 |
reading | -5.665 |
blogs | -5.656 |
monitor | -5.607 |
thanking | -5.503 |
Token | F |
Token ID | 37 |
Feature activation | +6.00e+00 |
Pos logit contributions | |
Percentage | +3.566 |
Worse | +3.286 |
Killed | +3.279 |
Only | +3.262 |
Millions | +3.250 |
Neg logit contributions | |
learning | -2.159 |
blogs | -2.157 |
reading | -2.146 |
monitor | -2.123 |
chatting | -2.101 |
Token | ifty |
Token ID | 24905 |
Feature activation | +3.17e+01 |
Pos logit contributions | |
Percentage | +7.440 |
Worse | +6.882 |
Only | +6.840 |
Millions | +6.829 |
Killed | +6.793 |
Neg logit contributions | |
learning | -4.511 |
blogs | -4.478 |
monitor | -4.412 |
chatting | -4.411 |
reading | -4.400 |
Token | / |
Token ID | 14 |
Feature activation | +1.39e+01 |
Pos logit contributions | |
Percentage | +29.777 |
Percent | +29.040 |
Millions | +27.855 |
Killed | +27.309 |
Worse | +27.203 |
Neg logit contributions | |
monitor | -18.829 |
chatting | -18.472 |
learning | -18.218 |
reading | -18.080 |
thanking | -17.878 |
Token | F |
Token ID | 37 |
Feature activation | +1.62e+01 |
Pos logit contributions | |
Percentage | +15.530 |
Percent | +14.358 |
Only | +14.279 |
Worse | +14.206 |
Killed | +14.111 |
Neg logit contributions | |
blogs | -10.881 |
chatting | -10.727 |
learning | -10.714 |
monitor | -10.568 |
reading | -10.522 |
Token | ifty |
Token ID | 24905 |
Feature activation | +2.92e+01 |
Pos logit contributions | |
Percentage | +15.353 |
Worse | +13.974 |
Only | +13.967 |
Percent | +13.886 |
Millions | +13.782 |
Neg logit contributions | |
thanking | -14.497 |
chatting | -14.433 |
monitor | -14.390 |
blogs | -14.326 |
learning | -14.258 |
Token | Plan |
Token ID | 5224 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
Percentage | +29.435 |
Percent | +27.750 |
Worse | +27.537 |
Only | +27.243 |
Votes | +27.092 |
Neg logit contributions | |
monitor | -16.483 |
learning | -16.322 |
blogs | -16.240 |
chatting | -16.058 |
reading | -15.891 |
Token |
|
Token ID | 198 |
Feature activation | -7.26e+00 |
Pos logit contributions | |
Percentage | +14.352 |
Worse | +13.219 |
Only | +13.188 |
Killed | +13.177 |
Percent | +12.904 |
Neg logit contributions | |
blogs | -11.872 |
learning | -11.831 |
monitor | -11.816 |
reading | -11.612 |
chatting | -11.537 |
Token | Andromeda |
Token ID | 34542 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
Percentage | +8.266 |
Killed | +7.470 |
Only | +7.435 |
Millions | +7.409 |
Worse | +7.408 |
Neg logit contributions | |
blogs | -7.639 |
learning | -7.597 |
reading | -7.572 |
monitor | -7.444 |
thanking | -7.269 |
Token | galaxy |
Token ID | 16161 |
Feature activation | +1.18e+01 |
Pos logit contributions | |
Percentage | +9.704 |
Percent | +8.570 |
Millions | +8.568 |
Worse | +8.539 |
Only | +8.539 |
Neg logit contributions | |
reading | -10.836 |
blogs | -10.816 |
learning | -10.705 |
monitor | -10.457 |
thanking | -10.278 |
Token | ( |
Token ID | 357 |
Feature activation | +5.80e+00 |
Pos logit contributions | |
Percentage | +11.562 |
Millions | +10.456 |
Only | +10.421 |
Killed | +10.333 |
Percent | +10.301 |
Neg logit contributions | |
blogs | -11.725 |
reading | -11.560 |
learning | -11.483 |
monitor | -11.177 |
thanking | -10.932 |
Token | 2 |
Token ID | 17 |
Feature activation | +2.82e+01 |
Pos logit contributions | |
Percentage | +5.629 |
Millions | +5.041 |
Killed | +5.012 |
Only | +5.008 |
Worse | +4.997 |
Neg logit contributions | |
blogs | -6.008 |
reading | -5.983 |
learning | -5.970 |
thanking | -5.884 |
chatting | -5.872 |
Token | , |
Token ID | 11 |
Feature activation | +7.98e+00 |
Pos logit contributions | |
Percentage | +25.935 |
Millions | +24.594 |
Percent | +24.057 |
Only | +23.673 |
Killed | +23.388 |
Neg logit contributions | |
blogs | -19.456 |
reading | -19.384 |
learning | -18.668 |
thanking | -18.099 |
reader | -18.043 |
Token | 000 |
Token ID | 830 |
Feature activation | +3.14e+01 |
Pos logit contributions | |
Percentage | +7.661 |
Killed | +6.888 |
Millions | +6.848 |
Worse | +6.816 |
Only | +6.809 |
Neg logit contributions | |
blogs | -8.264 |
reading | -8.255 |
learning | -8.181 |
monitor | -8.035 |
thanking | -7.952 |
Token | , |
Token ID | 11 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
Percentage | +27.249 |
Millions | +26.070 |
Only | +25.483 |
Percent | +25.189 |
Killed | +24.618 |
Neg logit contributions | |
blogs | -21.143 |
reading | -20.201 |
learning | -19.887 |
monitor | -19.771 |
thanking | -19.364 |
Token | 000 |
Token ID | 830 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
Percentage | +2.741 |
Killed | +2.468 |
Worse | +2.455 |
Millions | +2.442 |
Only | +2.432 |
Neg logit contributions | |
learning | -2.704 |
blogs | -2.701 |
reading | -2.699 |
monitor | -2.660 |
thanking | -2.609 |
Token | Light |
Token ID | 4401 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
Percentage | +23.654 |
Millions | +22.331 |
Only | +22.073 |
Percent | +21.449 |
Killed | +21.368 |
Neg logit contributions | |
blogs | -21.570 |
reading | -20.698 |
monitor | -20.693 |
learning | -20.502 |
chatting | -20.044 |
Token | Years |
Token ID | 13212 |
Feature activation | +1.58e+01 |
Pos logit contributions | |
Percentage | +5.804 |
Millions | +4.749 |
Only | +4.474 |
Killed | +4.337 |
Percent | +4.311 |
Neg logit contributions | |
monitor | -23.813 |
learning | -23.599 |
reading | -23.372 |
chatting | -23.165 |
thanking | -23.138 |
Token | ) |
Token ID | 8 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
Percentage | +13.001 |
Only | +11.824 |
Millions | +11.442 |
Killed | +11.426 |
Worse | +11.426 |
Neg logit contributions | |
blogs | -16.681 |
learning | -16.490 |
reading | -16.371 |
monitor | -16.190 |
thanking | -16.009 |
Token | cannot |
Token ID | 2314 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
Percentage | +13.569 |
Only | +12.299 |
Worse | +12.097 |
Percent | +11.845 |
Millions | +11.799 |
Neg logit contributions | |
learning | -13.303 |
blogs | -13.096 |
reading | -12.827 |
monitor | -12.712 |
thanking | -12.418 |
Token | exceed |
Token ID | 7074 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
Percentage | +17.210 |
Only | +15.849 |
(- | +15.558 |
Approximately | +15.422 |
Worse | +15.384 |
Neg logit contributions | |
learning | -19.386 |
blogs | -18.488 |
reading | -18.485 |
reader | -17.965 |
thanking | -17.921 |
Token | $ |
Token ID | 720 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
Percentage | +23.352 |
Millions | +21.538 |
Thirty | +21.384 |
Approximately | +21.287 |
Percent | +21.265 |
Neg logit contributions | |
learning | -21.431 |
monitor | -21.145 |
blogs | -20.841 |
reading | -20.420 |
forums | -20.121 |
Token | 16 |
Token ID | 1433 |
Feature activation | +3.03e+01 |
Pos logit contributions | |
Percentage | +17.793 |
Millions | +16.469 |
Only | +15.985 |
Worse | +15.666 |
Percent | +15.580 |
Neg logit contributions | |
chatting | -18.610 |
arranging | -18.295 |
learning | -18.285 |
workspace | -18.249 |
monitor | -18.167 |
Token | . |
Token ID | 13 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
Percentage | +25.234 |
Percent | +23.886 |
Only | +23.564 |
Worse | +23.058 |
Millions | +22.946 |
Neg logit contributions | |
reading | -19.752 |
learning | -19.056 |
blogs | -18.979 |
thanking | -18.933 |
monitor | -18.837 |
Token | 7 |
Token ID | 22 |
Feature activation | +3.12e+01 |
Pos logit contributions | |
Percentage | +22.192 |
Only | +20.839 |
Millions | +20.470 |
Percent | +20.337 |
Worse | +20.151 |
Neg logit contributions | |
blogs | -23.061 |
learning | -22.899 |
chatting | -22.846 |
arranging | -22.525 |
reading | -22.520 |
Token | trillion |
Token ID | 12989 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
Percentage | +23.347 |
Percent | +22.142 |
Only | +21.727 |
Millions | +21.568 |
Worse | +20.968 |
Neg logit contributions | |
reading | -21.606 |
monitor | -21.582 |
learning | -21.542 |
thanking | -21.302 |
asking | -21.279 |
Token |
|
Token ID | 198 |
Feature activation | -5.59e+00 |
Pos logit contributions | |
Percentage | +22.788 |
Only | +20.932 |
(- | +20.731 |
Worse | +20.720 |
Percent | +20.712 |
Neg logit contributions | |
blogs | -16.639 |
learning | -16.416 |
monitor | -16.398 |
reader | -16.213 |
reading | -16.119 |
Token |
|
Token ID | 198 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
reading | +7.653 |
learning | +7.593 |
blogs | +7.572 |
monitor | +7.534 |
thanking | +7.398 |
Neg logit contributions | |
Percentage | -3.623 |
Worse | -3.049 |
Killed | -3.030 |
Percent | -3.017 |
Millions | -2.909 |
Token | Tre |
Token ID | 31055 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
reading | +3.681 |
blogs | +3.659 |
learning | +3.655 |
monitor | +3.598 |
thanking | +3.445 |
Neg logit contributions | |
Percentage | -6.019 |
Killed | -5.556 |
Worse | -5.522 |
Percent | -5.466 |
Millions | -5.401 |
Token | asury |
Token ID | 11579 |
Feature activation | +8.22e+00 |
Pos logit contributions | |
Percentage | +1.491 |
Worse | +1.365 |
Killed | +1.365 |
Percent | +1.347 |
Millions | +1.345 |
Neg logit contributions | |
learning | -0.983 |
reading | -0.980 |
blogs | -0.976 |
monitor | -0.967 |
thanking | -0.943 |
Token | Debt |
Token ID | 30319 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
Percentage | +20.907 |
Percent | +18.930 |
Only | +18.372 |
Worse | +18.161 |
Millions | +18.104 |
Neg logit contributions | |
reading | -15.046 |
learning | -14.982 |
blogs | -14.904 |
monitor | -14.574 |
chatting | -14.468 |
Token | - |
Token ID | 12 |
Feature activation | +6.81e+00 |
Pos logit contributions | |
Percentage | +24.529 |
Percent | +22.585 |
Only | +21.757 |
Worse | +21.754 |
Millions | +21.428 |
Neg logit contributions | |
learning | -15.080 |
blogs | -14.947 |
reading | -14.898 |
chatting | -14.448 |
monitor | -14.363 |
Token | to |
Token ID | 1462 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
Percentage | +9.186 |
Percent | +8.403 |
Killed | +8.329 |
Worse | +8.326 |
Millions | +8.298 |
Neg logit contributions | |
blogs | -4.616 |
learning | -4.548 |
reading | -4.509 |
chatting | -4.485 |
thanking | -4.433 |
Token | - |
Token ID | 12 |
Feature activation | +4.97e+00 |
Pos logit contributions | |
Percentage | +10.034 |
Percent | +8.849 |
Worse | +8.698 |
Killed | +8.689 |
Millions | +8.661 |
Neg logit contributions | |
blogs | -11.622 |
learning | -11.554 |
reading | -11.480 |
monitor | -11.402 |
chatting | -11.209 |
Token | G |
Token ID | 38 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
Percentage | +6.136 |
Killed | +5.560 |
Worse | +5.555 |
Millions | +5.554 |
Percent | +5.552 |
Neg logit contributions | |
blogs | -3.966 |
learning | -3.928 |
reading | -3.877 |
chatting | -3.847 |
monitor | -3.817 |
Token | DP |
Token ID | 6322 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
Percentage | +5.531 |
Only | +5.018 |
Percent | +5.004 |
Killed | +4.999 |
Worse | +4.970 |
Neg logit contributions | |
learning | -3.708 |
blogs | -3.669 |
reading | -3.592 |
monitor | -3.575 |
chatting | -3.514 |
Token | Ratio |
Token ID | 33956 |
Feature activation | +2.99e+01 |
Pos logit contributions | |
Percentage | +31.060 |
Percent | +28.725 |
Only | +27.280 |
Millions | +27.267 |
Ratio | +27.255 |
Neg logit contributions | |
learning | -17.834 |
blogs | -17.804 |
reading | -17.231 |
forums | -16.894 |
chatting | -16.811 |
Token | 1 |
Token ID | 352 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
Percentage | +30.699 |
Percent | +28.373 |
Only | +27.531 |
Worse | +26.894 |
Average | +26.778 |
Neg logit contributions | |
learning | -17.416 |
blogs | -16.846 |
reading | -16.834 |
chatting | -16.386 |
forums | -16.353 |
Token | Mac |
Token ID | 4100 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
Percentage | +11.750 |
Only | +10.320 |
Percent | +10.319 |
Worse | +10.250 |
Killed | +10.175 |
Neg logit contributions | |
blogs | -13.115 |
learning | -13.097 |
reading | -13.085 |
monitor | -12.852 |
forums | -12.666 |
Token | ao |
Token ID | 5488 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
Percentage | +4.580 |
Killed | +4.154 |
Millions | +4.138 |
Only | +4.111 |
Percent | +4.106 |
Neg logit contributions | |
blogs | -3.934 |
learning | -3.925 |
reading | -3.870 |
monitor | -3.818 |
thanking | -3.747 |
Token | SAR |
Token ID | 47341 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
Percentage | +21.626 |
Only | +19.590 |
Percent | +19.405 |
Worse | +19.329 |
Millions | +19.178 |
Neg logit contributions | |
blogs | -15.945 |
reading | -15.892 |
learning | -15.874 |
forums | -15.302 |
monitor | -15.284 |
Token | its |
Token ID | 663 |
Feature activation | +9.49e+00 |
Pos logit contributions | |
Percentage | +7.909 |
Millions | +7.249 |
Worse | +7.220 |
Killed | +7.196 |
Only | +7.144 |
Neg logit contributions | |
blogs | -6.605 |
learning | -6.589 |
monitor | -6.556 |
reading | -6.553 |
thanking | -6.347 |
Token | intellectual |
Token ID | 9028 |
Feature activation | +7.08e+00 |
Pos logit contributions | |
Percentage | +11.204 |
Killed | +10.393 |
Worse | +10.368 |
Millions | +10.320 |
Only | +10.275 |
Neg logit contributions | |
learning | -7.342 |
blogs | -7.336 |
monitor | -7.265 |
reading | -7.188 |
thanking | -7.039 |
Token | protagonists |
Token ID | 39558 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
Percentage | +8.530 |
Killed | +7.929 |
Worse | +7.859 |
Only | +7.841 |
Millions | +7.799 |
Neg logit contributions | |
learning | -5.569 |
blogs | -5.497 |
monitor | -5.410 |
reading | -5.366 |
thanking | -5.241 |
Token | would |
Token ID | 561 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
Percentage | +13.040 |
Killed | +12.028 |
Only | +11.991 |
Millions | +11.956 |
Worse | +11.942 |
Neg logit contributions | |
learning | -9.470 |
blogs | -9.401 |
monitor | -9.342 |
reading | -9.280 |
forums | -8.987 |
Token | not |
Token ID | 407 |
Feature activation | +2.22e+01 |
Pos logit contributions | |
Percentage | +18.832 |
Only | +18.103 |
Worse | +17.786 |
Killed | +17.659 |
Millions | +17.591 |
Neg logit contributions | |
learning | -13.839 |
blogs | -13.573 |
reading | -13.141 |
monitor | -12.956 |
reader | -12.824 |
Token | have |
Token ID | 423 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
Percentage | +21.786 |
Only | +21.185 |
Killed | +20.400 |
Worse | +20.336 |
Millions | +20.222 |
Neg logit contributions | |
blogs | -15.166 |
learning | -15.091 |
reading | -14.714 |
reader | -14.527 |
forums | -14.491 |
Token | had |
Token ID | 550 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
Percentage | +27.090 |
Killed | +26.512 |
Only | +25.331 |
Worse | +24.881 |
Millions | +24.864 |
Neg logit contributions | |
learning | -18.093 |
blogs | -17.465 |
reading | -17.390 |
forums | -17.188 |
monitor | -17.107 |
Token | a |
Token ID | 257 |
Feature activation | +2.00e+01 |
Pos logit contributions | |
Percentage | +24.994 |
Killed | +24.080 |
Worse | +23.609 |
Millions | +23.403 |
Only | +23.308 |
Neg logit contributions | |
learning | -15.467 |
monitor | -15.095 |
blogs | -15.028 |
reading | -14.916 |
forums | -14.723 |
Token | tangible |
Token ID | 24607 |
Feature activation | +2.39e+01 |
Pos logit contributions | |
Percentage | +21.582 |
Worse | +20.255 |
Killed | +20.110 |
Percent | +19.927 |
Millions | +19.846 |
Neg logit contributions | |
blogs | -13.142 |
monitor | -12.817 |
learning | -12.757 |
reading | -12.519 |
forums | -12.516 |
Token |
|
Token ID | 198 |
Feature activation | -6.44e+00 |
Pos logit contributions | |
Percentage | +24.420 |
Killed | +22.396 |
Only | +22.263 |
Percent | +22.249 |
Worse | +22.187 |
Neg logit contributions | |
blogs | -15.005 |
forums | -14.625 |
monitor | -14.408 |
learning | -14.323 |
reading | -13.911 |
Token |
|
Token ID | 198 |
Feature activation | -6.51e+00 |
Pos logit contributions | |
reading | +8.669 |
learning | +8.636 |
blogs | +8.572 |
monitor | +8.559 |
thanking | +8.393 |
Neg logit contributions | |
Percentage | -4.265 |
Worse | -3.595 |
Killed | -3.574 |
Percent | -3.564 |
サーティワン | -3.440 |
Token | Immigration |
Token ID | 18204 |
Feature activation | +1.44e+01 |
Pos logit contributions | |
Percentage | +8.253 |
Killed | +7.440 |
Percent | +7.406 |
Worse | +7.401 |
Only | +7.327 |
Neg logit contributions | |
reading | -8.185 |
learning | -8.171 |
monitor | -8.166 |
blogs | -8.118 |
chatting | -7.931 |
Token | P |
Token ID | 350 |
Feature activation | +7.48e+00 |
Pos logit contributions | |
Percentage | +15.241 |
Killed | +14.136 |
Worse | +14.120 |
Percent | +13.822 |
Only | +13.817 |
Neg logit contributions | |
learning | -12.158 |
reading | -11.948 |
monitor | -11.943 |
blogs | -11.883 |
reader | -11.655 |
Token | uts |
Token ID | 5500 |
Feature activation | +2.51e+01 |
Pos logit contributions | |
Percentage | +8.553 |
Millions | +8.015 |
Killed | +7.881 |
Worse | +7.873 |
Only | +7.828 |
Neg logit contributions | |
learning | -5.919 |
monitor | -5.879 |
chatting | -5.855 |
blogs | -5.844 |
reading | -5.717 |
Token | Half |
Token ID | 13139 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
Percentage | +23.957 |
Millions | +23.481 |
Worse | +22.921 |
Only | +22.780 |
Killed | +22.529 |
Neg logit contributions | |
monitor | -17.790 |
reading | -17.493 |
blogs | -17.466 |
reader | -17.094 |
learning | -16.936 |
Token | a |
Token ID | 257 |
Feature activation | +2.31e+01 |
Pos logit contributions | |
Percentage | +25.646 |
Millions | +24.077 |
Percent | +23.903 |
Worse | +23.513 |
Killed | +23.511 |
Neg logit contributions | |
blogs | -16.891 |
chatting | -16.626 |
thanking | -16.591 |
monitor | -16.428 |
learning | -16.307 |
Token | Million |
Token ID | 23425 |
Feature activation | +3.05e+01 |
Pos logit contributions | |
Percentage | +21.623 |
Percent | +20.658 |
Millions | +20.359 |
Killed | +19.769 |
Worse | +19.498 |
Neg logit contributions | |
blogs | -18.490 |
reading | -17.919 |
learning | -17.864 |
monitor | -17.777 |
chatting | -17.760 |
Token | U |
Token ID | 471 |
Feature activation | +6.11e+00 |
Pos logit contributions | |
Percentage | +29.187 |
Millions | +28.146 |
Worse | +27.910 |
Percent | +27.818 |
Killed | +27.552 |
Neg logit contributions | |
monitor | -18.042 |
chatting | -17.766 |
blogs | -17.479 |
thanking | -17.287 |
workspace | -17.234 |
Token | . |
Token ID | 13 |
Feature activation | +6.88e+00 |
Pos logit contributions | |
Percentage | +5.506 |
Worse | +4.990 |
Killed | +4.910 |
Only | +4.848 |
Millions | +4.817 |
Neg logit contributions | |
learning | -6.623 |
blogs | -6.620 |
monitor | -6.592 |
chatting | -6.537 |
reading | -6.532 |
Token | S |
Token ID | 50 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
Percentage | +7.366 |
Killed | +6.729 |
Millions | +6.676 |
Only | +6.633 |
Worse | +6.616 |
Neg logit contributions | |
learning | -6.543 |
blogs | -6.510 |
monitor | -6.460 |
reading | -6.355 |
chatting | -6.331 |
Token | . |
Token ID | 13 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
Percentage | +13.504 |
Millions | +12.378 |
Percent | +12.309 |
Killed | +12.137 |
Worse | +11.983 |
Neg logit contributions | |
chatting | -16.998 |
thanking | -16.874 |
blogs | -16.792 |
monitor | -16.679 |
reading | -16.602 |
Token | Girls |
Token ID | 12002 |
Feature activation | +1.64e+01 |
Pos logit contributions | |
Percentage | +17.485 |
Millions | +16.384 |
Killed | +16.242 |
Percent | +16.140 |
Only | +15.944 |
Neg logit contributions | |
monitor | -17.848 |
chatting | -17.789 |
thanking | -17.655 |
learning | -17.587 |
blogs | -17.541 |
Token | national |
Token ID | 2260 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Percentage | +7.134 |
Only | +6.380 |
Millions | +6.374 |
Worse | +6.359 |
Percent | +6.310 |
Neg logit contributions | |
learning | -6.802 |
monitor | -6.732 |
reading | -6.716 |
blogs | -6.714 |
thanking | -6.484 |
Token | debt |
Token ID | 5057 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
learning | +1.183 |
reading | +1.180 |
blogs | +1.178 |
monitor | +1.165 |
thanking | +1.134 |
Neg logit contributions | |
Percentage | -1.712 |
Killed | -1.565 |
Worse | -1.563 |
Percent | -1.544 |
Millions | -1.541 |
Token | cannot |
Token ID | 2314 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
Percentage | +13.569 |
Only | +12.299 |
Worse | +12.097 |
Percent | +11.845 |
Millions | +11.799 |
Neg logit contributions | |
learning | -13.303 |
blogs | -13.096 |
reading | -12.827 |
monitor | -12.712 |
thanking | -12.418 |
Token | exceed |
Token ID | 7074 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
Percentage | +17.210 |
Only | +15.849 |
(- | +15.558 |
Approximately | +15.422 |
Worse | +15.384 |
Neg logit contributions | |
learning | -19.386 |
blogs | -18.488 |
reading | -18.485 |
reader | -17.965 |
thanking | -17.921 |
Token | $ |
Token ID | 720 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
Percentage | +23.352 |
Millions | +21.538 |
Thirty | +21.384 |
Approximately | +21.287 |
Percent | +21.265 |
Neg logit contributions | |
learning | -21.431 |
monitor | -21.145 |
blogs | -20.841 |
reading | -20.420 |
forums | -20.121 |
Token | 16 |
Token ID | 1433 |
Feature activation | +3.03e+01 |
Pos logit contributions | |
Percentage | +17.793 |
Millions | +16.469 |
Only | +15.985 |
Worse | +15.666 |
Percent | +15.580 |
Neg logit contributions | |
chatting | -18.610 |
arranging | -18.295 |
learning | -18.285 |
workspace | -18.249 |
monitor | -18.167 |
Token | . |
Token ID | 13 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
Percentage | +25.234 |
Percent | +23.886 |
Only | +23.564 |
Worse | +23.058 |
Millions | +22.946 |
Neg logit contributions | |
reading | -19.752 |
learning | -19.056 |
blogs | -18.979 |
thanking | -18.933 |
monitor | -18.837 |
Token | 7 |
Token ID | 22 |
Feature activation | +3.12e+01 |
Pos logit contributions | |
Percentage | +22.192 |
Only | +20.839 |
Millions | +20.470 |
Percent | +20.337 |
Worse | +20.151 |
Neg logit contributions | |
blogs | -23.061 |
learning | -22.899 |
chatting | -22.846 |
arranging | -22.525 |
reading | -22.520 |
Token | trillion |
Token ID | 12989 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
Percentage | +23.347 |
Percent | +22.142 |
Only | +21.727 |
Millions | +21.568 |
Worse | +20.968 |
Neg logit contributions | |
reading | -21.606 |
monitor | -21.582 |
learning | -21.542 |
thanking | -21.302 |
asking | -21.279 |
Token |
|
Token ID | 198 |
Feature activation | -5.59e+00 |
Pos logit contributions | |
Percentage | +22.788 |
Only | +20.932 |
(- | +20.731 |
Worse | +20.720 |
Percent | +20.712 |
Neg logit contributions | |
blogs | -16.639 |
learning | -16.416 |
monitor | -16.398 |
reader | -16.213 |
reading | -16.119 |
Token |
|
Token ID | 198 |
Feature activation | -4.75e+00 |
Pos logit contributions | |
reading | +7.653 |
learning | +7.593 |
blogs | +7.572 |
monitor | +7.534 |
thanking | +7.398 |
Neg logit contributions | |
Percentage | -3.623 |
Worse | -3.049 |
Killed | -3.030 |
Percent | -3.017 |
Millions | -2.909 |
Token | Greenland |
Token ID | 30155 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
Percentage | +5.150 |
Killed | +4.638 |
Worse | +4.617 |
Only | +4.616 |
Millions | +4.599 |
Neg logit contributions | |
reading | -4.446 |
learning | -4.427 |
blogs | -4.376 |
monitor | -4.344 |
reader | -4.212 |
Token | has |
Token ID | 468 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
Percentage | +10.273 |
Only | +9.090 |
Killed | +9.086 |
Millions | +8.980 |
Percent | +8.977 |
Neg logit contributions | |
learning | -10.175 |
reading | -10.148 |
blogs | -9.932 |
monitor | -9.925 |
thanking | -9.803 |
Token | lost |
Token ID | 2626 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
Percentage | +18.810 |
Killed | +17.337 |
Only | +17.188 |
Millions | +16.874 |
(- | +16.289 |
Neg logit contributions | |
learning | -16.500 |
reading | -16.412 |
forums | -15.742 |
reader | -15.706 |
blogs | -15.633 |
Token | some |
Token ID | 617 |
Feature activation | +2.08e+01 |
Pos logit contributions | |
Percentage | +20.635 |
Millions | +19.098 |
Only | +19.045 |
(- | +18.614 |
Approximately | +18.320 |
Neg logit contributions | |
learning | -18.211 |
reading | -17.850 |
monitor | -17.435 |
forums | -17.324 |
blogs | -17.116 |
Token | 7 |
Token ID | 767 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
Percentage | +19.258 |
Only | +17.197 |
Millions | +17.165 |
Percent | +17.116 |
(- | +16.900 |
Neg logit contributions | |
learning | -17.019 |
reading | -16.575 |
blogs | -16.319 |
monitor | -16.220 |
forums | -16.047 |
Token | 39 |
Token ID | 2670 |
Feature activation | +3.03e+01 |
Pos logit contributions | |
Percentage | +24.462 |
Percent | +23.005 |
Millions | +22.468 |
Killed | +21.698 |
Only | +21.482 |
Neg logit contributions | |
learning | -18.647 |
reading | -18.354 |
blogs | -18.126 |
monitor | -17.960 |
reader | -17.828 |
Token | gig |
Token ID | 12526 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
Percentage | +26.972 |
Millions | +25.468 |
Percent | +25.308 |
Killed | +25.136 |
Only | +24.436 |
Neg logit contributions | |
learning | -17.861 |
reading | -17.354 |
thanking | -16.682 |
reader | -16.530 |
monitor | -16.520 |
Token | at |
Token ID | 265 |
Feature activation | +7.23e+00 |
Pos logit contributions | |
Percentage | +20.009 |
Millions | +19.113 |
Percent | +18.683 |
Only | +18.519 |
Worse | +18.126 |
Neg logit contributions | |
monitor | -14.761 |
reading | -14.736 |
learning | -14.686 |
thanking | -14.647 |
blogs | -14.367 |
Token | ons |
Token ID | 684 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
Percentage | +7.351 |
Killed | +6.580 |
Worse | +6.574 |
Percent | +6.553 |
Millions | +6.497 |
Neg logit contributions | |
blogs | -6.926 |
learning | -6.924 |
monitor | -6.845 |
reading | -6.840 |
chatting | -6.818 |
Token | of |
Token ID | 286 |
Feature activation | +1.70e+01 |
Pos logit contributions | |
Percentage | +18.312 |
(- | +16.603 |
Percent | +16.475 |
Killed | +16.279 |
Only | +16.218 |
Neg logit contributions | |
blogs | -16.558 |
learning | -16.353 |
monitor | -16.044 |
reading | -16.044 |
forums | -15.832 |
Token | ice |
Token ID | 4771 |
Feature activation | +7.60e+00 |
Pos logit contributions | |
Percentage | +15.053 |
Only | +13.768 |
(- | +13.571 |
Killed | +13.550 |
Millions | +13.402 |
Neg logit contributions | |
learning | -15.476 |
reading | -15.363 |
blogs | -15.342 |
monitor | -15.117 |
forums | -14.954 |
Token | ) |
Token ID | 8 |
Feature activation | +7.34e+00 |
Pos logit contributions | |
Percentage | +6.638 |
Killed | +5.752 |
Worse | +5.712 |
Only | +5.709 |
Millions | +5.636 |
Neg logit contributions | |
learning | -11.030 |
blogs | -10.979 |
reading | -10.947 |
monitor | -10.926 |
thanking | -10.734 |
Token |
|
Token ID | 198 |
Feature activation | -7.40e+00 |
Pos logit contributions | |
Percentage | +4.878 |
Killed | +4.156 |
Worse | +4.151 |
Only | +4.081 |
Millions | +4.062 |
Neg logit contributions | |
learning | -9.908 |
reading | -9.870 |
blogs | -9.847 |
monitor | -9.815 |
thanking | -9.667 |
Token |
|
Token ID | 198 |
Feature activation | -2.08e+00 |
Pos logit contributions | |
reading | +9.661 |
learning | +9.560 |
blogs | +9.536 |
monitor | +9.483 |
via | +9.284 |
Neg logit contributions | |
Percentage | -5.054 |
サーティワン | -4.317 |
Worse | -4.298 |
Percent | -4.278 |
Killed | -4.247 |
Token | Can |
Token ID | 6090 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
reading | +1.580 |
learning | +1.579 |
blogs | +1.574 |
monitor | +1.555 |
thanking | +1.502 |
Neg logit contributions | |
Percentage | -2.687 |
Killed | -2.472 |
Worse | -2.469 |
Percent | -2.439 |
Millions | -2.432 |
Token | 4 |
Token ID | 604 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
Percentage | +20.805 |
Only | +19.507 |
Worse | +19.479 |
Millions | +19.415 |
Percent | +19.107 |
Neg logit contributions | |
monitor | -14.239 |
thanking | -14.056 |
reading | -14.033 |
blogs | -14.003 |
learning | -13.791 |
Token | % |
Token ID | 4 |
Feature activation | +3.01e+01 |
Pos logit contributions | |
Percentage | +22.846 |
Percent | +21.849 |
Millions | +21.223 |
Worse | +21.014 |
Killed | +20.819 |
Neg logit contributions | |
monitor | -14.252 |
blogs | -14.215 |
thanking | -14.149 |
chatting | -14.142 |
learning | -14.054 |
Token | of |
Token ID | 286 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
Percentage | +28.835 |
Percent | +27.213 |
Worse | +27.092 |
Only | +26.704 |
Millions | +26.240 |
Neg logit contributions | |
blogs | -18.577 |
learning | -18.391 |
monitor | -18.156 |
chatting | -18.035 |
reading | -17.824 |
Token | Home |
Token ID | 5995 |
Feature activation | +9.97e+00 |
Pos logit contributions | |
Percentage | +23.349 |
Millions | +21.612 |
Only | +21.482 |
Percent | +21.427 |
Worse | +21.325 |
Neg logit contributions | |
monitor | -18.260 |
blogs | -18.181 |
reading | -18.170 |
learning | -18.112 |
chatting | -17.438 |
Token | owners |
Token ID | 15605 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
Percentage | +12.235 |
Worse | +11.200 |
Percent | +11.151 |
Only | +11.106 |
Killed | +11.102 |
Neg logit contributions | |
learning | -7.777 |
reading | -7.706 |
blogs | -7.655 |
thanking | -7.552 |
monitor | -7.548 |
Token | S |
Token ID | 311 |
Feature activation | +8.72e+00 |
Pos logit contributions | |
Percentage | +23.640 |
Only | +22.439 |
Worse | +22.370 |
Killed | +22.017 |
Percent | +21.853 |
Neg logit contributions | |
learning | -17.124 |
blogs | -16.843 |
reading | -16.797 |
thanking | -16.618 |
chatting | -16.390 |
Token | ink |
Token ID | 676 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
Percentage | +9.171 |
Millions | +8.389 |
Worse | +8.375 |
Only | +8.358 |
Killed | +8.280 |
Neg logit contributions | |
learning | -8.064 |
blogs | -8.021 |
chatting | -7.888 |
thanking | -7.883 |
reading | -7.807 |
Token | cannot |
Token ID | 2314 |
Feature activation | +1.75e+01 |
Pos logit contributions | |
Percentage | +18.976 |
Worse | +17.609 |
Only | +17.545 |
(- | +17.384 |
Likely | +17.130 |
Neg logit contributions | |
learning | -14.333 |
monitor | -14.042 |
blogs | -13.989 |
reading | -13.919 |
reader | -13.653 |
Token | much |
Token ID | 881 |
Feature activation | +1.50e+01 |
Pos logit contributions | |
Percentage | +16.394 |
Only | +15.138 |
Worse | +15.127 |
(- | +15.092 |
Likely | +14.725 |
Neg logit contributions | |
learning | -14.566 |
blogs | -14.492 |
reading | -14.276 |
thanking | -14.107 |
reader | -13.919 |
Token | exceed |
Token ID | 7074 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
Percentage | +15.197 |
Worse | +14.305 |
Only | +13.733 |
Likely | +13.704 |
(- | +13.655 |
Neg logit contributions | |
learning | -12.073 |
blogs | -12.064 |
reading | -11.746 |
forums | -11.591 |
thanking | -11.556 |
Token | 1 |
Token ID | 352 |
Feature activation | +2.06e+01 |
Pos logit contributions | |
Percentage | +22.833 |
(- | +21.510 |
Likely | +21.015 |
Only | +20.910 |
Percent | +20.620 |
Neg logit contributions | |
learning | -16.259 |
blogs | -16.085 |
reading | -16.083 |
reader | -15.656 |
monitor | -15.629 |
Token | . |
Token ID | 13 |
Feature activation | +2.32e+01 |
Pos logit contributions | |
Percentage | +19.716 |
Percent | +18.282 |
Killed | +17.774 |
Worse | +17.710 |
Millions | +17.610 |
Neg logit contributions | |
learning | -15.523 |
blogs | -15.490 |
thanking | -15.408 |
reading | -15.353 |
chatting | -15.068 |
Token | 2 |
Token ID | 17 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
Percentage | +20.489 |
Only | +19.076 |
Worse | +19.033 |
Killed | +18.501 |
Percent | +18.414 |
Neg logit contributions | |
blogs | -18.775 |
learning | -18.742 |
reading | -18.635 |
chatting | -18.582 |
thanking | -18.514 |
Token | K |
Token ID | 509 |
Feature activation | +1.79e+01 |
Pos logit contributions | |
Percentage | +26.593 |
Percent | +24.672 |
Worse | +24.091 |
Killed | +24.079 |
(- | +24.034 |
Neg logit contributions | |
learning | -18.271 |
reading | -18.156 |
monitor | -17.733 |
blogs | -17.710 |
reader | -17.648 |
Token | . |
Token ID | 13 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
Percentage | +18.934 |
Only | +17.277 |
(- | +17.185 |
Worse | +17.167 |
Percent | +17.137 |
Neg logit contributions | |
learning | -12.885 |
reading | -12.800 |
blogs | -12.677 |
reader | -12.549 |
monitor | -12.410 |
Token |
|
Token ID | 198 |
Feature activation | -5.40e+00 |
Pos logit contributions | |
Percentage | +19.008 |
Worse | +17.935 |
Only | +17.865 |
Millions | +17.378 |
Killed | +16.884 |
Neg logit contributions | |
learning | -17.155 |
monitor | -16.956 |
blogs | -16.937 |
reading | -16.706 |
chatting | -16.557 |
Token |
|
Token ID | 198 |
Feature activation | -6.89e+00 |
Pos logit contributions | |
reading | +7.416 |
learning | +7.365 |
blogs | +7.335 |
monitor | +7.294 |
thanking | +7.180 |
Neg logit contributions | |
Percentage | -3.510 |
Killed | -2.944 |
Worse | -2.929 |
Percent | -2.919 |
Millions | -2.825 |
Token | S |
Token ID | 50 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
reading | +5.261 |
learning | +5.209 |
blogs | +5.188 |
monitor | +5.132 |
reader | +4.905 |
Neg logit contributions | |
Percentage | -8.750 |
Killed | -8.088 |
Worse | -7.974 |
Percent | -7.962 |
Millions | -7.864 |
Token | - |
Token ID | 12 |
Feature activation | +6.81e+00 |
Pos logit contributions | |
Percentage | +24.529 |
Percent | +22.585 |
Only | +21.757 |
Worse | +21.754 |
Millions | +21.428 |
Neg logit contributions | |
learning | -15.080 |
blogs | -14.947 |
reading | -14.898 |
chatting | -14.448 |
monitor | -14.363 |
Token | to |
Token ID | 1462 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
Percentage | +9.186 |
Percent | +8.403 |
Killed | +8.329 |
Worse | +8.326 |
Millions | +8.298 |
Neg logit contributions | |
blogs | -4.616 |
learning | -4.548 |
reading | -4.509 |
chatting | -4.485 |
thanking | -4.433 |
Token | - |
Token ID | 12 |
Feature activation | +4.97e+00 |
Pos logit contributions | |
Percentage | +10.034 |
Percent | +8.849 |
Worse | +8.698 |
Killed | +8.689 |
Millions | +8.661 |
Neg logit contributions | |
blogs | -11.622 |
learning | -11.554 |
reading | -11.480 |
monitor | -11.402 |
chatting | -11.209 |
Token | G |
Token ID | 38 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
Percentage | +6.136 |
Killed | +5.560 |
Worse | +5.555 |
Millions | +5.554 |
Percent | +5.552 |
Neg logit contributions | |
blogs | -3.966 |
learning | -3.928 |
reading | -3.877 |
chatting | -3.847 |
monitor | -3.817 |
Token | DP |
Token ID | 6322 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
Percentage | +5.531 |
Only | +5.018 |
Percent | +5.004 |
Killed | +4.999 |
Worse | +4.970 |
Neg logit contributions | |
learning | -3.708 |
blogs | -3.669 |
reading | -3.592 |
monitor | -3.575 |
chatting | -3.514 |
Token | Ratio |
Token ID | 33956 |
Feature activation | +2.99e+01 |
Pos logit contributions | |
Percentage | +31.060 |
Percent | +28.725 |
Only | +27.280 |
Millions | +27.267 |
Ratio | +27.255 |
Neg logit contributions | |
learning | -17.834 |
blogs | -17.804 |
reading | -17.231 |
forums | -16.894 |
chatting | -16.811 |
Token | 1 |
Token ID | 352 |
Feature activation | +1.28e+01 |
Pos logit contributions | |
Percentage | +30.699 |
Percent | +28.373 |
Only | +27.531 |
Worse | +26.894 |
Average | +26.778 |
Neg logit contributions | |
learning | -17.416 |
blogs | -16.846 |
reading | -16.834 |
chatting | -16.386 |
forums | -16.353 |
Token | Mac |
Token ID | 4100 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
Percentage | +11.750 |
Only | +10.320 |
Percent | +10.319 |
Worse | +10.250 |
Killed | +10.175 |
Neg logit contributions | |
blogs | -13.115 |
learning | -13.097 |
reading | -13.085 |
monitor | -12.852 |
forums | -12.666 |
Token | ao |
Token ID | 5488 |
Feature activation | +2.10e+01 |
Pos logit contributions | |
Percentage | +4.580 |
Killed | +4.154 |
Millions | +4.138 |
Only | +4.111 |
Percent | +4.106 |
Neg logit contributions | |
blogs | -3.934 |
learning | -3.925 |
reading | -3.870 |
monitor | -3.818 |
thanking | -3.747 |
Token | SAR |
Token ID | 47341 |
Feature activation | +2.21e+01 |
Pos logit contributions | |
Percentage | +21.626 |
Only | +19.590 |
Percent | +19.405 |
Worse | +19.329 |
Millions | +19.178 |
Neg logit contributions | |
blogs | -15.945 |
reading | -15.892 |
learning | -15.874 |
forums | -15.302 |
monitor | -15.284 |
Token | 0 |
Token ID | 657 |
Feature activation | +2.29e+01 |
Pos logit contributions | |
Percentage | +23.073 |
Only | +20.987 |
Percent | +20.708 |
Millions | +20.669 |
Worse | +20.565 |
Neg logit contributions | |
blogs | -15.762 |
reading | -15.701 |
learning | -15.672 |
monitor | -15.082 |
forums | -14.965 |
Token |
|
Token ID | 198 |
Feature activation | -8.15e+00 |
Pos logit contributions | |
Percentage | +9.876 |
Worse | +8.821 |
Killed | +8.821 |
Only | +8.785 |
Millions | +8.768 |
Neg logit contributions | |
learning | -11.065 |
monitor | -10.971 |
reading | -10.967 |
blogs | -10.836 |
chatting | -10.667 |
Token |
|
Token ID | 198 |
Feature activation | -6.47e+00 |
Pos logit contributions | |
reading | +10.516 |
blogs | +10.383 |
learning | +10.368 |
monitor | +10.295 |
via | +10.168 |
Neg logit contributions | |
Percentage | -5.571 |
サーティワン | -4.795 |
Worse | -4.738 |
Percent | -4.707 |
Killed | -4.704 |
Token | Will |
Token ID | 8743 |
Feature activation | +1.80e+01 |
Pos logit contributions | |
reading | +5.209 |
blogs | +5.207 |
learning | +5.164 |
monitor | +5.106 |
reader | +4.887 |
Neg logit contributions | |
Percentage | -7.921 |
Killed | -7.268 |
Worse | -7.244 |
Percent | -7.157 |
Millions | -7.094 |
Token | Del |
Token ID | 4216 |
Feature activation | +6.01e+00 |
Pos logit contributions | |
Percentage | +20.326 |
Worse | +19.223 |
Only | +19.036 |
Millions | +18.894 |
Killed | +18.830 |
Neg logit contributions | |
monitor | -11.617 |
learning | -11.580 |
reading | -11.567 |
blogs | -11.498 |
thanking | -11.345 |
Token | inqu |
Token ID | 18934 |
Feature activation | +7.11e+00 |
Pos logit contributions | |
Percentage | +7.279 |
Worse | +6.698 |
Killed | +6.658 |
Millions | +6.617 |
Only | +6.603 |
Neg logit contributions | |
blogs | -4.776 |
reading | -4.699 |
learning | -4.687 |
monitor | -4.655 |
thanking | -4.606 |
Token | encies |
Token ID | 3976 |
Feature activation | +2.97e+01 |
Pos logit contributions | |
Percentage | +7.991 |
Killed | +7.338 |
Worse | +7.269 |
Percent | +7.238 |
Only | +7.233 |
Neg logit contributions | |
learning | -6.123 |
blogs | -6.090 |
reading | -6.032 |
monitor | -6.002 |
thanking | -5.969 |
Token | Trigger |
Token ID | 24593 |
Feature activation | +2.57e+01 |
Pos logit contributions | |
Percentage | +27.720 |
Worse | +26.923 |
Only | +26.731 |
Killed | +26.473 |
Millions | +25.760 |
Neg logit contributions | |
learning | -18.440 |
blogs | -18.240 |
chatting | -17.465 |
monitor | -17.380 |
reader | -17.289 |
Token | a |
Token ID | 257 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
Percentage | +25.159 |
Worse | +24.204 |
Millions | +23.796 |
Only | +23.419 |
Percent | +23.329 |
Neg logit contributions | |
monitor | -17.311 |
chatting | -17.055 |
blogs | -16.965 |
thanking | -16.906 |
reading | -16.884 |
Token | New |
Token ID | 968 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
Percentage | +15.500 |
Worse | +14.200 |
Millions | +14.032 |
Percent | +13.915 |
Killed | +13.779 |
Neg logit contributions | |
blogs | -16.811 |
monitor | -16.809 |
learning | -16.566 |
reading | -16.515 |
chatting | -16.336 |
Token | American |
Token ID | 1605 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
Percentage | +16.747 |
Millions | +15.213 |
Worse | +15.131 |
Percent | +15.024 |
Only | +14.992 |
Neg logit contributions | |
monitor | -17.224 |
blogs | -17.130 |
thanking | -16.976 |
learning | -16.933 |
chatting | -16.807 |
Token | Revolution |
Token ID | 9303 |
Feature activation | +1.83e+01 |
Pos logit contributions | |
Percentage | +12.871 |
Worse | +11.508 |
Percent | +11.402 |
Millions | +11.391 |
Killed | +11.307 |
Neg logit contributions | |
monitor | -16.506 |
blogs | -16.442 |
learning | -16.228 |
reading | -16.177 |
thanking | -16.077 |
Token | Gross |
Token ID | 21796 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
Percentage | +10.549 |
Percent | +9.414 |
Only | +9.347 |
Millions | +9.310 |
Killed | +9.299 |
Neg logit contributions | |
blogs | -8.927 |
learning | -8.787 |
monitor | -8.616 |
reading | -8.545 |
forums | -8.461 |
Token | National |
Token ID | 2351 |
Feature activation | +6.65e+00 |
Pos logit contributions | |
Percentage | +12.067 |
Millions | +10.589 |
Only | +10.576 |
Percent | +10.549 |
Killed | +10.217 |
Neg logit contributions | |
blogs | -17.460 |
learning | -17.352 |
monitor | -16.859 |
reading | -16.836 |
thanking | -16.765 |
Token | Product |
Token ID | 8721 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
Percentage | +3.971 |
Killed | +3.232 |
Millions | +3.169 |
Only | +3.131 |
Worse | +3.126 |
Neg logit contributions | |
blogs | -9.827 |
learning | -9.726 |
reading | -9.654 |
monitor | -9.550 |
thanking | -9.517 |
Token | of |
Token ID | 286 |
Feature activation | +1.95e+01 |
Pos logit contributions | |
Percentage | +21.273 |
Percent | +19.166 |
Only | +18.839 |
(- | +18.694 |
Millions | +18.675 |
Neg logit contributions | |
blogs | -16.609 |
learning | -16.340 |
forums | -15.683 |
monitor | -15.431 |
reading | -15.297 |
Token | $ |
Token ID | 720 |
Feature activation | +1.87e+01 |
Pos logit contributions | |
Percentage | +18.210 |
Only | +17.144 |
Millions | +16.995 |
Approximately | +16.722 |
Worse | +16.349 |
Neg logit contributions | |
blogs | -16.390 |
learning | -16.248 |
reading | -16.097 |
monitor | -15.970 |
forums | -15.709 |
Token | 20 |
Token ID | 1238 |
Feature activation | +2.96e+01 |
Pos logit contributions | |
Percentage | +16.807 |
Millions | +15.459 |
Only | +15.257 |
Worse | +14.954 |
Killed | +14.928 |
Neg logit contributions | |
learning | -16.095 |
blogs | -16.078 |
reading | -16.048 |
monitor | -15.844 |
chatting | -15.713 |
Token | billion |
Token ID | 2997 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
Percentage | +26.772 |
Millions | +25.283 |
Percent | +24.770 |
Only | +24.732 |
Worse | +23.969 |
Neg logit contributions | |
reading | -18.645 |
blogs | -18.325 |
learning | -17.939 |
monitor | -17.713 |
reader | -17.271 |
Token | , |
Token ID | 11 |
Feature activation | +6.55e+00 |
Pos logit contributions | |
Percentage | +22.481 |
Millions | +20.354 |
Only | +20.350 |
(- | +20.334 |
Percent | +20.258 |
Neg logit contributions | |
blogs | -16.184 |
reading | -15.612 |
learning | -15.594 |
monitor | -15.546 |
reader | -15.036 |
Token | more |
Token ID | 517 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
Percentage | +6.636 |
Killed | +5.916 |
Millions | +5.887 |
Only | +5.886 |
Worse | +5.869 |
Neg logit contributions | |
learning | -6.615 |
reading | -6.575 |
blogs | -6.575 |
monitor | -6.522 |
thanking | -6.308 |
Token | than |
Token ID | 621 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
Percentage | +12.876 |
Millions | +11.804 |
Percent | +11.497 |
Killed | +11.490 |
Only | +11.482 |
Neg logit contributions | |
learning | -11.510 |
blogs | -11.373 |
reading | -11.266 |
monitor | -10.977 |
forums | -10.698 |
Token | half |
Token ID | 2063 |
Feature activation | +2.16e+01 |
Pos logit contributions | |
Percentage | +18.879 |
Killed | +17.087 |
Twice | +16.873 |
Millions | +16.758 |
Only | +16.607 |
Neg logit contributions | |
learning | -18.088 |
blogs | -18.036 |
reading | -17.662 |
forums | -17.627 |
monitor | -17.459 |
Token | , |
Token ID | 11 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
Percentage | +10.359 |
Only | +9.335 |
Worse | +9.194 |
Killed | +9.167 |
Percent | +9.116 |
Neg logit contributions | |
blogs | -11.275 |
learning | -11.185 |
monitor | -11.149 |
reading | -11.091 |
forums | -10.837 |
Token | the |
Token ID | 262 |
Feature activation | +6.90e+00 |
Pos logit contributions | |
Percentage | +3.295 |
Worse | +2.961 |
Killed | +2.954 |
Only | +2.952 |
Millions | +2.940 |
Neg logit contributions | |
learning | -3.060 |
reading | -3.055 |
monitor | -3.047 |
blogs | -3.040 |
thanking | -2.913 |
Token | national |
Token ID | 2260 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Percentage | +7.134 |
Only | +6.380 |
Millions | +6.374 |
Worse | +6.359 |
Percent | +6.310 |
Neg logit contributions | |
learning | -6.802 |
monitor | -6.732 |
reading | -6.716 |
blogs | -6.714 |
thanking | -6.484 |
Token | debt |
Token ID | 5057 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
learning | +1.183 |
reading | +1.180 |
blogs | +1.178 |
monitor | +1.165 |
thanking | +1.134 |
Neg logit contributions | |
Percentage | -1.712 |
Killed | -1.565 |
Worse | -1.563 |
Percent | -1.544 |
Millions | -1.541 |
Token | cannot |
Token ID | 2314 |
Feature activation | +2.15e+01 |
Pos logit contributions | |
Percentage | +13.569 |
Only | +12.299 |
Worse | +12.097 |
Percent | +11.845 |
Millions | +11.799 |
Neg logit contributions | |
learning | -13.303 |
blogs | -13.096 |
reading | -12.827 |
monitor | -12.712 |
thanking | -12.418 |
Token | exceed |
Token ID | 7074 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
Percentage | +17.210 |
Only | +15.849 |
(- | +15.558 |
Approximately | +15.422 |
Worse | +15.384 |
Neg logit contributions | |
learning | -19.386 |
blogs | -18.488 |
reading | -18.485 |
reader | -17.965 |
thanking | -17.921 |
Token | $ |
Token ID | 720 |
Feature activation | +2.14e+01 |
Pos logit contributions | |
Percentage | +23.352 |
Millions | +21.538 |
Thirty | +21.384 |
Approximately | +21.287 |
Percent | +21.265 |
Neg logit contributions | |
learning | -21.431 |
monitor | -21.145 |
blogs | -20.841 |
reading | -20.420 |
forums | -20.121 |
Token | 16 |
Token ID | 1433 |
Feature activation | +3.03e+01 |
Pos logit contributions | |
Percentage | +17.793 |
Millions | +16.469 |
Only | +15.985 |
Worse | +15.666 |
Percent | +15.580 |
Neg logit contributions | |
chatting | -18.610 |
arranging | -18.295 |
learning | -18.285 |
workspace | -18.249 |
monitor | -18.167 |
Token | . |
Token ID | 13 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
Percentage | +25.234 |
Percent | +23.886 |
Only | +23.564 |
Worse | +23.058 |
Millions | +22.946 |
Neg logit contributions | |
reading | -19.752 |
learning | -19.056 |
blogs | -18.979 |
thanking | -18.933 |
monitor | -18.837 |
Token | 7 |
Token ID | 22 |
Feature activation | +3.12e+01 |
Pos logit contributions | |
Percentage | +22.192 |
Only | +20.839 |
Millions | +20.470 |
Percent | +20.337 |
Worse | +20.151 |
Neg logit contributions | |
blogs | -23.061 |
learning | -22.899 |
chatting | -22.846 |
arranging | -22.525 |
reading | -22.520 |
Token | trillion |
Token ID | 12989 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
Percentage | +23.347 |
Percent | +22.142 |
Only | +21.727 |
Millions | +21.568 |
Worse | +20.968 |
Neg logit contributions | |
reading | -21.606 |
monitor | -21.582 |
learning | -21.542 |
thanking | -21.302 |
asking | -21.279 |
Token | a |
Token ID | 257 |
Feature activation | -2.59e+00 |
Pos logit contributions | |
Percentage | +1.322 |
Worse | +1.199 |
Killed | +1.197 |
Millions | +1.183 |
Only | +1.175 |
Neg logit contributions | |
reading | -1.233 |
learning | -1.230 |
blogs | -1.222 |
monitor | -1.205 |
thanking | -1.191 |
Token | 2007 |
Token ID | 4343 |
Feature activation | +7.26e+00 |
Pos logit contributions | |
learning | +2.708 |
reading | +2.705 |
blogs | +2.697 |
monitor | +2.682 |
thanking | +2.617 |
Neg logit contributions | |
Percentage | -2.588 |
Killed | -2.321 |
Worse | -2.314 |
Percent | -2.281 |
Millions | -2.271 |
Token | World |
Token ID | 2159 |
Feature activation | +6.62e+00 |
Pos logit contributions | |
Percentage | +9.290 |
Worse | +8.577 |
Millions | +8.530 |
Percent | +8.482 |
Killed | +8.480 |
Neg logit contributions | |
blogs | -5.211 |
learning | -5.181 |
reading | -5.156 |
thanking | -5.053 |
reader | -5.006 |
Token | Bank |
Token ID | 5018 |
Feature activation | +4.81e-01 |
Pos logit contributions | |
Percentage | +3.778 |
Worse | +3.155 |
Killed | +3.154 |
Millions | +3.124 |
Only | +3.057 |
Neg logit contributions | |
reading | -9.586 |
learning | -9.583 |
blogs | -9.528 |
thanking | -9.421 |
chatting | -9.280 |
Token | study |
Token ID | 2050 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
Percentage | +0.659 |
Worse | +0.609 |
Killed | +0.608 |
Percent | +0.602 |
Millions | +0.602 |
Neg logit contributions | |
learning | -0.329 |
blogs | -0.329 |
reading | -0.329 |
monitor | -0.321 |
thanking | -0.313 |
Token | . |
Token ID | 13 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
Percentage | +0.123 |
Killed | +0.110 |
Worse | +0.110 |
Percent | +0.108 |
Millions | +0.108 |
Neg logit contributions | |
learning | -0.137 |
reading | -0.137 |
blogs | -0.137 |
monitor | -0.136 |
thanking | -0.133 |
Token |
|
Token ID | 198 |
Feature activation | -5.03e+00 |
Pos logit contributions | |
Percentage | +26.396 |
Millions | +25.758 |
Worse | +25.433 |
Only | +25.393 |
Percent | +24.211 |
Neg logit contributions | |
learning | -20.338 |
chatting | -20.074 |
workspace | -20.035 |
brainstorm | -19.841 |
blogs | -19.822 |
Token |
|
Token ID | 198 |
Feature activation | -5.66e+00 |
Pos logit contributions | |
reading | +6.948 |
learning | +6.877 |
blogs | +6.851 |
monitor | +6.839 |
thanking | +6.694 |
Neg logit contributions | |
Percentage | -3.250 |
Worse | -2.724 |
Killed | -2.720 |
Percent | -2.700 |
Millions | -2.614 |
Token | Y |
Token ID | 56 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
reading | +4.411 |
blogs | +4.380 |
learning | +4.376 |
monitor | +4.370 |
thanking | +4.116 |
Neg logit contributions | |
Percentage | -7.104 |
Killed | -6.525 |
Worse | -6.466 |
Percent | -6.435 |
Millions | -6.334 |
Token | un |
Token ID | 403 |
Feature activation | +2.62e+00 |
Pos logit contributions | |
reading | +2.184 |
learning | +2.183 |
blogs | +2.176 |
monitor | +2.155 |
thanking | +2.101 |
Neg logit contributions | |
Percentage | -2.842 |
Killed | -2.588 |
Worse | -2.586 |
Percent | -2.550 |
Millions | -2.546 |
Token | Ya |
Token ID | 26421 |
Feature activation | +9.82e+00 |
Pos logit contributions | |
Percentage | +2.998 |
Killed | +2.736 |
Worse | +2.730 |
Percent | +2.691 |
Only | +2.689 |
Neg logit contributions | |
learning | -2.342 |
reading | -2.338 |
blogs | -2.334 |
monitor | -2.301 |
thanking | -2.256 |
Token | twitter |
Token ID | 17044 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
blogs | +8.756 |
reading | +8.599 |
learning | +8.520 |
monitor | +8.487 |
chatting | +8.456 |
Neg logit contributions | |
Percentage | -9.084 |
Worse | -8.256 |
Killed | -8.150 |
Percent | -8.023 |
Millions | -7.946 |
Token | and |
Token ID | 290 |
Feature activation | -2.85e+01 |
Pos logit contributions | |
blogs | +13.233 |
reading | +13.137 |
chatting | +12.870 |
monitor | +12.851 |
thanking | +12.841 |
Neg logit contributions | |
Percentage | -10.846 |
Worse | -9.696 |
Killed | -9.670 |
Percent | -9.431 |
Millions | -9.260 |
Token | social |
Token ID | 1919 |
Feature activation | -1.82e+01 |
Pos logit contributions | |
blogs | +26.441 |
chatting | +26.127 |
reading | +25.499 |
thanking | +25.440 |
forums | +25.306 |
Neg logit contributions | |
Percentage | -18.746 |
サーティワン | -16.272 |
Worse | -15.897 |
Killed | -15.235 |
Percent | -15.213 |
Token | media |
Token ID | 2056 |
Feature activation | -1.78e+01 |
Pos logit contributions | |
blogs | +16.395 |
reading | +16.000 |
chatting | +15.970 |
learning | +15.768 |
thanking | +15.718 |
Neg logit contributions | |
Percentage | -17.051 |
Worse | -15.211 |
Killed | -14.903 |
Percent | -14.637 |
Millions | -14.421 |
Token | pages |
Token ID | 5468 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
blogs | +17.600 |
chatting | +17.411 |
thanking | +17.198 |
reading | +17.092 |
monitor | +16.906 |
Neg logit contributions | |
Percentage | -14.909 |
Worse | -13.265 |
Killed | -13.206 |
Percent | -12.893 |
サーティワン | -12.749 |
Token | , |
Token ID | 11 |
Feature activation | -3.89e+01 |
Pos logit contributions | |
blogs | +15.496 |
reading | +15.385 |
monitor | +15.287 |
chatting | +15.284 |
thanking | +15.256 |
Neg logit contributions | |
Percentage | -11.442 |
Worse | -10.285 |
Killed | -10.275 |
Percent | -10.009 |
サーティワン | -9.787 |
Token | and |
Token ID | 290 |
Feature activation | -2.88e+01 |
Pos logit contributions | |
chatting | +32.363 |
blogs | +31.850 |
thanking | +31.717 |
reading | +31.119 |
brainstorm | +30.836 |
Neg logit contributions | |
Percentage | -20.244 |
サーティワン | -18.600 |
Worse | -17.954 |
Killed | -17.144 |
Percent | -17.140 |
Token | you |
Token ID | 345 |
Feature activation | -8.19e+00 |
Pos logit contributions | |
chatting | +26.211 |
brainstorm | +25.480 |
blogs | +25.420 |
reading | +25.253 |
thanking | +25.247 |
Neg logit contributions | |
Percentage | -18.929 |
サーティワン | -17.451 |
Worse | -16.624 |
Killed | -16.387 |
Percent | -15.793 |
Token | can |
Token ID | 460 |
Feature activation | -1.43e+01 |
Pos logit contributions | |
blogs | +7.630 |
learning | +7.489 |
reading | +7.465 |
monitor | +7.403 |
chatting | +7.267 |
Neg logit contributions | |
Percentage | -8.822 |
Worse | -8.016 |
Percent | -7.908 |
Killed | -7.878 |
Millions | -7.725 |
Token | get |
Token ID | 651 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
chatting | +12.370 |
monitor | +12.268 |
blogs | +12.251 |
reading | +12.199 |
learning | +12.025 |
Neg logit contributions | |
Percentage | -14.738 |
Worse | -13.428 |
Killed | -13.247 |
サーティワン | -13.063 |
Percent | -13.030 |
Token | a |
Token ID | 257 |
Feature activation | -1.53e+01 |
Pos logit contributions | |
chatting | +11.221 |
blogs | +10.969 |
reading | +10.911 |
learning | +10.796 |
thanking | +10.788 |
Neg logit contributions | |
Percentage | -11.186 |
Worse | -9.978 |
Percent | -9.912 |
Killed | -9.719 |
Only | -9.609 |
Token | motivated |
Token ID | 13338 |
Feature activation | -8.10e+00 |
Pos logit contributions | |
learning | +1.692 |
reading | +1.691 |
blogs | +1.687 |
monitor | +1.669 |
thanking | +1.623 |
Neg logit contributions | |
Percentage | -2.664 |
Worse | -2.444 |
Killed | -2.443 |
Percent | -2.414 |
Millions | -2.408 |
Token | to |
Token ID | 284 |
Feature activation | -1.29e+01 |
Pos logit contributions | |
learning | +8.077 |
reading | +8.013 |
blogs | +7.975 |
thanking | +7.884 |
monitor | +7.869 |
Neg logit contributions | |
Percentage | -8.066 |
Worse | -7.384 |
Killed | -7.304 |
Percent | -7.185 |
Millions | -7.165 |
Token | build |
Token ID | 1382 |
Feature activation | -8.06e+00 |
Pos logit contributions | |
monitor | +10.307 |
blogs | +10.291 |
learning | +10.252 |
chatting | +10.208 |
reading | +10.153 |
Neg logit contributions | |
Percentage | -14.095 |
Worse | -12.853 |
Killed | -12.727 |
Percent | -12.641 |
サーティワン | -12.581 |
Token | projects |
Token ID | 4493 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
blogs | +8.299 |
learning | +8.291 |
reading | +8.178 |
monitor | +8.138 |
thanking | +8.030 |
Neg logit contributions | |
Percentage | -7.801 |
Killed | -6.955 |
Worse | -6.946 |
Percent | -6.839 |
Millions | -6.775 |
Token | myself |
Token ID | 3589 |
Feature activation | -1.21e+01 |
Pos logit contributions | |
thanking | +13.244 |
blogs | +13.178 |
reading | +13.158 |
learning | +13.136 |
monitor | +13.033 |
Neg logit contributions | |
Percentage | -12.631 |
Worse | -11.416 |
Killed | -11.373 |
Percent | -11.150 |
Millions | -11.033 |
Token | , |
Token ID | 11 |
Feature activation | -3.70e+01 |
Pos logit contributions | |
learning | +13.714 |
blogs | +13.579 |
reading | +13.526 |
thanking | +13.511 |
monitor | +13.381 |
Neg logit contributions | |
Percentage | -9.601 |
Worse | -8.659 |
Killed | -8.540 |
Percent | -8.342 |
Millions | -8.295 |
Token | or |
Token ID | 393 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
thanking | +32.043 |
chatting | +31.779 |
learning | +31.492 |
researching | +31.443 |
blogs | +31.035 |
Neg logit contributions | |
Percentage | -18.414 |
サーティワン | -16.233 |
Worse | -16.156 |
Percent | -15.819 |
Killed | -15.765 |
Token | contribute |
Token ID | 8676 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
chatting | +19.529 |
blogs | +19.478 |
thanking | +19.234 |
learning | +19.189 |
monitor | +19.169 |
Neg logit contributions | |
Percentage | -16.017 |
Percent | -13.745 |
サーティワン | -13.668 |
Killed | -13.548 |
Worse | -13.342 |
Token | to |
Token ID | 284 |
Feature activation | -1.77e+01 |
Pos logit contributions | |
blogs | +11.640 |
learning | +11.623 |
reading | +11.586 |
thanking | +11.387 |
monitor | +11.379 |
Neg logit contributions | |
Percentage | -12.159 |
Worse | -11.011 |
Killed | -10.898 |
Percent | -10.815 |
Millions | -10.687 |
Token | big |
Token ID | 1263 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
blogs | +18.602 |
learning | +18.306 |
chatting | +17.926 |
reading | +17.899 |
monitor | +17.825 |
Neg logit contributions | |
Percentage | -13.696 |
Worse | -11.913 |
Killed | -11.824 |
Percent | -11.760 |
サーティワン | -11.489 |
Token | projects |
Token ID | 4493 |
Feature activation | -1.81e+01 |
Pos logit contributions | |
learning | +10.332 |
blogs | +10.305 |
reading | +10.132 |
monitor | +10.095 |
forums | +9.844 |
Neg logit contributions | |
Percentage | -10.528 |
Worse | -9.590 |
Killed | -9.525 |
Percent | -9.411 |
Millions | -9.305 |
Token | the |
Token ID | 262 |
Feature activation | -7.53e+00 |
Pos logit contributions | |
blogs | +8.493 |
reading | +8.383 |
learning | +8.382 |
chatting | +8.350 |
monitor | +8.335 |
Neg logit contributions | |
Percentage | -7.424 |
Worse | -6.671 |
Killed | -6.657 |
Percent | -6.460 |
Millions | -6.403 |
Token | match |
Token ID | 2872 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
blogs | +8.338 |
reading | +8.267 |
learning | +8.230 |
monitor | +8.181 |
chatting | +8.157 |
Neg logit contributions | |
Percentage | -6.685 |
Killed | -5.970 |
Worse | -5.946 |
Percent | -5.757 |
Millions | -5.688 |
Token | from |
Token ID | 422 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
blogs | +14.073 |
monitor | +13.805 |
chatting | +13.741 |
learning | +13.691 |
reading | +13.684 |
Neg logit contributions | |
Percentage | -11.747 |
Killed | -10.599 |
Worse | -10.528 |
Percent | -10.351 |
Millions | -10.026 |
Token | your |
Token ID | 534 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
blogs | +13.239 |
learning | +13.125 |
reading | +13.056 |
monitor | +13.053 |
chatting | +13.040 |
Neg logit contributions | |
Percentage | -9.641 |
Worse | -8.388 |
Killed | -8.300 |
Percent | -8.137 |
Millions | -7.894 |
Token | couch |
Token ID | 18507 |
Feature activation | -1.64e+01 |
Pos logit contributions | |
blogs | +14.220 |
monitor | +14.214 |
reading | +14.163 |
chatting | +14.024 |
learning | +13.949 |
Neg logit contributions | |
Percentage | -11.550 |
Worse | -10.476 |
Percent | -10.213 |
Killed | -10.204 |
Millions | -9.801 |
Token | , |
Token ID | 11 |
Feature activation | -3.59e+01 |
Pos logit contributions | |
monitor | +18.189 |
reading | +18.054 |
chatting | +17.930 |
reader | +17.769 |
learning | +17.718 |
Neg logit contributions | |
Percentage | -11.875 |
Killed | -10.809 |
Worse | -10.666 |
Percent | -10.492 |
Millions | -10.190 |
Token | as |
Token ID | 355 |
Feature activation | -7.75e+00 |
Pos logit contributions | |
chatting | +32.499 |
thanking | +31.002 |
monitor | +30.948 |
reading | +30.827 |
blogs | +30.340 |
Neg logit contributions | |
Percentage | -18.638 |
Percent | -17.086 |
Worse | -16.563 |
サーティワン | -16.450 |
Killed | -16.449 |
Token | it |
Token ID | 340 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
blogs | +7.834 |
reading | +7.797 |
learning | +7.754 |
monitor | +7.739 |
chatting | +7.672 |
Neg logit contributions | |
Percentage | -7.612 |
Worse | -6.905 |
Killed | -6.857 |
Percent | -6.684 |
Millions | -6.580 |
Token | will |
Token ID | 481 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
Percentage | +1.706 |
Killed | +1.518 |
Worse | +1.509 |
Millions | +1.496 |
Only | +1.494 |
Neg logit contributions | |
learning | -1.993 |
reading | -1.983 |
blogs | -1.971 |
monitor | -1.960 |
thanking | -1.926 |
Token | be |
Token ID | 307 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
learning | +0.013 |
reading | +0.013 |
blogs | +0.013 |
monitor | +0.013 |
thanking | +0.013 |
Neg logit contributions | |
Percentage | -0.017 |
Killed | -0.015 |
Worse | -0.015 |
Millions | -0.015 |
Percent | -0.015 |
Token | broadcast |
Token ID | 7025 |
Feature activation | -7.53e+00 |
Pos logit contributions | |
blogs | +2.366 |
reading | +2.364 |
learning | +2.363 |
monitor | +2.339 |
thanking | +2.295 |
Neg logit contributions | |
Percentage | -3.118 |
Killed | -2.838 |
Worse | -2.837 |
Percent | -2.804 |
Millions | -2.786 |
Token | of |
Token ID | 286 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
reading | +9.639 |
learning | +9.456 |
blogs | +9.453 |
monitor | +9.138 |
chatting | +9.120 |
Neg logit contributions | |
Percentage | -9.672 |
Worse | -8.761 |
Killed | -8.724 |
Percent | -8.616 |
Millions | -8.575 |
Token | mouth |
Token ID | 5422 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
chatting | +6.315 |
reading | +6.277 |
thanking | +6.226 |
learning | +6.026 |
blogs | +6.021 |
Neg logit contributions | |
Percentage | -21.164 |
Killed | -19.946 |
サーティワン | -19.862 |
Worse | -19.852 |
Percent | -19.795 |
Token | and |
Token ID | 290 |
Feature activation | -2.50e+01 |
Pos logit contributions | |
reading | +15.779 |
thanking | +15.653 |
learning | +15.559 |
blogs | +15.522 |
chatting | +15.277 |
Neg logit contributions | |
Percentage | -13.449 |
Worse | -12.489 |
Killed | -12.408 |
サーティワン | -12.224 |
Percent | -11.932 |
Token | social |
Token ID | 1919 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
chatting | +24.332 |
blogs | +23.953 |
thanking | +23.779 |
brainstorm | +23.357 |
reading | +23.347 |
Neg logit contributions | |
Percentage | -17.239 |
サーティワン | -15.904 |
Worse | -15.265 |
Killed | -14.745 |
Percent | -14.340 |
Token | media |
Token ID | 2056 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
reading | +15.114 |
learning | +15.029 |
blogs | +14.945 |
chatting | +14.870 |
thanking | +14.638 |
Neg logit contributions | |
Percentage | -22.495 |
Worse | -20.989 |
Killed | -20.622 |
サーティワン | -20.321 |
Percent | -19.914 |
Token | , |
Token ID | 11 |
Feature activation | -3.56e+01 |
Pos logit contributions | |
blogs | +17.955 |
chatting | +17.910 |
reading | +17.884 |
thanking | +17.811 |
learning | +17.809 |
Neg logit contributions | |
Percentage | -15.292 |
Worse | -13.916 |
サーティワン | -13.840 |
Killed | -13.808 |
Percent | -13.372 |
Token | and |
Token ID | 290 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
thanking | +31.354 |
chatting | +31.019 |
learning | +29.775 |
arranging | +29.698 |
researching | +29.548 |
Neg logit contributions | |
Percentage | -18.808 |
サーティワン | -17.496 |
Worse | -16.205 |
Killed | -15.852 |
Percent | -15.641 |
Token | Carter |
Token ID | 10831 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
chatting | +19.710 |
thanking | +19.655 |
blogs | +19.370 |
learning | +19.288 |
reading | +19.123 |
Neg logit contributions | |
Percentage | -13.366 |
Worse | -11.733 |
Killed | -11.637 |
サーティワン | -11.443 |
Percent | -11.059 |
Token | expects |
Token ID | 13423 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
thanking | +10.586 |
blogs | +10.526 |
learning | +10.458 |
chatting | +10.444 |
monitor | +10.418 |
Neg logit contributions | |
Percentage | -11.899 |
Worse | -10.851 |
Killed | -10.730 |
Percent | -10.664 |
Millions | -10.535 |
Token | a |
Token ID | 257 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
Percentage | +0.742 |
Killed | +0.670 |
Worse | +0.670 |
Millions | +0.664 |
Percent | +0.663 |
Neg logit contributions | |
learning | -0.647 |
reading | -0.646 |
blogs | -0.644 |
monitor | -0.640 |
thanking | -0.619 |
Token | bump |
Token ID | 13852 |
Feature activation | -4.79e+00 |
Pos logit contributions | |
learning | +3.428 |
reading | +3.426 |
blogs | +3.401 |
monitor | +3.383 |
thanking | +3.326 |
Neg logit contributions | |
Percentage | -3.750 |
Killed | -3.399 |
Worse | -3.394 |
Percent | -3.337 |
Millions | -3.323 |
Token | time |
Token ID | 640 |
Feature activation | -5.86e+00 |
Pos logit contributions | |
reading | +2.220 |
learning | +2.218 |
blogs | +2.212 |
monitor | +2.195 |
thanking | +2.149 |
Neg logit contributions | |
Percentage | -2.324 |
Killed | -2.091 |
Worse | -2.090 |
Percent | -2.062 |
Millions | -2.058 |
Token | to |
Token ID | 284 |
Feature activation | -1.25e+01 |
Pos logit contributions | |
learning | +5.334 |
reading | +5.300 |
monitor | +5.216 |
blogs | +5.215 |
thanking | +5.127 |
Neg logit contributions | |
Percentage | -6.499 |
Worse | -5.957 |
Killed | -5.924 |
Percent | -5.841 |
Millions | -5.822 |
Token | develop |
Token ID | 1205 |
Feature activation | -8.85e+00 |
Pos logit contributions | |
monitor | +10.822 |
chatting | +10.697 |
reading | +10.695 |
learning | +10.624 |
blogs | +10.442 |
Neg logit contributions | |
Percentage | -13.008 |
Worse | -11.857 |
Killed | -11.716 |
Percent | -11.691 |
Millions | -11.673 |
Token | your |
Token ID | 534 |
Feature activation | -9.53e+00 |
Pos logit contributions | |
learning | +8.124 |
reading | +8.102 |
blogs | +8.006 |
monitor | +7.940 |
chatting | +7.932 |
Neg logit contributions | |
Percentage | -9.399 |
Killed | -8.459 |
Worse | -8.452 |
Millions | -8.443 |
Percent | -8.354 |
Token | character |
Token ID | 2095 |
Feature activation | -1.40e+01 |
Pos logit contributions | |
reading | +9.868 |
learning | +9.788 |
monitor | +9.657 |
chatting | +9.630 |
blogs | +9.613 |
Neg logit contributions | |
Percentage | -8.864 |
Worse | -7.983 |
Millions | -7.913 |
Killed | -7.862 |
Percent | -7.767 |
Token | , |
Token ID | 11 |
Feature activation | -3.51e+01 |
Pos logit contributions | |
reading | +15.442 |
learning | +15.403 |
chatting | +15.089 |
blogs | +14.925 |
monitor | +14.921 |
Neg logit contributions | |
Percentage | -11.152 |
Killed | -9.938 |
Worse | -9.824 |
Millions | -9.765 |
Percent | -9.748 |
Token | but |
Token ID | 475 |
Feature activation | -8.56e+00 |
Pos logit contributions | |
chatting | +30.825 |
thanking | +30.686 |
researching | +30.297 |
arranging | +30.048 |
learning | +29.970 |
Neg logit contributions | |
Percentage | -18.294 |
サーティワン | -16.667 |
Percent | -16.346 |
Worse | -16.094 |
Millions | -15.814 |
Token | I |
Token ID | 314 |
Feature activation | -8.79e+00 |
Pos logit contributions | |
learning | +8.181 |
reading | +8.146 |
blogs | +8.017 |
monitor | +8.010 |
thanking | +8.005 |
Neg logit contributions | |
Percentage | -8.872 |
Killed | -7.995 |
Worse | -7.919 |
Millions | -7.863 |
Percent | -7.848 |
Token | wish |
Token ID | 4601 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
blogs | +7.642 |
learning | +7.542 |
reading | +7.536 |
monitor | +7.513 |
chatting | +7.400 |
Neg logit contributions | |
Percentage | -9.748 |
Worse | -8.839 |
Killed | -8.776 |
Millions | -8.774 |
Percent | -8.765 |
Token | it |
Token ID | 340 |
Feature activation | +2.75e+00 |
Pos logit contributions | |
Percentage | +1.864 |
Worse | +1.690 |
Killed | +1.688 |
Percent | +1.662 |
Only | +1.658 |
Neg logit contributions | |
reading | -1.675 |
blogs | -1.674 |
learning | -1.672 |
monitor | -1.658 |
thanking | -1.612 |
Token | had |
Token ID | 550 |
Feature activation | +6.30e+00 |
Pos logit contributions | |
Percentage | +2.493 |
Killed | +2.208 |
Worse | +2.203 |
Only | +2.164 |
Percent | +2.159 |
Neg logit contributions | |
learning | -3.136 |
blogs | -3.131 |
reading | -3.121 |
monitor | -3.103 |
thanking | -3.012 |
Token | involved |
Token ID | 2950 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
learning | +3.697 |
reading | +3.693 |
blogs | +3.686 |
monitor | +3.656 |
thanking | +3.588 |
Neg logit contributions | |
Percentage | -3.808 |
Killed | -3.419 |
Worse | -3.411 |
Percent | -3.392 |
Millions | -3.371 |
Token | in |
Token ID | 287 |
Feature activation | -1.58e+01 |
Pos logit contributions | |
learning | +10.098 |
reading | +9.940 |
monitor | +9.851 |
blogs | +9.850 |
chatting | +9.794 |
Neg logit contributions | |
Percentage | -11.238 |
Killed | -10.151 |
Percent | -10.130 |
Worse | -10.108 |
Millions | -9.935 |
Token | the |
Token ID | 262 |
Feature activation | -1.46e+01 |
Pos logit contributions | |
learning | +16.498 |
chatting | +16.395 |
blogs | +16.259 |
thanking | +16.207 |
reading | +16.189 |
Neg logit contributions | |
Percentage | -13.112 |
Killed | -11.282 |
Worse | -11.224 |
Percent | -11.178 |
サーティワン | -11.082 |
Token | business |
Token ID | 1597 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
learning | +15.522 |
reading | +15.306 |
chatting | +15.294 |
blogs | +15.235 |
thanking | +15.078 |
Neg logit contributions | |
Percentage | -12.019 |
Worse | -10.415 |
Killed | -10.361 |
Percent | -10.273 |
サーティワン | -10.213 |
Token | community |
Token ID | 2055 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
learning | +17.534 |
reading | +17.294 |
blogs | +17.171 |
thanking | +17.162 |
chatting | +17.077 |
Neg logit contributions | |
Percentage | -14.503 |
Killed | -12.909 |
Percent | -12.820 |
Worse | -12.708 |
Millions | -12.411 |
Token | , |
Token ID | 11 |
Feature activation | -3.48e+01 |
Pos logit contributions | |
learning | +16.146 |
thanking | +16.120 |
chatting | +16.104 |
reading | +15.923 |
blogs | +15.875 |
Neg logit contributions | |
Percentage | -13.484 |
Killed | -12.051 |
Percent | -11.971 |
Worse | -11.896 |
サーティワン | -11.802 |
Token | she |
Token ID | 673 |
Feature activation | -1.49e+01 |
Pos logit contributions | |
thanking | +32.393 |
chatting | +31.949 |
learning | +31.319 |
arranging | +31.055 |
educating | +30.787 |
Neg logit contributions | |
Percentage | -16.670 |
サーティワン | -15.942 |
Worse | -14.071 |
Killed | -13.909 |
Percent | -13.694 |
Token | said |
Token ID | 531 |
Feature activation | -7.93e+00 |
Pos logit contributions | |
learning | +10.951 |
blogs | +10.951 |
thanking | +10.874 |
chatting | +10.813 |
reading | +10.812 |
Neg logit contributions | |
Percentage | -16.636 |
Worse | -15.399 |
Percent | -15.069 |
Millions | -14.974 |
Killed | -14.967 |
Token | . |
Token ID | 13 |
Feature activation | +8.60e+00 |
Pos logit contributions | |
learning | +8.018 |
reading | +7.952 |
monitor | +7.818 |
blogs | +7.807 |
thanking | +7.752 |
Neg logit contributions | |
Percentage | -7.695 |
Killed | -7.031 |
Worse | -6.966 |
Percent | -6.761 |
Millions | -6.712 |
Token |
|
Token ID | 198 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
Percentage | +5.228 |
Worse | +4.463 |
Only | +4.441 |
Killed | +4.389 |
Millions | +4.330 |
Neg logit contributions | |
blogs | -11.981 |
reading | -11.977 |
learning | -11.934 |
monitor | -11.922 |
thanking | -11.697 |
Token |
|
Token ID | 198 |
Feature activation | -1.83e+01 |
Pos logit contributions | |
reading | +17.952 |
learning | +17.437 |
via | +17.423 |
monitor | +17.382 |
blogs | +17.305 |
Neg logit contributions | |
Percentage | -12.740 |
サーティワン | -12.395 |
Percent | -11.199 |
Worse | -11.183 |
Killed | -10.942 |
Token | significant |
Token ID | 2383 |
Feature activation | +2.52e+00 |
Pos logit contributions | |
learning | +0.571 |
reading | +0.571 |
blogs | +0.569 |
monitor | +0.564 |
thanking | +0.551 |
Neg logit contributions | |
Percentage | -0.615 |
Worse | -0.555 |
Killed | -0.555 |
Percent | -0.547 |
Millions | -0.546 |
Token | time |
Token ID | 640 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
Percentage | +2.564 |
Worse | +2.272 |
Killed | +2.257 |
Percent | +2.256 |
Millions | +2.252 |
Neg logit contributions | |
blogs | -2.588 |
reading | -2.581 |
learning | -2.581 |
monitor | -2.569 |
reader | -2.494 |
Token | on |
Token ID | 319 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
learning | +11.749 |
reading | +11.699 |
monitor | +11.547 |
chatting | +11.539 |
thanking | +11.531 |
Neg logit contributions | |
Percentage | -11.319 |
Killed | -10.372 |
Percent | -10.125 |
Worse | -10.124 |
Millions | -10.051 |
Token | the |
Token ID | 262 |
Feature activation | -9.75e+00 |
Pos logit contributions | |
learning | +13.290 |
reading | +13.236 |
blogs | +13.210 |
monitor | +12.971 |
thanking | +12.895 |
Neg logit contributions | |
Percentage | -10.492 |
Killed | -9.531 |
Worse | -9.265 |
Millions | -9.196 |
Percent | -9.120 |
Token | phone |
Token ID | 3072 |
Feature activation | -1.97e+01 |
Pos logit contributions | |
learning | +10.529 |
reading | +10.469 |
blogs | +10.427 |
monitor | +10.307 |
chatting | +10.157 |
Neg logit contributions | |
Percentage | -8.800 |
Killed | -7.957 |
Worse | -7.800 |
Percent | -7.669 |
Millions | -7.653 |
Token | , |
Token ID | 11 |
Feature activation | -3.46e+01 |
Pos logit contributions | |
chatting | +20.459 |
thanking | +20.349 |
learning | +20.173 |
reading | +20.119 |
monitor | +19.736 |
Neg logit contributions | |
Percentage | -15.106 |
Killed | -14.091 |
Worse | -13.400 |
Percent | -13.326 |
Millions | -13.284 |
Token | responding |
Token ID | 14409 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
chatting | +32.762 |
thanking | +31.656 |
researching | +31.005 |
reading | +30.858 |
brainstorm | +30.773 |
Neg logit contributions | |
Percentage | -19.185 |
サーティワン | -17.290 |
Killed | -16.958 |
Percent | -16.601 |
Worse | -16.059 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
blogs | +10.722 |
reading | +10.687 |
learning | +10.593 |
thanking | +10.586 |
chatting | +10.456 |
Neg logit contributions | |
Percentage | -11.797 |
Killed | -10.879 |
Worse | -10.633 |
Percent | -10.601 |
Millions | -10.352 |
Token | emails |
Token ID | 7237 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
blogs | +13.648 |
thanking | +13.471 |
reading | +13.462 |
chatting | +13.460 |
learning | +13.389 |
Neg logit contributions | |
Percentage | -12.787 |
Killed | -11.527 |
Percent | -11.323 |
Worse | -11.322 |
サーティワン | -11.099 |
Token | , |
Token ID | 11 |
Feature activation | -3.01e+01 |
Pos logit contributions | |
thanking | +17.582 |
chatting | +17.018 |
reading | +16.886 |
blogs | +16.606 |
learning | +16.503 |
Neg logit contributions | |
Percentage | -12.579 |
Killed | -11.374 |
Percent | -11.179 |
Worse | -11.048 |
サーティワン | -10.907 |
Token | and |
Token ID | 290 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
chatting | +29.398 |
thanking | +29.036 |
researching | +28.222 |
reading | +28.197 |
arranging | +28.161 |
Neg logit contributions | |
Percentage | -18.255 |
サーティワン | -16.935 |
Killed | -16.242 |
Percent | -15.794 |
Worse | -15.648 |
Token | on |
Token ID | 319 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
reading | +13.315 |
blogs | +13.219 |
thanking | +13.197 |
learning | +13.143 |
chatting | +13.063 |
Neg logit contributions | |
Percentage | -10.589 |
Killed | -9.392 |
Worse | -9.367 |
Percent | -9.345 |
Millions | -9.040 |
Token | pretty |
Token ID | 2495 |
Feature activation | -4.74e+00 |
Pos logit contributions | |
reading | +11.742 |
blogs | +11.520 |
learning | +11.507 |
monitor | +11.315 |
chatting | +11.245 |
Neg logit contributions | |
Percentage | -10.948 |
Killed | -9.857 |
Worse | -9.652 |
Percent | -9.607 |
Millions | -9.326 |
Token | much |
Token ID | 881 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
reading | +4.087 |
blogs | +4.061 |
monitor | +4.031 |
learning | +4.026 |
thanking | +3.896 |
Neg logit contributions | |
Percentage | -5.613 |
Killed | -5.123 |
Worse | -5.099 |
Percent | -5.038 |
Millions | -4.993 |
Token | any |
Token ID | 597 |
Feature activation | -7.25e+00 |
Pos logit contributions | |
Percentage | +2.247 |
Killed | +2.039 |
Worse | +2.034 |
Only | +2.015 |
Millions | +2.009 |
Neg logit contributions | |
learning | -2.101 |
blogs | -2.083 |
reading | -2.077 |
monitor | -2.073 |
thanking | -2.006 |
Token | device |
Token ID | 3335 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
reading | +6.339 |
learning | +6.158 |
monitor | +6.157 |
blogs | +6.123 |
reader | +5.997 |
Neg logit contributions | |
Percentage | -8.338 |
Killed | -7.653 |
Worse | -7.620 |
Percent | -7.495 |
Millions | -7.458 |
Token | , |
Token ID | 11 |
Feature activation | -3.45e+01 |
Pos logit contributions | |
reading | +11.627 |
blogs | +11.505 |
learning | +11.490 |
monitor | +11.467 |
thanking | +11.369 |
Neg logit contributions | |
Percentage | -8.440 |
Worse | -7.428 |
Killed | -7.425 |
Percent | -7.363 |
Millions | -7.193 |
Token | including |
Token ID | 1390 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
thanking | +30.547 |
chatting | +30.302 |
reading | +30.255 |
blogs | +30.194 |
monitor | +29.725 |
Neg logit contributions | |
Percentage | -18.291 |
サーティワン | -16.809 |
Percent | -15.796 |
Killed | -15.719 |
Worse | -15.507 |
Token | mobile |
Token ID | 5175 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
blogs | +11.931 |
reading | +11.922 |
learning | +11.709 |
monitor | +11.700 |
chatting | +11.670 |
Neg logit contributions | |
Percentage | -10.539 |
Killed | -9.234 |
Worse | -9.164 |
Percent | -9.098 |
Millions | -8.862 |
Token | phones |
Token ID | 9512 |
Feature activation | -7.60e+00 |
Pos logit contributions | |
blogs | +11.909 |
reading | +11.901 |
monitor | +11.676 |
learning | +11.574 |
chatting | +11.513 |
Neg logit contributions | |
Percentage | -11.908 |
Killed | -10.698 |
Worse | -10.625 |
Percent | -10.584 |
Millions | -10.302 |
Token | and |
Token ID | 290 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
reading | +8.621 |
blogs | +8.554 |
learning | +8.512 |
monitor | +8.466 |
thanking | +8.378 |
Neg logit contributions | |
Percentage | -6.585 |
Worse | -5.868 |
Killed | -5.796 |
Percent | -5.773 |
Millions | -5.649 |
Token | net |
Token ID | 2010 |
Feature activation | -8.83e+00 |
Pos logit contributions | |
blogs | +16.447 |
reading | +16.171 |
chatting | +15.994 |
monitor | +15.595 |
learning | +15.566 |
Neg logit contributions | |
Percentage | -15.168 |
Killed | -13.409 |
サーティワン | -13.259 |
Worse | -13.250 |
Percent | -13.121 |
Token | f |
Token ID | 277 |
Feature activation | -5.45e+00 |
Pos logit contributions | |
learning | +9.637 |
blogs | +9.601 |
reading | +9.522 |
monitor | +9.514 |
chatting | +9.383 |
Neg logit contributions | |
Percentage | -10.078 |
Killed | -9.008 |
Percent | -8.963 |
Worse | -8.863 |
Millions | -8.688 |
Token | MRI |
Token ID | 40952 |
Feature activation | -8.76e+00 |
Pos logit contributions | |
learning | +2.982 |
reading | +2.942 |
blogs | +2.909 |
monitor | +2.862 |
reader | +2.667 |
Neg logit contributions | |
Percentage | -8.171 |
Killed | -7.642 |
Worse | -7.599 |
Percent | -7.553 |
Millions | -7.518 |
Token | and |
Token ID | 290 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
learning | +9.615 |
reading | +9.598 |
monitor | +9.496 |
blogs | +9.494 |
chatting | +9.354 |
Neg logit contributions | |
Percentage | -7.900 |
Killed | -7.024 |
Worse | -6.998 |
Percent | -6.896 |
Millions | -6.801 |
Token | medication |
Token ID | 14103 |
Feature activation | -8.56e+00 |
Pos logit contributions | |
learning | +20.670 |
monitor | +20.424 |
chatting | +20.312 |
blogs | +19.982 |
reading | +19.875 |
Neg logit contributions | |
Percentage | -15.357 |
Killed | -13.587 |
Percent | -13.438 |
Worse | -13.230 |
Millions | -12.980 |
Token | studies |
Token ID | 3640 |
Feature activation | -9.56e+00 |
Pos logit contributions | |
learning | +9.637 |
reading | +9.575 |
monitor | +9.505 |
blogs | +9.434 |
chatting | +9.237 |
Neg logit contributions | |
Percentage | -7.653 |
Killed | -6.819 |
Worse | -6.736 |
Percent | -6.701 |
Millions | -6.565 |
Token | , |
Token ID | 11 |
Feature activation | -3.43e+01 |
Pos logit contributions | |
reading | +10.422 |
monitor | +10.380 |
learning | +10.310 |
blogs | +10.231 |
thanking | +10.166 |
Neg logit contributions | |
Percentage | -8.479 |
Killed | -7.584 |
Worse | -7.521 |
Percent | -7.446 |
Millions | -7.307 |
Token | and |
Token ID | 290 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
chatting | +30.068 |
thanking | +29.965 |
researching | +29.957 |
monitor | +29.668 |
brainstorm | +29.342 |
Neg logit contributions | |
Percentage | -19.174 |
Killed | -16.594 |
サーティワン | -16.428 |
Percent | -16.283 |
Millions | -16.016 |
Token | also |
Token ID | 635 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
chatting | +19.672 |
monitor | +19.584 |
thanking | +19.477 |
blogs | +19.393 |
learning | +19.379 |
Neg logit contributions | |
Percentage | -14.044 |
Killed | -12.126 |
Percent | -11.806 |
Worse | -11.763 |
サーティワン | -11.566 |
Token | develop |
Token ID | 1205 |
Feature activation | -7.61e+00 |
Pos logit contributions | |
chatting | +14.834 |
monitor | +14.792 |
blogs | +14.780 |
reading | +14.642 |
learning | +14.590 |
Neg logit contributions | |
Percentage | -15.104 |
Killed | -13.355 |
Percent | -13.318 |
Worse | -13.144 |
Millions | -12.805 |
Token | more |
Token ID | 517 |
Feature activation | -7.18e+00 |
Pos logit contributions | |
learning | +7.006 |
reading | +6.943 |
blogs | +6.914 |
monitor | +6.904 |
chatting | +6.743 |
Neg logit contributions | |
Percentage | -8.361 |
Killed | -7.567 |
Worse | -7.525 |
Percent | -7.499 |
Millions | -7.408 |
Token | advanced |
Token ID | 6190 |
Feature activation | -9.64e+00 |
Pos logit contributions | |
learning | +6.265 |
reading | +6.250 |
monitor | +6.210 |
blogs | +6.186 |
chatting | +6.052 |
Neg logit contributions | |
Percentage | -8.217 |
Worse | -7.508 |
Killed | -7.497 |
Percent | -7.396 |
Millions | -7.310 |
Token | the |
Token ID | 262 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
blogs | +13.182 |
learning | +13.064 |
monitor | +12.942 |
reading | +12.925 |
chatting | +12.810 |
Neg logit contributions | |
Percentage | -11.696 |
Worse | -10.538 |
Killed | -10.461 |
Millions | -10.414 |
Percent | -10.282 |
Token | project |
Token ID | 1628 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
blogs | +11.694 |
reading | +11.675 |
learning | +11.610 |
monitor | +11.599 |
chatting | +11.483 |
Neg logit contributions | |
Percentage | -10.000 |
Worse | -8.962 |
Killed | -8.935 |
Millions | -8.800 |
Percent | -8.769 |
Token | as |
Token ID | 355 |
Feature activation | -5.22e+00 |
Pos logit contributions | |
blogs | +18.443 |
monitor | +18.300 |
chatting | +18.184 |
reading | +18.173 |
thanking | +18.073 |
Neg logit contributions | |
Percentage | -15.228 |
Killed | -13.808 |
Worse | -13.712 |
Millions | -13.407 |
Percent | -13.319 |
Token | it |
Token ID | 340 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
learning | +4.788 |
blogs | +4.783 |
reading | +4.780 |
monitor | +4.738 |
thanking | +4.623 |
Neg logit contributions | |
Percentage | -5.822 |
Killed | -5.295 |
Worse | -5.271 |
Percent | -5.215 |
Millions | -5.199 |
Token | evolves |
Token ID | 43576 |
Feature activation | -5.06e+00 |
Pos logit contributions | |
Percentage | +2.238 |
Killed | +2.033 |
Worse | +2.020 |
Only | +2.002 |
Millions | +1.998 |
Neg logit contributions | |
learning | -2.003 |
blogs | -1.981 |
reading | -1.980 |
monitor | -1.959 |
thanking | -1.923 |
Token | , |
Token ID | 11 |
Feature activation | -3.42e+01 |
Pos logit contributions | |
learning | +5.905 |
reading | +5.902 |
blogs | +5.880 |
monitor | +5.845 |
thanking | +5.754 |
Neg logit contributions | |
Percentage | -4.397 |
Killed | -3.899 |
Worse | -3.881 |
Percent | -3.815 |
Millions | -3.785 |
Token | as |
Token ID | 355 |
Feature activation | -7.53e+00 |
Pos logit contributions | |
chatting | +30.536 |
thanking | +30.112 |
monitor | +29.818 |
blogs | +29.807 |
researching | +29.692 |
Neg logit contributions | |
Percentage | -19.489 |
サーティワン | -18.620 |
Worse | -17.631 |
Killed | -17.511 |
Percent | -16.957 |
Token | inevitable |
Token ID | 13203 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
blogs | +7.179 |
reading | +7.163 |
learning | +7.143 |
monitor | +7.098 |
thanking | +6.948 |
Neg logit contributions | |
Percentage | -7.917 |
Killed | -7.188 |
Worse | -7.163 |
Percent | -7.056 |
Millions | -7.044 |
Token | design |
Token ID | 1486 |
Feature activation | -3.90e+00 |
Pos logit contributions | |
Percentage | +5.520 |
Worse | +5.039 |
Killed | +4.999 |
Only | +4.988 |
Millions | +4.943 |
Neg logit contributions | |
reading | -3.939 |
learning | -3.929 |
monitor | -3.883 |
blogs | -3.860 |
thanking | -3.732 |
Token | changes |
Token ID | 2458 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
learning | +3.879 |
reading | +3.878 |
blogs | +3.876 |
monitor | +3.826 |
thanking | +3.751 |
Neg logit contributions | |
Percentage | -4.093 |
Killed | -3.691 |
Worse | -3.689 |
Percent | -3.644 |
Millions | -3.629 |
Token | are |
Token ID | 389 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
Percentage | +1.888 |
Worse | +1.704 |
Killed | +1.703 |
Only | +1.679 |
Millions | +1.674 |
Neg logit contributions | |
learning | -1.786 |
reading | -1.774 |
blogs | -1.773 |
monitor | -1.756 |
thanking | -1.718 |
Token | Washington |
Token ID | 2669 |
Feature activation | -9.95e+00 |
Pos logit contributions | |
learning | +15.005 |
reading | +14.825 |
blogs | +14.752 |
thanking | +14.731 |
chatting | +14.722 |
Neg logit contributions | |
Percentage | -10.345 |
Killed | -9.116 |
Worse | -9.048 |
Percent | -8.815 |
Millions | -8.809 |
Token | among |
Token ID | 1871 |
Feature activation | -7.73e+00 |
Pos logit contributions | |
learning | +11.139 |
reading | +11.069 |
thanking | +11.013 |
monitor | +10.878 |
blogs | +10.876 |
Neg logit contributions | |
Percentage | -8.432 |
Worse | -7.487 |
Killed | -7.439 |
Millions | -7.295 |
Percent | -7.249 |
Token | his |
Token ID | 465 |
Feature activation | -8.24e+00 |
Pos logit contributions | |
learning | +7.808 |
reading | +7.764 |
blogs | +7.751 |
thanking | +7.683 |
chatting | +7.636 |
Neg logit contributions | |
Percentage | -7.599 |
Worse | -6.811 |
Killed | -6.717 |
Percent | -6.650 |
Millions | -6.536 |
Token | many |
Token ID | 867 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
reading | +8.752 |
learning | +8.709 |
blogs | +8.639 |
thanking | +8.594 |
chatting | +8.565 |
Neg logit contributions | |
Percentage | -7.571 |
Worse | -6.815 |
Killed | -6.708 |
Percent | -6.697 |
Only | -6.486 |
Token | friends |
Token ID | 2460 |
Feature activation | -9.27e+00 |
Pos logit contributions | |
reading | +3.571 |
learning | +3.560 |
blogs | +3.553 |
monitor | +3.494 |
thanking | +3.463 |
Neg logit contributions | |
Percentage | -4.837 |
Worse | -4.417 |
Killed | -4.390 |
Percent | -4.356 |
Millions | -4.310 |
Token | , |
Token ID | 11 |
Feature activation | -3.40e+01 |
Pos logit contributions | |
learning | +10.536 |
reading | +10.451 |
thanking | +10.405 |
chatting | +10.368 |
blogs | +10.310 |
Neg logit contributions | |
Percentage | -7.831 |
Worse | -7.018 |
Percent | -6.882 |
Killed | -6.859 |
Millions | -6.730 |
Token | who |
Token ID | 508 |
Feature activation | -8.87e+00 |
Pos logit contributions | |
thanking | +31.847 |
chatting | +31.385 |
arranging | +29.761 |
learning | +29.404 |
researching | +29.340 |
Neg logit contributions | |
Percentage | -18.499 |
サーティワン | -17.338 |
Percent | -15.786 |
Worse | -15.598 |
Votes | -15.017 |
Token | affection |
Token ID | 17696 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
blogs | +8.805 |
reading | +8.659 |
thanking | +8.651 |
learning | +8.648 |
monitor | +8.599 |
Neg logit contributions | |
Percentage | -8.925 |
Worse | -8.085 |
Percent | -7.972 |
Killed | -7.905 |
Millions | -7.810 |
Token | ately |
Token ID | 1286 |
Feature activation | -5.33e+00 |
Pos logit contributions | |
reading | +2.772 |
blogs | +2.756 |
learning | +2.749 |
monitor | +2.710 |
thanking | +2.629 |
Neg logit contributions | |
Percentage | -4.810 |
Worse | -4.437 |
Killed | -4.408 |
Percent | -4.382 |
Millions | -4.362 |
Token | called |
Token ID | 1444 |
Feature activation | +3.53e+00 |
Pos logit contributions | |
blogs | +4.724 |
reading | +4.715 |
learning | +4.699 |
monitor | +4.657 |
thanking | +4.601 |
Neg logit contributions | |
Percentage | -6.136 |
Worse | -5.592 |
Killed | -5.577 |
Percent | -5.540 |
Millions | -5.491 |
Token | him |
Token ID | 683 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
Percentage | +3.323 |
Killed | +2.975 |
Worse | +2.941 |
Only | +2.926 |
Millions | +2.917 |
Neg logit contributions | |
reading | -3.881 |
learning | -3.877 |
monitor | -3.868 |
blogs | -3.860 |
reader | -3.728 |
Token | fighting |
Token ID | 4330 |
Feature activation | -1.03e+01 |
Pos logit contributions | |
learning | +5.410 |
reading | +5.403 |
blogs | +5.386 |
monitor | +5.345 |
thanking | +5.264 |
Neg logit contributions | |
Percentage | -5.711 |
Worse | -5.175 |
Killed | -5.137 |
Percent | -5.051 |
Millions | -5.030 |
Token | game |
Token ID | 983 |
Feature activation | -1.35e+01 |
Pos logit contributions | |
learning | +7.208 |
blogs | +7.133 |
monitor | +7.128 |
reading | +7.114 |
chatting | +7.060 |
Neg logit contributions | |
Percentage | -13.086 |
Worse | -12.107 |
Killed | -12.054 |
Percent | -11.919 |
Millions | -11.799 |
Token | communities |
Token ID | 5348 |
Feature activation | -1.61e+01 |
Pos logit contributions | |
blogs | +12.078 |
reading | +12.024 |
learning | +11.981 |
monitor | +11.928 |
chatting | +11.844 |
Neg logit contributions | |
Percentage | -13.703 |
Worse | -12.585 |
Killed | -12.382 |
Percent | -12.290 |
Millions | -12.069 |
Token | in |
Token ID | 287 |
Feature activation | -2.04e+01 |
Pos logit contributions | |
thanking | +16.130 |
chatting | +15.881 |
reading | +15.859 |
learning | +15.698 |
monitor | +15.664 |
Neg logit contributions | |
Percentage | -13.291 |
Worse | -12.135 |
Killed | -11.974 |
Percent | -11.722 |
サーティワン | -11.707 |
Token | Japan |
Token ID | 2869 |
Feature activation | -1.72e+01 |
Pos logit contributions | |
thanking | +20.324 |
chatting | +20.013 |
researching | +19.826 |
learning | +19.771 |
reading | +19.624 |
Neg logit contributions | |
Percentage | -15.202 |
Killed | -13.847 |
Worse | -13.716 |
サーティワン | -13.305 |
Percent | -13.224 |
Token | , |
Token ID | 11 |
Feature activation | -3.40e+01 |
Pos logit contributions | |
thanking | +17.220 |
learning | +16.926 |
reading | +16.919 |
chatting | +16.916 |
monitor | +16.683 |
Neg logit contributions | |
Percentage | -14.102 |
Worse | -12.896 |
Killed | -12.696 |
Percent | -12.572 |
Millions | -12.087 |
Token | and |
Token ID | 290 |
Feature activation | -1.96e+01 |
Pos logit contributions | |
thanking | +31.628 |
chatting | +30.586 |
arranging | +29.416 |
noting | +29.044 |
researching | +28.906 |
Neg logit contributions | |
Percentage | -18.270 |
サーティワン | -17.684 |
Killed | -16.719 |
Worse | -16.637 |
Percent | -15.906 |
Token | specifically |
Token ID | 5734 |
Feature activation | -6.91e+00 |
Pos logit contributions | |
thanking | +20.250 |
chatting | +20.038 |
reading | +19.531 |
learning | +19.326 |
blogs | +19.222 |
Neg logit contributions | |
Percentage | -14.346 |
Worse | -12.907 |
Killed | -12.624 |
サーティワン | -12.563 |
Millions | -12.375 |
Token | mentioned |
Token ID | 4750 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
learning | +7.730 |
reading | +7.707 |
blogs | +7.681 |
thanking | +7.665 |
monitor | +7.628 |
Neg logit contributions | |
Percentage | -6.090 |
Worse | -5.440 |
Killed | -5.348 |
Millions | -5.290 |
Percent | -5.286 |
Token | the |
Token ID | 262 |
Feature activation | -2.79e+00 |
Pos logit contributions | |
learning | +5.296 |
reading | +5.291 |
blogs | +5.274 |
monitor | +5.241 |
thanking | +5.195 |
Neg logit contributions | |
Percentage | -4.741 |
Worse | -4.271 |
Killed | -4.235 |
Millions | -4.158 |
Percent | -4.154 |
Token | organization |
Token ID | 4009 |
Feature activation | -5.65e+00 |
Pos logit contributions | |
learning | +3.156 |
reading | +3.155 |
blogs | +3.147 |
monitor | +3.124 |
thanking | +3.072 |
Neg logit contributions | |
Percentage | -2.536 |
Worse | -2.256 |
Killed | -2.251 |
Percent | -2.208 |
Millions | -2.196 |
Token | dialogue |
Token ID | 10721 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
reading | +6.861 |
learning | +6.843 |
blogs | +6.811 |
monitor | +6.748 |
chatting | +6.726 |
Neg logit contributions | |
Percentage | -7.250 |
Killed | -6.583 |
Worse | -6.580 |
Percent | -6.486 |
Millions | -6.478 |
Token | between |
Token ID | 1022 |
Feature activation | -4.98e+00 |
Pos logit contributions | |
reading | +13.180 |
learning | +13.177 |
thanking | +13.151 |
blogs | +13.075 |
chatting | +13.009 |
Neg logit contributions | |
Percentage | -13.058 |
Worse | -12.008 |
Killed | -11.781 |
Percent | -11.655 |
Millions | -11.557 |
Token | clubs |
Token ID | 9784 |
Feature activation | -1.74e+01 |
Pos logit contributions | |
reading | +4.234 |
learning | +4.222 |
blogs | +4.209 |
monitor | +4.176 |
thanking | +4.123 |
Neg logit contributions | |
Percentage | -5.873 |
Worse | -5.357 |
Killed | -5.355 |
Percent | -5.293 |
Millions | -5.268 |
Token | and |
Token ID | 290 |
Feature activation | -1.71e+01 |
Pos logit contributions | |
thanking | +17.132 |
chatting | +16.884 |
learning | +16.692 |
reading | +16.655 |
monitor | +16.637 |
Neg logit contributions | |
Percentage | -14.470 |
Worse | -13.188 |
Killed | -12.912 |
Percent | -12.862 |
Millions | -12.575 |
Token | fans |
Token ID | 3296 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
thanking | +16.864 |
chatting | +16.742 |
reading | +16.704 |
learning | +16.527 |
monitor | +16.517 |
Neg logit contributions | |
Percentage | -13.925 |
Killed | -12.429 |
Percent | -12.429 |
Worse | -12.363 |
サーティワン | -12.316 |
Token | , |
Token ID | 11 |
Feature activation | -3.40e+01 |
Pos logit contributions | |
thanking | +20.019 |
chatting | +19.877 |
reading | +19.530 |
learning | +19.495 |
monitor | +19.260 |
Neg logit contributions | |
Percentage | -16.192 |
Worse | -15.128 |
Percent | -14.641 |
Killed | -14.627 |
Millions | -14.187 |
Token | and |
Token ID | 290 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
thanking | +29.285 |
chatting | +28.540 |
arranging | +28.031 |
researching | +27.854 |
educating | +27.779 |
Neg logit contributions | |
Percentage | -20.728 |
サーティワン | -19.004 |
Percent | -18.902 |
Killed | -18.782 |
Worse | -18.753 |
Token | we |
Token ID | 356 |
Feature activation | -6.87e+00 |
Pos logit contributions | |
reading | +13.954 |
thanking | +13.900 |
chatting | +13.846 |
learning | +13.755 |
blogs | +13.755 |
Neg logit contributions | |
Percentage | -12.092 |
Worse | -10.827 |
Killed | -10.789 |
Percent | -10.745 |
サーティワン | -10.480 |
Token | have |
Token ID | 423 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
blogs | +6.434 |
monitor | +6.287 |
reading | +6.271 |
thanking | +6.218 |
learning | +6.215 |
Neg logit contributions | |
Percentage | -7.526 |
Worse | -6.838 |
Killed | -6.750 |
Percent | -6.746 |
Millions | -6.659 |
Token | worked |
Token ID | 3111 |
Feature activation | -9.86e+00 |
Pos logit contributions | |
learning | +2.306 |
blogs | +2.304 |
reading | +2.301 |
monitor | +2.280 |
thanking | +2.249 |
Neg logit contributions | |
Percentage | -2.158 |
Worse | -1.936 |
Killed | -1.927 |
Percent | -1.908 |
Millions | -1.893 |
Token | at |
Token ID | 379 |
Feature activation | -8.49e+00 |
Pos logit contributions | |
blogs | +6.913 |
learning | +6.888 |
reading | +6.887 |
monitor | +6.814 |
thanking | +6.794 |
Neg logit contributions | |
Percentage | -12.579 |
Worse | -11.660 |
Killed | -11.539 |
Percent | -11.537 |
Millions | -11.274 |
Token | and |
Token ID | 290 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
chatting | +17.277 |
thanking | +16.756 |
reading | +16.635 |
learning | +16.332 |
workspace | +16.120 |
Neg logit contributions | |
Percentage | -22.659 |
Killed | -21.599 |
Worse | -21.211 |
Percent | -21.116 |
Millions | -20.314 |
Token | straightforward |
Token ID | 15836 |
Feature activation | -1.80e+01 |
Pos logit contributions | |
chatting | +12.951 |
reading | +12.636 |
thanking | +12.557 |
blogs | +12.103 |
learning | +12.030 |
Neg logit contributions | |
Percentage | -25.483 |
Killed | -23.950 |
Percent | -23.377 |
Worse | -23.136 |
サーティワン | -22.839 |
Token | communication |
Token ID | 6946 |
Feature activation | -1.75e+01 |
Pos logit contributions | |
chatting | +13.794 |
thanking | +13.386 |
reading | +13.269 |
blogs | +12.981 |
monitor | +12.882 |
Neg logit contributions | |
Percentage | -19.170 |
Worse | -18.233 |
Killed | -18.230 |
サーティワン | -17.820 |
Percent | -17.800 |
Token | with |
Token ID | 351 |
Feature activation | -1.88e+01 |
Pos logit contributions | |
learning | +13.493 |
reading | +13.310 |
thanking | +13.309 |
monitor | +13.008 |
chatting | +12.936 |
Neg logit contributions | |
Percentage | -17.573 |
Worse | -16.624 |
Killed | -16.331 |
Percent | -16.023 |
Millions | -15.877 |
Token | staff |
Token ID | 3085 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
chatting | +11.349 |
blogs | +11.165 |
reading | +11.148 |
learning | +11.111 |
thanking | +11.059 |
Neg logit contributions | |
Percentage | -22.168 |
Worse | -20.543 |
Killed | -20.506 |
Percent | -20.496 |
サーティワン | -20.071 |
Token | , |
Token ID | 11 |
Feature activation | -3.39e+01 |
Pos logit contributions | |
learning | +11.146 |
reading | +11.132 |
blogs | +11.074 |
thanking | +11.001 |
monitor | +10.986 |
Neg logit contributions | |
Percentage | -8.796 |
Killed | -7.909 |
Worse | -7.834 |
Percent | -7.772 |
Millions | -7.583 |
Token | clearly |
Token ID | 4084 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
thanking | +30.986 |
monitor | +29.872 |
blogs | +29.725 |
chatting | +29.692 |
reading | +29.594 |
Neg logit contributions | |
Percentage | -18.874 |
Killed | -16.971 |
サーティワン | -16.820 |
Percent | -16.548 |
Worse | -16.278 |
Token | explaining |
Token ID | 11170 |
Feature activation | -5.87e+00 |
Pos logit contributions | |
reading | +11.134 |
thanking | +11.070 |
monitor | +11.012 |
learning | +10.989 |
blogs | +10.959 |
Neg logit contributions | |
Percentage | -12.968 |
Killed | -11.854 |
Worse | -11.819 |
Percent | -11.695 |
Millions | -11.581 |
Token | the |
Token ID | 262 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
reading | +4.863 |
learning | +4.858 |
blogs | +4.842 |
monitor | +4.765 |
thanking | +4.740 |
Neg logit contributions | |
Percentage | -7.016 |
Killed | -6.432 |
Worse | -6.415 |
Percent | -6.357 |
Millions | -6.331 |
Token | reasons |
Token ID | 3840 |
Feature activation | -2.72e+00 |
Pos logit contributions | |
learning | +2.675 |
reading | +2.674 |
blogs | +2.663 |
monitor | +2.634 |
thanking | +2.583 |
Neg logit contributions | |
Percentage | -2.996 |
Killed | -2.711 |
Worse | -2.707 |
Percent | -2.672 |
Millions | -2.661 |
Token | for |
Token ID | 329 |
Feature activation | -5.20e-01 |
Pos logit contributions | |
reading | +2.112 |
learning | +2.110 |
blogs | +2.105 |
monitor | +2.076 |
thanking | +2.028 |
Neg logit contributions | |
Percentage | -3.461 |
Killed | -3.179 |
Worse | -3.178 |
Percent | -3.141 |
Millions | -3.133 |
Token | more |
Token ID | 517 |
Feature activation | -1.44e+01 |
Pos logit contributions | |
reading | +8.941 |
learning | +8.875 |
blogs | +8.832 |
monitor | +8.568 |
chatting | +8.563 |
Neg logit contributions | |
Percentage | -10.009 |
Killed | -9.193 |
Millions | -8.998 |
Worse | -8.925 |
Percent | -8.891 |
Token | deeply |
Token ID | 7744 |
Feature activation | -1.45e+01 |
Pos logit contributions | |
reading | +13.320 |
blogs | +13.183 |
learning | +13.166 |
chatting | +12.973 |
thanking | +12.831 |
Neg logit contributions | |
Percentage | -13.475 |
Killed | -12.362 |
Worse | -12.358 |
Millions | -12.057 |
Percent | -11.779 |
Token | about |
Token ID | 546 |
Feature activation | -9.28e+00 |
Pos logit contributions | |
learning | +13.634 |
reading | +13.479 |
blogs | +13.415 |
thanking | +13.254 |
chatting | +13.110 |
Neg logit contributions | |
Percentage | -13.429 |
Worse | -12.259 |
Killed | -12.171 |
Millions | -12.000 |
Percent | -11.949 |
Token | their |
Token ID | 511 |
Feature activation | -7.91e+00 |
Pos logit contributions | |
learning | +9.185 |
reading | +9.032 |
blogs | +8.966 |
thanking | +8.942 |
monitor | +8.940 |
Neg logit contributions | |
Percentage | -9.100 |
Worse | -8.302 |
Killed | -8.301 |
Millions | -8.154 |
Percent | -8.114 |
Token | training |
Token ID | 3047 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
learning | +7.183 |
reading | +7.050 |
blogs | +6.994 |
monitor | +6.957 |
chatting | +6.854 |
Neg logit contributions | |
Percentage | -8.600 |
Worse | -7.915 |
Killed | -7.866 |
Millions | -7.763 |
Percent | -7.748 |
Token | , |
Token ID | 11 |
Feature activation | -3.38e+01 |
Pos logit contributions | |
learning | +12.101 |
blogs | +11.892 |
reading | +11.826 |
monitor | +11.813 |
thanking | +11.633 |
Neg logit contributions | |
Percentage | -10.105 |
Killed | -9.088 |
Worse | -9.055 |
Millions | -8.955 |
Percent | -8.848 |
Token | balance |
Token ID | 5236 |
Feature activation | -7.55e+00 |
Pos logit contributions | |
learning | +31.539 |
thanking | +30.861 |
reading | +30.497 |
chatting | +30.404 |
blogs | +30.121 |
Neg logit contributions | |
Percentage | -16.725 |
Worse | -14.899 |
Millions | -14.598 |
Percent | -14.549 |
Killed | -14.509 |
Token | and |
Token ID | 290 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
learning | +8.823 |
reading | +8.723 |
blogs | +8.676 |
monitor | +8.646 |
thanking | +8.557 |
Neg logit contributions | |
Percentage | -6.223 |
Killed | -5.550 |
Worse | -5.470 |
Percent | -5.462 |
Millions | -5.460 |
Token | stability |
Token ID | 10159 |
Feature activation | -6.83e+00 |
Pos logit contributions | |
learning | +19.909 |
chatting | +19.502 |
reading | +19.468 |
thanking | +19.465 |
monitor | +19.177 |
Neg logit contributions | |
Percentage | -15.414 |
Millions | -14.054 |
Worse | -13.982 |
Killed | -13.726 |
Percent | -13.614 |
Token | . |
Token ID | 13 |
Feature activation | +4.08e+00 |
Pos logit contributions | |
learning | +7.333 |
blogs | +7.283 |
reading | +7.266 |
monitor | +7.197 |
thanking | +7.057 |
Neg logit contributions | |
Percentage | -6.380 |
Killed | -5.727 |
Worse | -5.722 |
Millions | -5.669 |
Percent | -5.643 |
Token | I |
Token ID | 314 |
Feature activation | -9.52e+00 |
Pos logit contributions | |
Percentage | +2.911 |
Worse | +2.504 |
Killed | +2.496 |
Only | +2.468 |
Percent | +2.443 |
Neg logit contributions | |
reading | -5.426 |
blogs | -5.407 |
learning | -5.405 |
monitor | -5.396 |
thanking | -5.256 |
Token | greets |
Token ID | 45204 |
Feature activation | -3.90e+00 |
Pos logit contributions | |
reading | +4.341 |
blogs | +4.332 |
learning | +4.320 |
monitor | +4.262 |
thanking | +4.216 |
Neg logit contributions | |
Percentage | -3.882 |
Worse | -3.471 |
Killed | -3.456 |
Percent | -3.412 |
Millions | -3.393 |
Token | his |
Token ID | 465 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
learning | +3.960 |
reading | +3.955 |
blogs | +3.951 |
monitor | +3.917 |
thanking | +3.847 |
Neg logit contributions | |
Percentage | -3.998 |
Killed | -3.591 |
Worse | -3.590 |
Percent | -3.538 |
Millions | -3.516 |
Token | producers |
Token ID | 11408 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
reading | +13.894 |
blogs | +13.820 |
chatting | +13.733 |
learning | +13.688 |
thanking | +13.631 |
Neg logit contributions | |
Percentage | -11.361 |
Worse | -10.122 |
Killed | -9.992 |
Percent | -9.983 |
Millions | -9.675 |
Token | and |
Token ID | 290 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
thanking | +14.202 |
chatting | +14.190 |
reading | +14.158 |
blogs | +14.097 |
monitor | +13.977 |
Neg logit contributions | |
Percentage | -11.183 |
Worse | -9.976 |
Killed | -9.961 |
Percent | -9.872 |
Millions | -9.632 |
Token | technicians |
Token ID | 33519 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
chatting | +20.367 |
thanking | +20.148 |
blogs | +20.135 |
reading | +20.096 |
reader | +19.636 |
Neg logit contributions | |
Percentage | -15.431 |
Percent | -13.397 |
Killed | -13.384 |
Worse | -13.363 |
Millions | -13.269 |
Token | , |
Token ID | 11 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
chatting | +14.619 |
thanking | +14.527 |
reading | +14.451 |
blogs | +14.447 |
monitor | +14.194 |
Neg logit contributions | |
Percentage | -11.977 |
Worse | -10.746 |
Killed | -10.668 |
Percent | -10.653 |
Millions | -10.336 |
Token | and |
Token ID | 290 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
thanking | +31.662 |
chatting | +31.645 |
reading | +29.985 |
blogs | +29.983 |
arranging | +29.777 |
Neg logit contributions | |
Percentage | -18.352 |
Worse | -16.247 |
Killed | -15.882 |
Percent | -15.777 |
サーティワン | -15.328 |
Token | they |
Token ID | 484 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
chatting | +20.170 |
thanking | +20.166 |
blogs | +19.978 |
reading | +19.708 |
learning | +19.366 |
Neg logit contributions | |
Percentage | -14.785 |
Worse | -12.895 |
Killed | -12.856 |
Percent | -12.575 |
サーティワン | -12.398 |
Token | word |
Token ID | 1573 |
Feature activation | -2.65e+00 |
Pos logit contributions | |
blogs | +10.220 |
chatting | +10.066 |
reading | +10.061 |
thanking | +9.987 |
monitor | +9.917 |
Neg logit contributions | |
Percentage | -12.391 |
Worse | -11.334 |
Killed | -11.231 |
Percent | -11.170 |
Millions | -10.964 |
Token | lessly |
Token ID | 8613 |
Feature activation | -9.21e+00 |
Pos logit contributions | |
learning | +2.533 |
reading | +2.531 |
blogs | +2.527 |
monitor | +2.501 |
thanking | +2.445 |
Neg logit contributions | |
Percentage | -2.908 |
Killed | -2.633 |
Worse | -2.629 |
Percent | -2.594 |
Millions | -2.586 |
Token | pick |
Token ID | 2298 |
Feature activation | -4.72e+00 |
Pos logit contributions | |
blogs | +7.923 |
reading | +7.895 |
thanking | +7.780 |
chatting | +7.774 |
learning | +7.696 |
Neg logit contributions | |
Percentage | -10.486 |
Worse | -9.628 |
Killed | -9.589 |
Percent | -9.457 |
Millions | -9.348 |
Token | the |
Token ID | 262 |
Feature activation | -1.60e+01 |
Pos logit contributions | |
thanking | +21.780 |
chatting | +21.775 |
learning | +21.261 |
reading | +21.050 |
blogs | +21.009 |
Neg logit contributions | |
Percentage | -12.772 |
Killed | -11.010 |
Worse | -10.991 |
サーティワン | -10.740 |
Percent | -10.728 |
Token | Zero |
Token ID | 12169 |
Feature activation | -3.60e+00 |
Pos logit contributions | |
reading | +17.779 |
chatting | +17.735 |
blogs | +17.685 |
learning | +17.667 |
thanking | +17.564 |
Neg logit contributions | |
Percentage | -11.340 |
Worse | -9.873 |
Killed | -9.822 |
Percent | -9.738 |
サーティワン | -9.440 |
Token | Point |
Token ID | 6252 |
Feature activation | -5.35e+00 |
Pos logit contributions | |
learning | +4.740 |
reading | +4.728 |
blogs | +4.727 |
monitor | +4.678 |
chatting | +4.613 |
Neg logit contributions | |
Percentage | -2.561 |
Killed | -2.215 |
Worse | -2.213 |
Millions | -2.132 |
Percent | -2.120 |
Token | Zero |
Token ID | 12169 |
Feature activation | -7.57e+00 |
Pos logit contributions | |
learning | +7.326 |
blogs | +7.314 |
reading | +7.311 |
monitor | +7.247 |
thanking | +7.152 |
Neg logit contributions | |
Percentage | -3.491 |
Killed | -2.977 |
Worse | -2.968 |
Percent | -2.870 |
Millions | -2.859 |
Token | offices |
Token ID | 9730 |
Feature activation | -1.27e+01 |
Pos logit contributions | |
learning | +8.369 |
blogs | +8.366 |
reading | +8.356 |
monitor | +8.241 |
chatting | +8.195 |
Neg logit contributions | |
Percentage | -6.695 |
Worse | -6.012 |
Killed | -5.989 |
Millions | -5.848 |
Percent | -5.823 |
Token | , |
Token ID | 11 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
chatting | +13.471 |
reading | +13.438 |
learning | +13.391 |
thanking | +13.349 |
blogs | +13.340 |
Neg logit contributions | |
Percentage | -10.744 |
Worse | -9.779 |
Killed | -9.546 |
Percent | -9.418 |
Millions | -9.381 |
Token | which |
Token ID | 543 |
Feature activation | -6.91e+00 |
Pos logit contributions | |
chatting | +32.798 |
thanking | +31.957 |
reading | +30.742 |
arranging | +30.678 |
monitor | +30.396 |
Neg logit contributions | |
Percentage | -16.337 |
Worse | -15.121 |
サーティワン | -14.524 |
Percent | -14.186 |
Killed | -14.050 |
Token | are |
Token ID | 389 |
Feature activation | -8.04e+00 |
Pos logit contributions | |
blogs | +7.076 |
reading | +7.043 |
monitor | +6.984 |
learning | +6.975 |
chatting | +6.892 |
Neg logit contributions | |
Percentage | -6.718 |
Worse | -6.091 |
Killed | -6.043 |
Percent | -5.918 |
Millions | -5.882 |
Token | in |
Token ID | 287 |
Feature activation | -9.31e+00 |
Pos logit contributions | |
blogs | +7.860 |
reading | +7.760 |
chatting | +7.720 |
learning | +7.716 |
monitor | +7.701 |
Neg logit contributions | |
Percentage | -8.186 |
Worse | -7.462 |
Killed | -7.394 |
Percent | -7.340 |
Millions | -7.277 |
Token | a |
Token ID | 257 |
Feature activation | -8.59e+00 |
Pos logit contributions | |
learning | +10.458 |
reading | +10.351 |
blogs | +10.325 |
monitor | +10.184 |
chatting | +10.144 |
Neg logit contributions | |
Percentage | -7.842 |
Killed | -6.990 |
Worse | -6.893 |
Percent | -6.854 |
Millions | -6.798 |
Token | nond |
Token ID | 30745 |
Feature activation | -5.56e+00 |
Pos logit contributions | |
learning | +9.231 |
reading | +9.202 |
blogs | +9.168 |
monitor | +9.066 |
chatting | +9.033 |
Neg logit contributions | |
Percentage | -7.695 |
Killed | -6.929 |
Worse | -6.901 |
Percent | -6.854 |
Millions | -6.788 |
Token | person |
Token ID | 1048 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
chatting | +21.268 |
thanking | +21.240 |
learning | +20.926 |
reading | +20.779 |
blogs | +20.493 |
Neg logit contributions | |
Percentage | -16.599 |
Killed | -14.620 |
Percent | -14.525 |
Worse | -14.519 |
サーティワン | -14.235 |
Token | and |
Token ID | 290 |
Feature activation | -3.00e+01 |
Pos logit contributions | |
thanking | +21.153 |
chatting | +20.950 |
learning | +20.642 |
reading | +20.506 |
blogs | +20.428 |
Neg logit contributions | |
Percentage | -15.481 |
Worse | -14.415 |
Killed | -14.000 |
Percent | -13.701 |
Millions | -13.278 |
Token | sample |
Token ID | 6291 |
Feature activation | -4.24e+00 |
Pos logit contributions | |
chatting | +25.765 |
brainstorm | +25.586 |
chat | +24.779 |
thanking | +24.515 |
blogs | +23.953 |
Neg logit contributions | |
Percentage | -20.632 |
サーティワン | -18.141 |
Percent | -17.853 |
Worse | -17.791 |
Killed | -17.789 |
Token | their |
Token ID | 511 |
Feature activation | -5.52e+00 |
Pos logit contributions | |
learning | +3.610 |
blogs | +3.610 |
reading | +3.600 |
monitor | +3.535 |
thanking | +3.490 |
Neg logit contributions | |
Percentage | -5.018 |
Worse | -4.582 |
Killed | -4.575 |
Percent | -4.520 |
Millions | -4.483 |
Token | beers |
Token ID | 16800 |
Feature activation | -1.06e+01 |
Pos logit contributions | |
blogs | +4.755 |
learning | +4.753 |
reading | +4.750 |
monitor | +4.646 |
chatting | +4.610 |
Neg logit contributions | |
Percentage | -6.377 |
Worse | -5.839 |
Killed | -5.802 |
Percent | -5.746 |
Millions | -5.684 |
Token | , |
Token ID | 11 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
learning | +11.227 |
reading | +11.153 |
blogs | +11.147 |
thanking | +11.083 |
chatting | +11.042 |
Neg logit contributions | |
Percentage | -9.470 |
Worse | -8.590 |
Killed | -8.456 |
Percent | -8.387 |
Millions | -8.129 |
Token | including |
Token ID | 1390 |
Feature activation | -6.90e+00 |
Pos logit contributions | |
chatting | +31.220 |
thanking | +30.033 |
blogs | +30.024 |
reading | +29.641 |
brainstorm | +29.534 |
Neg logit contributions | |
Percentage | -18.711 |
Percent | -16.162 |
サーティワン | -16.155 |
Worse | -16.081 |
Killed | -15.812 |
Token | lots |
Token ID | 6041 |
Feature activation | -2.94e+00 |
Pos logit contributions | |
blogs | +7.372 |
learning | +7.322 |
reading | +7.309 |
chatting | +7.220 |
thanking | +7.193 |
Neg logit contributions | |
Percentage | -6.489 |
Worse | -5.795 |
Killed | -5.769 |
Percent | -5.677 |
Millions | -5.622 |
Token | of |
Token ID | 286 |
Feature activation | -5.96e+00 |
Pos logit contributions | |
reading | +3.193 |
learning | +3.188 |
blogs | +3.183 |
monitor | +3.129 |
thanking | +3.093 |
Neg logit contributions | |
Percentage | -2.819 |
Killed | -2.521 |
Worse | -2.516 |
Percent | -2.482 |
Millions | -2.463 |
Token | exclusive |
Token ID | 8568 |
Feature activation | -6.77e+00 |
Pos logit contributions | |
blogs | +5.832 |
learning | +5.803 |
reading | +5.794 |
chatting | +5.702 |
monitor | +5.684 |
Neg logit contributions | |
Percentage | -6.202 |
Worse | -5.612 |
Killed | -5.576 |
Percent | -5.507 |
Millions | -5.474 |
Token | festival |
Token ID | 10876 |
Feature activation | -1.38e+01 |
Pos logit contributions | |
blogs | +6.837 |
reading | +6.774 |
learning | +6.752 |
chatting | +6.705 |
monitor | +6.631 |
Neg logit contributions | |
Percentage | -6.799 |
Worse | -6.151 |
Killed | -6.094 |
Millions | -6.037 |
Percent | -6.034 |
Token | can |
Token ID | 460 |
Feature activation | -5.99e+00 |
Pos logit contributions | |
learning | +3.276 |
reading | +3.275 |
blogs | +3.273 |
monitor | +3.238 |
thanking | +3.153 |
Neg logit contributions | |
Percentage | -4.070 |
Worse | -3.700 |
Killed | -3.699 |
Percent | -3.652 |
Millions | -3.632 |
Token | do |
Token ID | 466 |
Feature activation | -9.37e+00 |
Pos logit contributions | |
reading | +5.048 |
learning | +5.034 |
blogs | +5.019 |
monitor | +5.015 |
chatting | +4.872 |
Neg logit contributions | |
Percentage | -7.081 |
Killed | -6.495 |
Worse | -6.465 |
Percent | -6.406 |
Millions | -6.322 |
Token | in |
Token ID | 287 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
learning | +9.679 |
reading | +9.657 |
blogs | +9.588 |
monitor | +9.469 |
chatting | +9.416 |
Neg logit contributions | |
Percentage | -8.931 |
Killed | -8.098 |
Worse | -8.037 |
Percent | -7.958 |
Millions | -7.746 |
Token | the |
Token ID | 262 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
learning | +13.578 |
reading | +13.476 |
chatting | +13.343 |
blogs | +13.286 |
thanking | +13.151 |
Neg logit contributions | |
Percentage | -12.207 |
Killed | -11.258 |
Percent | -10.908 |
Worse | -10.888 |
Millions | -10.521 |
Token | classroom |
Token ID | 15806 |
Feature activation | -1.66e+01 |
Pos logit contributions | |
learning | +11.191 |
reading | +11.111 |
blogs | +10.906 |
monitor | +10.852 |
chatting | +10.838 |
Neg logit contributions | |
Percentage | -10.887 |
Killed | -9.890 |
Worse | -9.710 |
Percent | -9.637 |
Millions | -9.389 |
Token | , |
Token ID | 11 |
Feature activation | -3.37e+01 |
Pos logit contributions | |
learning | +17.887 |
reading | +17.472 |
monitor | +17.405 |
chatting | +17.376 |
blogs | +17.376 |
Neg logit contributions | |
Percentage | -12.864 |
Killed | -11.621 |
Worse | -11.555 |
Percent | -11.418 |
Millions | -11.074 |
Token | the |
Token ID | 262 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
chatting | +29.666 |
reading | +29.109 |
learning | +28.998 |
monitor | +28.536 |
researching | +28.502 |
Neg logit contributions | |
Percentage | -19.992 |
Percent | -17.578 |
サーティワン | -17.471 |
Killed | -17.420 |
Worse | -16.732 |
Token | board |
Token ID | 3096 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
learning | +20.938 |
reading | +20.867 |
chatting | +20.682 |
blogs | +20.400 |
workspace | +20.317 |
Neg logit contributions | |
Percentage | -14.752 |
Killed | -13.261 |
Percent | -12.720 |
Worse | -12.599 |
Millions | -12.428 |
Token | room |
Token ID | 3823 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
reading | +15.101 |
learning | +14.914 |
blogs | +14.645 |
chatting | +14.602 |
monitor | +14.592 |
Neg logit contributions | |
Percentage | -15.976 |
Killed | -14.571 |
Worse | -14.463 |
Percent | -14.444 |
Millions | -14.306 |
Token | , |
Token ID | 11 |
Feature activation | -2.84e+01 |
Pos logit contributions | |
reading | +13.594 |
learning | +13.583 |
monitor | +13.533 |
chatting | +13.495 |
blogs | +13.380 |
Neg logit contributions | |
Percentage | -9.263 |
Killed | -8.325 |
Worse | -8.193 |
Percent | -8.067 |
Millions | -7.947 |
Token | maybe |
Token ID | 3863 |
Feature activation | -1.37e+01 |
Pos logit contributions | |
chatting | +25.914 |
reading | +25.300 |
learning | +25.045 |
thanking | +24.785 |
blogs | +24.682 |
Neg logit contributions | |
Percentage | -19.836 |
Percent | -17.369 |
Killed | -17.335 |
Worse | -16.808 |
Millions | -16.585 |
Token | their |
Token ID | 511 |
Feature activation | -4.29e+00 |
Pos logit contributions | |
learning | +5.224 |
reading | +5.194 |
thanking | +5.155 |
monitor | +5.097 |
blogs | +5.092 |
Neg logit contributions | |
Percentage | -8.077 |
Killed | -7.430 |
Worse | -7.382 |
Percent | -7.306 |
Millions | -7.243 |
Token | realism |
Token ID | 30787 |
Feature activation | -7.54e+00 |
Pos logit contributions | |
reading | +3.566 |
learning | +3.563 |
blogs | +3.534 |
monitor | +3.488 |
thanking | +3.443 |
Neg logit contributions | |
Percentage | -5.186 |
Killed | -4.743 |
Worse | -4.743 |
Percent | -4.673 |
Millions | -4.642 |
Token | and |
Token ID | 290 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
reading | +8.340 |
learning | +8.318 |
blogs | +8.240 |
thanking | +8.181 |
monitor | +8.166 |
Neg logit contributions | |
Percentage | -6.761 |
Killed | -6.029 |
Worse | -5.992 |
Percent | -5.965 |
Millions | -5.895 |
Token | bold |
Token ID | 10758 |
Feature activation | -8.33e+00 |
Pos logit contributions | |
thanking | +19.168 |
reading | +18.893 |
learning | +18.713 |
chatting | +18.551 |
blogs | +18.292 |
Neg logit contributions | |
Percentage | -17.558 |
Worse | -15.404 |
Killed | -15.365 |
Percent | -15.185 |
Deaths | -14.654 |
Token | ness |
Token ID | 1108 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
reading | +7.327 |
learning | +7.249 |
blogs | +7.178 |
monitor | +7.123 |
thanking | +6.900 |
Neg logit contributions | |
Percentage | -9.420 |
Killed | -8.595 |
Worse | -8.579 |
Millions | -8.442 |
Percent | -8.423 |
Token | , |
Token ID | 11 |
Feature activation | -3.36e+01 |
Pos logit contributions | |
reading | +11.665 |
learning | +11.632 |
thanking | +11.540 |
blogs | +11.410 |
monitor | +11.352 |
Neg logit contributions | |
Percentage | -9.849 |
Killed | -8.864 |
Worse | -8.829 |
Percent | -8.816 |
Millions | -8.700 |
Token | and |
Token ID | 290 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
thanking | +28.921 |
reading | +27.860 |
chatting | +27.613 |
remembering | +27.499 |
learning | +27.295 |
Neg logit contributions | |
Percentage | -20.427 |
Percent | -18.039 |
Worse | -17.658 |
Killed | -17.545 |
サーティワン | -17.001 |
Token | hope |
Token ID | 2911 |
Feature activation | -8.97e-01 |
Pos logit contributions | |
thanking | +23.067 |
chatting | +21.778 |
reading | +21.735 |
monitor | +21.558 |
learning | +21.480 |
Neg logit contributions | |
Percentage | -18.102 |
Killed | -15.845 |
Percent | -15.412 |
Worse | -15.218 |
サーティワン | -14.869 |
Token | the |
Token ID | 262 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
learning | +0.818 |
reading | +0.816 |
blogs | +0.814 |
monitor | +0.807 |
thanking | +0.787 |
Neg logit contributions | |
Percentage | -1.023 |
Killed | -0.930 |
Worse | -0.929 |
Percent | -0.916 |
Millions | -0.914 |
Token | Obama |
Token ID | 2486 |
Feature activation | -5.95e+00 |
Pos logit contributions | |
learning | +1.257 |
reading | +1.256 |
blogs | +1.254 |
monitor | +1.244 |
thanking | +1.221 |
Neg logit contributions | |
Percentage | -0.994 |
Killed | -0.881 |
Worse | -0.879 |
Percent | -0.864 |
Millions | -0.861 |
Token | administration |
Token ID | 3662 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
reading | +5.008 |
learning | +5.001 |
blogs | +5.000 |
monitor | +4.920 |
thanking | +4.824 |
Neg logit contributions | |
Percentage | -6.977 |
Killed | -6.379 |
Worse | -6.340 |
Percent | -6.254 |
Millions | -6.205 |
Token | also |
Token ID | 635 |
Feature activation | +6.75e-02 |
Pos logit contributions | |
learning | +2.189 |
reading | +2.186 |
blogs | +2.182 |
monitor | +2.162 |
thanking | +2.117 |
Neg logit contributions | |
Percentage | -2.344 |
Killed | -2.114 |
Worse | -2.113 |
Percent | -2.083 |
Millions | -2.077 |
Token | performs |
Token ID | 17706 |
Feature activation | -9.31e-01 |
Pos logit contributions | |
Percentage | +0.069 |
Killed | +0.062 |
Worse | +0.061 |
Millions | +0.060 |
Only | +0.060 |
Neg logit contributions | |
learning | -0.070 |
reading | -0.070 |
blogs | -0.069 |
monitor | -0.069 |
thanking | -0.067 |
Token | " |
Token ID | 366 |
Feature activation | -3.58e+00 |
Pos logit contributions | |
learning | +0.880 |
reading | +0.879 |
blogs | +0.875 |
monitor | +0.869 |
thanking | +0.845 |
Neg logit contributions | |
Percentage | -1.031 |
Killed | -0.937 |
Worse | -0.934 |
Percent | -0.921 |
Millions | -0.920 |
Token | Sm |
Token ID | 7556 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
learning | +2.672 |
reading | +2.669 |
blogs | +2.652 |
monitor | +2.624 |
thanking | +2.542 |
Neg logit contributions | |
Percentage | -4.670 |
Killed | -4.295 |
Worse | -4.294 |
Percent | -4.243 |
Millions | -4.232 |
Token | ells |
Token ID | 19187 |
Feature activation | +1.54e+01 |
Pos logit contributions | |
Percentage | +6.662 |
Killed | +6.154 |
Only | +6.136 |
Worse | +6.135 |
Millions | +6.050 |
Neg logit contributions | |
learning | -3.783 |
blogs | -3.771 |
monitor | -3.761 |
reading | -3.701 |
thanking | -3.699 |
Token | Like |
Token ID | 4525 |
Feature activation | +1.96e+01 |
Pos logit contributions | |
Percentage | +14.504 |
Worse | +14.137 |
Only | +13.817 |
Killed | +13.767 |
Twice | +13.043 |
Neg logit contributions | |
learning | -14.469 |
monitor | -14.331 |
blogs | -14.037 |
reading | -13.892 |
forums | -13.709 |
Token | Teen |
Token ID | 21432 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
Percentage | +15.104 |
Worse | +14.114 |
Only | +14.014 |
Killed | +13.957 |
Millions | +13.530 |
Neg logit contributions | |
learning | -20.571 |
monitor | -20.406 |
blogs | -20.288 |
reading | -19.934 |
reader | -19.526 |
Token | Spirit |
Token ID | 7710 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
Percentage | +8.395 |
Only | +7.525 |
Killed | +7.472 |
Worse | +7.468 |
Millions | +7.333 |
Neg logit contributions | |
blogs | -13.015 |
learning | -12.810 |
reading | -12.753 |
monitor | -12.675 |
forums | -12.400 |
Token | " |
Token ID | 1 |
Feature activation | -3.70e+00 |
Pos logit contributions | |
Percentage | +12.295 |
Only | +11.364 |
Killed | +11.327 |
Worse | +11.208 |
Millions | +10.913 |
Neg logit contributions | |
learning | -12.554 |
blogs | -12.495 |
monitor | -12.465 |
reading | -12.392 |
thanking | -12.026 |
Token | in |
Token ID | 287 |
Feature activation | -4.08e+00 |
Pos logit contributions | |
learning | +3.621 |
reading | +3.620 |
blogs | +3.610 |
monitor | +3.577 |
thanking | +3.507 |
Neg logit contributions | |
Percentage | -3.945 |
Killed | -3.562 |
Worse | -3.559 |
Percent | -3.509 |
Millions | -3.498 |
Token | a |
Token ID | 257 |
Feature activation | -5.01e+00 |
Pos logit contributions | |
learning | +4.444 |
reading | +4.440 |
blogs | +4.437 |
monitor | +4.396 |
thanking | +4.359 |
Neg logit contributions | |
Percentage | -3.838 |
Worse | -3.424 |
Killed | -3.420 |
Percent | -3.359 |
Millions | -3.339 |
Token | at |
Token ID | 379 |
Feature activation | +1.40e+01 |
Pos logit contributions | |
Percentage | +8.825 |
Worse | +8.013 |
Only | +7.956 |
Millions | +7.931 |
Killed | +7.927 |
Neg logit contributions | |
learning | -8.118 |
reading | -8.021 |
blogs | -8.001 |
monitor | -7.967 |
forums | -7.732 |
Token | a |
Token ID | 257 |
Feature activation | +9.91e+00 |
Pos logit contributions | |
Percentage | +13.393 |
Only | +12.318 |
Worse | +12.155 |
Millions | +12.048 |
Killed | +11.882 |
Neg logit contributions | |
learning | -13.044 |
reading | -12.938 |
blogs | -12.886 |
monitor | -12.820 |
reader | -12.298 |
Token | grand |
Token ID | 4490 |
Feature activation | +1.24e+01 |
Pos logit contributions | |
Percentage | +10.367 |
Worse | +9.348 |
Killed | +9.305 |
Only | +9.205 |
Millions | +9.175 |
Neg logit contributions | |
blogs | -9.282 |
learning | -9.165 |
reading | -9.081 |
monitor | -9.074 |
forums | -8.793 |
Token | total |
Token ID | 2472 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
Percentage | +13.346 |
Percent | +11.802 |
Worse | +11.779 |
Killed | +11.565 |
Only | +11.561 |
Neg logit contributions | |
blogs | -10.988 |
learning | -10.610 |
monitor | -10.395 |
forums | -10.283 |
reading | -10.241 |
Token | of |
Token ID | 286 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
Percentage | +10.104 |
Worse | +8.884 |
Only | +8.865 |
Percent | +8.851 |
Millions | +8.714 |
Neg logit contributions | |
blogs | -11.732 |
learning | -11.484 |
monitor | -11.385 |
reading | -11.275 |
forums | -11.160 |
Token | zero |
Token ID | 6632 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
Percentage | +15.311 |
Only | +14.310 |
Millions | +13.854 |
Worse | +13.852 |
Killed | +13.687 |
Neg logit contributions | |
learning | -15.367 |
reading | -15.245 |
blogs | -15.176 |
monitor | -14.952 |
forums | -14.571 |
Token | gig |
Token ID | 12526 |
Feature activation | +1.37e+01 |
Pos logit contributions | |
Percentage | +20.442 |
Percent | +18.986 |
(- | +18.535 |
Killed | +18.289 |
Millions | +18.243 |
Neg logit contributions | |
monitor | -14.564 |
learning | -14.533 |
reading | -14.167 |
blogs | -14.108 |
forums | -13.492 |
Token | awatts |
Token ID | 46684 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
Percentage | +11.699 |
Killed | +10.648 |
Millions | +10.379 |
Only | +10.296 |
Percent | +10.285 |
Neg logit contributions | |
learning | -13.604 |
reading | -13.571 |
thanking | -13.556 |
blogs | -13.488 |
monitor | -13.408 |
Token | . |
Token ID | 13 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
Percentage | +17.641 |
Only | +16.161 |
Worse | +16.022 |
Percent | +16.012 |
(- | +15.999 |
Neg logit contributions | |
blogs | -13.728 |
learning | -13.661 |
reading | -13.318 |
monitor | -13.153 |
forums | -12.867 |
Token | But |
Token ID | 887 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
Percentage | +14.447 |
Worse | +13.559 |
Only | +13.385 |
Millions | +13.071 |
Killed | +12.665 |
Neg logit contributions | |
learning | -18.126 |
blogs | -17.930 |
reading | -17.892 |
monitor | -17.848 |
chatting | -17.559 |
Token | knowing |
Token ID | 6970 |
Feature activation | +4.44e+00 |
Pos logit contributions | |
learning | +0.431 |
reading | +0.430 |
blogs | +0.429 |
monitor | +0.425 |
thanking | +0.413 |
Neg logit contributions | |
Percentage | -0.527 |
Worse | -0.478 |
Killed | -0.478 |
Percent | -0.472 |
Millions | -0.471 |
Token | to |
Token ID | 284 |
Feature activation | +3.96e+00 |
Pos logit contributions | |
Percentage | +2.697 |
Killed | +2.439 |
Worse | +2.439 |
Millions | +2.401 |
Percent | +2.397 |
Neg logit contributions | |
learning | -2.468 |
reading | -2.466 |
blogs | -2.459 |
monitor | -2.441 |
thanking | -2.376 |
Token | put |
Token ID | 1234 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
Percentage | +4.816 |
Killed | +4.443 |
Worse | +4.437 |
Only | +4.395 |
Millions | +4.389 |
Neg logit contributions | |
learning | -3.269 |
reading | -3.252 |
blogs | -3.244 |
monitor | -3.157 |
thanking | -3.051 |
Token | back |
Token ID | 736 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
Percentage | +12.501 |
Millions | +11.583 |
Worse | +11.476 |
Only | +11.304 |
Killed | +11.257 |
Neg logit contributions | |
monitor | -10.890 |
reading | -10.874 |
learning | -10.755 |
blogs | -10.728 |
reader | -10.311 |
Token | the |
Token ID | 262 |
Feature activation | +5.62e+00 |
Pos logit contributions | |
Percentage | +3.045 |
Worse | +2.756 |
Millions | +2.744 |
Killed | +2.742 |
Only | +2.705 |
Neg logit contributions | |
blogs | -2.871 |
learning | -2.868 |
reading | -2.866 |
monitor | -2.853 |
thanking | -2.780 |
Token | $ |
Token ID | 720 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
Percentage | +6.078 |
Millions | +5.555 |
Killed | +5.542 |
Worse | +5.535 |
Only | +5.496 |
Neg logit contributions | |
learning | -5.297 |
blogs | -5.280 |
reading | -5.257 |
monitor | -5.237 |
forums | -5.020 |
Token | 5 |
Token ID | 20 |
Feature activation | +1.82e+01 |
Pos logit contributions | |
Percentage | +9.063 |
Millions | +8.119 |
Killed | +8.046 |
Worse | +8.027 |
Only | +7.988 |
Neg logit contributions | |
reading | -11.114 |
blogs | -11.107 |
learning | -11.085 |
monitor | -10.950 |
chatting | -10.920 |
Token | billion |
Token ID | 2997 |
Feature activation | +1.53e+01 |
Pos logit contributions | |
Percentage | +17.314 |
Percent | +15.727 |
Millions | +15.676 |
Only | +15.556 |
Killed | +15.556 |
Neg logit contributions | |
reading | -15.278 |
blogs | -15.191 |
learning | -15.083 |
monitor | -15.057 |
thanking | -14.438 |
Token | for |
Token ID | 329 |
Feature activation | +3.65e+00 |
Pos logit contributions | |
Percentage | +16.616 |
Millions | +15.357 |
Killed | +15.272 |
Only | +15.234 |
Worse | +15.234 |
Neg logit contributions | |
blogs | -11.960 |
reading | -11.656 |
learning | -11.640 |
monitor | -11.511 |
forums | -11.013 |
Token | food |
Token ID | 2057 |
Feature activation | +7.61e-01 |
Pos logit contributions | |
Percentage | +4.052 |
Worse | +3.706 |
Killed | +3.693 |
Millions | +3.655 |
Only | +3.651 |
Neg logit contributions | |
blogs | -3.363 |
reading | -3.362 |
learning | -3.344 |
monitor | -3.322 |
thanking | -3.212 |
Token | stamps |
Token ID | 25560 |
Feature activation | +3.87e+00 |
Pos logit contributions | |
Percentage | +0.866 |
Killed | +0.790 |
Worse | +0.788 |
Millions | +0.777 |
Percent | +0.776 |
Neg logit contributions | |
learning | -0.692 |
blogs | -0.690 |
reading | -0.690 |
monitor | -0.682 |
thanking | -0.664 |
Token | for |
Token ID | 329 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
Percentage | +4.538 |
Worse | +4.144 |
Killed | +4.139 |
Millions | +4.112 |
Only | +4.094 |
Neg logit contributions | |
blogs | -3.388 |
learning | -3.379 |
reading | -3.354 |
monitor | -3.325 |
reader | -3.179 |
Token | have |
Token ID | 423 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
Percentage | +10.193 |
Worse | +9.229 |
Killed | +9.226 |
Only | +9.143 |
Millions | +8.984 |
Neg logit contributions | |
learning | -8.789 |
blogs | -8.719 |
reading | -8.681 |
monitor | -8.528 |
reader | -8.445 |
Token | historically |
Token ID | 15074 |
Feature activation | +1.69e+01 |
Pos logit contributions | |
Percentage | +12.850 |
Killed | +11.958 |
Only | +11.780 |
Worse | +11.566 |
Millions | +11.350 |
Neg logit contributions | |
learning | -12.116 |
reading | -11.919 |
blogs | -11.806 |
monitor | -11.598 |
reader | -11.512 |
Token | been |
Token ID | 587 |
Feature activation | +8.07e+00 |
Pos logit contributions | |
Percentage | +14.631 |
Killed | +13.728 |
Only | +13.600 |
Worse | +13.099 |
Millions | +12.915 |
Neg logit contributions | |
learning | -16.271 |
reading | -15.866 |
reader | -15.537 |
blogs | -15.524 |
monitor | -15.288 |
Token | much |
Token ID | 881 |
Feature activation | +8.04e+00 |
Pos logit contributions | |
Percentage | +8.355 |
Worse | +7.632 |
Killed | +7.549 |
Only | +7.461 |
Millions | +7.328 |
Neg logit contributions | |
learning | -7.835 |
reading | -7.772 |
monitor | -7.571 |
blogs | -7.549 |
reader | -7.365 |
Token | shorter |
Token ID | 12238 |
Feature activation | +8.15e+00 |
Pos logit contributions | |
Percentage | +7.957 |
Worse | +7.422 |
Killed | +7.151 |
Only | +7.097 |
Percent | +6.987 |
Neg logit contributions | |
learning | -8.054 |
blogs | -7.871 |
reading | -7.860 |
monitor | -7.833 |
reader | -7.595 |
Token | . |
Token ID | 13 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
Percentage | +8.140 |
Killed | +7.280 |
Worse | +7.253 |
Only | +7.194 |
Percent | +7.147 |
Neg logit contributions | |
learning | -8.026 |
reading | -8.022 |
monitor | -8.007 |
blogs | -7.929 |
reader | -7.768 |
Token | The |
Token ID | 383 |
Feature activation | +5.44e+00 |
Pos logit contributions | |
Percentage | +18.032 |
Only | +17.097 |
Worse | +17.009 |
Millions | +16.594 |
Killed | +16.403 |
Neg logit contributions | |
learning | -18.088 |
reading | -18.035 |
blogs | -17.789 |
chatting | -17.607 |
monitor | -17.528 |
Token | latest |
Token ID | 3452 |
Feature activation | +1.30e+01 |
Pos logit contributions | |
Percentage | +6.030 |
Worse | +5.468 |
Killed | +5.449 |
Only | +5.439 |
Millions | +5.415 |
Neg logit contributions | |
learning | -5.007 |
reading | -4.999 |
blogs | -4.959 |
monitor | -4.874 |
thanking | -4.779 |
Token | dispute |
Token ID | 11047 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
Percentage | +14.536 |
Killed | +13.332 |
Worse | +13.291 |
Millions | +13.165 |
Only | +13.156 |
Neg logit contributions | |
learning | -10.310 |
blogs | -10.232 |
reading | -10.124 |
monitor | -9.727 |
forums | -9.627 |
Token | is |
Token ID | 318 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
Percentage | +3.588 |
Killed | +3.219 |
Worse | +3.211 |
Millions | +3.151 |
Only | +3.149 |
Neg logit contributions | |
learning | -3.829 |
blogs | -3.817 |
reading | -3.807 |
monitor | -3.770 |
thanking | -3.676 |
Token | rooted |
Token ID | 19459 |
Feature activation | +2.10e+00 |
Pos logit contributions | |
Percentage | +0.558 |
Killed | +0.507 |
Worse | +0.507 |
Millions | +0.498 |
Percent | +0.497 |
Neg logit contributions | |
learning | -0.479 |
reading | -0.477 |
blogs | -0.476 |
monitor | -0.471 |
thanking | -0.459 |
Token | � |
Token ID | 564 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
Percentage | +16.854 |
Worse | +15.794 |
Only | +15.646 |
Killed | +15.547 |
Millions | +15.182 |
Neg logit contributions | |
reading | -12.382 |
monitor | -12.369 |
learning | -12.236 |
blogs | -12.042 |
reader | -11.597 |
Token | � |
Token ID | 246 |
Feature activation | +9.48e-01 |
Pos logit contributions | |
Percentage | +0.346 |
Worse | +0.309 |
Killed | +0.309 |
Percent | +0.304 |
Millions | +0.303 |
Neg logit contributions | |
learning | -0.376 |
reading | -0.376 |
blogs | -0.375 |
monitor | -0.372 |
thanking | -0.365 |
Token | evil |
Token ID | 23542 |
Feature activation | +7.65e+00 |
Pos logit contributions | |
Percentage | +1.184 |
Worse | +1.089 |
Killed | +1.088 |
Only | +1.072 |
Percent | +1.071 |
Neg logit contributions | |
reading | -0.747 |
learning | -0.746 |
blogs | -0.745 |
monitor | -0.737 |
thanking | -0.722 |
Token | � |
Token ID | 447 |
Feature activation | +3.66e+00 |
Pos logit contributions | |
Percentage | +7.676 |
Worse | +6.904 |
Killed | +6.860 |
Only | +6.841 |
Percent | +6.777 |
Neg logit contributions | |
reading | -7.581 |
learning | -7.574 |
monitor | -7.530 |
blogs | -7.494 |
thanking | -7.313 |
Token | � |
Token ID | 247 |
Feature activation | +3.12e+00 |
Pos logit contributions | |
Percentage | +2.912 |
Worse | +2.515 |
Killed | +2.514 |
Percent | +2.483 |
Only | +2.468 |
Neg logit contributions | |
reading | -4.565 |
learning | -4.562 |
monitor | -4.544 |
blogs | -4.537 |
thanking | -4.437 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e+01 |
Pos logit contributions | |
Percentage | +3.182 |
Worse | +2.881 |
Killed | +2.863 |
Only | +2.834 |
Millions | +2.815 |
Neg logit contributions | |
learning | -3.173 |
reading | -3.171 |
blogs | -3.166 |
monitor | -3.151 |
thanking | -3.063 |
Token | But |
Token ID | 887 |
Feature activation | -8.75e-01 |
Pos logit contributions | |
Percentage | +17.173 |
Worse | +16.314 |
Only | +16.233 |
Millions | +15.585 |
Killed | +15.553 |
Neg logit contributions | |
monitor | -17.147 |
learning | -16.911 |
blogs | -16.815 |
chatting | -16.667 |
reading | -16.614 |
Token | the |
Token ID | 262 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
learning | +0.845 |
reading | +0.844 |
blogs | +0.842 |
monitor | +0.835 |
thanking | +0.814 |
Neg logit contributions | |
Percentage | -0.950 |
Killed | -0.860 |
Worse | -0.859 |
Percent | -0.846 |
Millions | -0.844 |
Token | � |
Token ID | 564 |
Feature activation | -4.28e+00 |
Pos logit contributions | |
Percentage | +3.591 |
Worse | +3.256 |
Killed | +3.248 |
Only | +3.224 |
Percent | +3.212 |
Neg logit contributions | |
learning | -3.009 |
reading | -3.001 |
blogs | -3.000 |
monitor | -2.991 |
thanking | -2.873 |
Token | � |
Token ID | 246 |
Feature activation | -5.54e+00 |
Pos logit contributions | |
learning | +4.356 |
reading | +4.320 |
blogs | +4.315 |
monitor | +4.253 |
thanking | +4.136 |
Neg logit contributions | |
Percentage | -4.376 |
Killed | -3.966 |
Worse | -3.919 |
Millions | -3.864 |
Percent | -3.849 |
Token | new |
Token ID | 3605 |
Feature activation | +8.36e+00 |
Pos logit contributions | |
learning | +4.145 |
reading | +4.113 |
blogs | +4.073 |
monitor | +4.047 |
reader | +3.843 |
Neg logit contributions | |
Percentage | -7.225 |
Killed | -6.643 |
Worse | -6.612 |
Percent | -6.596 |
Millions | -6.548 |
Token | hard |
Token ID | 1327 |
Feature activation | -8.73e+00 |
Pos logit contributions | |
learning | +10.813 |
reading | +10.763 |
blogs | +10.601 |
thanking | +10.529 |
monitor | +10.462 |
Neg logit contributions | |
Percentage | -11.491 |
Worse | -10.616 |
Killed | -10.435 |
Millions | -10.250 |
Percent | -10.220 |
Token | work |
Token ID | 670 |
Feature activation | -8.21e+00 |
Pos logit contributions | |
learning | +6.236 |
reading | +6.216 |
blogs | +6.185 |
monitor | +5.916 |
chatting | +5.855 |
Neg logit contributions | |
Percentage | -11.345 |
Worse | -10.581 |
Killed | -10.539 |
Millions | -10.370 |
Percent | -10.346 |
Token | . |
Token ID | 13 |
Feature activation | +8.86e+00 |
Pos logit contributions | |
learning | +9.177 |
reading | +9.133 |
blogs | +9.079 |
thanking | +8.919 |
monitor | +8.904 |
Neg logit contributions | |
Percentage | -7.177 |
Worse | -6.468 |
Killed | -6.367 |
Millions | -6.240 |
Percent | -6.240 |
Token | � |
Token ID | 564 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
Percentage | +6.523 |
Worse | +5.720 |
Only | +5.684 |
Killed | +5.678 |
Millions | +5.567 |
Neg logit contributions | |
monitor | -11.269 |
blogs | -11.222 |
reading | -11.212 |
learning | -11.201 |
chatting | -10.878 |
Token | � |
Token ID | 250 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
learning | +1.328 |
reading | +1.326 |
blogs | +1.326 |
monitor | +1.307 |
thanking | +1.290 |
Neg logit contributions | |
Percentage | -0.886 |
Killed | -0.779 |
Worse | -0.776 |
Percent | -0.756 |
Millions | -0.755 |
Token | Being |
Token ID | 18357 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
learning | +1.786 |
reading | +1.783 |
blogs | +1.778 |
monitor | +1.759 |
thanking | +1.709 |
Neg logit contributions | |
Percentage | -2.939 |
Killed | -2.701 |
Worse | -2.699 |
Percent | -2.665 |
Millions | -2.662 |
Token | immigrants |
Token ID | 7971 |
Feature activation | -5.16e+00 |
Pos logit contributions | |
Percentage | +0.507 |
Killed | +0.461 |
Worse | +0.458 |
Percent | +0.454 |
Only | +0.453 |
Neg logit contributions | |
reading | -0.406 |
learning | -0.405 |
blogs | -0.403 |
monitor | -0.402 |
thanking | -0.389 |
Token | , |
Token ID | 11 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
learning | +6.081 |
reading | +6.035 |
blogs | +6.025 |
monitor | +5.964 |
thanking | +5.936 |
Neg logit contributions | |
Percentage | -4.351 |
Worse | -3.904 |
Killed | -3.841 |
Percent | -3.786 |
Millions | -3.776 |
Token | we |
Token ID | 356 |
Feature activation | -5.11e+00 |
Pos logit contributions | |
learning | +17.726 |
reading | +17.237 |
blogs | +17.108 |
chatting | +17.014 |
thanking | +17.001 |
Neg logit contributions | |
Percentage | -12.579 |
Worse | -11.378 |
Killed | -11.201 |
Percent | -10.947 |
Millions | -10.637 |
Token | knew |
Token ID | 2993 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
blogs | +4.821 |
learning | +4.802 |
reading | +4.750 |
monitor | +4.723 |
thanking | +4.615 |
Neg logit contributions | |
Percentage | -5.586 |
Worse | -5.099 |
Killed | -5.054 |
Percent | -5.003 |
Millions | -4.980 |
Token | that |
Token ID | 326 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
Percentage | +1.594 |
Killed | +1.449 |
Worse | +1.442 |
Millions | +1.434 |
Only | +1.433 |
Neg logit contributions | |
reading | -1.223 |
blogs | -1.222 |
learning | -1.221 |
monitor | -1.220 |
thanking | -1.170 |
Token | force |
Token ID | 2700 |
Feature activation | -3.61e+00 |
Pos logit contributions | |
learning | +5.816 |
reading | +5.807 |
blogs | +5.755 |
monitor | +5.750 |
thanking | +5.589 |
Neg logit contributions | |
Percentage | -9.703 |
Killed | -8.911 |
Worse | -8.909 |
Percent | -8.830 |
Millions | -8.694 |
Token | , |
Token ID | 11 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
learning | +3.813 |
reading | +3.804 |
blogs | +3.780 |
monitor | +3.767 |
thanking | +3.714 |
Neg logit contributions | |
Percentage | -3.554 |
Worse | -3.184 |
Killed | -3.179 |
Percent | -3.136 |
Millions | -3.113 |
Token | and |
Token ID | 290 |
Feature activation | -5.20e+00 |
Pos logit contributions | |
thanking | +19.391 |
monitor | +19.059 |
reading | +19.053 |
learning | +19.040 |
chatting | +18.951 |
Neg logit contributions | |
Percentage | -15.688 |
Worse | -13.981 |
Percent | -13.885 |
Killed | -13.672 |
サーティワン | -13.485 |
Token | the |
Token ID | 262 |
Feature activation | +9.56e-02 |
Pos logit contributions | |
reading | +4.996 |
learning | +4.988 |
blogs | +4.961 |
monitor | +4.933 |
thanking | +4.877 |
Neg logit contributions | |
Percentage | -5.543 |
Killed | -4.983 |
Worse | -4.982 |
Percent | -4.925 |
Millions | -4.861 |
Token | policy |
Token ID | 2450 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
Percentage | +0.100 |
Killed | +0.091 |
Worse | +0.090 |
Percent | +0.089 |
Millions | +0.089 |
Neg logit contributions | |
learning | -0.096 |
reading | -0.095 |
blogs | -0.095 |
monitor | -0.094 |
thanking | -0.092 |
Token | of |
Token ID | 286 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
learning | +0.459 |
reading | +0.457 |
blogs | +0.457 |
monitor | +0.455 |
thanking | +0.444 |
Neg logit contributions | |
Percentage | -0.410 |
Killed | -0.367 |
Worse | -0.366 |
Percent | -0.360 |
Millions | -0.360 |
Token | non |
Token ID | 1729 |
Feature activation | -5.39e+00 |
Pos logit contributions | |
Percentage | +2.551 |
Killed | +2.322 |
Worse | +2.322 |
Millions | +2.296 |
Only | +2.295 |
Neg logit contributions | |
blogs | -2.019 |
reading | -2.014 |
learning | -2.013 |
monitor | -1.992 |
thanking | -1.918 |
Token | - |
Token ID | 12 |
Feature activation | -8.68e+00 |
Pos logit contributions | |
reading | +5.146 |
learning | +5.140 |
blogs | +5.062 |
monitor | +5.028 |
thanking | +4.890 |
Neg logit contributions | |
Percentage | -5.839 |
Worse | -5.321 |
Killed | -5.304 |
Percent | -5.211 |
Millions | -5.190 |
Token | al |
Token ID | 282 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
learning | +4.986 |
reading | +4.982 |
monitor | +4.864 |
blogs | +4.825 |
reader | +4.538 |
Neg logit contributions | |
Percentage | -12.444 |
Killed | -11.606 |
Worse | -11.573 |
Percent | -11.471 |
Millions | -11.370 |
Token | ignment |
Token ID | 16747 |
Feature activation | +5.06e+00 |
Pos logit contributions | |
Percentage | +1.669 |
Killed | +1.506 |
Worse | +1.504 |
Percent | +1.484 |
Only | +1.483 |
Neg logit contributions | |
blogs | -1.419 |
learning | -1.415 |
reading | -1.412 |
monitor | -1.400 |
thanking | -1.376 |
Token | is |
Token ID | 318 |
Feature activation | +6.40e+00 |
Pos logit contributions | |
Percentage | +5.376 |
Worse | +4.889 |
Killed | +4.878 |
Only | +4.837 |
Millions | +4.779 |
Neg logit contributions | |
blogs | -4.832 |
learning | -4.813 |
reading | -4.782 |
monitor | -4.769 |
reader | -4.622 |
Token | their |
Token ID | 511 |
Feature activation | -7.35e-01 |
Pos logit contributions | |
learning | +0.952 |
reading | +0.951 |
blogs | +0.949 |
monitor | +0.941 |
thanking | +0.922 |
Neg logit contributions | |
Percentage | -0.862 |
Killed | -0.770 |
Worse | -0.769 |
Percent | -0.757 |
Millions | -0.755 |
Token | first |
Token ID | 717 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
learning | +0.745 |
reading | +0.744 |
blogs | +0.742 |
monitor | +0.736 |
thanking | +0.720 |
Neg logit contributions | |
Percentage | -0.761 |
Killed | -0.686 |
Worse | -0.685 |
Percent | -0.674 |
Millions | -0.673 |
Token | meetings |
Token ID | 8292 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
Percentage | +2.717 |
Killed | +2.489 |
Worse | +2.485 |
Only | +2.463 |
Millions | +2.456 |
Neg logit contributions | |
learning | -1.936 |
blogs | -1.913 |
reading | -1.903 |
monitor | -1.903 |
thanking | -1.825 |
Token | , |
Token ID | 11 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
Percentage | +1.449 |
Killed | +1.306 |
Worse | +1.303 |
Only | +1.283 |
Percent | +1.281 |
Neg logit contributions | |
learning | -1.419 |
blogs | -1.418 |
reading | -1.415 |
monitor | -1.404 |
thanking | -1.362 |
Token | so |
Token ID | 523 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
thanking | +17.271 |
chatting | +17.188 |
learning | +17.022 |
reading | +16.955 |
monitor | +16.797 |
Neg logit contributions | |
Percentage | -12.557 |
Percent | -11.222 |
Killed | -11.138 |
Worse | -11.115 |
Millions | -10.943 |
Token | it |
Token ID | 340 |
Feature activation | +7.11e+00 |
Pos logit contributions | |
learning | +1.818 |
reading | +1.816 |
blogs | +1.810 |
monitor | +1.795 |
thanking | +1.756 |
Neg logit contributions | |
Percentage | -2.101 |
Killed | -1.905 |
Worse | -1.901 |
Percent | -1.875 |
Millions | -1.870 |
Token | � |
Token ID | 447 |
Feature activation | +5.78e+00 |
Pos logit contributions | |
Percentage | +6.098 |
Only | +5.443 |
Killed | +5.437 |
Worse | +5.368 |
Millions | +5.273 |
Neg logit contributions | |
learning | -8.137 |
reading | -8.045 |
blogs | -8.040 |
monitor | -7.994 |
forums | -7.765 |
Token | � |
Token ID | 247 |
Feature activation | +9.62e+00 |
Pos logit contributions | |
Percentage | +4.718 |
Worse | +4.148 |
Killed | +4.107 |
Only | +4.060 |
Millions | +4.048 |
Neg logit contributions | |
reading | -6.988 |
learning | -6.981 |
monitor | -6.932 |
blogs | -6.914 |
thanking | -6.806 |
Token | s |
Token ID | 82 |
Feature activation | +9.16e+00 |
Pos logit contributions | |
Percentage | +10.656 |
Worse | +9.792 |
Only | +9.760 |
Killed | +9.693 |
Millions | +9.575 |
Neg logit contributions | |
learning | -8.076 |
reading | -8.029 |
monitor | -7.926 |
blogs | -7.915 |
thanking | -7.865 |
Token | obviously |
Token ID | 6189 |
Feature activation | +1.13e+01 |
Pos logit contributions | |
Percentage | +9.308 |
Only | +8.590 |
Worse | +8.573 |
Killed | +8.366 |
Millions | +8.328 |
Neg logit contributions | |
reading | -8.687 |
learning | -8.669 |
blogs | -8.594 |
monitor | -8.483 |
reader | -8.274 |
Token | not |
Token ID | 407 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
Percentage | +11.589 |
Only | +10.811 |
Worse | +10.772 |
Killed | +10.503 |
Millions | +10.458 |
Neg logit contributions | |
learning | -10.130 |
reading | -10.095 |
blogs | -9.962 |
monitor | -9.918 |
reader | -9.576 |
Token | 29 |
Token ID | 2808 |
Feature activation | +5.72e+00 |
Pos logit contributions | |
Percentage | +6.480 |
Only | +5.332 |
Killed | +5.223 |
Worse | +5.143 |
Millions | +5.138 |
Neg logit contributions | |
learning | -17.672 |
blogs | -17.531 |
monitor | -17.363 |
reading | -17.336 |
reader | -16.861 |
Token | , |
Token ID | 11 |
Feature activation | -7.83e-01 |
Pos logit contributions | |
Percentage | +3.454 |
Killed | +2.896 |
Only | +2.832 |
Worse | +2.800 |
Millions | +2.795 |
Neg logit contributions | |
learning | -8.063 |
blogs | -8.060 |
reading | -8.022 |
monitor | -7.988 |
thanking | -7.845 |
Token | 2010 |
Token ID | 3050 |
Feature activation | +5.64e+00 |
Pos logit contributions | |
learning | +1.045 |
reading | +1.044 |
blogs | +1.042 |
monitor | +1.035 |
thanking | +1.017 |
Neg logit contributions | |
Percentage | -0.563 |
Killed | -0.482 |
Worse | -0.480 |
Percent | -0.470 |
Millions | -0.468 |
Token | , |
Token ID | 11 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
Percentage | +4.529 |
Killed | +3.953 |
Worse | +3.919 |
Millions | +3.887 |
Percent | +3.884 |
Neg logit contributions | |
learning | -6.915 |
blogs | -6.901 |
reading | -6.891 |
monitor | -6.824 |
thanking | -6.685 |
Token | in |
Token ID | 287 |
Feature activation | -7.54e+00 |
Pos logit contributions | |
thanking | +15.027 |
reading | +14.889 |
chatting | +14.753 |
learning | +14.751 |
blogs | +14.618 |
Neg logit contributions | |
Percentage | -13.980 |
Worse | -12.977 |
Killed | -12.480 |
Percent | -12.200 |
Millions | -12.176 |
Token | Pasadena |
Token ID | 41010 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
reading | +8.428 |
learning | +8.425 |
blogs | +8.367 |
thanking | +8.265 |
monitor | +8.219 |
Neg logit contributions | |
Percentage | -6.490 |
Killed | -5.798 |
Worse | -5.759 |
Percent | -5.650 |
Millions | -5.599 |
Token | , |
Token ID | 11 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
reading | +0.803 |
learning | +0.802 |
blogs | +0.799 |
monitor | +0.798 |
thanking | +0.786 |
Neg logit contributions | |
Percentage | -0.457 |
Worse | -0.397 |
Killed | -0.395 |
Percent | -0.383 |
Millions | -0.380 |
Token | California |
Token ID | 3442 |
Feature activation | +8.23e-02 |
Pos logit contributions | |
thanking | +14.978 |
reading | +14.687 |
chatting | +14.678 |
blogs | +14.444 |
learning | +14.402 |
Neg logit contributions | |
Percentage | -15.468 |
Worse | -14.543 |
Killed | -14.069 |
サーティワン | -13.878 |
Percent | -13.786 |
Token | . |
Token ID | 13 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
Percentage | +0.079 |
Worse | +0.071 |
Killed | +0.071 |
Percent | +0.069 |
Millions | +0.069 |
Neg logit contributions | |
learning | -0.090 |
reading | -0.090 |
blogs | -0.089 |
monitor | -0.089 |
thanking | -0.087 |
Token | Hide |
Token ID | 10415 |
Feature activation | -7.14e+00 |
Pos logit contributions | |
Percentage | +10.101 |
Only | +9.202 |
Killed | +9.021 |
Millions | +8.960 |
Worse | +8.934 |
Neg logit contributions | |
learning | -15.924 |
reading | -15.629 |
blogs | -15.622 |
monitor | -15.615 |
chatting | -15.218 |
Token | Caption |
Token ID | 11260 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
reading | +7.004 |
blogs | +6.954 |
monitor | +6.890 |
learning | +6.873 |
chatting | +6.795 |
Neg logit contributions | |
Percentage | -6.874 |
Killed | -6.223 |
Worse | -6.178 |
Percent | -6.122 |
サーティワン | -6.089 |
Token | , |
Token ID | 11 |
Feature activation | -4.55e+00 |
Pos logit contributions | |
Percentage | +10.158 |
Only | +8.934 |
Percent | +8.916 |
Worse | +8.882 |
Killed | +8.836 |
Neg logit contributions | |
reading | -9.825 |
blogs | -9.794 |
monitor | -9.712 |
learning | -9.631 |
reader | -9.454 |
Token | Lean |
Token ID | 45661 |
Feature activation | +5.51e+00 |
Pos logit contributions | |
learning | +5.868 |
reading | +5.824 |
blogs | +5.819 |
monitor | +5.781 |
thanking | +5.701 |
Neg logit contributions | |
Percentage | -3.342 |
Killed | -2.935 |
Worse | -2.921 |
Percent | -2.827 |
Millions | -2.824 |
Token | methodology |
Token ID | 20411 |
Feature activation | +5.46e+00 |
Pos logit contributions | |
Percentage | +4.542 |
Worse | +3.923 |
Killed | +3.913 |
Only | +3.893 |
Percent | +3.872 |
Neg logit contributions | |
reading | -6.731 |
blogs | -6.700 |
learning | -6.681 |
monitor | -6.644 |
thanking | -6.504 |
Token | aims |
Token ID | 12031 |
Feature activation | +6.19e+00 |
Pos logit contributions | |
Percentage | +6.050 |
Killed | +5.467 |
Worse | +5.422 |
Only | +5.411 |
Percent | +5.374 |
Neg logit contributions | |
reading | -5.024 |
blogs | -5.012 |
learning | -5.006 |
monitor | -4.964 |
reader | -4.819 |
Token | at |
Token ID | 379 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
Percentage | +6.369 |
Worse | +5.667 |
Killed | +5.664 |
Only | +5.631 |
Percent | +5.619 |
Neg logit contributions | |
learning | -6.164 |
blogs | -6.160 |
reading | -6.156 |
monitor | -6.078 |
thanking | -5.942 |
Token | waste |
Token ID | 7030 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
Percentage | +1.825 |
Killed | +1.686 |
Worse | +1.685 |
Percent | +1.668 |
Millions | +1.665 |
Neg logit contributions | |
blogs | -0.823 |
reading | -0.823 |
learning | -0.820 |
monitor | -0.806 |
thanking | -0.772 |
Token | reduction |
Token ID | 7741 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
Percentage | +1.084 |
Worse | +0.966 |
Killed | +0.965 |
Only | +0.948 |
Percent | +0.947 |
Neg logit contributions | |
learning | -1.195 |
reading | -1.194 |
blogs | -1.193 |
monitor | -1.179 |
thanking | -1.156 |
Token | in |
Token ID | 287 |
Feature activation | -6.69e+00 |
Pos logit contributions | |
Percentage | +1.190 |
Killed | +1.071 |
Worse | +1.070 |
Only | +1.055 |
Percent | +1.054 |
Neg logit contributions | |
learning | -1.078 |
reading | -1.075 |
blogs | -1.074 |
monitor | -1.065 |
thanking | -1.037 |
Token | process |
Token ID | 1429 |
Feature activation | -5.44e+00 |
Pos logit contributions | |
learning | +6.385 |
reading | +6.338 |
blogs | +6.336 |
monitor | +6.267 |
thanking | +6.158 |
Neg logit contributions | |
Percentage | -6.935 |
Killed | -6.362 |
Worse | -6.326 |
Percent | -6.240 |
Millions | -6.191 |
Token | , |
Token ID | 11 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
learning | +5.788 |
reading | +5.771 |
blogs | +5.731 |
monitor | +5.696 |
thanking | +5.571 |
Neg logit contributions | |
Percentage | -5.205 |
Killed | -4.695 |
Worse | -4.647 |
Percent | -4.618 |
Millions | -4.586 |
Token | while |
Token ID | 981 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
learning | +24.038 |
reading | +23.791 |
monitor | +23.732 |
thanking | +23.561 |
blogs | +23.456 |
Neg logit contributions | |
Percentage | -11.208 |
Killed | -10.323 |
Percent | -9.860 |
サーティワン | -9.840 |
Worse | -9.633 |
Token | local |
Token ID | 1957 |
Feature activation | -6.07e+00 |
Pos logit contributions | |
thanking | +10.001 |
reading | +9.985 |
learning | +9.956 |
blogs | +9.884 |
chatting | +9.847 |
Neg logit contributions | |
Percentage | -18.056 |
Worse | -16.574 |
Millions | -16.481 |
Killed | -16.400 |
Percent | -16.331 |
Token | powers |
Token ID | 5635 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
learning | +5.896 |
blogs | +5.862 |
reading | +5.840 |
monitor | +5.799 |
thanking | +5.677 |
Neg logit contributions | |
Percentage | -6.374 |
Killed | -5.766 |
Worse | -5.743 |
Percent | -5.669 |
Millions | -5.640 |
Token | has |
Token ID | 468 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
reading | +2.046 |
learning | +2.044 |
blogs | +2.036 |
monitor | +2.023 |
thanking | +1.984 |
Neg logit contributions | |
Percentage | -1.948 |
Killed | -1.748 |
Worse | -1.744 |
Percent | -1.723 |
Millions | -1.712 |
Token | been |
Token ID | 587 |
Feature activation | +6.18e+00 |
Pos logit contributions | |
Percentage | +11.467 |
Killed | +10.624 |
Only | +10.445 |
Millions | +10.315 |
Worse | +10.283 |
Neg logit contributions | |
learning | -11.605 |
blogs | -11.361 |
reading | -11.264 |
monitor | -11.225 |
reader | -10.858 |
Token | a |
Token ID | 257 |
Feature activation | +2.27e+00 |
Pos logit contributions | |
Percentage | +6.613 |
Killed | +5.998 |
Worse | +5.969 |
Only | +5.858 |
Millions | +5.814 |
Neg logit contributions | |
learning | -5.920 |
blogs | -5.843 |
reading | -5.807 |
monitor | -5.749 |
reader | -5.590 |
Token | topic |
Token ID | 7243 |
Feature activation | -4.00e+00 |
Pos logit contributions | |
Percentage | +2.549 |
Killed | +2.326 |
Worse | +2.321 |
Millions | +2.285 |
Only | +2.279 |
Neg logit contributions | |
blogs | -2.087 |
learning | -2.080 |
reading | -2.076 |
monitor | -2.064 |
thanking | -1.990 |
Token | since |
Token ID | 1201 |
Feature activation | +5.33e+00 |
Pos logit contributions | |
reading | +4.325 |
blogs | +4.316 |
learning | +4.301 |
monitor | +4.265 |
thanking | +4.200 |
Neg logit contributions | |
Percentage | -3.848 |
Killed | -3.419 |
Worse | -3.418 |
Percent | -3.372 |
Millions | -3.355 |
Token | Ronald |
Token ID | 14430 |
Feature activation | +1.71e+01 |
Pos logit contributions | |
Percentage | +5.383 |
Worse | +4.874 |
Killed | +4.860 |
Millions | +4.828 |
Only | +4.824 |
Neg logit contributions | |
blogs | -5.353 |
monitor | -5.347 |
learning | -5.338 |
reading | -5.317 |
reader | -5.095 |
Token | Reagan |
Token ID | 12823 |
Feature activation | +8.78e+00 |
Pos logit contributions | |
Percentage | +10.771 |
Only | +9.179 |
Millions | +9.048 |
Worse | +9.010 |
Killed | +8.976 |
Neg logit contributions | |
learning | -21.226 |
blogs | -21.111 |
monitor | -20.919 |
forums | -20.843 |
reading | -20.372 |
Token | � |
Token ID | 447 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
Percentage | +8.898 |
Killed | +8.052 |
Only | +7.959 |
Worse | +7.929 |
Millions | +7.896 |
Neg logit contributions | |
blogs | -8.556 |
learning | -8.520 |
monitor | -8.405 |
reading | -8.357 |
forums | -8.237 |
Token | � |
Token ID | 247 |
Feature activation | +8.13e-01 |
Pos logit contributions | |
Percentage | +0.376 |
Killed | +0.331 |
Worse | +0.331 |
Percent | +0.325 |
Millions | +0.325 |
Neg logit contributions | |
reading | -0.503 |
learning | -0.503 |
blogs | -0.501 |
monitor | -0.499 |
thanking | -0.489 |
Token | according |
Token ID | 1864 |
Feature activation | +4.68e-01 |
Pos logit contributions | |
learning | +7.403 |
reading | +7.398 |
monitor | +7.353 |
blogs | +7.350 |
thanking | +7.263 |
Neg logit contributions | |
Percentage | -6.202 |
Killed | -5.539 |
Worse | -5.500 |
Percent | -5.444 |
Millions | -5.426 |
Token | to |
Token ID | 284 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
Percentage | +0.498 |
Killed | +0.450 |
Worse | +0.448 |
Percent | +0.442 |
Millions | +0.441 |
Neg logit contributions | |
learning | -0.464 |
reading | -0.462 |
blogs | -0.461 |
monitor | -0.457 |
thanking | -0.447 |
Token | a |
Token ID | 257 |
Feature activation | -4.19e+00 |
Pos logit contributions | |
learning | +1.675 |
reading | +1.672 |
blogs | +1.671 |
monitor | +1.657 |
thanking | +1.620 |
Neg logit contributions | |
Percentage | -1.609 |
Killed | -1.445 |
Worse | -1.443 |
Percent | -1.419 |
Millions | -1.415 |
Token | new |
Token ID | 649 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
learning | +4.516 |
reading | +4.515 |
blogs | +4.506 |
monitor | +4.470 |
thanking | +4.374 |
Neg logit contributions | |
Percentage | -3.988 |
Killed | -3.577 |
Worse | -3.563 |
Percent | -3.491 |
Millions | -3.486 |
Token | poll |
Token ID | 3278 |
Feature activation | -5.90e+00 |
Pos logit contributions | |
learning | +2.015 |
reading | +2.012 |
blogs | +2.008 |
monitor | +1.994 |
thanking | +1.949 |
Neg logit contributions | |
Percentage | -1.697 |
Killed | -1.516 |
Worse | -1.511 |
Percent | -1.482 |
Millions | -1.478 |
Token | released |
Token ID | 2716 |
Feature activation | -6.80e+00 |
Pos logit contributions | |
learning | +5.910 |
reading | +5.893 |
blogs | +5.867 |
monitor | +5.835 |
thanking | +5.771 |
Neg logit contributions | |
Percentage | -5.849 |
Killed | -5.304 |
Worse | -5.289 |
Millions | -5.206 |
Percent | -5.149 |
Token | Thursday |
Token ID | 3635 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
reading | +6.159 |
blogs | +6.158 |
learning | +6.148 |
monitor | +6.112 |
thanking | +6.012 |
Neg logit contributions | |
Percentage | -7.436 |
Killed | -6.767 |
Worse | -6.738 |
Percent | -6.633 |
Millions | -6.591 |
Token | by |
Token ID | 416 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
Percentage | +1.017 |
Killed | +0.910 |
Worse | +0.908 |
Percent | +0.897 |
Millions | +0.894 |
Neg logit contributions | |
learning | -1.080 |
reading | -1.079 |
blogs | -1.076 |
monitor | -1.068 |
thanking | -1.043 |
Token | Public |
Token ID | 5094 |
Feature activation | -4.39e+00 |
Pos logit contributions | |
learning | +4.819 |
blogs | +4.801 |
reading | +4.795 |
monitor | +4.775 |
thanking | +4.684 |
Neg logit contributions | |
Percentage | -3.377 |
Killed | -2.968 |
Worse | -2.953 |
Percent | -2.894 |
Millions | -2.886 |
Token | Policy |
Token ID | 7820 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
learning | +5.096 |
reading | +5.092 |
monitor | +5.051 |
blogs | +5.027 |
thanking | +4.899 |
Neg logit contributions | |
Percentage | -3.771 |
Killed | -3.373 |
Worse | -3.340 |
Percent | -3.318 |
Millions | -3.303 |
Token | Poll |
Token ID | 12868 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
Percentage | +0.074 |
Killed | +0.062 |
Worse | +0.062 |
Percent | +0.061 |
Millions | +0.060 |
Neg logit contributions | |
blogs | -0.155 |
reading | -0.155 |
learning | -0.155 |
monitor | -0.154 |
thanking | -0.152 |
Token | member |
Token ID | 2888 |
Feature activation | +6.15e+00 |
Pos logit contributions | |
learning | +0.258 |
reading | +0.258 |
blogs | +0.257 |
monitor | +0.254 |
thanking | +0.247 |
Neg logit contributions | |
Percentage | -0.366 |
Killed | -0.335 |
Worse | -0.335 |
Percent | -0.330 |
Millions | -0.330 |
Token | is |
Token ID | 318 |
Feature activation | +8.42e+00 |
Pos logit contributions | |
Percentage | +6.300 |
Killed | +5.773 |
Worse | +5.661 |
Only | +5.614 |
Millions | +5.525 |
Neg logit contributions | |
reading | -6.071 |
learning | -6.064 |
blogs | -6.015 |
monitor | -5.983 |
forums | -5.704 |
Token | up |
Token ID | 510 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
Percentage | +8.992 |
Killed | +8.378 |
Worse | +8.167 |
Only | +8.061 |
Millions | +7.845 |
Neg logit contributions | |
reading | -7.766 |
blogs | -7.751 |
learning | -7.684 |
monitor | -7.580 |
forums | -7.347 |
Token | for |
Token ID | 329 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
Percentage | +1.191 |
Killed | +1.082 |
Worse | +1.072 |
Percent | +1.056 |
Only | +1.055 |
Neg logit contributions | |
blogs | -1.129 |
learning | -1.128 |
reading | -1.127 |
monitor | -1.116 |
thanking | -1.087 |
Token | discussion |
Token ID | 5114 |
Feature activation | -4.06e+00 |
Pos logit contributions | |
Percentage | +0.198 |
Killed | +0.180 |
Worse | +0.180 |
Percent | +0.177 |
Millions | +0.177 |
Neg logit contributions | |
reading | -0.158 |
learning | -0.158 |
blogs | -0.158 |
monitor | -0.156 |
thanking | -0.152 |
Token | ( |
Token ID | 357 |
Feature activation | -1.57e+01 |
Pos logit contributions | |
reading | +4.790 |
learning | +4.789 |
blogs | +4.779 |
monitor | +4.740 |
thanking | +4.682 |
Neg logit contributions | |
Percentage | -3.490 |
Worse | -3.073 |
Killed | -3.066 |
Percent | -3.019 |
Millions | -3.011 |
Token | even |
Token ID | 10197 |
Feature activation | -3.87e+00 |
Pos logit contributions | |
reading | +15.552 |
learning | +15.525 |
blogs | +15.233 |
monitor | +15.197 |
via | +14.704 |
Neg logit contributions | |
Percentage | -14.341 |
Worse | -12.677 |
Percent | -12.671 |
Millions | -12.653 |
Killed | -12.637 |
Token | mang |
Token ID | 45663 |
Feature activation | -3.34e-01 |
Pos logit contributions | |
learning | +3.147 |
reading | +3.146 |
blogs | +3.137 |
monitor | +3.101 |
thanking | +3.034 |
Neg logit contributions | |
Percentage | -4.780 |
Killed | -4.375 |
Worse | -4.367 |
Percent | -4.321 |
Millions | -4.316 |
Token | achu |
Token ID | 32323 |
Feature activation | +9.24e-01 |
Pos logit contributions | |
learning | +0.262 |
reading | +0.262 |
blogs | +0.261 |
monitor | +0.258 |
thanking | +0.251 |
Neg logit contributions | |
Percentage | -0.422 |
Killed | -0.388 |
Worse | -0.387 |
Percent | -0.382 |
Millions | -0.382 |
Token | or |
Token ID | 393 |
Feature activation | -3.07e+00 |
Pos logit contributions | |
Percentage | +0.947 |
Killed | +0.857 |
Worse | +0.851 |
Only | +0.840 |
Percent | +0.837 |
Neg logit contributions | |
reading | -0.940 |
learning | -0.940 |
blogs | -0.936 |
monitor | -0.931 |
thanking | -0.903 |
Token | bre |
Token ID | 1449 |
Feature activation | +9.06e-01 |
Pos logit contributions | |
learning | +3.417 |
reading | +3.416 |
blogs | +3.400 |
monitor | +3.380 |
thanking | +3.329 |
Neg logit contributions | |
Percentage | -2.841 |
Killed | -2.509 |
Worse | -2.507 |
Millions | -2.473 |
Percent | -2.470 |
Token | or |
Token ID | 393 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
blogs | +14.342 |
learning | +14.239 |
reading | +14.233 |
chatting | +14.104 |
thanking | +14.088 |
Neg logit contributions | |
Percentage | -9.803 |
Worse | -8.635 |
Killed | -8.625 |
Percent | -8.463 |
Millions | -8.176 |
Token | talked |
Token ID | 6619 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
chatting | +23.486 |
blogs | +23.433 |
reading | +23.224 |
thanking | +23.176 |
learning | +22.592 |
Neg logit contributions | |
Percentage | -13.516 |
サーティワン | -11.619 |
Percent | -11.061 |
Worse | -10.691 |
Killed | -10.613 |
Token | to |
Token ID | 284 |
Feature activation | -1.00e+01 |
Pos logit contributions | |
reading | +8.930 |
blogs | +8.891 |
learning | +8.888 |
chatting | +8.820 |
monitor | +8.782 |
Neg logit contributions | |
Percentage | -10.925 |
Killed | -9.905 |
Worse | -9.860 |
Percent | -9.813 |
Millions | -9.649 |
Token | me |
Token ID | 502 |
Feature activation | -1.70e+01 |
Pos logit contributions | |
blogs | +9.880 |
reading | +9.739 |
learning | +9.733 |
chatting | +9.628 |
thanking | +9.575 |
Neg logit contributions | |
Percentage | -9.716 |
Killed | -8.632 |
Worse | -8.607 |
Percent | -8.538 |
Millions | -8.289 |
Token | in |
Token ID | 287 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
blogs | +16.573 |
chatting | +16.443 |
thanking | +16.233 |
reading | +16.173 |
learning | +16.088 |
Neg logit contributions | |
Percentage | -14.550 |
Worse | -13.061 |
Killed | -13.006 |
Percent | -12.773 |
Millions | -12.310 |
Token | person |
Token ID | 1048 |
Feature activation | -1.63e+01 |
Pos logit contributions | |
blogs | +21.200 |
chatting | +21.200 |
reading | +21.092 |
learning | +20.808 |
thanking | +20.582 |
Neg logit contributions | |
Percentage | -14.916 |
Killed | -12.621 |
Percent | -12.577 |
サーティワン | -12.533 |
Worse | -12.450 |
Token | , |
Token ID | 11 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
thanking | +17.788 |
chatting | +17.763 |
blogs | +17.708 |
learning | +17.644 |
reading | +17.586 |
Neg logit contributions | |
Percentage | -11.875 |
Worse | -10.508 |
Percent | -10.425 |
Killed | -10.395 |
Millions | -9.873 |
Token | you |
Token ID | 345 |
Feature activation | -8.05e+00 |
Pos logit contributions | |
learning | +20.072 |
blogs | +19.924 |
reading | +19.891 |
monitor | +19.508 |
thanking | +19.432 |
Neg logit contributions | |
Percentage | -15.028 |
Worse | -13.300 |
Killed | -13.239 |
Percent | -12.993 |
Millions | -12.430 |
Token | probably |
Token ID | 2192 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
blogs | +7.256 |
learning | +7.201 |
reading | +7.163 |
monitor | +7.068 |
thanking | +6.824 |
Neg logit contributions | |
Percentage | -8.968 |
Worse | -8.099 |
Killed | -8.066 |
Percent | -8.044 |
Millions | -7.843 |
Token | know |
Token ID | 760 |
Feature activation | -3.47e+00 |
Pos logit contributions | |
learning | +1.176 |
reading | +1.175 |
blogs | +1.172 |
monitor | +1.158 |
thanking | +1.125 |
Neg logit contributions | |
Percentage | -1.901 |
Killed | -1.745 |
Worse | -1.744 |
Percent | -1.723 |
Millions | -1.719 |
Token | that |
Token ID | 326 |
Feature activation | -3.86e+00 |
Pos logit contributions | |
reading | +3.193 |
blogs | +3.184 |
learning | +3.183 |
monitor | +3.131 |
thanking | +3.097 |
Neg logit contributions | |
Percentage | -3.861 |
Worse | -3.515 |
Killed | -3.510 |
Percent | -3.456 |
Millions | -3.445 |
Token | D |
Token ID | 360 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
Percentage | +6.238 |
Killed | +5.558 |
Worse | +5.514 |
Only | +5.464 |
Millions | +5.448 |
Neg logit contributions | |
blogs | -8.588 |
learning | -8.562 |
reading | -8.528 |
monitor | -8.503 |
thanking | -8.369 |
Token | yer |
Token ID | 9860 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
reading | +3.644 |
learning | +3.619 |
blogs | +3.600 |
monitor | +3.585 |
thanking | +3.475 |
Neg logit contributions | |
Percentage | -4.827 |
Worse | -4.387 |
Killed | -4.384 |
Percent | -4.325 |
Millions | -4.318 |
Token | , |
Token ID | 11 |
Feature activation | -1.32e+01 |
Pos logit contributions | |
Percentage | +0.106 |
Killed | +0.095 |
Worse | +0.095 |
Percent | +0.093 |
Millions | +0.093 |
Neg logit contributions | |
reading | -0.115 |
learning | -0.114 |
blogs | -0.114 |
monitor | -0.113 |
thanking | -0.111 |
Token | from |
Token ID | 422 |
Feature activation | -4.43e+00 |
Pos logit contributions | |
learning | +13.137 |
thanking | +13.061 |
blogs | +13.057 |
reading | +12.961 |
chatting | +12.917 |
Neg logit contributions | |
Percentage | -11.518 |
Worse | -10.354 |
Millions | -10.326 |
Killed | -10.278 |
Percent | -10.209 |
Token | RM |
Token ID | 29820 |
Feature activation | -3.18e+00 |
Pos logit contributions | |
learning | +4.725 |
reading | +4.706 |
blogs | +4.684 |
monitor | +4.638 |
thanking | +4.571 |
Neg logit contributions | |
Percentage | -4.263 |
Worse | -3.802 |
Killed | -3.801 |
Percent | -3.746 |
Millions | -3.730 |
Token | IT |
Token ID | 2043 |
Feature activation | -3.97e+00 |
Pos logit contributions | |
reading | +1.971 |
learning | +1.961 |
blogs | +1.929 |
monitor | +1.907 |
thanking | +1.876 |
Neg logit contributions | |
Percentage | -4.506 |
Killed | -4.195 |
Worse | -4.180 |
Percent | -4.142 |
Millions | -4.130 |
Token | University |
Token ID | 2059 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
learning | +4.212 |
reading | +4.208 |
blogs | +4.187 |
monitor | +4.158 |
thanking | +4.096 |
Neg logit contributions | |
Percentage | -3.878 |
Worse | -3.471 |
Killed | -3.462 |
Percent | -3.406 |
Millions | -3.385 |
Token | , |
Token ID | 11 |
Feature activation | -1.39e+01 |
Pos logit contributions | |
learning | +1.864 |
reading | +1.860 |
blogs | +1.854 |
monitor | +1.841 |
thanking | +1.813 |
Neg logit contributions | |
Percentage | -1.447 |
Worse | -1.283 |
Killed | -1.279 |
Percent | -1.257 |
Millions | -1.252 |
Token | said |
Token ID | 531 |
Feature activation | -1.99e-01 |
Pos logit contributions | |
learning | +14.748 |
blogs | +14.729 |
reading | +14.598 |
thanking | +14.508 |
monitor | +14.424 |
Neg logit contributions | |
Percentage | -11.187 |
Worse | -10.081 |
Killed | -9.822 |
Percent | -9.809 |
Millions | -9.750 |
Token | the |
Token ID | 262 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
reading | +0.205 |
learning | +0.204 |
blogs | +0.204 |
monitor | +0.202 |
thanking | +0.197 |
Neg logit contributions | |
Percentage | -0.203 |
Killed | -0.182 |
Worse | -0.182 |
Millions | -0.179 |
Percent | -0.179 |
Token | findings |
Token ID | 6373 |
Feature activation | +5.67e+00 |
Pos logit contributions | |
learning | +1.386 |
reading | +1.384 |
blogs | +1.380 |
monitor | +1.366 |
thanking | +1.330 |
Neg logit contributions | |
Percentage | -1.934 |
Killed | -1.767 |
Worse | -1.765 |
Percent | -1.742 |
Millions | -1.738 |
Token | residents |
Token ID | 5085 |
Feature activation | -5.70e+00 |
Pos logit contributions | |
learning | +1.618 |
reading | +1.616 |
blogs | +1.610 |
monitor | +1.594 |
thanking | +1.561 |
Neg logit contributions | |
Percentage | -1.846 |
Killed | -1.676 |
Worse | -1.672 |
Percent | -1.649 |
Millions | -1.644 |
Token | and |
Token ID | 290 |
Feature activation | -1.19e+01 |
Pos logit contributions | |
learning | +6.280 |
reading | +6.243 |
blogs | +6.216 |
monitor | +6.186 |
thanking | +6.139 |
Neg logit contributions | |
Percentage | -5.170 |
Killed | -4.660 |
Worse | -4.652 |
Percent | -4.586 |
Millions | -4.519 |
Token | other |
Token ID | 584 |
Feature activation | -4.15e+00 |
Pos logit contributions | |
learning | +11.919 |
thanking | +11.768 |
blogs | +11.757 |
reading | +11.738 |
chatting | +11.713 |
Neg logit contributions | |
Percentage | -10.596 |
Killed | -9.621 |
Percent | -9.512 |
Worse | -9.439 |
Millions | -9.308 |
Token | eligible |
Token ID | 8867 |
Feature activation | -3.68e-01 |
Pos logit contributions | |
learning | +3.979 |
reading | +3.955 |
blogs | +3.952 |
monitor | +3.908 |
thanking | +3.846 |
Neg logit contributions | |
Percentage | -4.440 |
Killed | -4.042 |
Worse | -4.027 |
Percent | -3.983 |
Millions | -3.956 |
Token | groups |
Token ID | 2628 |
Feature activation | -3.93e+00 |
Pos logit contributions | |
learning | +0.348 |
reading | +0.347 |
blogs | +0.346 |
monitor | +0.343 |
thanking | +0.335 |
Neg logit contributions | |
Percentage | -0.408 |
Killed | -0.370 |
Worse | -0.369 |
Percent | -0.364 |
Millions | -0.364 |
Token | , |
Token ID | 11 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
learning | +4.425 |
reading | +4.403 |
blogs | +4.397 |
monitor | +4.370 |
thanking | +4.314 |
Neg logit contributions | |
Percentage | -3.563 |
Worse | -3.181 |
Killed | -3.181 |
Percent | -3.129 |
Millions | -3.096 |
Token | like |
Token ID | 588 |
Feature activation | -5.37e+00 |
Pos logit contributions | |
thanking | +24.628 |
blogs | +24.446 |
chatting | +24.148 |
learning | +24.117 |
monitor | +24.063 |
Neg logit contributions | |
Percentage | -14.249 |
サーティワン | -12.952 |
Percent | -12.742 |
Killed | -12.694 |
Worse | -12.533 |
Token | single |
Token ID | 2060 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
learning | +5.210 |
reading | +5.184 |
blogs | +5.162 |
monitor | +5.092 |
thanking | +5.043 |
Neg logit contributions | |
Percentage | -5.644 |
Killed | -5.122 |
Worse | -5.121 |
Percent | -5.053 |
Millions | -5.024 |
Token | mothers |
Token ID | 12289 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
learning | +1.096 |
reading | +1.094 |
blogs | +1.092 |
monitor | +1.080 |
thanking | +1.054 |
Neg logit contributions | |
Percentage | -1.379 |
Killed | -1.255 |
Worse | -1.254 |
Percent | -1.237 |
Millions | -1.234 |
Token | . |
Token ID | 13 |
Feature activation | +2.03e+01 |
Pos logit contributions | |
Percentage | +2.054 |
Killed | +1.852 |
Worse | +1.847 |
Only | +1.826 |
Millions | +1.823 |
Neg logit contributions | |
reading | -1.765 |
learning | -1.759 |
blogs | -1.759 |
monitor | -1.745 |
thanking | -1.689 |
Token |
|
Token ID | 198 |
Feature activation | -9.34e+00 |
Pos logit contributions | |
Percentage | +18.963 |
Only | +17.807 |
Worse | +17.180 |
Millions | +17.045 |
Percent | +16.761 |
Neg logit contributions | |
learning | -17.917 |
reading | -17.809 |
chatting | -17.574 |
monitor | -17.566 |
blogs | -17.548 |
Token | party |
Token ID | 2151 |
Feature activation | -1.17e+01 |
Pos logit contributions | |
reading | +1.904 |
learning | +1.902 |
blogs | +1.889 |
monitor | +1.872 |
thanking | +1.842 |
Neg logit contributions | |
Percentage | -2.518 |
Killed | -2.298 |
Worse | -2.295 |
Percent | -2.261 |
Millions | -2.247 |
Token | ! |
Token ID | 0 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
thanking | +12.409 |
chatting | +12.351 |
learning | +12.295 |
reading | +12.280 |
blogs | +12.133 |
Neg logit contributions | |
Percentage | -10.214 |
Worse | -9.030 |
Killed | -8.950 |
Percent | -8.926 |
Millions | -8.667 |
Token | Friends |
Token ID | 14213 |
Feature activation | -5.24e+00 |
Pos logit contributions | |
Percentage | +1.368 |
Worse | +1.159 |
Killed | +1.158 |
Only | +1.130 |
Millions | +1.129 |
Neg logit contributions | |
reading | -2.990 |
learning | -2.988 |
blogs | -2.987 |
monitor | -2.974 |
thanking | -2.907 |
Token | , |
Token ID | 11 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
blogs | +5.681 |
reading | +5.675 |
learning | +5.651 |
monitor | +5.583 |
thanking | +5.570 |
Neg logit contributions | |
Percentage | -4.910 |
Worse | -4.382 |
Killed | -4.348 |
Percent | -4.314 |
Millions | -4.286 |
Token | family |
Token ID | 1641 |
Feature activation | -8.08e+00 |
Pos logit contributions | |
thanking | +21.725 |
chatting | +21.683 |
blogs | +21.373 |
reading | +21.371 |
learning | +21.088 |
Neg logit contributions | |
Percentage | -13.890 |
サーティワン | -12.061 |
Worse | -12.038 |
Percent | -11.838 |
Killed | -11.667 |
Token | , |
Token ID | 11 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
blogs | +9.412 |
reading | +9.348 |
thanking | +9.335 |
learning | +9.304 |
chatting | +9.270 |
Neg logit contributions | |
Percentage | -6.583 |
Worse | -5.820 |
Killed | -5.762 |
Percent | -5.710 |
Millions | -5.588 |
Token | fighting |
Token ID | 4330 |
Feature activation | -9.01e+00 |
Pos logit contributions | |
thanking | +22.540 |
reading | +22.378 |
chatting | +22.271 |
blogs | +22.125 |
learning | +22.095 |
Neg logit contributions | |
Percentage | -14.907 |
Percent | -12.852 |
Worse | -12.690 |
サーティワン | -12.371 |
Killed | -12.317 |
Token | , |
Token ID | 11 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
blogs | +9.244 |
learning | +9.239 |
reading | +9.187 |
chatting | +9.126 |
thanking | +9.115 |
Neg logit contributions | |
Percentage | -8.546 |
Worse | -7.657 |
Killed | -7.605 |
Percent | -7.501 |
Only | -7.399 |
Token | and |
Token ID | 290 |
Feature activation | -1.59e+01 |
Pos logit contributions | |
chatting | +22.460 |
thanking | +22.311 |
learning | +21.851 |
reading | +21.784 |
blogs | +21.616 |
Neg logit contributions | |
Percentage | -14.257 |
Worse | -12.169 |
Percent | -12.104 |
サーティワン | -11.987 |
Killed | -11.790 |
Token | FO |
Token ID | 11895 |
Feature activation | -4.72e-01 |
Pos logit contributions | |
chatting | +17.271 |
thanking | +17.196 |
learning | +16.893 |
reading | +16.789 |
blogs | +16.772 |
Neg logit contributions | |
Percentage | -12.355 |
Worse | -10.664 |
Percent | -10.606 |
Killed | -10.456 |
サーティワン | -10.428 |
Token | OD |
Token ID | 3727 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
learning | +0.375 |
reading | +0.374 |
blogs | +0.373 |
monitor | +0.369 |
thanking | +0.358 |
Neg logit contributions | |
Percentage | -0.593 |
Killed | -0.544 |
Worse | -0.543 |
Percent | -0.537 |
Millions | -0.537 |
Token | � |
Token ID | 247 |
Feature activation | +5.09e+00 |
Pos logit contributions | |
Percentage | +4.854 |
Worse | +4.098 |
Killed | +4.076 |
Only | +4.076 |
Millions | +4.068 |
Neg logit contributions | |
monitor | -9.108 |
learning | -9.103 |
reading | -9.103 |
blogs | -8.992 |
thanking | -8.911 |
Token | s |
Token ID | 82 |
Feature activation | +7.08e-01 |
Pos logit contributions | |
Percentage | +5.305 |
Killed | +4.781 |
Worse | +4.764 |
Only | +4.729 |
Millions | +4.701 |
Neg logit contributions | |
learning | -5.020 |
reading | -4.981 |
blogs | -4.957 |
monitor | -4.951 |
thanking | -4.873 |
Token | also |
Token ID | 635 |
Feature activation | -6.00e-01 |
Pos logit contributions | |
Percentage | +0.784 |
Killed | +0.711 |
Worse | +0.710 |
Millions | +0.700 |
Percent | +0.699 |
Neg logit contributions | |
learning | -0.668 |
reading | -0.667 |
blogs | -0.664 |
monitor | -0.660 |
thanking | -0.640 |
Token | just |
Token ID | 655 |
Feature activation | -2.74e+00 |
Pos logit contributions | |
learning | +0.564 |
reading | +0.563 |
blogs | +0.561 |
monitor | +0.556 |
thanking | +0.543 |
Neg logit contributions | |
Percentage | -0.667 |
Killed | -0.605 |
Worse | -0.604 |
Percent | -0.596 |
Millions | -0.595 |
Token | enjoyable |
Token ID | 20050 |
Feature activation | -9.32e+00 |
Pos logit contributions | |
learning | +2.589 |
reading | +2.589 |
blogs | +2.582 |
monitor | +2.554 |
thanking | +2.506 |
Neg logit contributions | |
Percentage | -3.018 |
Killed | -2.737 |
Worse | -2.735 |
Percent | -2.696 |
Millions | -2.687 |
Token | , |
Token ID | 11 |
Feature activation | -2.83e+01 |
Pos logit contributions | |
learning | +10.255 |
reading | +10.249 |
chatting | +10.149 |
blogs | +10.133 |
thanking | +9.980 |
Neg logit contributions | |
Percentage | -8.359 |
Worse | -7.486 |
Killed | -7.467 |
Percent | -7.312 |
Millions | -7.302 |
Token | with |
Token ID | 351 |
Feature activation | -8.46e+00 |
Pos logit contributions | |
chatting | +27.737 |
thanking | +27.146 |
learning | +27.086 |
reading | +27.086 |
blogs | +26.665 |
Neg logit contributions | |
Percentage | -16.835 |
Killed | -14.864 |
Worse | -14.790 |
Percent | -14.594 |
サーティワン | -14.493 |
Token | leaflets |
Token ID | 48409 |
Feature activation | -7.99e+00 |
Pos logit contributions | |
blogs | +8.454 |
reading | +8.446 |
learning | +8.422 |
chatting | +8.334 |
thanking | +8.222 |
Neg logit contributions | |
Percentage | -8.418 |
Worse | -7.544 |
Killed | -7.539 |
Percent | -7.452 |
Millions | -7.296 |
Token | from |
Token ID | 422 |
Feature activation | -3.39e+00 |
Pos logit contributions | |
reading | +8.762 |
thanking | +8.693 |
blogs | +8.614 |
learning | +8.605 |
chatting | +8.560 |
Neg logit contributions | |
Percentage | -7.291 |
Killed | -6.522 |
Worse | -6.519 |
Percent | -6.402 |
Millions | -6.352 |
Token | ex |
Token ID | 409 |
Feature activation | -3.02e+00 |
Pos logit contributions | |
learning | +3.416 |
reading | +3.414 |
blogs | +3.412 |
monitor | +3.367 |
thanking | +3.313 |
Neg logit contributions | |
Percentage | -3.513 |
Killed | -3.156 |
Worse | -3.154 |
Percent | -3.107 |
Millions | -3.088 |
Token | - |
Token ID | 12 |
Feature activation | -6.36e+00 |
Pos logit contributions | |
blogs | +3.037 |
learning | +3.033 |
reading | +3.032 |
monitor | +3.000 |
thanking | +2.937 |
Neg logit contributions | |
Percentage | -3.121 |
Killed | -2.812 |
Worse | -2.808 |
Percent | -2.761 |
Millions | -2.752 |
Token | most |
Token ID | 749 |
Feature activation | +4.74e+00 |
Pos logit contributions | |
Percentage | +1.305 |
Killed | +1.179 |
Worse | +1.173 |
Only | +1.160 |
Percent | +1.159 |
Neg logit contributions | |
learning | -1.211 |
reading | -1.209 |
blogs | -1.205 |
monitor | -1.196 |
thanking | -1.163 |
Token | powerful |
Token ID | 3665 |
Feature activation | +4.16e+00 |
Pos logit contributions | |
Percentage | +5.383 |
Killed | +4.934 |
Worse | +4.832 |
Only | +4.832 |
Percent | +4.828 |
Neg logit contributions | |
learning | -4.264 |
reading | -4.260 |
blogs | -4.214 |
monitor | -4.168 |
reader | -3.999 |
Token | and |
Token ID | 290 |
Feature activation | -7.06e+00 |
Pos logit contributions | |
Percentage | +4.983 |
Killed | +4.562 |
Only | +4.508 |
Worse | +4.508 |
Percent | +4.503 |
Neg logit contributions | |
learning | -3.513 |
reading | -3.507 |
blogs | -3.489 |
monitor | -3.452 |
reader | -3.326 |
Token | fastest |
Token ID | 14162 |
Feature activation | +3.99e+00 |
Pos logit contributions | |
learning | +6.143 |
blogs | +6.138 |
reading | +6.122 |
monitor | +6.075 |
thanking | +6.060 |
Neg logit contributions | |
Percentage | -7.919 |
Worse | -7.246 |
Killed | -7.211 |
Millions | -7.070 |
Percent | -7.061 |
Token | off |
Token ID | 572 |
Feature activation | -1.36e+01 |
Pos logit contributions | |
Percentage | +4.533 |
Killed | +4.144 |
Worse | +4.092 |
Only | +4.083 |
Percent | +4.082 |
Neg logit contributions | |
reading | -3.613 |
learning | -3.601 |
blogs | -3.575 |
monitor | -3.562 |
reader | -3.427 |
Token | - |
Token ID | 12 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
blogs | +10.956 |
learning | +10.818 |
reading | +10.766 |
forums | +10.416 |
monitor | +10.331 |
Neg logit contributions | |
Percentage | -14.783 |
Worse | -13.428 |
Killed | -13.283 |
Percent | -13.182 |
Millions | -13.152 |
Token | road |
Token ID | 6344 |
Feature activation | -8.60e+00 |
Pos logit contributions | |
learning | +16.993 |
blogs | +16.856 |
reading | +16.691 |
monitor | +16.572 |
forums | +16.097 |
Neg logit contributions | |
Percentage | -23.687 |
Worse | -21.670 |
Percent | -21.498 |
Killed | -21.168 |
Millions | -21.041 |
Token | pickups |
Token ID | 46462 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
learning | +7.814 |
blogs | +7.804 |
reading | +7.773 |
monitor | +7.677 |
chatting | +7.671 |
Neg logit contributions | |
Percentage | -9.095 |
Worse | -8.298 |
Killed | -8.244 |
Percent | -8.134 |
Millions | -8.079 |
Token | . |
Token ID | 13 |
Feature activation | +1.73e+01 |
Pos logit contributions | |
learning | +2.745 |
reading | +2.738 |
blogs | +2.733 |
monitor | +2.707 |
thanking | +2.665 |
Neg logit contributions | |
Percentage | -2.775 |
Worse | -2.507 |
Killed | -2.496 |
Percent | -2.461 |
Millions | -2.449 |
Token |
|
Token ID | 198 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
Percentage | +15.235 |
Only | +14.247 |
Worse | +13.879 |
Millions | +13.788 |
Killed | +13.717 |
Neg logit contributions | |
learning | -16.842 |
blogs | -16.756 |
monitor | -16.708 |
reading | -16.604 |
chatting | -16.364 |
Token |
|
Token ID | 198 |
Feature activation | -9.60e+00 |
Pos logit contributions | |
reading | +13.517 |
learning | +13.260 |
blogs | +13.206 |
monitor | +13.152 |
via | +13.035 |
Neg logit contributions | |
Percentage | -8.067 |
サーティワン | -7.294 |
Percent | -6.987 |
Worse | -6.987 |
Killed | -6.883 |
Token | spread |
Token ID | 4104 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
Percentage | +1.597 |
Worse | +1.459 |
Killed | +1.453 |
Percent | +1.436 |
Only | +1.435 |
Neg logit contributions | |
learning | -1.164 |
reading | -1.154 |
blogs | -1.154 |
monitor | -1.146 |
thanking | -1.106 |
Token | in |
Token ID | 287 |
Feature activation | -5.62e+00 |
Pos logit contributions | |
reading | +3.050 |
learning | +3.046 |
blogs | +3.036 |
monitor | +3.012 |
thanking | +2.952 |
Neg logit contributions | |
Percentage | -2.859 |
Killed | -2.570 |
Worse | -2.567 |
Percent | -2.526 |
Millions | -2.515 |
Token | the |
Token ID | 262 |
Feature activation | -5.27e+00 |
Pos logit contributions | |
blogs | +5.745 |
reading | +5.742 |
learning | +5.722 |
monitor | +5.647 |
thanking | +5.619 |
Neg logit contributions | |
Percentage | -5.597 |
Killed | -5.053 |
Worse | -5.028 |
Percent | -4.954 |
Millions | -4.887 |
Token | International |
Token ID | 4037 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
reading | +5.534 |
blogs | +5.520 |
learning | +5.496 |
monitor | +5.453 |
thanking | +5.385 |
Neg logit contributions | |
Percentage | -5.127 |
Killed | -4.598 |
Worse | -4.594 |
Percent | -4.530 |
Millions | -4.436 |
Token | League |
Token ID | 4041 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
learning | +1.155 |
reading | +1.153 |
blogs | +1.150 |
monitor | +1.141 |
thanking | +1.118 |
Neg logit contributions | |
Percentage | -1.054 |
Killed | -0.950 |
Worse | -0.948 |
Percent | -0.930 |
Millions | -0.925 |
Token | , |
Token ID | 11 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
learning | +2.899 |
reading | +2.896 |
blogs | +2.890 |
monitor | +2.869 |
thanking | +2.821 |
Neg logit contributions | |
Percentage | -2.133 |
Killed | -1.886 |
Worse | -1.876 |
Percent | -1.847 |
Millions | -1.837 |
Token | on |
Token ID | 319 |
Feature activation | -6.99e+00 |
Pos logit contributions | |
chatting | +25.813 |
thanking | +25.582 |
reading | +24.908 |
monitor | +24.881 |
blogs | +24.747 |
Neg logit contributions | |
Percentage | -14.296 |
Killed | -12.563 |
サーティワン | -12.413 |
Percent | -12.260 |
Worse | -12.231 |
Token | this |
Token ID | 428 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
reading | +7.280 |
blogs | +7.273 |
learning | +7.253 |
monitor | +7.153 |
chatting | +7.053 |
Neg logit contributions | |
Percentage | -6.790 |
Killed | -6.143 |
Worse | -6.068 |
Percent | -5.979 |
Millions | -5.948 |
Token | night |
Token ID | 1755 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
learning | +0.339 |
reading | +0.338 |
blogs | +0.337 |
monitor | +0.334 |
thanking | +0.324 |
Neg logit contributions | |
Percentage | -0.452 |
Killed | -0.412 |
Worse | -0.412 |
Percent | -0.407 |
Millions | -0.406 |
Token | beef |
Token ID | 12023 |
Feature activation | -7.10e-01 |
Pos logit contributions | |
Percentage | +3.050 |
Worse | +2.713 |
Killed | +2.708 |
Only | +2.679 |
Millions | +2.673 |
Neg logit contributions | |
learning | -3.562 |
reading | -3.553 |
blogs | -3.553 |
monitor | -3.535 |
thanking | -3.431 |
Token | tips |
Token ID | 9040 |
Feature activation | +9.49e-02 |
Pos logit contributions | |
learning | +0.598 |
reading | +0.597 |
blogs | +0.596 |
monitor | +0.590 |
thanking | +0.574 |
Neg logit contributions | |
Percentage | -0.858 |
Killed | -0.784 |
Worse | -0.783 |
Percent | -0.773 |
Millions | -0.772 |