Token | treaties |
Token ID | 30734 |
Feature activation | +2.75e+00 |
Pos logit contributions | |
Adds | +4.916 |
Breach | +4.182 |
letters | +3.896 |
arrivals | +3.798 |
oa | +3.757 |
Neg logit contributions | |
intend | -5.982 |
Compton | -5.962 |
percentile | -5.739 |
adelphia | -5.614 |
totality | -5.581 |
Token | , |
Token ID | 11 |
Feature activation | +2.73e+00 |
Pos logit contributions | |
Adds | +1.939 |
Breach | +1.713 |
oa | +1.560 |
letters | +1.557 |
̶ | +1.547 |
Neg logit contributions | |
intend | -1.956 |
Compton | -1.923 |
percentile | -1.922 |
totality | -1.849 |
adelphia | -1.794 |
Token | undermined |
Token ID | 31256 |
Feature activation | -4.64e-01 |
Pos logit contributions | |
Adds | +2.024 |
Breach | +1.797 |
oa | +1.651 |
letters | +1.642 |
̶ | +1.625 |
Neg logit contributions | |
intend | -1.847 |
Compton | -1.812 |
percentile | -1.802 |
totality | -1.732 |
adelphia | -1.680 |
Token | the |
Token ID | 262 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
intend | +0.318 |
Compton | +0.317 |
percentile | +0.317 |
totality | +0.305 |
adelphia | +0.291 |
Neg logit contributions | |
Adds | -0.340 |
Breach | -0.299 |
oa | -0.275 |
letters | -0.275 |
̶ | -0.270 |
Token | International |
Token ID | 4037 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
intend | +0.701 |
Compton | +0.696 |
percentile | +0.695 |
totality | +0.672 |
adelphia | +0.635 |
Neg logit contributions | |
Adds | -0.808 |
Breach | -0.705 |
oa | -0.657 |
letters | -0.654 |
̶ | -0.647 |
Token | Criminal |
Token ID | 15531 |
Feature activation | +1.43e+01 |
Pos logit contributions | |
Adds | +1.740 |
Breach | +1.498 |
oa | +1.296 |
letters | +1.293 |
Newsletter | +1.252 |
Neg logit contributions | |
intend | -3.074 |
percentile | -3.017 |
Compton | -3.015 |
totality | -2.941 |
adelphia | -2.865 |
Token | Court |
Token ID | 3078 |
Feature activation | +9.70e+00 |
Pos logit contributions | |
Adds | +6.214 |
Breach | +5.372 |
letters | +4.985 |
ン | +4.489 |
IER | +4.428 |
Neg logit contributions | |
intend | -12.507 |
percentile | -12.320 |
Compton | -12.210 |
totality | -12.079 |
�� | -12.049 |
Token | , |
Token ID | 11 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
Adds | +6.163 |
Breach | +5.580 |
letters | +4.984 |
Newsletter | +4.963 |
IER | +4.961 |
Neg logit contributions | |
intend | -7.073 |
Compton | -6.895 |
percentile | -6.895 |
adelphia | -6.633 |
totality | -6.626 |
Token | insulted |
Token ID | 40102 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
Adds | +1.666 |
Breach | +1.482 |
oa | +1.366 |
letters | +1.349 |
̶ | +1.341 |
Neg logit contributions | |
intend | -1.525 |
Compton | -1.500 |
percentile | -1.492 |
totality | -1.437 |
adelphia | -1.388 |
Token | the |
Token ID | 262 |
Feature activation | -4.87e-01 |
Pos logit contributions | |
intend | +0.234 |
Compton | +0.233 |
percentile | +0.232 |
totality | +0.223 |
adelphia | +0.213 |
Neg logit contributions | |
Adds | -0.243 |
Breach | -0.214 |
oa | -0.196 |
letters | -0.195 |
̶ | -0.193 |
Token | United |
Token ID | 1578 |
Feature activation | +9.86e-01 |
Pos logit contributions | |
intend | +0.332 |
Compton | +0.331 |
percentile | +0.330 |
totality | +0.319 |
adelphia | +0.302 |
Neg logit contributions | |
Adds | -0.359 |
Breach | -0.314 |
oa | -0.291 |
letters | -0.289 |
̶ | -0.287 |
Token | the |
Token ID | 262 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
intend | +0.519 |
Compton | +0.518 |
percentile | +0.511 |
totality | +0.493 |
adelphia | +0.469 |
Neg logit contributions | |
Adds | -0.604 |
Breach | -0.535 |
letters | -0.491 |
oa | -0.491 |
IER | -0.484 |
Token | National |
Token ID | 2351 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
Adds | +0.711 |
Breach | +0.618 |
oa | +0.563 |
letters | +0.563 |
̶ | +0.556 |
Neg logit contributions | |
intend | -0.784 |
Compton | -0.780 |
percentile | -0.773 |
totality | -0.747 |
adelphia | -0.718 |
Token | Ocean |
Token ID | 10692 |
Feature activation | +4.17e+00 |
Pos logit contributions | |
Adds | +1.806 |
Breach | +1.583 |
oa | +1.427 |
letters | +1.422 |
Newsletter | +1.395 |
Neg logit contributions | |
intend | -2.184 |
percentile | -2.152 |
Compton | -2.149 |
totality | -2.079 |
adelphia | -2.015 |
Token | ic |
Token ID | 291 |
Feature activation | +3.88e+00 |
Pos logit contributions | |
Adds | +3.339 |
Breach | +3.068 |
oa | +2.864 |
letters | +2.838 |
Newsletter | +2.802 |
Neg logit contributions | |
intend | -2.505 |
Compton | -2.456 |
percentile | -2.447 |
totality | -2.372 |
adelphia | -2.261 |
Token | and |
Token ID | 290 |
Feature activation | +6.17e+00 |
Pos logit contributions | |
Adds | +2.762 |
Breach | +2.481 |
oa | +2.286 |
letters | +2.246 |
Newsletter | +2.234 |
Neg logit contributions | |
intend | -2.686 |
percentile | -2.651 |
Compton | -2.645 |
totality | -2.555 |
adelphia | -2.468 |
Token | Atmospheric |
Token ID | 41516 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
Adds | +3.890 |
Breach | +3.590 |
oa | +3.231 |
Newsletter | +3.216 |
artisan | +3.106 |
Neg logit contributions | |
intend | -4.630 |
percentile | -4.530 |
totality | -4.440 |
Compton | -4.439 |
adelphia | -4.333 |
Token | Administration |
Token ID | 8694 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
Adds | +5.451 |
Breach | +5.023 |
oa | +4.434 |
artisan | +4.333 |
Newsletter | +4.200 |
Neg logit contributions | |
intend | -12.154 |
percentile | -11.924 |
adelphia | -11.866 |
Compton | -11.814 |
totality | -11.715 |
Token | � |
Token ID | 447 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
Adds | +2.017 |
Breach | +1.789 |
oa | +1.642 |
letters | +1.633 |
Newsletter | +1.613 |
Neg logit contributions | |
intend | -1.924 |
percentile | -1.899 |
Compton | -1.894 |
totality | -1.822 |
adelphia | -1.757 |
Token | � |
Token ID | 247 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
Adds | +1.443 |
Breach | +1.302 |
letters | +1.210 |
oa | +1.209 |
̶ | +1.198 |
Neg logit contributions | |
intend | -0.952 |
Compton | -0.934 |
percentile | -0.928 |
totality | -0.887 |
adelphia | -0.844 |
Token | s |
Token ID | 82 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
Adds | +1.310 |
Breach | +1.110 |
oa | +0.986 |
letters | +0.979 |
̶ | +0.960 |
Neg logit contributions | |
intend | -2.071 |
Compton | -2.051 |
percentile | -2.050 |
totality | -1.986 |
adelphia | -1.928 |
Token | National |
Token ID | 2351 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
Adds | +1.348 |
Breach | +1.184 |
oa | +1.081 |
letters | +1.076 |
̶ | +1.061 |
Neg logit contributions | |
intend | -1.411 |
Compton | -1.394 |
percentile | -1.391 |
totality | -1.339 |
adelphia | -1.292 |
Token | . |
Token ID | 13 |
Feature activation | -2.52e+00 |
Pos logit contributions | |
intend | +1.810 |
Compton | +1.772 |
percentile | +1.759 |
adelphia | +1.660 |
totality | +1.644 |
Neg logit contributions | |
Adds | -2.262 |
Breach | -2.039 |
artisan | -1.859 |
oa | -1.858 |
̶ | -1.851 |
Token | S |
Token ID | 50 |
Feature activation | -3.04e+00 |
Pos logit contributions | |
intend | +1.934 |
Compton | +1.915 |
percentile | +1.906 |
totality | +1.808 |
adelphia | +1.782 |
Neg logit contributions | |
Adds | -1.604 |
Breach | -1.410 |
oa | -1.279 |
artisan | -1.273 |
letters | -1.261 |
Token | . |
Token ID | 13 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
intend | +1.946 |
Compton | +1.923 |
percentile | +1.908 |
totality | +1.809 |
adelphia | +1.749 |
Neg logit contributions | |
Adds | -2.348 |
Breach | -2.090 |
oa | -1.927 |
̶ | -1.918 |
letters | -1.917 |
Token | Immigration |
Token ID | 18204 |
Feature activation | +5.53e+00 |
Pos logit contributions | |
intend | +0.944 |
Compton | +0.929 |
percentile | +0.922 |
totality | +0.889 |
adelphia | +0.858 |
Neg logit contributions | |
Adds | -0.871 |
Breach | -0.762 |
oa | -0.694 |
letters | -0.690 |
̶ | -0.689 |
Token | and |
Token ID | 290 |
Feature activation | +1.01e+01 |
Pos logit contributions | |
Adds | +3.846 |
Breach | +3.450 |
letters | +3.153 |
oa | +3.148 |
Newsletter | +3.083 |
Neg logit contributions | |
intend | -3.840 |
percentile | -3.813 |
Compton | -3.806 |
totality | -3.720 |
adelphia | -3.544 |
Token | Customs |
Token ID | 23888 |
Feature activation | +1.35e+01 |
Pos logit contributions | |
Adds | +2.903 |
Breach | +2.624 |
oa | +2.031 |
letters | +1.969 |
arrivals | +1.923 |
Neg logit contributions | |
intend | -10.464 |
percentile | -10.286 |
totality | -10.233 |
Compton | -10.215 |
adelphia | -10.182 |
Token | Enforcement |
Token ID | 19198 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
Adds | +6.157 |
Breach | +5.736 |
oa | +4.941 |
Newsletter | +4.927 |
ales | +4.918 |
Neg logit contributions | |
percentile | -11.291 |
intend | -10.993 |
totality | -10.912 |
�� | -10.836 |
Compton | -10.770 |
Token | and |
Token ID | 290 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
Adds | +2.225 |
Breach | +1.997 |
letters | +1.821 |
oa | +1.820 |
Newsletter | +1.797 |
Neg logit contributions | |
intend | -2.285 |
percentile | -2.247 |
Compton | -2.242 |
totality | -2.163 |
adelphia | -2.093 |
Token | the |
Token ID | 262 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
Adds | +2.698 |
Breach | +2.424 |
oa | +2.206 |
letters | +2.197 |
IER | +2.154 |
Neg logit contributions | |
intend | -2.671 |
percentile | -2.626 |
Compton | -2.585 |
totality | -2.504 |
adelphia | -2.435 |
Token | U |
Token ID | 471 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
Adds | +1.199 |
Breach | +1.065 |
oa | +0.974 |
letters | +0.968 |
IER | +0.953 |
Neg logit contributions | |
intend | -1.162 |
percentile | -1.143 |
Compton | -1.141 |
totality | -1.095 |
adelphia | -1.059 |
Token | . |
Token ID | 13 |
Feature activation | -8.89e-01 |
Pos logit contributions | |
intend | +2.124 |
Compton | +2.089 |
percentile | +2.070 |
totality | +1.929 |
adelphia | +1.915 |
Neg logit contributions | |
Adds | -2.619 |
Breach | -2.341 |
oa | -2.147 |
artisan | -2.144 |
letters | -2.135 |
Token | also |
Token ID | 635 |
Feature activation | -5.54e-01 |
Pos logit contributions | |
Compton | +2.327 |
intend | +2.294 |
percentile | +2.293 |
totality | +2.236 |
adelphia | +2.128 |
Neg logit contributions | |
Adds | -2.328 |
Breach | -2.082 |
letters | -1.922 |
artisan | -1.907 |
IER | -1.897 |
Token | brought |
Token ID | 3181 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
intend | +0.430 |
Compton | +0.426 |
percentile | +0.425 |
totality | +0.410 |
adelphia | +0.396 |
Neg logit contributions | |
Adds | -0.355 |
Breach | -0.309 |
oa | -0.279 |
letters | -0.278 |
IER | -0.274 |
Token | Joe |
Token ID | 5689 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
Adds | +1.908 |
Breach | +1.687 |
oa | +1.556 |
letters | +1.539 |
̶ | +1.523 |
Neg logit contributions | |
intend | -1.752 |
percentile | -1.715 |
Compton | -1.698 |
totality | -1.643 |
adelphia | -1.582 |
Token | N |
Token ID | 399 |
Feature activation | -6.38e+00 |
Pos logit contributions | |
Adds | +2.031 |
Breach | +1.850 |
oa | +1.685 |
Newsletter | +1.658 |
̶ | +1.651 |
Neg logit contributions | |
intend | -1.764 |
percentile | -1.728 |
totality | -1.699 |
Compton | -1.677 |
adelphia | -1.590 |
Token | ieu |
Token ID | 22304 |
Feature activation | +6.25e+00 |
Pos logit contributions | |
intend | +3.329 |
percentile | +3.121 |
Compton | +3.074 |
ocl | +2.747 |
adelphia | +2.725 |
Neg logit contributions | |
Adds | -5.731 |
Breach | -5.286 |
letters | -4.893 |
Newsletter | -4.883 |
*/( | -4.809 |
Token | w |
Token ID | 86 |
Feature activation | +1.34e+01 |
Pos logit contributions | |
Adds | +4.983 |
Breach | +4.489 |
oa | +4.267 |
letters | +4.182 |
Newsletter | +4.142 |
Neg logit contributions | |
intend | -3.732 |
percentile | -3.726 |
Compton | -3.635 |
totality | -3.618 |
adelphia | -3.422 |
Token | end |
Token ID | 437 |
Feature activation | +3.82e+00 |
Pos logit contributions | |
Adds | +5.314 |
Breach | +4.593 |
oa | +4.586 |
letters | +4.135 |
ales | +3.914 |
Neg logit contributions | |
totality | -12.263 |
percentile | -12.235 |
intend | -12.154 |
Compton | -11.634 |
adelphia | -11.624 |
Token | yk |
Token ID | 48361 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
Adds | +2.696 |
Breach | +2.394 |
oa | +2.228 |
letters | +2.171 |
artisan | +2.148 |
Neg logit contributions | |
intend | -2.724 |
Compton | -2.661 |
percentile | -2.657 |
totality | -2.587 |
adelphia | -2.474 |
Token | to |
Token ID | 284 |
Feature activation | +3.62e+00 |
Pos logit contributions | |
Adds | +2.570 |
Breach | +2.246 |
oa | +2.106 |
̶ | +2.065 |
letters | +2.059 |
Neg logit contributions | |
intend | -2.538 |
percentile | -2.504 |
Compton | -2.476 |
totality | -2.405 |
adelphia | -2.302 |
Token | the |
Token ID | 262 |
Feature activation | +3.44e+00 |
Pos logit contributions | |
Adds | +2.752 |
Breach | +2.441 |
oa | +2.262 |
letters | +2.218 |
Newsletter | +2.209 |
Neg logit contributions | |
intend | -2.391 |
percentile | -2.350 |
Compton | -2.299 |
totality | -2.213 |
adelphia | -2.123 |
Token | Devils |
Token ID | 26199 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
Adds | +2.699 |
Breach | +2.445 |
oa | +2.249 |
letters | +2.215 |
Newsletter | +2.197 |
Neg logit contributions | |
intend | -2.170 |
percentile | -2.118 |
Compton | -2.099 |
totality | -2.011 |
adelphia | -1.928 |
Token | . |
Token ID | 13 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
intend | +0.996 |
Compton | +0.982 |
percentile | +0.972 |
totality | +0.906 |
adelphia | +0.904 |
Neg logit contributions | |
Adds | -1.228 |
Breach | -1.104 |
artisan | -1.011 |
letters | -1.007 |
oa | -1.006 |
Token | S |
Token ID | 50 |
Feature activation | -4.65e+00 |
Pos logit contributions | |
intend | +1.026 |
Compton | +1.015 |
percentile | +1.013 |
totality | +0.965 |
adelphia | +0.945 |
Neg logit contributions | |
Adds | -0.829 |
Breach | -0.726 |
oa | -0.657 |
artisan | -0.650 |
letters | -0.650 |
Token | . |
Token ID | 13 |
Feature activation | -7.35e-01 |
Pos logit contributions | |
intend | +2.834 |
Compton | +2.821 |
percentile | +2.799 |
totality | +2.604 |
adelphia | +2.533 |
Neg logit contributions | |
Adds | -3.673 |
Breach | -3.279 |
̶ | -3.051 |
artisan | -3.039 |
oa | -3.027 |
Token | Immigration |
Token ID | 18204 |
Feature activation | +4.33e+00 |
Pos logit contributions | |
intend | +0.526 |
Compton | +0.519 |
percentile | +0.517 |
totality | +0.497 |
adelphia | +0.479 |
Neg logit contributions | |
Adds | -0.518 |
Breach | -0.455 |
oa | -0.416 |
letters | -0.415 |
̶ | -0.412 |
Token | and |
Token ID | 290 |
Feature activation | +9.10e+00 |
Pos logit contributions | |
Adds | +3.114 |
Breach | +2.786 |
oa | +2.550 |
letters | +2.539 |
Newsletter | +2.497 |
Neg logit contributions | |
intend | -2.963 |
Compton | -2.933 |
percentile | -2.925 |
totality | -2.832 |
adelphia | -2.720 |
Token | Customs |
Token ID | 23888 |
Feature activation | +1.31e+01 |
Pos logit contributions | |
Adds | +3.013 |
Breach | +2.703 |
oa | +2.150 |
letters | +2.041 |
Newsletter | +1.944 |
Neg logit contributions | |
intend | -9.194 |
percentile | -9.022 |
totality | -8.993 |
Compton | -8.956 |
adelphia | -8.927 |
Token | Enforcement |
Token ID | 19198 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
Adds | +6.149 |
Breach | +5.893 |
letters | +4.996 |
ales | +4.918 |
Newsletter | +4.905 |
Neg logit contributions | |
percentile | -10.593 |
intend | -10.399 |
totality | -10.344 |
adelphia | -10.280 |
�� | -10.272 |
Token | forb |
Token ID | 11747 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
Adds | +0.918 |
Breach | +0.813 |
oa | +0.744 |
letters | +0.740 |
Newsletter | +0.730 |
Neg logit contributions | |
intend | -0.909 |
percentile | -0.895 |
Compton | -0.894 |
totality | -0.860 |
adelphia | -0.830 |
Token | ade |
Token ID | 671 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
Adds | +0.728 |
Breach | +0.631 |
oa | +0.573 |
letters | +0.569 |
̶ | +0.559 |
Neg logit contributions | |
intend | -0.917 |
Compton | -0.910 |
percentile | -0.907 |
totality | -0.881 |
adelphia | -0.845 |
Token | his |
Token ID | 465 |
Feature activation | -2.08e-01 |
Pos logit contributions | |
intend | +0.987 |
Compton | +0.986 |
percentile | +0.976 |
totality | +0.947 |
adelphia | +0.905 |
Neg logit contributions | |
Adds | -0.912 |
Breach | -0.795 |
oa | -0.724 |
letters | -0.723 |
̶ | -0.721 |
Token | release |
Token ID | 2650 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
intend | +0.152 |
Compton | +0.150 |
percentile | +0.150 |
totality | +0.144 |
adelphia | +0.139 |
Neg logit contributions | |
Adds | -0.143 |
Breach | -0.125 |
oa | -0.114 |
letters | -0.114 |
̶ | -0.113 |
Token | AM |
Token ID | 2390 |
Feature activation | -3.51e+00 |
Pos logit contributions | |
Adds | +3.100 |
Breach | +2.727 |
IER | +2.544 |
oa | +2.525 |
letters | +2.506 |
Neg logit contributions | |
intend | -2.877 |
percentile | -2.828 |
Compton | -2.814 |
totality | -2.776 |
adelphia | -2.598 |
Token | AR |
Token ID | 1503 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
Compton | +2.389 |
percentile | +2.365 |
intend | +2.357 |
totality | +2.217 |
adelphia | +2.174 |
Neg logit contributions | |
Adds | -2.538 |
Breach | -2.224 |
artisan | -2.078 |
letters | -2.060 |
oa | -2.038 |
Token | Q |
Token ID | 48 |
Feature activation | +5.01e+00 |
Pos logit contributions | |
Adds | +1.020 |
Breach | +0.917 |
oa | +0.852 |
letters | +0.849 |
̶ | +0.840 |
Neg logit contributions | |
intend | -0.717 |
Compton | -0.708 |
percentile | -0.705 |
totality | -0.672 |
adelphia | -0.642 |
Token | UE |
Token ID | 8924 |
Feature activation | +5.64e+00 |
Pos logit contributions | |
Adds | +2.362 |
Breach | +1.943 |
IER | +1.691 |
oa | +1.670 |
letters | +1.655 |
Neg logit contributions | |
intend | -4.764 |
percentile | -4.670 |
Compton | -4.655 |
totality | -4.567 |
adelphia | -4.438 |
Token | / |
Token ID | 14 |
Feature activation | +7.40e+00 |
Pos logit contributions | |
Adds | +4.711 |
Breach | +4.251 |
IER | +3.952 |
oa | +3.898 |
̶ | +3.863 |
Neg logit contributions | |
intend | -3.303 |
percentile | -3.204 |
Compton | -3.145 |
totality | -3.093 |
adelphia | -2.978 |
Token | RE |
Token ID | 2200 |
Feature activation | +1.27e+01 |
Pos logit contributions | |
Adds | +5.094 |
Breach | +4.394 |
letters | +4.049 |
IER | +4.015 |
oa | +3.988 |
Neg logit contributions | |
intend | -5.348 |
percentile | -5.202 |
Compton | -5.133 |
totality | -5.071 |
adelphia | -4.920 |
Token | UTERS |
Token ID | 14974 |
Feature activation | +3.67e+00 |
Pos logit contributions | |
Adds | +1.885 |
IER | +0.417 |
Breach | +0.354 |
PORT | +0.103 |
UTERS | +0.061 |
Neg logit contributions | |
intend | -15.942 |
totality | -15.557 |
percentile | -15.389 |
Compton | -15.282 |
adelphia | -15.152 |
Token | Presidential |
Token ID | 17471 |
Feature activation | -7.41e-02 |
Pos logit contributions | |
Adds | +2.461 |
Breach | +2.196 |
letters | +1.967 |
oa | +1.961 |
IER | +1.928 |
Neg logit contributions | |
intend | -2.738 |
percentile | -2.671 |
Compton | -2.653 |
totality | -2.585 |
adelphia | -2.511 |
Token | candidate |
Token ID | 4540 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
intend | +0.051 |
Compton | +0.050 |
percentile | +0.050 |
totality | +0.048 |
adelphia | +0.047 |
Neg logit contributions | |
Adds | -0.054 |
Breach | -0.048 |
oa | -0.044 |
letters | -0.044 |
̶ | -0.043 |
Token | Senator |
Token ID | 8962 |
Feature activation | -1.96e-01 |
Pos logit contributions | |
intend | +0.931 |
Compton | +0.924 |
percentile | +0.919 |
totality | +0.886 |
adelphia | +0.850 |
Neg logit contributions | |
Adds | -0.977 |
Breach | -0.861 |
oa | -0.789 |
letters | -0.788 |
Newsletter | -0.779 |
Token | Bernie |
Token ID | 10477 |
Feature activation | +9.14e-01 |
Pos logit contributions | |
intend | +0.141 |
Compton | +0.139 |
percentile | +0.139 |
totality | +0.133 |
adelphia | +0.129 |
Neg logit contributions | |
Adds | -0.138 |
Breach | -0.121 |
oa | -0.111 |
letters | -0.110 |
Newsletter | -0.109 |
Token |
|
Token ID | 198 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
Adds | +0.212 |
Breach | +0.189 |
letters | +0.175 |
oa | +0.175 |
Newsletter | +0.172 |
Neg logit contributions | |
intend | -0.164 |
Compton | -0.161 |
percentile | -0.161 |
totality | -0.156 |
adelphia | -0.149 |
Token | Finally |
Token ID | 11158 |
Feature activation | +7.87e-01 |
Pos logit contributions | |
Adds | +0.217 |
Breach | +0.198 |
oa | +0.183 |
letters | +0.182 |
artisan | +0.180 |
Neg logit contributions | |
intend | -0.157 |
Compton | -0.155 |
percentile | -0.153 |
totality | -0.146 |
adelphia | -0.141 |
Token | , |
Token ID | 11 |
Feature activation | +9.30e-01 |
Pos logit contributions | |
Adds | +0.572 |
Breach | +0.505 |
oa | +0.464 |
letters | +0.462 |
̶ | +0.455 |
Neg logit contributions | |
intend | -0.543 |
Compton | -0.538 |
percentile | -0.536 |
totality | -0.516 |
adelphia | -0.495 |
Token | and |
Token ID | 290 |
Feature activation | +5.68e-01 |
Pos logit contributions | |
Adds | +0.696 |
Breach | +0.618 |
oa | +0.568 |
letters | +0.566 |
̶ | +0.559 |
Neg logit contributions | |
intend | -0.622 |
Compton | -0.614 |
percentile | -0.613 |
totality | -0.588 |
adelphia | -0.566 |
Token | most |
Token ID | 749 |
Feature activation | +6.31e+00 |
Pos logit contributions | |
Adds | +0.472 |
Breach | +0.422 |
oa | +0.393 |
letters | +0.392 |
artisan | +0.387 |
Neg logit contributions | |
intend | -0.334 |
Compton | -0.332 |
percentile | -0.330 |
totality | -0.316 |
adelphia | -0.299 |
Token | revealing |
Token ID | 13477 |
Feature activation | +1.26e+01 |
Pos logit contributions | |
Adds | +4.065 |
Breach | +3.574 |
oa | +3.228 |
letters | +3.179 |
IER | +3.172 |
Neg logit contributions | |
intend | -4.741 |
percentile | -4.610 |
Compton | -4.604 |
adelphia | -4.421 |
totality | -4.411 |
Token | ly |
Token ID | 306 |
Feature activation | +7.06e+00 |
Pos logit contributions | |
Adds | +6.813 |
Breach | +6.029 |
oa | +5.552 |
Newsletter | +5.348 |
arrivals | +5.248 |
Neg logit contributions | |
intend | -10.030 |
Compton | -9.498 |
percentile | -9.445 |
adelphia | -9.256 |
laim | -8.974 |
Token | in |
Token ID | 287 |
Feature activation | +3.96e+00 |
Pos logit contributions | |
Adds | +4.540 |
Breach | +3.961 |
oa | +3.643 |
̶ | +3.634 |
Newsletter | +3.625 |
Neg logit contributions | |
intend | -5.325 |
percentile | -5.178 |
Compton | -5.145 |
totality | -4.973 |
adelphia | -4.904 |
Token | my |
Token ID | 616 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
Adds | +2.890 |
Breach | +2.573 |
letters | +2.338 |
oa | +2.336 |
Newsletter | +2.308 |
Neg logit contributions | |
intend | -2.738 |
percentile | -2.661 |
Compton | -2.658 |
totality | -2.523 |
adelphia | -2.501 |
Token | opinion |
Token ID | 4459 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
Adds | +2.052 |
Breach | +1.830 |
oa | +1.676 |
letters | +1.667 |
̶ | +1.644 |
Neg logit contributions | |
intend | -1.892 |
Compton | -1.848 |
percentile | -1.837 |
totality | -1.755 |
adelphia | -1.726 |
Token | , |
Token ID | 11 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
Adds | +3.319 |
Breach | +2.917 |
oa | +2.676 |
̶ | +2.662 |
Newsletter | +2.651 |
Neg logit contributions | |
intend | -3.642 |
percentile | -3.564 |
Compton | -3.546 |
totality | -3.395 |
adelphia | -3.348 |
Token | N |
Token ID | 399 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
Adds | +3.232 |
Breach | +2.890 |
oa | +2.645 |
letters | +2.587 |
Newsletter | +2.550 |
Neg logit contributions | |
intend | -3.411 |
Compton | -3.286 |
percentile | -3.278 |
totality | -3.174 |
adelphia | -3.118 |
Token | f |
Token ID | 69 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
Adds | +1.140 |
Breach | +1.007 |
oa | +0.923 |
letters | +0.920 |
̶ | +0.907 |
Neg logit contributions | |
intend | -1.096 |
Compton | -1.082 |
percentile | -1.079 |
totality | -1.037 |
adelphia | -0.999 |
Token | 3 |
Token ID | 18 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
Adds | +0.842 |
Breach | +0.749 |
oa | +0.693 |
letters | +0.686 |
Newsletter | +0.677 |
Neg logit contributions | |
intend | -0.778 |
Compton | -0.769 |
percentile | -0.769 |
totality | -0.745 |
adelphia | -0.713 |
Token | { |
Token ID | 1391 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
Adds | +2.244 |
Breach | +1.993 |
oa | +1.838 |
letters | +1.806 |
Newsletter | +1.779 |
Neg logit contributions | |
intend | -2.228 |
Compton | -2.187 |
percentile | -2.185 |
totality | -2.100 |
adelphia | -2.048 |
Token | ( |
Token ID | 7 |
Feature activation | +3.10e+00 |
Pos logit contributions | |
Adds | +1.332 |
Breach | +1.191 |
oa | +1.124 |
letters | +1.119 |
Newsletter | +1.101 |
Neg logit contributions | |
intend | -0.804 |
percentile | -0.802 |
Compton | -0.795 |
totality | -0.779 |
adelphia | -0.729 |
Token | 0 |
Token ID | 15 |
Feature activation | +1.20e+01 |
Pos logit contributions | |
Adds | +2.196 |
Breach | +1.914 |
oa | +1.776 |
letters | +1.764 |
̶ | +1.740 |
Neg logit contributions | |
intend | -2.191 |
Compton | -2.175 |
percentile | -2.169 |
totality | -2.111 |
adelphia | -2.027 |
Token | s |
Token ID | 82 |
Feature activation | +4.46e+00 |
Pos logit contributions | |
Adds | +4.882 |
Breach | +3.553 |
oa | +3.545 |
letters | +3.540 |
ales | +2.853 |
Neg logit contributions | |
totality | -11.342 |
percentile | -11.226 |
Compton | -11.173 |
intend | -10.953 |
�� | -10.829 |
Token | )} |
Token ID | 38165 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
Adds | +2.463 |
Breach | +2.069 |
oa | +1.883 |
letters | +1.848 |
IER | +1.751 |
Neg logit contributions | |
intend | -3.827 |
percentile | -3.793 |
Compton | -3.765 |
totality | -3.762 |
adelphia | -3.593 |
Token | e |
Token ID | 304 |
Feature activation | +8.23e+00 |
Pos logit contributions | |
Adds | +3.172 |
Breach | +2.843 |
oa | +2.615 |
letters | +2.562 |
Newsletter | +2.516 |
Neg logit contributions | |
intend | -3.197 |
Compton | -3.100 |
percentile | -3.097 |
totality | -2.997 |
adelphia | -2.960 |
Token | 6 |
Token ID | 21 |
Feature activation | +2.81e+00 |
Pos logit contributions | |
Adds | +4.616 |
Breach | +4.064 |
oa | +3.736 |
letters | +3.666 |
̶ | +3.596 |
Neg logit contributions | |
totality | -6.621 |
intend | -6.599 |
percentile | -6.477 |
Compton | -6.427 |
adelphia | -6.242 |
Token | { |
Token ID | 1391 |
Feature activation | +5.07e-01 |
Pos logit contributions | |
Adds | +2.015 |
Breach | +1.783 |
oa | +1.641 |
letters | +1.622 |
Newsletter | +1.598 |
Neg logit contributions | |
intend | -1.966 |
percentile | -1.936 |
Compton | -1.929 |
totality | -1.860 |
adelphia | -1.794 |
Token | The |
Token ID | 383 |
Feature activation | +3.89e+00 |
Pos logit contributions | |
Adds | +1.102 |
Breach | +0.979 |
oa | +0.900 |
letters | +0.896 |
Newsletter | +0.883 |
Neg logit contributions | |
intend | -0.988 |
Compton | -0.973 |
percentile | -0.973 |
totality | -0.933 |
adelphia | -0.897 |
Token | Associated |
Token ID | 10575 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
Adds | +2.547 |
Breach | +2.248 |
letters | +2.031 |
oa | +2.006 |
Newsletter | +1.983 |
Neg logit contributions | |
intend | -2.956 |
percentile | -2.896 |
Compton | -2.866 |
totality | -2.810 |
adelphia | -2.703 |
Token | Press |
Token ID | 4332 |
Feature activation | +5.34e+00 |
Pos logit contributions | |
intend | +1.118 |
Compton | +1.118 |
percentile | +1.111 |
totality | +1.069 |
adelphia | +1.044 |
Neg logit contributions | |
Adds | -0.579 |
Breach | -0.469 |
oa | -0.416 |
̶ | -0.410 |
artisan | -0.408 |
Token | . |
Token ID | 13 |
Feature activation | +6.51e+00 |
Pos logit contributions | |
Adds | +3.566 |
Breach | +3.184 |
letters | +2.957 |
oa | +2.855 |
Newsletter | +2.816 |
Neg logit contributions | |
intend | -3.894 |
Compton | -3.824 |
percentile | -3.796 |
totality | -3.749 |
adelphia | -3.644 |
Token | All |
Token ID | 1439 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
Adds | +4.622 |
Breach | +4.318 |
letters | +3.801 |
Newsletter | +3.772 |
oa | +3.756 |
Neg logit contributions | |
intend | -4.438 |
totality | -4.336 |
percentile | -4.331 |
Compton | -4.198 |
adelphia | -4.088 |
Token | Rights |
Token ID | 6923 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
Adds | +2.820 |
Breach | +2.614 |
letters | +2.292 |
oa | +2.211 |
Newsletter | +2.149 |
Neg logit contributions | |
intend | -4.431 |
percentile | -4.391 |
Compton | -4.347 |
totality | -4.323 |
adelphia | -4.224 |
Token | Reserved |
Token ID | 33876 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
Adds | +5.185 |
Breach | +4.783 |
letters | +4.309 |
Created | +3.703 |
Newsletter | +3.506 |
Neg logit contributions | |
intend | -10.651 |
percentile | -10.287 |
�� | -10.126 |
totality | -10.010 |
Compton | -9.966 |
Token | . |
Token ID | 13 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
Adds | +1.986 |
Breach | +1.762 |
letters | +1.608 |
oa | +1.592 |
Newsletter | +1.585 |
Neg logit contributions | |
intend | -2.061 |
percentile | -2.021 |
Compton | -2.014 |
totality | -1.974 |
adelphia | -1.882 |
Token | This |
Token ID | 770 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
Adds | +2.857 |
Breach | +2.565 |
letters | +2.242 |
oa | +2.194 |
Newsletter | +2.187 |
Neg logit contributions | |
intend | -3.647 |
percentile | -3.525 |
Compton | -3.477 |
totality | -3.471 |
adelphia | -3.312 |
Token | material |
Token ID | 2587 |
Feature activation | +4.69e+00 |
Pos logit contributions | |
intend | +0.245 |
Compton | +0.239 |
percentile | +0.239 |
totality | +0.231 |
adelphia | +0.224 |
Neg logit contributions | |
Adds | -0.246 |
Breach | -0.220 |
oa | -0.200 |
letters | -0.199 |
Newsletter | -0.195 |
Token | may |
Token ID | 743 |
Feature activation | +7.05e+00 |
Pos logit contributions | |
Adds | +3.243 |
Breach | +2.911 |
oa | +2.628 |
letters | +2.526 |
arrivals | +2.488 |
Neg logit contributions | |
intend | -3.384 |
Compton | -3.310 |
percentile | -3.197 |
totality | -3.168 |
adelphia | -3.110 |
Token | Reserved |
Token ID | 33876 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
Adds | +5.217 |
Breach | +4.908 |
letters | +4.282 |
Newsletter | +3.889 |
IER | +3.811 |
Neg logit contributions | |
intend | -10.047 |
percentile | -9.796 |
Compton | -9.483 |
adelphia | -9.404 |
totality | -9.392 |
Token | . |
Token ID | 13 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
Adds | +2.812 |
Breach | +2.485 |
letters | +2.268 |
oa | +2.265 |
Newsletter | +2.251 |
Neg logit contributions | |
intend | -2.760 |
percentile | -2.716 |
Compton | -2.714 |
totality | -2.612 |
adelphia | -2.526 |
Token | Prot |
Token ID | 5038 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
Adds | +1.936 |
Breach | +1.737 |
oa | +1.589 |
letters | +1.584 |
Newsletter | +1.571 |
Neg logit contributions | |
intend | -1.616 |
percentile | -1.582 |
Compton | -1.574 |
totality | -1.522 |
adelphia | -1.461 |
Token | ected |
Token ID | 11197 |
Feature activation | +7.01e+00 |
Pos logit contributions | |
Adds | +1.893 |
Breach | +1.674 |
oa | +1.551 |
letters | +1.540 |
̶ | +1.504 |
Neg logit contributions | |
intend | -1.852 |
Compton | -1.837 |
percentile | -1.835 |
totality | -1.788 |
adelphia | -1.709 |
Token | by |
Token ID | 416 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
Adds | +4.845 |
Breach | +4.450 |
letters | +4.021 |
oa | +3.975 |
Newsletter | +3.921 |
Neg logit contributions | |
intend | -4.909 |
Compton | -4.723 |
percentile | -4.680 |
totality | -4.519 |
adelphia | -4.507 |
Token | copyright |
Token ID | 6634 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
Adds | +1.479 |
Breach | +1.306 |
oa | +1.170 |
letters | +1.167 |
Newsletter | +1.144 |
Neg logit contributions | |
intend | -1.798 |
Compton | -1.759 |
percentile | -1.758 |
totality | -1.700 |
adelphia | -1.655 |
Token | of |
Token ID | 286 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
Adds | +6.985 |
Breach | +6.387 |
oa | +5.834 |
letters | +5.737 |
Newsletter | +5.634 |
Neg logit contributions | |
intend | -8.432 |
Compton | -8.164 |
percentile | -8.147 |
adelphia | -7.876 |
weak | -7.791 |
Token | the |
Token ID | 262 |
Feature activation | +4.87e+00 |
Pos logit contributions | |
Adds | +1.370 |
Breach | +1.217 |
oa | +1.110 |
letters | +1.105 |
Newsletter | +1.091 |
Neg logit contributions | |
intend | -1.338 |
percentile | -1.310 |
Compton | -1.307 |
totality | -1.258 |
adelphia | -1.217 |
Token | United |
Token ID | 1578 |
Feature activation | +3.47e+00 |
Pos logit contributions | |
Adds | +3.575 |
Breach | +3.218 |
letters | +2.916 |
oa | +2.903 |
Newsletter | +2.893 |
Neg logit contributions | |
intend | -3.297 |
percentile | -3.201 |
Compton | -3.177 |
totality | -3.052 |
adelphia | -3.009 |
Token | States |
Token ID | 1829 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
Adds | +1.924 |
Breach | +1.662 |
letters | +1.443 |
oa | +1.429 |
̶ | +1.385 |
Neg logit contributions | |
intend | -3.023 |
percentile | -2.903 |
Compton | -2.900 |
totality | -2.873 |
adelphia | -2.777 |
Token | and |
Token ID | 290 |
Feature activation | +7.72e+00 |
Pos logit contributions | |
Adds | +0.985 |
Breach | +0.867 |
oa | +0.790 |
letters | +0.786 |
Newsletter | +0.774 |
Neg logit contributions | |
intend | -1.037 |
Compton | -1.023 |
percentile | -1.021 |
totality | -0.983 |
adelphia | -0.951 |
Token | B |
Token ID | 347 |
Feature activation | +7.03e-01 |
Pos logit contributions | |
Adds | +0.190 |
Breach | +0.169 |
oa | +0.157 |
letters | +0.156 |
IER | +0.155 |
Neg logit contributions | |
intend | -0.152 |
Compton | -0.151 |
percentile | -0.149 |
totality | -0.143 |
adelphia | -0.137 |
Token | . |
Token ID | 13 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
Adds | +0.535 |
Breach | +0.475 |
letters | +0.437 |
oa | +0.435 |
IER | +0.430 |
Neg logit contributions | |
intend | -0.464 |
Compton | -0.457 |
percentile | -0.454 |
totality | -0.434 |
adelphia | -0.416 |
Token | V |
Token ID | 53 |
Feature activation | +1.33e+00 |
Pos logit contributions | |
Adds | +2.102 |
Breach | +1.793 |
oa | +1.614 |
̶ | +1.590 |
letters | +1.530 |
Neg logit contributions | |
percentile | -2.687 |
intend | -2.650 |
Compton | -2.611 |
totality | -2.602 |
adelphia | -2.551 |
Token | . |
Token ID | 13 |
Feature activation | +4.18e+00 |
Pos logit contributions | |
Adds | +1.020 |
Breach | +0.908 |
oa | +0.838 |
letters | +0.834 |
̶ | +0.824 |
Neg logit contributions | |
intend | -0.869 |
Compton | -0.857 |
percentile | -0.855 |
totality | -0.820 |
adelphia | -0.788 |
Token | All |
Token ID | 1439 |
Feature activation | +5.17e+00 |
Pos logit contributions | |
Adds | +3.145 |
Breach | +2.863 |
oa | +2.628 |
letters | +2.549 |
̶ | +2.526 |
Neg logit contributions | |
intend | -2.766 |
percentile | -2.695 |
Compton | -2.654 |
totality | -2.618 |
adelphia | -2.530 |
Token | rights |
Token ID | 2489 |
Feature activation | +1.17e+01 |
Pos logit contributions | |
Adds | +3.363 |
Breach | +3.005 |
oa | +2.744 |
letters | +2.737 |
Newsletter | +2.678 |
Neg logit contributions | |
intend | -3.878 |
Compton | -3.827 |
percentile | -3.820 |
totality | -3.708 |
adelphia | -3.642 |
Token | reserved |
Token ID | 10395 |
Feature activation | +3.80e+00 |
Pos logit contributions | |
Adds | +2.543 |
Breach | +1.848 |
letters | +1.315 |
oa | +1.074 |
arrivals | +1.071 |
Neg logit contributions | |
intend | -13.021 |
adelphia | -12.410 |
percentile | -12.361 |
Compton | -12.348 |
totality | -12.087 |
Token | . |
Token ID | 13 |
Feature activation | +3.41e+00 |
Pos logit contributions | |
Adds | +2.657 |
Breach | +2.338 |
oa | +2.126 |
letters | +2.120 |
Newsletter | +2.102 |
Neg logit contributions | |
intend | -2.740 |
percentile | -2.681 |
Compton | -2.666 |
totality | -2.609 |
adelphia | -2.522 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
Adds | +2.639 |
Breach | +2.387 |
oa | +2.160 |
letters | +2.154 |
Newsletter | +2.137 |
Neg logit contributions | |
intend | -2.220 |
percentile | -2.135 |
Compton | -2.113 |
totality | -2.100 |
adelphia | -2.032 |
Token | On |
Token ID | 2202 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
intend | +1.366 |
Compton | +1.331 |
percentile | +1.314 |
totality | +1.246 |
adelphia | +1.233 |
Neg logit contributions | |
Adds | -1.511 |
Breach | -1.396 |
oa | -1.252 |
letters | -1.243 |
̶ | -1.239 |
Token | the |
Token ID | 262 |
Feature activation | -2.63e+00 |
Pos logit contributions | |
intend | +0.681 |
Compton | +0.679 |
percentile | +0.675 |
totality | +0.652 |
adelphia | +0.619 |
Neg logit contributions | |
Adds | -0.731 |
Breach | -0.642 |
oa | -0.593 |
letters | -0.592 |
̶ | -0.588 |
Token | the |
Token ID | 262 |
Feature activation | -6.07e-01 |
Pos logit contributions | |
Compton | +0.760 |
intend | +0.758 |
percentile | +0.755 |
totality | +0.729 |
adelphia | +0.693 |
Neg logit contributions | |
Adds | -0.758 |
Breach | -0.662 |
oa | -0.611 |
letters | -0.609 |
̶ | -0.607 |
Token | Syrian |
Token ID | 6318 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Compton | +0.441 |
intend | +0.441 |
percentile | +0.438 |
totality | +0.425 |
adelphia | +0.405 |
Neg logit contributions | |
Adds | -0.416 |
Breach | -0.363 |
oa | -0.334 |
letters | -0.333 |
̶ | -0.331 |
Token | Observatory |
Token ID | 25758 |
Feature activation | +5.24e+00 |
Pos logit contributions | |
Adds | +0.876 |
Breach | +0.741 |
oa | +0.654 |
letters | +0.648 |
Newsletter | +0.636 |
Neg logit contributions | |
intend | -1.411 |
Compton | -1.397 |
percentile | -1.392 |
totality | -1.349 |
adelphia | -1.311 |
Token | for |
Token ID | 329 |
Feature activation | +6.91e+00 |
Pos logit contributions | |
Adds | +3.150 |
Breach | +2.661 |
̶ | +2.371 |
oa | +2.367 |
Newsletter | +2.365 |
Neg logit contributions | |
intend | -4.250 |
Compton | -4.214 |
percentile | -4.175 |
totality | -4.072 |
adelphia | -3.945 |
Token | Human |
Token ID | 5524 |
Feature activation | +9.57e+00 |
Pos logit contributions | |
Adds | +3.707 |
Breach | +3.359 |
Newsletter | +2.847 |
arrivals | +2.782 |
letters | +2.743 |
Neg logit contributions | |
intend | -6.102 |
Compton | -5.830 |
percentile | -5.822 |
totality | -5.674 |
adelphia | -5.613 |
Token | Rights |
Token ID | 6923 |
Feature activation | +1.16e+01 |
Pos logit contributions | |
Adds | +4.526 |
Breach | +4.145 |
oa | +3.317 |
arrivals | +3.283 |
Newsletter | +3.282 |
Neg logit contributions | |
intend | -8.634 |
Compton | -8.528 |
percentile | -8.398 |
totality | -8.375 |
adelphia | -8.169 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
Adds | +7.335 |
Breach | +6.408 |
Newsletter | +5.846 |
oa | +5.747 |
arrivals | +5.720 |
Neg logit contributions | |
intend | -8.322 |
Compton | -8.260 |
percentile | -8.242 |
totality | -7.874 |
adelphia | -7.791 |
Token |
|
Token ID | 198 |
Feature activation | +4.47e-01 |
Pos logit contributions | |
intend | +0.094 |
Compton | +0.093 |
percentile | +0.092 |
totality | +0.088 |
adelphia | +0.084 |
Neg logit contributions | |
Adds | -0.122 |
Breach | -0.109 |
oa | -0.101 |
letters | -0.101 |
artisan | -0.100 |
Token |
|
Token ID | 198 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
Adds | +0.359 |
Breach | +0.319 |
oa | +0.296 |
letters | +0.295 |
Newsletter | +0.292 |
Neg logit contributions | |
intend | -0.278 |
Compton | -0.273 |
percentile | -0.273 |
totality | -0.264 |
adelphia | -0.251 |
Token | � |
Token ID | 447 |
Feature activation | -9.39e-01 |
Pos logit contributions | |
intend | +1.042 |
Compton | +1.011 |
percentile | +1.002 |
totality | +0.952 |
adelphia | +0.947 |
Neg logit contributions | |
Adds | -1.172 |
Breach | -1.090 |
oa | -0.979 |
letters | -0.971 |
̶ | -0.966 |
Token | � |
Token ID | 250 |
Feature activation | -3.59e+00 |
Pos logit contributions | |
intend | +0.542 |
percentile | +0.533 |
Compton | +0.532 |
totality | +0.506 |
adelphia | +0.485 |
Neg logit contributions | |
Adds | -0.787 |
Breach | -0.710 |
oa | -0.661 |
letters | -0.657 |
̶ | -0.652 |
Token | Creative |
Token ID | 17404 |
Feature activation | +3.01e+00 |
Pos logit contributions | |
Adds | +0.779 |
Breach | +0.630 |
oa | +0.527 |
letters | +0.519 |
̶ | +0.505 |
Neg logit contributions | |
intend | -1.894 |
Compton | -1.872 |
percentile | -1.870 |
totality | -1.819 |
adelphia | -1.780 |
Token | Commons |
Token ID | 13815 |
Feature activation | +6.43e+00 |
Pos logit contributions | |
Adds | +2.051 |
Breach | +1.844 |
oa | +1.660 |
letters | +1.651 |
Newsletter | +1.633 |
Neg logit contributions | |
intend | -2.206 |
percentile | -2.153 |
Compton | -2.153 |
totality | -2.065 |
adelphia | -2.007 |
Token | Attribution |
Token ID | 45336 |
Feature activation | +7.82e+00 |
Pos logit contributions | |
Adds | +3.867 |
Breach | +3.480 |
oa | +3.098 |
IER | +2.998 |
artisan | +2.991 |
Neg logit contributions | |
intend | -5.154 |
percentile | -4.985 |
Compton | -4.962 |
adelphia | -4.797 |
totality | -4.759 |
Token | - |
Token ID | 12 |
Feature activation | +6.96e+00 |
Pos logit contributions | |
Adds | +5.439 |
Breach | +4.837 |
oa | +4.484 |
IER | +4.353 |
Newsletter | +4.352 |
Neg logit contributions | |
intend | -5.465 |
Compton | -5.362 |
percentile | -5.311 |
adelphia | -5.050 |
totality | -5.022 |
Token | Non |
Token ID | 15419 |
Feature activation | +7.97e+00 |
Pos logit contributions | |
Adds | +4.610 |
Breach | +3.969 |
oa | +3.729 |
Newsletter | +3.686 |
IER | +3.684 |
Neg logit contributions | |
Compton | -5.103 |
percentile | -5.085 |
intend | -5.064 |
totality | -4.857 |
adelphia | -4.784 |
Token | Commercial |
Token ID | 48401 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
Adds | +5.230 |
Breach | +4.664 |
oa | +4.332 |
̶ | +4.280 |
letters | +4.276 |
Neg logit contributions | |
percentile | -5.752 |
Compton | -5.666 |
intend | -5.626 |
totality | -5.548 |
adelphia | -5.293 |
Token | 3 |
Token ID | 513 |
Feature activation | +6.15e+00 |
Pos logit contributions | |
Adds | +6.966 |
Breach | +6.329 |
oa | +5.776 |
IER | +5.596 |
̶ | +5.521 |
Neg logit contributions | |
intend | -8.666 |
Compton | -8.178 |
percentile | -8.073 |
totality | -7.902 |
adelphia | -7.871 |
Token | . |
Token ID | 13 |
Feature activation | +1.08e+01 |
Pos logit contributions | |
Adds | +4.027 |
Breach | +3.596 |
̶ | +3.236 |
oa | +3.210 |
Newsletter | +3.193 |
Neg logit contributions | |
intend | -4.696 |
Compton | -4.543 |
percentile | -4.471 |
totality | -4.388 |
adelphia | -4.273 |
Token | 0 |
Token ID | 15 |
Feature activation | +8.86e+00 |
Pos logit contributions | |
Adds | +6.154 |
Breach | +5.576 |
oa | +4.961 |
̶ | +4.833 |
letters | +4.638 |
Neg logit contributions | |
intend | -8.934 |
totality | -8.398 |
Compton | -8.369 |
percentile | -8.321 |
adelphia | -8.085 |
Token | Un |
Token ID | 791 |
Feature activation | +6.59e+00 |
Pos logit contributions | |
Adds | +4.860 |
Breach | +4.446 |
oa | +3.878 |
̶ | +3.726 |
ン | +3.622 |
Neg logit contributions | |
intend | -7.623 |
Compton | -7.173 |
percentile | -7.022 |
adelphia | -6.782 |
totality | -6.761 |
Token | ported |
Token ID | 9213 |
Feature activation | +5.66e+00 |
Pos logit contributions | |
Adds | +2.787 |
Breach | +2.330 |
oa | +2.211 |
̶ | +2.009 |
letters | +1.977 |
Neg logit contributions | |
intend | -6.426 |
Compton | -6.397 |
percentile | -6.367 |
totality | -6.272 |
adelphia | -5.911 |
Token | poorly |
Token ID | 13455 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
Adds | +0.646 |
Breach | +0.572 |
oa | +0.525 |
letters | +0.525 |
Newsletter | +0.516 |
Neg logit contributions | |
intend | -0.587 |
Compton | -0.579 |
percentile | -0.578 |
totality | -0.555 |
adelphia | -0.532 |
Token | . |
Token ID | 13 |
Feature activation | +7.95e-01 |
Pos logit contributions | |
Adds | +1.036 |
Breach | +0.919 |
oa | +0.845 |
letters | +0.842 |
̶ | +0.830 |
Neg logit contributions | |
intend | -0.934 |
Compton | -0.922 |
percentile | -0.920 |
totality | -0.883 |
adelphia | -0.849 |
Token |
|
Token ID | 198 |
Feature activation | +1.76e-01 |
Pos logit contributions | |
Adds | +0.658 |
Breach | +0.590 |
oa | +0.548 |
letters | +0.547 |
artisan | +0.541 |
Neg logit contributions | |
intend | -0.469 |
Compton | -0.464 |
percentile | -0.461 |
totality | -0.438 |
adelphia | -0.419 |
Token |
|
Token ID | 198 |
Feature activation | +5.24e-01 |
Pos logit contributions | |
Adds | +0.142 |
Breach | +0.126 |
oa | +0.117 |
letters | +0.117 |
̶ | +0.115 |
Neg logit contributions | |
intend | -0.109 |
Compton | -0.107 |
percentile | -0.107 |
totality | -0.104 |
adelphia | -0.099 |
Token | " |
Token ID | 1 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
Adds | +0.312 |
Breach | +0.271 |
oa | +0.240 |
letters | +0.239 |
artisan | +0.236 |
Neg logit contributions | |
intend | -0.430 |
Compton | -0.423 |
percentile | -0.422 |
totality | -0.406 |
adelphia | -0.396 |
Token | Ste |
Token ID | 7447 |
Feature activation | +1.15e+01 |
Pos logit contributions | |
Adds | +1.262 |
Breach | +1.123 |
oa | +1.035 |
letters | +1.031 |
̶ | +1.018 |
Neg logit contributions | |
intend | -1.081 |
Compton | -1.067 |
percentile | -1.064 |
totality | -1.021 |
adelphia | -0.980 |
Token | lla |
Token ID | 8466 |
Feature activation | +5.27e+00 |
Pos logit contributions | |
Adds | +2.543 |
oa | +1.885 |
letters | +1.688 |
ales | +1.505 |
ese | +1.450 |
Neg logit contributions | |
totality | -12.691 |
intend | -12.408 |
Compton | -12.284 |
percentile | -12.259 |
Sunder | -11.954 |
Token | , |
Token ID | 11 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Adds | +3.695 |
Breach | +3.288 |
oa | +3.063 |
letters | +2.974 |
̶ | +2.963 |
Neg logit contributions | |
intend | -3.675 |
Compton | -3.629 |
percentile | -3.627 |
totality | -3.502 |
adelphia | -3.385 |
Token | you |
Token ID | 345 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
Adds | +1.151 |
Breach | +1.019 |
oa | +0.934 |
letters | +0.927 |
̶ | +0.916 |
Neg logit contributions | |
intend | -1.124 |
Compton | -1.110 |
percentile | -1.106 |
totality | -1.064 |
adelphia | -1.028 |
Token | should |
Token ID | 815 |
Feature activation | -2.90e+00 |
Pos logit contributions | |
Adds | +0.966 |
Breach | +0.862 |
oa | +0.790 |
letters | +0.775 |
̶ | +0.768 |
Neg logit contributions | |
intend | -1.012 |
Compton | -1.004 |
percentile | -0.995 |
totality | -0.965 |
adelphia | -0.936 |
Token | und |
Token ID | 3318 |
Feature activation | -2.12e-01 |
Pos logit contributions | |
intend | +1.932 |
percentile | +1.908 |
Compton | +1.884 |
totality | +1.808 |
lé | +1.723 |
Neg logit contributions | |
Adds | -2.197 |
Breach | -1.931 |
letters | -1.797 |
artisan | -1.772 |
oa | -1.771 |
Token | Money |
Token ID | 12911 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
Adds | +2.790 |
Breach | +2.538 |
oa | +2.232 |
letters | +2.213 |
Newsletter | +2.177 |
Neg logit contributions | |
intend | -3.096 |
percentile | -3.000 |
Compton | -2.990 |
totality | -2.888 |
adelphia | -2.857 |
Token | Map |
Token ID | 9347 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
intend | +0.912 |
percentile | +0.896 |
Compton | +0.891 |
totality | +0.847 |
adelphia | +0.810 |
Neg logit contributions | |
Adds | -1.419 |
Breach | -1.271 |
oa | -1.196 |
̶ | -1.184 |
letters | -1.182 |
Token | Press |
Token ID | 4332 |
Feature activation | +4.31e+00 |
Pos logit contributions | |
intend | +0.273 |
Compton | +0.269 |
percentile | +0.268 |
totality | +0.258 |
adelphia | +0.248 |
Neg logit contributions | |
Adds | -0.297 |
Breach | -0.263 |
oa | -0.242 |
letters | -0.241 |
̶ | -0.239 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e+00 |
Pos logit contributions | |
Adds | +3.090 |
Breach | +2.751 |
letters | +2.560 |
oa | +2.505 |
Newsletter | +2.474 |
Neg logit contributions | |
intend | -2.947 |
percentile | -2.929 |
Compton | -2.915 |
totality | -2.810 |
adelphia | -2.711 |
Token | All |
Token ID | 1439 |
Feature activation | +5.26e+00 |
Pos logit contributions | |
Adds | +1.417 |
Breach | +1.270 |
oa | +1.168 |
letters | +1.164 |
Newsletter | +1.151 |
Neg logit contributions | |
intend | -1.153 |
percentile | -1.134 |
Compton | -1.132 |
totality | -1.087 |
adelphia | -1.044 |
Token | Rights |
Token ID | 6923 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
Adds | +3.304 |
Breach | +2.980 |
letters | +2.693 |
oa | +2.676 |
Newsletter | +2.615 |
Neg logit contributions | |
intend | -4.024 |
Compton | -3.953 |
percentile | -3.947 |
totality | -3.825 |
adelphia | -3.750 |
Token | Reserved |
Token ID | 33876 |
Feature activation | +3.95e+00 |
Pos logit contributions | |
Adds | +5.217 |
Breach | +4.908 |
letters | +4.282 |
Newsletter | +3.889 |
IER | +3.811 |
Neg logit contributions | |
intend | -10.047 |
percentile | -9.796 |
Compton | -9.483 |
adelphia | -9.404 |
totality | -9.392 |
Token | . |
Token ID | 13 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
Adds | +2.812 |
Breach | +2.485 |
letters | +2.268 |
oa | +2.265 |
Newsletter | +2.251 |
Neg logit contributions | |
intend | -2.760 |
percentile | -2.716 |
Compton | -2.714 |
totality | -2.612 |
adelphia | -2.526 |
Token | Prot |
Token ID | 5038 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
Adds | +1.936 |
Breach | +1.737 |
oa | +1.589 |
letters | +1.584 |
Newsletter | +1.571 |
Neg logit contributions | |
intend | -1.616 |
percentile | -1.582 |
Compton | -1.574 |
totality | -1.522 |
adelphia | -1.461 |
Token | ected |
Token ID | 11197 |
Feature activation | +7.01e+00 |
Pos logit contributions | |
Adds | +1.893 |
Breach | +1.674 |
oa | +1.551 |
letters | +1.540 |
̶ | +1.504 |
Neg logit contributions | |
intend | -1.852 |
Compton | -1.837 |
percentile | -1.835 |
totality | -1.788 |
adelphia | -1.709 |
Token | by |
Token ID | 416 |
Feature activation | +2.31e+00 |
Pos logit contributions | |
Adds | +4.845 |
Breach | +4.450 |
letters | +4.021 |
oa | +3.975 |
Newsletter | +3.921 |
Neg logit contributions | |
intend | -4.909 |
Compton | -4.723 |
percentile | -4.680 |
totality | -4.519 |
adelphia | -4.507 |
Token | ermott |
Token ID | 46187 |
Feature activation | -9.21e-01 |
Pos logit contributions | |
intend | +1.422 |
Compton | +1.386 |
percentile | +1.379 |
totality | +1.309 |
adelphia | +1.292 |
Neg logit contributions | |
Adds | -1.668 |
Breach | -1.463 |
letters | -1.346 |
Newsletter | -1.345 |
IER | -1.340 |
Token | , |
Token ID | 11 |
Feature activation | -1.22e+00 |
Pos logit contributions | |
intend | +0.611 |
Compton | +0.607 |
percentile | +0.600 |
totality | +0.576 |
adelphia | +0.550 |
Neg logit contributions | |
Adds | -0.699 |
Breach | -0.613 |
letters | -0.568 |
artisan | -0.565 |
oa | -0.563 |
Token | their |
Token ID | 511 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
intend | +0.803 |
Compton | +0.803 |
percentile | +0.798 |
totality | +0.766 |
adelphia | +0.727 |
Neg logit contributions | |
Adds | -0.931 |
Breach | -0.821 |
letters | -0.760 |
oa | -0.756 |
artisan | -0.755 |
Token | kids |
Token ID | 3988 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
Compton | +1.181 |
intend | +1.176 |
percentile | +1.174 |
totality | +1.129 |
adelphia | +1.064 |
Neg logit contributions | |
Adds | -1.499 |
Breach | -1.325 |
letters | -1.236 |
oa | -1.230 |
̶ | -1.228 |
Token | , |
Token ID | 11 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
Adds | +0.351 |
Breach | +0.309 |
letters | +0.285 |
oa | +0.284 |
artisan | +0.281 |
Neg logit contributions | |
intend | -0.318 |
Compton | -0.315 |
percentile | -0.313 |
totality | -0.300 |
adelphia | -0.288 |
Token | Liam |
Token ID | 31684 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
intend | +1.041 |
Compton | +1.039 |
percentile | +1.028 |
totality | +0.986 |
adelphia | +0.935 |
Neg logit contributions | |
Adds | -1.184 |
Breach | -1.037 |
letters | -0.963 |
oa | -0.959 |
artisan | -0.954 |
Token | , |
Token ID | 11 |
Feature activation | +9.56e-01 |
Pos logit contributions | |
Adds | +7.076 |
Breach | +6.629 |
oa | +6.157 |
letters | +5.741 |
̶ | +5.644 |
Neg logit contributions | |
intend | -7.866 |
percentile | -7.810 |
totality | -7.551 |
Compton | -7.281 |
adelphia | -7.168 |
Token | Stella |
Token ID | 45856 |
Feature activation | +2.12e-01 |
Pos logit contributions | |
Adds | +0.683 |
Breach | +0.602 |
oa | +0.552 |
letters | +0.550 |
̶ | +0.542 |
Neg logit contributions | |
intend | -0.672 |
Compton | -0.665 |
percentile | -0.663 |
totality | -0.637 |
adelphia | -0.614 |
Token | , |
Token ID | 11 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
Adds | +0.161 |
Breach | +0.142 |
letters | +0.131 |
oa | +0.131 |
artisan | +0.130 |
Neg logit contributions | |
intend | -0.140 |
Compton | -0.140 |
percentile | -0.138 |
totality | -0.132 |
adelphia | -0.128 |
Token | Hatt |
Token ID | 48509 |
Feature activation | -4.84e+00 |
Pos logit contributions | |
intend | +0.339 |
Compton | +0.338 |
percentile | +0.334 |
totality | +0.320 |
adelphia | +0.308 |
Neg logit contributions | |
Adds | -0.363 |
Breach | -0.318 |
letters | -0.294 |
oa | -0.293 |
artisan | -0.290 |
Token | ie |
Token ID | 494 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
Compton | +3.212 |
intend | +3.189 |
percentile | +3.110 |
totality | +2.986 |
adelphia | +2.942 |
Neg logit contributions | |
Adds | -3.615 |
Breach | -3.122 |
Newsletter | -2.910 |
̶ | -2.898 |
IER | -2.874 |
Token | the |
Token ID | 262 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
percentile | +0.740 |
intend | +0.737 |
Compton | +0.736 |
totality | +0.713 |
adelphia | +0.669 |
Neg logit contributions | |
Adds | -0.791 |
Breach | -0.698 |
letters | -0.644 |
oa | -0.643 |
artisan | -0.636 |
Token | right |
Token ID | 826 |
Feature activation | -3.43e+00 |
Pos logit contributions | |
percentile | +0.867 |
Compton | +0.865 |
intend | +0.862 |
totality | +0.836 |
adelphia | +0.772 |
Neg logit contributions | |
Adds | -1.293 |
Breach | -1.158 |
letters | -1.084 |
oa | -1.083 |
artisan | -1.075 |
Token | path |
Token ID | 3108 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
percentile | +2.248 |
Compton | +2.227 |
intend | +2.219 |
totality | +2.174 |
indication | +2.054 |
Neg logit contributions | |
Adds | -2.582 |
Breach | -2.294 |
letters | -2.140 |
artisan | -2.118 |
oa | -2.111 |
Token | , |
Token ID | 11 |
Feature activation | +2.38e+00 |
Pos logit contributions | |
intend | +2.338 |
Compton | +2.327 |
percentile | +2.325 |
totality | +2.246 |
indication | +2.085 |
Neg logit contributions | |
Adds | -2.772 |
Breach | -2.483 |
letters | -2.283 |
artisan | -2.256 |
Newsletter | -2.239 |
Token | and |
Token ID | 290 |
Feature activation | +6.84e-01 |
Pos logit contributions | |
Adds | +1.738 |
Breach | +1.540 |
oa | +1.407 |
letters | +1.402 |
̶ | +1.391 |
Neg logit contributions | |
intend | -1.644 |
Compton | -1.619 |
percentile | -1.611 |
totality | -1.548 |
adelphia | -1.505 |
Token | Will |
Token ID | 2561 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
Adds | +0.494 |
Breach | +0.435 |
oa | +0.399 |
letters | +0.398 |
IER | +0.393 |
Neg logit contributions | |
intend | -0.477 |
Compton | -0.471 |
percentile | -0.470 |
totality | -0.452 |
adelphia | -0.434 |
Token | proves |
Token ID | 17021 |
Feature activation | +5.12e-01 |
Pos logit contributions | |
Adds | +7.515 |
Breach | +6.631 |
oa | +6.228 |
letters | +6.117 |
̶ | +6.026 |
Neg logit contributions | |
intend | -7.756 |
percentile | -7.486 |
totality | -7.291 |
Compton | -7.149 |
adelphia | -7.115 |
Token | that |
Token ID | 326 |
Feature activation | +2.68e+00 |
Pos logit contributions | |
Adds | +0.389 |
Breach | +0.345 |
oa | +0.319 |
letters | +0.317 |
Newsletter | +0.315 |
Neg logit contributions | |
intend | -0.335 |
Compton | -0.334 |
percentile | -0.334 |
totality | -0.318 |
adelphia | -0.303 |
Token | anyone |
Token ID | 2687 |
Feature activation | +4.46e+00 |
Pos logit contributions | |
Adds | +1.970 |
Breach | +1.748 |
oa | +1.603 |
letters | +1.595 |
̶ | +1.576 |
Neg logit contributions | |
intend | -1.825 |
Compton | -1.798 |
percentile | -1.788 |
totality | -1.722 |
adelphia | -1.667 |
Token | can |
Token ID | 460 |
Feature activation | +4.20e+00 |
Pos logit contributions | |
Adds | +3.065 |
Breach | +2.726 |
oa | +2.504 |
letters | +2.448 |
̶ | +2.444 |
Neg logit contributions | |
intend | -3.203 |
Compton | -3.140 |
percentile | -3.124 |
totality | -3.036 |
adelphia | -2.959 |
Token | become |
Token ID | 1716 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
Adds | +2.928 |
Breach | +2.611 |
oa | +2.387 |
̶ | +2.341 |
letters | +2.338 |
Neg logit contributions | |
intend | -2.948 |
Compton | -2.948 |
percentile | -2.869 |
totality | -2.826 |
adelphia | -2.737 |
Token | Limited |
Token ID | 15302 |
Feature activation | +9.13e+00 |
Pos logit contributions | |
Adds | +3.152 |
Breach | +2.912 |
letters | +2.693 |
oa | +2.652 |
̶ | +2.611 |
Neg logit contributions | |
intend | -2.731 |
percentile | -2.641 |
Compton | -2.632 |
totality | -2.601 |
adelphia | -2.546 |
Token | , |
Token ID | 11 |
Feature activation | +4.38e+00 |
Pos logit contributions | |
Adds | +5.450 |
Breach | +4.997 |
letters | +4.552 |
oa | +4.493 |
Newsletter | +4.491 |
Neg logit contributions | |
intend | -6.776 |
Compton | -6.699 |
percentile | -6.641 |
totality | -6.486 |
adelphia | -6.307 |
Token | London |
Token ID | 3576 |
Feature activation | +7.33e+00 |
Pos logit contributions | |
Adds | +3.072 |
Breach | +2.733 |
oa | +2.495 |
̶ | +2.449 |
letters | +2.439 |
Neg logit contributions | |
intend | -3.104 |
Compton | -3.065 |
percentile | -3.048 |
totality | -2.967 |
adelphia | -2.880 |
Token | . |
Token ID | 13 |
Feature activation | +4.52e+00 |
Pos logit contributions | |
Adds | +4.891 |
Breach | +4.294 |
letters | +4.011 |
oa | +3.980 |
Newsletter | +3.928 |
Neg logit contributions | |
intend | -5.316 |
percentile | -5.221 |
Compton | -5.185 |
totality | -5.127 |
adelphia | -4.903 |
Token | All |
Token ID | 1439 |
Feature activation | +5.62e+00 |
Pos logit contributions | |
Adds | +3.569 |
Breach | +3.198 |
oa | +2.951 |
letters | +2.947 |
Newsletter | +2.901 |
Neg logit contributions | |
intend | -2.839 |
percentile | -2.782 |
Compton | -2.778 |
totality | -2.697 |
adelphia | -2.582 |
Token | Rights |
Token ID | 6923 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
Adds | +3.500 |
Breach | +3.170 |
letters | +2.944 |
oa | +2.857 |
Newsletter | +2.819 |
Neg logit contributions | |
intend | -4.254 |
percentile | -4.235 |
Compton | -4.196 |
totality | -4.160 |
adelphia | -4.057 |
Token | Reserved |
Token ID | 33876 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
Adds | +4.948 |
Breach | +4.640 |
letters | +4.170 |
Newsletter | +3.633 |
oa | +3.458 |
Neg logit contributions | |
intend | -10.001 |
percentile | -9.680 |
adelphia | -9.459 |
�� | -9.329 |
Compton | -9.323 |
Token | . |
Token ID | 13 |
Feature activation | +3.04e+00 |
Pos logit contributions | |
Adds | +2.584 |
Breach | +2.293 |
oa | +2.102 |
letters | +2.101 |
Newsletter | +2.077 |
Neg logit contributions | |
intend | -2.395 |
percentile | -2.353 |
Compton | -2.350 |
totality | -2.266 |
adelphia | -2.178 |
Token | Rep |
Token ID | 1432 |
Feature activation | +9.79e-01 |
Pos logit contributions | |
Adds | +2.304 |
Breach | +2.075 |
letters | +1.896 |
oa | +1.887 |
Newsletter | +1.870 |
Neg logit contributions | |
intend | -2.002 |
percentile | -1.951 |
Compton | -1.949 |
totality | -1.903 |
adelphia | -1.820 |
Token | rint |
Token ID | 22272 |
Feature activation | +3.68e+00 |
Pos logit contributions | |
Adds | +0.795 |
Breach | +0.712 |
oa | +0.659 |
letters | +0.656 |
IER | +0.650 |
Neg logit contributions | |
intend | -0.595 |
Compton | -0.586 |
percentile | -0.584 |
totality | -0.558 |
adelphia | -0.534 |
Token | ed |
Token ID | 276 |
Feature activation | +4.95e+00 |
Pos logit contributions | |
Adds | +2.450 |
Breach | +2.168 |
oa | +2.045 |
letters | +2.043 |
Newsletter | +1.993 |
Neg logit contributions | |
intend | -2.714 |
Compton | -2.644 |
percentile | -2.630 |
totality | -2.571 |
adelphia | -2.473 |
Token | , |
Token ID | 11 |
Feature activation | +2.82e+00 |
Pos logit contributions | |
Adds | +2.667 |
Breach | +2.375 |
oa | +2.159 |
letters | +2.135 |
̶ | +2.134 |
Neg logit contributions | |
intend | -2.792 |
Compton | -2.754 |
percentile | -2.750 |
totality | -2.641 |
adelphia | -2.575 |
Token | while |
Token ID | 981 |
Feature activation | -4.77e-01 |
Pos logit contributions | |
Adds | +2.101 |
Breach | +1.879 |
oa | +1.714 |
letters | +1.706 |
̶ | +1.687 |
Neg logit contributions | |
intend | -1.905 |
percentile | -1.855 |
Compton | -1.850 |
totality | -1.779 |
adelphia | -1.732 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
Compton | +0.331 |
intend | +0.330 |
percentile | +0.328 |
totality | +0.317 |
adelphia | +0.302 |
Neg logit contributions | |
Adds | -0.345 |
Breach | -0.302 |
oa | -0.278 |
letters | -0.277 |
IER | -0.275 |
Token | US |
Token ID | 1294 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
Adds | +0.859 |
Breach | +0.756 |
oa | +0.689 |
letters | +0.686 |
̶ | +0.675 |
Neg logit contributions | |
intend | -0.900 |
Compton | -0.887 |
percentile | -0.886 |
totality | -0.851 |
adelphia | -0.823 |
Token | National |
Token ID | 2351 |
Feature activation | +2.20e+00 |
Pos logit contributions | |
Compton | +1.954 |
intend | +1.953 |
percentile | +1.949 |
totality | +1.875 |
disgr | +1.780 |
Neg logit contributions | |
Adds | -2.077 |
Breach | -1.824 |
letters | -1.693 |
IER | -1.672 |
oa | -1.668 |
Token | Security |
Token ID | 4765 |
Feature activation | +1.12e+01 |
Pos logit contributions | |
Adds | +0.917 |
Breach | +0.738 |
oa | +0.622 |
letters | +0.615 |
̶ | +0.595 |
Neg logit contributions | |
intend | -2.198 |
Compton | -2.179 |
percentile | -2.176 |
totality | -2.116 |
adelphia | -2.067 |
Token | Agency |
Token ID | 7732 |
Feature activation | +8.62e-01 |
Pos logit contributions | |
Adds | +6.598 |
Breach | +6.381 |
letters | +5.513 |
artisan | +5.362 |
IER | +5.354 |
Neg logit contributions | |
intend | -8.186 |
Compton | -7.996 |
percentile | -7.966 |
totality | -7.777 |
adelphia | -7.645 |
Token | ( |
Token ID | 357 |
Feature activation | +5.86e+00 |
Pos logit contributions | |
Adds | +0.649 |
Breach | +0.578 |
oa | +0.531 |
letters | +0.529 |
̶ | +0.522 |
Neg logit contributions | |
intend | -0.574 |
Compton | -0.565 |
percentile | -0.564 |
totality | -0.541 |
adelphia | -0.521 |
Token | NSA |
Token ID | 47549 |
Feature activation | -9.34e-02 |
Pos logit contributions | |
Adds | +2.772 |
Breach | +2.207 |
letters | +1.949 |
oa | +1.914 |
IER | +1.908 |
Neg logit contributions | |
intend | -5.538 |
percentile | -5.452 |
Compton | -5.420 |
totality | -5.297 |
adelphia | -5.207 |
Token | ) |
Token ID | 8 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
intend | +0.056 |
Compton | +0.055 |
percentile | +0.055 |
totality | +0.052 |
adelphia | +0.050 |
Neg logit contributions | |
Adds | -0.077 |
Breach | -0.069 |
oa | -0.064 |
letters | -0.064 |
Newsletter | -0.063 |
Token | wanted |
Token ID | 2227 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
Adds | +2.801 |
Breach | +2.528 |
oa | +2.311 |
letters | +2.290 |
̶ | +2.269 |
Neg logit contributions | |
intend | -2.514 |
Compton | -2.451 |
percentile | -2.448 |
totality | -2.342 |
adelphia | -2.291 |
Token | N |
Token ID | 399 |
Feature activation | -1.64e+00 |
Pos logit contributions | |
Adds | +0.111 |
Breach | +0.098 |
oa | +0.090 |
letters | +0.090 |
̶ | +0.089 |
Neg logit contributions | |
intend | -0.100 |
Compton | -0.099 |
percentile | -0.098 |
totality | -0.094 |
adelphia | -0.091 |
Token | f |
Token ID | 69 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
intend | +1.194 |
Compton | +1.146 |
percentile | +1.140 |
totality | +1.078 |
lé | +1.070 |
Neg logit contributions | |
Adds | -1.138 |
Breach | -1.016 |
IER | -0.901 |
letters | -0.895 |
̶ | -0.892 |
Token | 6 |
Token ID | 21 |
Feature activation | +8.33e-01 |
Pos logit contributions | |
intend | +0.993 |
Compton | +0.980 |
percentile | +0.977 |
totality | +0.932 |
adelphia | +0.901 |
Neg logit contributions | |
Adds | -1.059 |
Breach | -0.936 |
letters | -0.857 |
oa | -0.854 |
IER | -0.849 |
Token | { |
Token ID | 1391 |
Feature activation | +7.31e-01 |
Pos logit contributions | |
Adds | +0.628 |
Breach | +0.559 |
oa | +0.515 |
letters | +0.512 |
̶ | +0.505 |
Neg logit contributions | |
intend | -0.553 |
Compton | -0.545 |
percentile | -0.544 |
totality | -0.522 |
adelphia | -0.502 |
Token | ( |
Token ID | 7 |
Feature activation | +3.67e+00 |
Pos logit contributions | |
Adds | +0.665 |
Breach | +0.603 |
oa | +0.565 |
letters | +0.563 |
IER | +0.557 |
Neg logit contributions | |
intend | -0.372 |
Compton | -0.366 |
percentile | -0.365 |
totality | -0.345 |
adelphia | -0.328 |
Token | 0 |
Token ID | 15 |
Feature activation | +1.11e+01 |
Pos logit contributions | |
Adds | +2.547 |
Breach | +2.216 |
oa | +2.049 |
letters | +2.041 |
̶ | +2.016 |
Neg logit contributions | |
intend | -2.635 |
Compton | -2.605 |
percentile | -2.598 |
totality | -2.543 |
adelphia | -2.433 |
Token | s |
Token ID | 82 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
Adds | +5.751 |
Breach | +4.723 |
oa | +4.511 |
letters | +4.302 |
̶ | +4.050 |
Neg logit contributions | |
intend | -9.330 |
percentile | -9.304 |
Compton | -9.267 |
totality | -9.036 |
adelphia | -8.686 |
Token | )} |
Token ID | 38165 |
Feature activation | +2.08e+00 |
Pos logit contributions | |
Adds | +2.186 |
Breach | +1.859 |
oa | +1.684 |
letters | +1.654 |
IER | +1.586 |
Neg logit contributions | |
intend | -3.171 |
percentile | -3.135 |
Compton | -3.121 |
totality | -3.085 |
adelphia | -2.973 |
Token | 2 |
Token ID | 362 |
Feature activation | +3.06e+00 |
Pos logit contributions | |
Adds | +1.550 |
Breach | +1.384 |
oa | +1.274 |
letters | +1.263 |
IER | +1.246 |
Neg logit contributions | |
intend | -1.395 |
Compton | -1.364 |
percentile | -1.363 |
totality | -1.311 |
adelphia | -1.274 |
Token | . |
Token ID | 13 |
Feature activation | +4.70e+00 |
Pos logit contributions | |
Adds | +2.091 |
Breach | +1.808 |
oa | +1.684 |
letters | +1.676 |
Newsletter | +1.625 |
Neg logit contributions | |
intend | -2.255 |
percentile | -2.210 |
totality | -2.195 |
Compton | -2.195 |
adelphia | -2.080 |
Token | N |
Token ID | 399 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
Adds | +3.232 |
Breach | +2.890 |
oa | +2.645 |
letters | +2.587 |
Newsletter | +2.550 |
Neg logit contributions | |
intend | -3.411 |
Compton | -3.286 |
percentile | -3.278 |
totality | -3.174 |
adelphia | -3.118 |
Token | alo |
Token ID | 7335 |
Feature activation | -7.41e-01 |
Pos logit contributions | |
intend | +0.422 |
percentile | +0.407 |
Compton | +0.406 |
totality | +0.375 |
adelphia | +0.368 |
Neg logit contributions | |
Adds | -1.056 |
Breach | -0.963 |
IER | -0.907 |
letters | -0.907 |
̶ | -0.902 |
Token | Bills |
Token ID | 20209 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
intend | +0.563 |
Compton | +0.558 |
percentile | +0.557 |
totality | +0.536 |
adelphia | +0.521 |
Neg logit contributions | |
Adds | -0.484 |
Breach | -0.422 |
letters | -0.383 |
oa | -0.381 |
Newsletter | -0.378 |
Token | : |
Token ID | 25 |
Feature activation | +6.18e-01 |
Pos logit contributions | |
intend | +0.701 |
Compton | +0.696 |
percentile | +0.696 |
totality | +0.664 |
adelphia | +0.634 |
Neg logit contributions | |
Adds | -0.914 |
Breach | -0.816 |
letters | -0.756 |
oa | -0.755 |
artisan | -0.748 |
Token | G |
Token ID | 402 |
Feature activation | +3.40e+00 |
Pos logit contributions | |
Adds | +0.446 |
Breach | +0.394 |
oa | +0.361 |
letters | +0.360 |
IER | +0.355 |
Neg logit contributions | |
intend | -0.429 |
Compton | -0.425 |
percentile | -0.424 |
totality | -0.407 |
adelphia | -0.392 |
Token | Richie |
Token ID | 49209 |
Feature activation | -2.53e+00 |
Pos logit contributions | |
Adds | +2.518 |
Breach | +2.240 |
oa | +2.073 |
letters | +2.054 |
IER | +2.034 |
Neg logit contributions | |
intend | -2.286 |
percentile | -2.258 |
Compton | -2.252 |
totality | -2.172 |
adelphia | -2.082 |
Token | Inc |
Token ID | 3457 |
Feature activation | -1.33e+01 |
Pos logit contributions | |
intend | +1.402 |
Compton | +1.380 |
percentile | +1.363 |
totality | +1.274 |
adelphia | +1.260 |
Neg logit contributions | |
Adds | -2.206 |
Breach | -1.981 |
letters | -1.853 |
oa | -1.843 |
artisan | -1.840 |
Token | ogn |
Token ID | 2360 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
intend | +2.420 |
Compton | +2.076 |
percentile | +1.988 |
totality | +1.645 |
weak | +1.493 |
Neg logit contributions | |
Adds | -15.438 |
Breach | -14.778 |
artisan | -13.982 |
Newsletter | -13.724 |
arrivals | -13.714 |
Token | ito |
Token ID | 10094 |
Feature activation | -2.87e-01 |
Pos logit contributions | |
Adds | +0.166 |
Breach | +0.148 |
letters | +0.135 |
Newsletter | +0.135 |
̶ | +0.134 |
Neg logit contributions | |
intend | -0.142 |
percentile | -0.140 |
Compton | -0.139 |
totality | -0.131 |
adelphia | -0.128 |
Token |
|
Token ID | 198 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
intend | +0.190 |
Compton | +0.188 |
percentile | +0.188 |
totality | +0.180 |
adelphia | +0.173 |
Neg logit contributions | |
Adds | -0.217 |
Breach | -0.193 |
letters | -0.177 |
oa | -0.177 |
artisan | -0.175 |
Token |
|
Token ID | 198 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
Adds | +0.002 |
Breach | +0.002 |
oa | +0.002 |
letters | +0.002 |
Newsletter | +0.002 |
Neg logit contributions | |
intend | -0.002 |
Compton | -0.001 |
percentile | -0.001 |
totality | -0.001 |
adelphia | -0.001 |
Token | Contract |
Token ID | 45845 |
Feature activation | +3.59e-01 |
Pos logit contributions | |
intend | +0.216 |
Compton | +0.213 |
percentile | +0.210 |
totality | +0.200 |
adelphia | +0.195 |
Neg logit contributions | |
Adds | -0.247 |
Breach | -0.225 |
oa | -0.204 |
letters | -0.204 |
artisan | -0.203 |
Token | other |
Token ID | 584 |
Feature activation | -3.79e+00 |
Pos logit contributions | |
Compton | +2.286 |
intend | +2.281 |
percentile | +2.272 |
totality | +2.184 |
adelphia | +2.084 |
Neg logit contributions | |
Adds | -2.723 |
Breach | -2.378 |
artisan | -2.238 |
IER | -2.236 |
letters | -2.229 |
Token | team |
Token ID | 1074 |
Feature activation | -3.05e+00 |
Pos logit contributions | |
intend | +2.515 |
percentile | +2.494 |
Compton | +2.478 |
totality | +2.365 |
disgr | +2.261 |
Neg logit contributions | |
Adds | -2.831 |
Breach | -2.459 |
artisan | -2.307 |
IER | -2.306 |
letters | -2.301 |
Token | such |
Token ID | 884 |
Feature activation | -2.44e+00 |
Pos logit contributions | |
intend | +2.092 |
Compton | +2.045 |
percentile | +2.037 |
totality | +1.965 |
adelphia | +1.900 |
Neg logit contributions | |
Adds | -2.227 |
Breach | -1.947 |
oa | -1.797 |
artisan | -1.797 |
IER | -1.788 |
Token | as |
Token ID | 355 |
Feature activation | -2.33e+00 |
Pos logit contributions | |
intend | +1.605 |
percentile | +1.588 |
Compton | +1.581 |
totality | +1.523 |
adelphia | +1.456 |
Neg logit contributions | |
Adds | -1.851 |
Breach | -1.619 |
Newsletter | -1.526 |
oa | -1.498 |
artisan | -1.494 |
Token | sc |
Token ID | 629 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
intend | +1.562 |
Compton | +1.550 |
percentile | +1.538 |
totality | +1.476 |
adelphia | +1.425 |
Neg logit contributions | |
Adds | -1.745 |
Breach | -1.517 |
letters | -1.408 |
oa | -1.405 |
Newsletter | -1.398 |
Token | a |
Token ID | 64 |
Feature activation | -1.28e+01 |
Pos logit contributions | |
Adds | +1.460 |
Breach | +1.292 |
letters | +1.192 |
oa | +1.191 |
̶ | +1.159 |
Neg logit contributions | |
percentile | -1.532 |
intend | -1.531 |
Compton | -1.527 |
totality | -1.486 |
adelphia | -1.410 |
Token | . |
Token ID | 13 |
Feature activation | -3.74e+00 |
Pos logit contributions | |
intend | +8.171 |
percentile | +8.127 |
Compton | +7.902 |
adelphia | +7.830 |
totality | +7.404 |
Neg logit contributions | |
Adds | -8.923 |
Breach | -7.749 |
artisan | -7.607 |
Newsletter | -7.133 |
letters | -7.042 |
Token | If |
Token ID | 1002 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
intend | +2.439 |
Compton | +2.381 |
percentile | +2.366 |
totality | +2.261 |
adelphia | +2.199 |
Neg logit contributions | |
Adds | -2.842 |
Breach | -2.498 |
Newsletter | -2.309 |
oa | -2.303 |
letters | -2.295 |
Token | it |
Token ID | 340 |
Feature activation | -4.29e+00 |
Pos logit contributions | |
intend | +1.590 |
Compton | +1.586 |
percentile | +1.578 |
totality | +1.518 |
adelphia | +1.443 |
Neg logit contributions | |
Adds | -1.857 |
Breach | -1.640 |
letters | -1.518 |
Newsletter | -1.511 |
oa | -1.509 |
Token | worked |
Token ID | 3111 |
Feature activation | +3.79e+00 |
Pos logit contributions | |
Compton | +1.931 |
percentile | +1.913 |
intend | +1.888 |
totality | +1.769 |
disgr | +1.636 |
Neg logit contributions | |
Adds | -4.161 |
Breach | -3.800 |
letters | -3.568 |
Newsletter | -3.547 |
IER | -3.534 |
Token | out |
Token ID | 503 |
Feature activation | +1.77e+00 |
Pos logit contributions | |
Adds | +2.873 |
Breach | +2.585 |
oa | +2.405 |
letters | +2.333 |
̶ | +2.324 |
Neg logit contributions | |
intend | -2.428 |
Compton | -2.388 |
percentile | -2.318 |
totality | -2.276 |
adelphia | -2.256 |
Token | iment |
Token ID | 3681 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
intend | +0.157 |
Compton | +0.154 |
percentile | +0.154 |
totality | +0.146 |
adelphia | +0.141 |
Neg logit contributions | |
Adds | -0.213 |
Breach | -0.191 |
letters | -0.176 |
Newsletter | -0.176 |
oa | -0.176 |
Token | is |
Token ID | 318 |
Feature activation | -7.72e-01 |
Pos logit contributions | |
intend | +0.994 |
Compton | +0.988 |
percentile | +0.985 |
totality | +0.947 |
adelphia | +0.902 |
Neg logit contributions | |
Adds | -1.107 |
Breach | -0.984 |
oa | -0.903 |
letters | -0.900 |
artisan | -0.892 |
Token | fragmented |
Token ID | 41630 |
Feature activation | -2.43e+00 |
Pos logit contributions | |
intend | +0.501 |
Compton | +0.497 |
percentile | +0.495 |
totality | +0.475 |
adelphia | +0.454 |
Neg logit contributions | |
Adds | -0.592 |
Breach | -0.527 |
oa | -0.486 |
letters | -0.485 |
artisan | -0.479 |
Token | , |
Token ID | 11 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
Compton | +1.536 |
percentile | +1.534 |
intend | +1.533 |
totality | +1.476 |
adelphia | +1.387 |
Neg logit contributions | |
Adds | -1.883 |
Breach | -1.678 |
letters | -1.551 |
oa | -1.546 |
artisan | -1.534 |
Token | st |
Token ID | 336 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
Compton | +0.912 |
intend | +0.910 |
percentile | +0.906 |
totality | +0.868 |
adelphia | +0.824 |
Neg logit contributions | |
Adds | -1.089 |
Breach | -0.970 |
oa | -0.897 |
letters | -0.892 |
IER | -0.885 |
Token | acc |
Token ID | 4134 |
Feature activation | -1.26e+01 |
Pos logit contributions | |
Adds | +1.454 |
Breach | +1.266 |
oa | +1.159 |
letters | +1.151 |
̶ | +1.135 |
Neg logit contributions | |
intend | -1.666 |
Compton | -1.648 |
percentile | -1.648 |
totality | -1.599 |
adelphia | -1.526 |
Token | ato |
Token ID | 5549 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
percentile | +6.638 |
Compton | +6.621 |
intend | +6.466 |
laim | +6.289 |
totality | +6.116 |
Neg logit contributions | |
Adds | -9.437 |
Breach | -8.698 |
letters | -8.249 |
Newsletter | -8.198 |
装 | -7.962 |
Token | chords |
Token ID | 34211 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
Adds | +0.937 |
Breach | +0.830 |
oa | +0.762 |
letters | +0.759 |
̶ | +0.749 |
Neg logit contributions | |
intend | -0.866 |
Compton | -0.855 |
percentile | -0.853 |
totality | -0.819 |
adelphia | -0.788 |
Token | in |
Token ID | 287 |
Feature activation | -4.27e-01 |
Pos logit contributions | |
intend | +0.192 |
Compton | +0.190 |
percentile | +0.190 |
totality | +0.182 |
adelphia | +0.175 |
Neg logit contributions | |
Adds | -0.213 |
Breach | -0.188 |
oa | -0.173 |
letters | -0.173 |
IER | -0.170 |
Token | unpredictable |
Token ID | 22900 |
Feature activation | -3.89e+00 |
Pos logit contributions | |
intend | +0.285 |
Compton | +0.284 |
percentile | +0.282 |
totality | +0.272 |
adelphia | +0.259 |
Neg logit contributions | |
Adds | -0.320 |
Breach | -0.284 |
oa | -0.261 |
letters | -0.260 |
IER | -0.257 |
Token | places |
Token ID | 4113 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
percentile | +2.597 |
Compton | +2.588 |
intend | +2.539 |
totality | +2.516 |
indication | +2.335 |
Neg logit contributions | |
Adds | -2.904 |
Breach | -2.573 |
artisan | -2.384 |
oa | -2.371 |
̶ | -2.342 |
Token | | |
Token ID | 930 |
Feature activation | +1.66e+00 |
Pos logit contributions | |
percentile | +2.179 |
intend | +2.175 |
Compton | +2.173 |
totality | +2.078 |
adelphia | +1.998 |
Neg logit contributions | |
Adds | -1.885 |
Breach | -1.656 |
oa | -1.489 |
letters | -1.483 |
artisan | -1.479 |
Token | ISI |
Token ID | 22048 |
Feature activation | -5.14e+00 |
Pos logit contributions | |
Adds | +1.170 |
Breach | +1.030 |
oa | +0.937 |
letters | +0.930 |
Newsletter | +0.923 |
Neg logit contributions | |
intend | -1.196 |
Compton | -1.167 |
percentile | -1.158 |
totality | -1.137 |
adelphia | -1.104 |
Token |
|
Token ID | 198 |
Feature activation | +7.44e-01 |
Pos logit contributions | |
Compton | +2.679 |
intend | +2.653 |
percentile | +2.636 |
totality | +2.380 |
adelphia | +2.303 |
Neg logit contributions | |
Adds | -4.492 |
Breach | -4.089 |
artisan | -3.868 |
oa | -3.838 |
IER | -3.800 |
Token |
|
Token ID | 198 |
Feature activation | +9.37e-03 |
Pos logit contributions | |
Adds | +0.584 |
Breach | +0.518 |
letters | +0.480 |
oa | +0.478 |
Newsletter | +0.472 |
Neg logit contributions | |
intend | -0.475 |
percentile | -0.464 |
Compton | -0.463 |
totality | -0.455 |
adelphia | -0.433 |
Token | Sh |
Token ID | 2484 |
Feature activation | -2.65e+00 |
Pos logit contributions | |
Adds | +0.007 |
Breach | +0.006 |
oa | +0.006 |
letters | +0.006 |
̶ | +0.006 |
Neg logit contributions | |
intend | -0.006 |
Compton | -0.006 |
percentile | -0.006 |
totality | -0.006 |
adelphia | -0.006 |
Token | ak |
Token ID | 461 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
intend | +1.876 |
percentile | +1.821 |
Compton | +1.819 |
adelphia | +1.705 |
totality | +1.698 |
Neg logit contributions | |
Adds | -1.912 |
Breach | -1.678 |
IER | -1.515 |
Newsletter | -1.514 |
letters | -1.498 |
Token | oor |
Token ID | 2675 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
intend | +8.756 |
Compton | +8.467 |
percentile | +8.390 |
lé | +8.059 |
adelphia | +7.924 |
Neg logit contributions | |
Adds | -8.260 |
Breach | -7.217 |
̶ | -6.572 |
Newsletter | -6.542 |
arrivals | -6.423 |
Token | , |
Token ID | 11 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
intend | +1.872 |
Compton | +1.847 |
percentile | +1.816 |
totality | +1.729 |
lé | +1.691 |
Neg logit contributions | |
Adds | -2.055 |
Breach | -1.805 |
̶ | -1.666 |
letters | -1.657 |
Newsletter | -1.649 |
Token | S |
Token ID | 311 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Compton | +1.763 |
percentile | +1.731 |
intend | +1.729 |
totality | +1.635 |
adelphia | +1.564 |
Neg logit contributions | |
Adds | -2.049 |
Breach | -1.795 |
artisan | -1.685 |
letters | -1.674 |
oa | -1.673 |
Token | ., |
Token ID | 1539 |
Feature activation | -9.41e-01 |
Pos logit contributions | |
intend | +0.680 |
Compton | +0.671 |
percentile | +0.668 |
totality | +0.633 |
adelphia | +0.613 |
Neg logit contributions | |
Adds | -0.962 |
Breach | -0.867 |
letters | -0.799 |
oa | -0.795 |
artisan | -0.789 |
Token | J |
Token ID | 449 |
Feature activation | -3.78e+00 |
Pos logit contributions | |
Compton | +0.647 |
intend | +0.644 |
percentile | +0.635 |
totality | +0.607 |
adelphia | +0.585 |
Neg logit contributions | |
Adds | -0.690 |
Breach | -0.602 |
oa | -0.557 |
letters | -0.557 |
artisan | -0.554 |
Token | � |
Token ID | 126 |
Feature activation | +3.99e+00 |
Pos logit contributions | |
intend | +0.111 |
Compton | +0.110 |
percentile | +0.109 |
totality | +0.105 |
adelphia | +0.101 |
Neg logit contributions | |
Adds | -0.125 |
Breach | -0.111 |
oa | -0.102 |
letters | -0.102 |
IER | -0.100 |
Token | � |
Token ID | 222 |
Feature activation | +2.64e+00 |
Pos logit contributions | |
Adds | +2.977 |
Breach | +2.650 |
̶ | +2.439 |
letters | +2.426 |
oa | +2.417 |
Neg logit contributions | |
intend | -2.646 |
Compton | -2.621 |
percentile | -2.615 |
totality | -2.506 |
adelphia | -2.404 |
Token | � |
Token ID | 126 |
Feature activation | +4.56e+00 |
Pos logit contributions | |
Adds | +1.977 |
Breach | +1.764 |
oa | +1.626 |
letters | +1.614 |
̶ | +1.606 |
Neg logit contributions | |
intend | -1.756 |
Compton | -1.735 |
percentile | -1.733 |
totality | -1.663 |
adelphia | -1.601 |
Token | � |
Token ID | 242 |
Feature activation | +2.25e+00 |
Pos logit contributions | |
Adds | +2.926 |
Breach | +2.554 |
oa | +2.314 |
letters | +2.311 |
̶ | +2.299 |
Neg logit contributions | |
intend | -3.481 |
Compton | -3.464 |
percentile | -3.453 |
totality | -3.329 |
adelphia | -3.225 |
Token | Richie |
Token ID | 49209 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Adds | +1.679 |
Breach | +1.496 |
oa | +1.380 |
letters | +1.370 |
̶ | +1.361 |
Neg logit contributions | |
intend | -1.504 |
Compton | -1.485 |
percentile | -1.484 |
totality | -1.424 |
adelphia | -1.372 |
Token | Inc |
Token ID | 3457 |
Feature activation | -1.24e+01 |
Pos logit contributions | |
intend | +0.908 |
Compton | +0.900 |
percentile | +0.884 |
totality | +0.841 |
adelphia | +0.823 |
Neg logit contributions | |
Adds | -1.157 |
Breach | -1.019 |
letters | -0.951 |
oa | -0.943 |
artisan | -0.940 |
Token | ogn |
Token ID | 2360 |
Feature activation | +9.81e-01 |
Pos logit contributions | |
intend | +3.843 |
Compton | +3.692 |
percentile | +3.603 |
totality | +3.310 |
lé | +3.031 |
Neg logit contributions | |
Adds | -12.669 |
Breach | -11.553 |
Newsletter | -11.000 |
artisan | -10.970 |
IER | -10.869 |
Token | ito |
Token ID | 10094 |
Feature activation | +7.97e-01 |
Pos logit contributions | |
Adds | +0.719 |
Breach | +0.635 |
letters | +0.580 |
Newsletter | +0.573 |
̶ | +0.572 |
Neg logit contributions | |
intend | -0.679 |
Compton | -0.667 |
percentile | -0.667 |
totality | -0.637 |
adelphia | -0.617 |
Token | (@ |
Token ID | 4275 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
Adds | +0.591 |
Breach | +0.524 |
oa | +0.482 |
letters | +0.480 |
IER | +0.473 |
Neg logit contributions | |
intend | -0.539 |
Compton | -0.532 |
percentile | -0.530 |
totality | -0.509 |
adelphia | -0.490 |
Token | 68 |
Token ID | 3104 |
Feature activation | +8.80e-01 |
Pos logit contributions | |
intend | +1.214 |
Compton | +1.178 |
percentile | +1.169 |
totality | +1.115 |
adelphia | +1.095 |
Neg logit contributions | |
Adds | -1.298 |
Breach | -1.165 |
letters | -1.049 |
oa | -1.042 |
̶ | -1.039 |
Token | INC |
Token ID | 30158 |
Feature activation | -7.97e+00 |
Pos logit contributions | |
Adds | +0.648 |
Breach | +0.575 |
oa | +0.527 |
letters | +0.525 |
̶ | +0.518 |
Neg logit contributions | |
intend | -0.599 |
Compton | -0.591 |
percentile | -0.590 |
totality | -0.566 |
adelphia | -0.545 |
Token | Star |
Token ID | 2907 |
Feature activation | -4.16e+00 |
Pos logit contributions | |
intend | +1.056 |
percentile | +1.048 |
Compton | +1.048 |
totality | +0.999 |
adelphia | +0.955 |
Neg logit contributions | |
Adds | -1.268 |
Breach | -1.127 |
oa | -1.043 |
letters | -1.039 |
artisan | -1.031 |
Token | Trek |
Token ID | 12338 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
intend | +1.803 |
Compton | +1.764 |
percentile | +1.757 |
totality | +1.643 |
adelphia | +1.547 |
Neg logit contributions | |
Adds | -4.042 |
Breach | -3.643 |
oa | -3.487 |
artisan | -3.452 |
IER | -3.443 |
Token |
|
Token ID | 198 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
percentile | +1.595 |
intend | +1.580 |
Compton | +1.579 |
totality | +1.506 |
adelphia | +1.430 |
Neg logit contributions | |
Adds | -1.930 |
Breach | -1.721 |
oa | -1.608 |
artisan | -1.591 |
IER | -1.590 |
Token |
|
Token ID | 198 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
Adds | +0.098 |
Breach | +0.087 |
letters | +0.081 |
oa | +0.081 |
Newsletter | +0.080 |
Neg logit contributions | |
intend | -0.076 |
Compton | -0.075 |
percentile | -0.074 |
totality | -0.072 |
adelphia | -0.069 |
Token | The |
Token ID | 464 |
Feature activation | -1.77e+00 |
Pos logit contributions | |
intend | +0.203 |
Compton | +0.200 |
percentile | +0.199 |
totality | +0.190 |
adelphia | +0.183 |
Neg logit contributions | |
Adds | -0.253 |
Breach | -0.228 |
oa | -0.210 |
letters | -0.209 |
IER | -0.207 |
Token | Next |
Token ID | 7406 |
Feature activation | -1.23e+01 |
Pos logit contributions | |
intend | +1.161 |
Compton | +1.161 |
percentile | +1.158 |
totality | +1.112 |
adelphia | +1.058 |
Neg logit contributions | |
Adds | -1.344 |
Breach | -1.176 |
oa | -1.096 |
letters | -1.091 |
IER | -1.081 |
Token | Generation |
Token ID | 16588 |
Feature activation | -4.95e+00 |
Pos logit contributions | |
percentile | +5.132 |
Compton | +4.937 |
intend | +4.734 |
adelphia | +4.456 |
totality | +4.437 |
Neg logit contributions | |
Adds | -11.816 |
artisan | -10.069 |
Breach | -10.021 |
letters | -9.895 |
IER | -9.787 |
Token |
|
Token ID | 198 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
percentile | +2.944 |
Compton | +2.929 |
intend | +2.862 |
totality | +2.775 |
adelphia | +2.589 |
Neg logit contributions | |
Adds | -3.985 |
Breach | -3.512 |
artisan | -3.342 |
IER | -3.340 |
oa | -3.320 |
Token |
|
Token ID | 198 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Adds | +0.085 |
Breach | +0.076 |
letters | +0.070 |
oa | +0.070 |
Newsletter | +0.069 |
Neg logit contributions | |
intend | -0.066 |
Compton | -0.065 |
percentile | -0.065 |
totality | -0.063 |
adelphia | -0.060 |
Token | Please |
Token ID | 5492 |
Feature activation | +9.91e-01 |
Pos logit contributions | |
intend | +1.081 |
Compton | +1.061 |
percentile | +1.050 |
totality | +1.001 |
adelphia | +0.969 |
Neg logit contributions | |
Adds | -1.345 |
Breach | -1.218 |
oa | -1.122 |
artisan | -1.109 |
letters | -1.107 |
Token | enter |
Token ID | 3802 |
Feature activation | -2.99e+00 |
Pos logit contributions | |
Adds | +0.774 |
Breach | +0.692 |
oa | +0.636 |
letters | +0.634 |
̶ | +0.627 |
Neg logit contributions | |
intend | -0.633 |
Compton | -0.622 |
percentile | -0.618 |
totality | -0.595 |
adelphia | -0.573 |
Token | looked |
Token ID | 3114 |
Feature activation | +3.13e+00 |
Pos logit contributions | |
Adds | +2.219 |
Breach | +1.966 |
oa | +1.810 |
letters | +1.792 |
̶ | +1.781 |
Neg logit contributions | |
intend | -2.181 |
percentile | -2.141 |
Compton | -2.127 |
totality | -2.060 |
adelphia | -1.999 |
Token | like |
Token ID | 588 |
Feature activation | -2.75e+00 |
Pos logit contributions | |
Adds | +2.121 |
Breach | +1.865 |
oa | +1.710 |
̶ | +1.694 |
letters | +1.687 |
Neg logit contributions | |
intend | -2.292 |
Compton | -2.245 |
percentile | -2.242 |
totality | -2.165 |
adelphia | -2.123 |
Token | he |
Token ID | 339 |
Feature activation | +7.54e-01 |
Pos logit contributions | |
Compton | +1.925 |
intend | +1.903 |
percentile | +1.897 |
totality | +1.828 |
adelphia | +1.737 |
Neg logit contributions | |
Adds | -1.996 |
Breach | -1.726 |
oa | -1.587 |
letters | -1.580 |
artisan | -1.567 |
Token | was |
Token ID | 373 |
Feature activation | +9.81e-01 |
Pos logit contributions | |
Adds | +0.550 |
Breach | +0.486 |
oa | +0.449 |
letters | +0.445 |
̶ | +0.441 |
Neg logit contributions | |
intend | -0.518 |
Compton | -0.512 |
percentile | -0.510 |
totality | -0.492 |
adelphia | -0.473 |
Token | Will |
Token ID | 2561 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
Adds | +0.736 |
Breach | +0.655 |
oa | +0.604 |
letters | +0.600 |
̶ | +0.593 |
Neg logit contributions | |
intend | -0.653 |
Compton | -0.643 |
percentile | -0.642 |
totality | -0.616 |
adelphia | -0.593 |
Token | Sh |
Token ID | 911 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
Adds | +1.225 |
Breach | +1.075 |
oa | +0.981 |
letters | +0.974 |
̶ | +0.961 |
Neg logit contributions | |
intend | -1.330 |
percentile | -1.312 |
Compton | -1.309 |
totality | -1.265 |
adelphia | -1.221 |
Token | atter |
Token ID | 1436 |
Feature activation | -9.96e+00 |
Pos logit contributions | |
intend | +8.352 |
percentile | +7.988 |
Compton | +7.879 |
laim | +7.747 |
lé | +7.561 |
Neg logit contributions | |
Adds | -8.415 |
Breach | -7.175 |
arrivals | -6.698 |
IER | -6.559 |
Newsletter | -6.503 |
Token | gone |
Token ID | 3750 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
Compton | +5.910 |
intend | +5.816 |
percentile | +5.759 |
lé | +5.390 |
totality | +5.321 |
Neg logit contributions | |
Adds | -7.834 |
Breach | -6.857 |
Newsletter | -6.466 |
IER | -6.296 |
oa | -6.202 |
Token | through |
Token ID | 832 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
Adds | +0.807 |
Breach | +0.713 |
oa | +0.653 |
letters | +0.652 |
Newsletter | +0.643 |
Neg logit contributions | |
intend | -0.771 |
Compton | -0.762 |
percentile | -0.759 |
totality | -0.730 |
adelphia | -0.703 |
Token | the |
Token ID | 262 |
Feature activation | +7.84e-02 |
Pos logit contributions | |
Compton | +1.458 |
percentile | +1.410 |
intend | +1.393 |
totality | +1.373 |
adelphia | +1.291 |
Neg logit contributions | |
Adds | -1.690 |
Breach | -1.473 |
Newsletter | -1.370 |
letters | -1.368 |
oa | -1.363 |
Token | washing |
Token ID | 20518 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
Adds | +0.060 |
Breach | +0.053 |
oa | +0.049 |
letters | +0.049 |
IER | +0.048 |
Neg logit contributions | |
intend | -0.052 |
Compton | -0.051 |
percentile | -0.051 |
totality | -0.049 |
adelphia | -0.047 |
Token | was |
Token ID | 373 |
Feature activation | -6.26e+00 |
Pos logit contributions | |
Adds | +1.076 |
Breach | +0.947 |
oa | +0.866 |
letters | +0.861 |
̶ | +0.850 |
Neg logit contributions | |
intend | -1.107 |
Compton | -1.094 |
percentile | -1.091 |
totality | -1.050 |
adelphia | -1.013 |
Token | a |
Token ID | 257 |
Feature activation | -4.13e+00 |
Pos logit contributions | |
Compton | +3.846 |
percentile | +3.795 |
totality | +3.778 |
intend | +3.742 |
indication | +3.567 |
Neg logit contributions | |
Adds | -4.860 |
Breach | -4.240 |
letters | -4.001 |
artisan | -3.995 |
IER | -3.982 |
Token | lot |
Token ID | 1256 |
Feature activation | -9.55e+00 |
Pos logit contributions | |
percentile | +2.662 |
Compton | +2.662 |
intend | +2.637 |
totality | +2.582 |
disgr | +2.406 |
Neg logit contributions | |
Adds | -3.143 |
Breach | -2.721 |
letters | -2.608 |
Newsletter | -2.567 |
oa | -2.559 |
Token | of |
Token ID | 286 |
Feature activation | -8.79e+00 |
Pos logit contributions | |
Compton | +4.873 |
percentile | +4.835 |
intend | +4.688 |
totality | +4.646 |
indication | +4.486 |
Neg logit contributions | |
Adds | -8.005 |
Breach | -7.144 |
artisan | -6.815 |
Newsletter | -6.793 |
̶ | -6.695 |
Token | back |
Token ID | 736 |
Feature activation | -9.66e-01 |
Pos logit contributions | |
Compton | +5.328 |
totality | +5.271 |
percentile | +5.200 |
indication | +5.028 |
intend | +5.004 |
Neg logit contributions | |
Adds | -6.744 |
Breach | -5.865 |
IER | -5.661 |
Newsletter | -5.657 |
̶ | -5.618 |
Token | and |
Token ID | 290 |
Feature activation | -1.22e+01 |
Pos logit contributions | |
intend | +0.621 |
Compton | +0.617 |
percentile | +0.613 |
totality | +0.587 |
adelphia | +0.562 |
Neg logit contributions | |
Adds | -0.747 |
Breach | -0.664 |
oa | -0.608 |
letters | -0.607 |
̶ | -0.605 |
Token | forth |
Token ID | 6071 |
Feature activation | -1.08e+01 |
Pos logit contributions | |
percentile | +3.490 |
Compton | +3.446 |
intend | +3.162 |
totality | +3.120 |
background | +3.021 |
Neg logit contributions | |
Adds | -12.372 |
artisan | -11.475 |
Breach | -11.373 |
IER | -11.209 |
letters | -11.100 |
Token | , |
Token ID | 11 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
percentile | +5.814 |
Compton | +5.740 |
intend | +5.651 |
totality | +5.574 |
indication | +5.379 |
Neg logit contributions | |
Adds | -8.570 |
Breach | -7.582 |
artisan | -7.287 |
IER | -7.285 |
Newsletter | -7.001 |
Token | but |
Token ID | 475 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
Compton | +1.750 |
percentile | +1.747 |
intend | +1.731 |
totality | +1.675 |
indication | +1.564 |
Neg logit contributions | |
Adds | -2.291 |
Breach | -2.032 |
IER | -1.888 |
oa | -1.884 |
artisan | -1.883 |
Token | eventually |
Token ID | 4191 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
Compton | +0.726 |
intend | +0.725 |
percentile | +0.722 |
totality | +0.700 |
adelphia | +0.660 |
Neg logit contributions | |
Adds | -0.804 |
Breach | -0.707 |
letters | -0.653 |
oa | -0.651 |
artisan | -0.646 |
Token | she |
Token ID | 673 |
Feature activation | +9.79e-02 |
Pos logit contributions | |
Adds | +0.137 |
Breach | +0.121 |
letters | +0.111 |
oa | +0.111 |
artisan | +0.109 |
Neg logit contributions | |
intend | -0.129 |
Compton | -0.128 |
percentile | -0.127 |
totality | -0.123 |
adelphia | -0.118 |
Token | I |
Token ID | 314 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
Compton | +1.630 |
intend | +1.620 |
percentile | +1.609 |
totality | +1.559 |
adelphia | +1.484 |
Neg logit contributions | |
Adds | -1.867 |
Breach | -1.640 |
artisan | -1.527 |
oa | -1.515 |
letters | -1.512 |
Token | was |
Token ID | 373 |
Feature activation | -3.38e+00 |
Pos logit contributions | |
intend | +1.406 |
Compton | +1.389 |
percentile | +1.386 |
totality | +1.323 |
adelphia | +1.267 |
Neg logit contributions | |
Adds | -1.672 |
Breach | -1.485 |
letters | -1.370 |
oa | -1.365 |
artisan | -1.358 |
Token | h |
Token ID | 289 |
Feature activation | +2.78e+00 |
Pos logit contributions | |
Compton | +2.350 |
intend | +2.339 |
percentile | +2.324 |
totality | +2.247 |
disgr | +2.149 |
Neg logit contributions | |
Adds | -2.424 |
Breach | -2.135 |
artisan | -1.952 |
letters | -1.943 |
oa | -1.938 |
Token | uff |
Token ID | 1648 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
Adds | +2.503 |
Breach | +2.259 |
oa | +2.149 |
̶ | +2.133 |
letters | +2.124 |
Neg logit contributions | |
intend | -1.414 |
percentile | -1.401 |
Compton | -1.382 |
totality | -1.341 |
adelphia | -1.239 |
Token | ing |
Token ID | 278 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
intend | +0.751 |
Compton | +0.744 |
percentile | +0.726 |
totality | +0.644 |
lé | +0.599 |
Neg logit contributions | |
Adds | -2.730 |
Breach | -2.520 |
oa | -2.372 |
letters | -2.357 |
Newsletter | -2.356 |
Token | and |
Token ID | 290 |
Feature activation | -1.20e+01 |
Pos logit contributions | |
Adds | +0.097 |
Breach | +0.086 |
oa | +0.079 |
letters | +0.078 |
artisan | +0.078 |
Neg logit contributions | |
Compton | -0.082 |
intend | -0.081 |
percentile | -0.081 |
totality | -0.077 |
adelphia | -0.074 |
Token | puff |
Token ID | 33679 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
percentile | +2.831 |
Compton | +2.696 |
intend | +2.658 |
totality | +2.347 |
disgr | +2.340 |
Neg logit contributions | |
Adds | -13.288 |
Breach | -12.351 |
artisan | -11.701 |
IER | -11.615 |
装 | -11.547 |
Token | ing |
Token ID | 278 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
intend | +0.867 |
Compton | +0.855 |
percentile | +0.853 |
totality | +0.741 |
lé | +0.689 |
Neg logit contributions | |
Adds | -3.222 |
Breach | -2.973 |
oa | -2.782 |
letters | -2.768 |
artisan | -2.759 |
Token | and |
Token ID | 290 |
Feature activation | -4.49e+00 |
Pos logit contributions | |
intend | +0.430 |
Compton | +0.429 |
percentile | +0.429 |
totality | +0.409 |
adelphia | +0.389 |
Neg logit contributions | |
Adds | -0.495 |
Breach | -0.439 |
oa | -0.403 |
letters | -0.402 |
artisan | -0.398 |
Token | crying |
Token ID | 13774 |
Feature activation | +5.31e-01 |
Pos logit contributions | |
Compton | +2.998 |
percentile | +2.945 |
intend | +2.931 |
totality | +2.842 |
disgr | +2.701 |
Neg logit contributions | |
Adds | -3.367 |
Breach | -2.949 |
artisan | -2.737 |
letters | -2.701 |
IER | -2.695 |
Token | and |
Token ID | 290 |
Feature activation | -2.87e+00 |
Pos logit contributions | |
Adds | +0.397 |
Breach | +0.352 |
oa | +0.323 |
letters | +0.322 |
artisan | +0.318 |
Neg logit contributions | |
intend | -0.356 |
Compton | -0.353 |
percentile | -0.352 |
totality | -0.338 |
adelphia | -0.323 |
Token | it |
Token ID | 340 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
Adds | +0.438 |
Breach | +0.390 |
oa | +0.360 |
letters | +0.359 |
̶ | +0.354 |
Neg logit contributions | |
intend | -0.364 |
Compton | -0.359 |
percentile | -0.358 |
totality | -0.343 |
adelphia | -0.329 |
Token | 's |
Token ID | 338 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
Adds | +0.394 |
Breach | +0.344 |
oa | +0.315 |
letters | +0.312 |
̶ | +0.308 |
Neg logit contributions | |
intend | -0.428 |
Compton | -0.422 |
percentile | -0.421 |
totality | -0.406 |
adelphia | -0.392 |
Token | actually |
Token ID | 1682 |
Feature activation | -7.99e-01 |
Pos logit contributions | |
Adds | +0.144 |
Breach | +0.127 |
oa | +0.117 |
letters | +0.117 |
Newsletter | +0.115 |
Neg logit contributions | |
intend | -0.138 |
Compton | -0.137 |
percentile | -0.137 |
totality | -0.132 |
adelphia | -0.126 |
Token | pop |
Token ID | 1461 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
intend | +0.545 |
percentile | +0.543 |
Compton | +0.543 |
totality | +0.522 |
adelphia | +0.495 |
Neg logit contributions | |
Adds | -0.584 |
Breach | -0.516 |
letters | -0.474 |
oa | -0.473 |
artisan | -0.469 |
Token | / |
Token ID | 14 |
Feature activation | -5.15e+00 |
Pos logit contributions | |
intend | +1.079 |
Compton | +1.068 |
percentile | +1.066 |
totality | +1.013 |
adelphia | +0.959 |
Neg logit contributions | |
Adds | -1.662 |
Breach | -1.516 |
letters | -1.397 |
oa | -1.395 |
artisan | -1.387 |
Token | pop |
Token ID | 12924 |
Feature activation | -1.18e+01 |
Pos logit contributions | |
intend | +2.778 |
percentile | +2.611 |
Compton | +2.593 |
totality | +2.414 |
lé | +2.398 |
Neg logit contributions | |
Adds | -4.432 |
Breach | -4.126 |
IER | -3.798 |
Newsletter | -3.743 |
̶ | -3.731 |
Token | / |
Token ID | 14 |
Feature activation | -4.47e+00 |
Pos logit contributions | |
percentile | +5.467 |
intend | +5.228 |
Compton | +5.123 |
totality | +5.051 |
indication | +4.843 |
Neg logit contributions | |
Adds | -9.906 |
Breach | -9.338 |
artisan | -8.594 |
Newsletter | -8.529 |
letters | -8.511 |
Token | pop |
Token ID | 12924 |
Feature activation | -1.07e+01 |
Pos logit contributions | |
intend | +2.277 |
Compton | +2.150 |
percentile | +2.145 |
totality | +2.012 |
lé | +1.941 |
Neg logit contributions | |
Adds | -4.000 |
Breach | -3.696 |
IER | -3.389 |
̶ | -3.370 |
Newsletter | -3.357 |
Token | / |
Token ID | 14 |
Feature activation | -4.36e+00 |
Pos logit contributions | |
percentile | +5.701 |
intend | +5.654 |
Compton | +5.481 |
totality | +5.368 |
indication | +5.127 |
Neg logit contributions | |
Adds | -8.428 |
Breach | -7.894 |
artisan | -7.204 |
letters | -7.106 |
Newsletter | -7.048 |
Token | ret |
Token ID | 1186 |
Feature activation | -3.08e+00 |
Pos logit contributions | |
intend | +2.310 |
percentile | +2.196 |
Compton | +2.193 |
totality | +2.067 |
lé | +1.978 |
Neg logit contributions | |
Adds | -3.816 |
Breach | -3.521 |
IER | -3.218 |
̶ | -3.209 |
letters | -3.195 |
Token | , |
Token ID | 837 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
intend | +1.877 |
percentile | +1.865 |
Compton | +1.862 |
totality | +1.785 |
adelphia | +1.685 |
Neg logit contributions | |
Adds | -2.435 |
Breach | -2.210 |
letters | -2.021 |
artisan | -2.020 |
oa | -2.016 |
Token | ils |
Token ID | 4487 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
intend | +1.315 |
Compton | +1.302 |
percentile | +1.287 |
totality | +1.229 |
adelphia | +1.204 |
Neg logit contributions | |
Adds | -1.365 |
Breach | -1.203 |
letters | -1.097 |
oa | -1.089 |
Newsletter | -1.088 |
Token | a |
Token ID | 64 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
Adds | +1.147 |
Breach | +1.027 |
oa | +0.957 |
letters | +0.939 |
Newsletter | +0.914 |
Neg logit contributions | |
percentile | -1.095 |
intend | -1.093 |
Compton | -1.082 |
totality | -1.043 |
adelphia | -1.001 |
Token | Craig |
Token ID | 13854 |
Feature activation | +7.17e-01 |
Pos logit contributions | |
Adds | +0.088 |
Breach | +0.077 |
letters | +0.071 |
oa | +0.071 |
Newsletter | +0.070 |
Neg logit contributions | |
intend | -0.078 |
Compton | -0.077 |
percentile | -0.077 |
totality | -0.074 |
adelphia | -0.071 |
Token | , |
Token ID | 11 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
Adds | +0.532 |
Breach | +0.471 |
oa | +0.432 |
letters | +0.432 |
̶ | +0.426 |
Neg logit contributions | |
intend | -0.486 |
Compton | -0.480 |
percentile | -0.478 |
totality | -0.459 |
adelphia | -0.442 |
Token | St |
Token ID | 520 |
Feature activation | -3.72e+00 |
Pos logit contributions | |
Compton | +1.167 |
intend | +1.159 |
percentile | +1.139 |
totality | +1.106 |
adelphia | +1.052 |
Neg logit contributions | |
Adds | -1.251 |
Breach | -1.096 |
letters | -1.022 |
oa | -1.014 |
artisan | -1.013 |
Token | K |
Token ID | 509 |
Feature activation | -1.16e+01 |
Pos logit contributions | |
Compton | +2.483 |
intend | +2.479 |
percentile | +2.422 |
totality | +2.328 |
adelphia | +2.269 |
Neg logit contributions | |
Adds | -2.792 |
Breach | -2.417 |
letters | -2.270 |
Newsletter | -2.253 |
IER | -2.232 |
Token | ilda |
Token ID | 27281 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
intend | +8.391 |
Compton | +8.046 |
percentile | +7.763 |
lé | +7.756 |
weak | +7.622 |
Neg logit contributions | |
Adds | -7.275 |
Breach | -6.299 |
Newsletter | -6.063 |
HCR | -5.764 |
artisan | -5.697 |
Token | and |
Token ID | 290 |
Feature activation | -3.32e+00 |
Pos logit contributions | |
Adds | +0.556 |
Breach | +0.492 |
oa | +0.452 |
letters | +0.451 |
̶ | +0.445 |
Neg logit contributions | |
intend | -0.507 |
Compton | -0.501 |
percentile | -0.499 |
totality | -0.480 |
adelphia | -0.461 |
Token | the |
Token ID | 262 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
Compton | +2.274 |
intend | +2.219 |
percentile | +2.192 |
totality | +2.140 |
adelphia | +2.009 |
Neg logit contributions | |
Adds | -2.444 |
Breach | -2.117 |
artisan | -2.000 |
letters | -2.000 |
Newsletter | -1.977 |
Token | Bass |
Token ID | 19829 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Compton | +1.480 |
intend | +1.467 |
percentile | +1.451 |
totality | +1.408 |
adelphia | +1.327 |
Neg logit contributions | |
Adds | -1.738 |
Breach | -1.522 |
letters | -1.437 |
oa | -1.433 |
artisan | -1.422 |
Token | Rock |
Token ID | 4631 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
intend | +1.253 |
Compton | +1.237 |
percentile | +1.230 |
totality | +1.185 |
adelphia | +1.137 |
Neg logit contributions | |
Adds | -1.281 |
Breach | -1.123 |
letters | -1.028 |
̶ | -1.021 |
Newsletter | -1.021 |
Token | was |
Token ID | 373 |
Feature activation | +6.67e-01 |
Pos logit contributions | |
Adds | +0.352 |
Breach | +0.312 |
oa | +0.287 |
letters | +0.285 |
Newsletter | +0.281 |
Neg logit contributions | |
intend | -0.328 |
Compton | -0.324 |
percentile | -0.323 |
totality | -0.310 |
adelphia | -0.299 |
Token | not |
Token ID | 407 |
Feature activation | +5.52e-02 |
Pos logit contributions | |
Adds | +0.493 |
Breach | +0.437 |
oa | +0.401 |
letters | +0.400 |
̶ | +0.395 |
Neg logit contributions | |
intend | -0.453 |
Compton | -0.447 |
percentile | -0.446 |
totality | -0.428 |
adelphia | -0.412 |
Token | prone |
Token ID | 17592 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
Adds | +0.040 |
Breach | +0.035 |
oa | +0.032 |
letters | +0.032 |
̶ | +0.032 |
Neg logit contributions | |
intend | -0.038 |
Compton | -0.038 |
percentile | -0.038 |
totality | -0.036 |
adelphia | -0.035 |
Token | to |
Token ID | 284 |
Feature activation | -5.87e-01 |
Pos logit contributions | |
intend | +1.169 |
percentile | +1.152 |
Compton | +1.150 |
totality | +1.107 |
adelphia | +1.059 |
Neg logit contributions | |
Adds | -1.359 |
Breach | -1.217 |
letters | -1.115 |
oa | -1.112 |
artisan | -1.096 |
Token | divide |
Token ID | 14083 |
Feature activation | -4.57e+00 |
Pos logit contributions | |
intend | +0.386 |
percentile | +0.382 |
Compton | +0.382 |
totality | +0.367 |
adelphia | +0.349 |
Neg logit contributions | |
Adds | -0.446 |
Breach | -0.397 |
oa | -0.366 |
letters | -0.365 |
̶ | -0.361 |
Token | and |
Token ID | 290 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
intend | +2.932 |
percentile | +2.909 |
Compton | +2.889 |
totality | +2.805 |
adelphia | +2.670 |
Neg logit contributions | |
Adds | -3.500 |
Breach | -3.098 |
̶ | -2.850 |
IER | -2.838 |
oa | -2.837 |
Token | name |
Token ID | 1438 |
Feature activation | -3.83e+00 |
Pos logit contributions | |
percentile | +5.873 |
totality | +5.701 |
Compton | +5.673 |
intend | +5.502 |
disgr | +5.341 |
Neg logit contributions | |
Adds | -9.656 |
Breach | -8.701 |
Newsletter | -8.347 |
letters | -8.218 |
artisan | -8.190 |
Token | - |
Token ID | 12 |
Feature activation | +7.69e-01 |
Pos logit contributions | |
intend | +2.459 |
Compton | +2.458 |
percentile | +2.455 |
totality | +2.365 |
disgr | +2.228 |
Neg logit contributions | |
Adds | -2.922 |
Breach | -2.596 |
IER | -2.400 |
oa | -2.396 |
̶ | -2.376 |
Token | call |
Token ID | 13345 |
Feature activation | +4.72e-01 |
Pos logit contributions | |
Adds | +0.592 |
Breach | +0.527 |
oa | +0.487 |
letters | +0.485 |
̶ | +0.478 |
Neg logit contributions | |
intend | -0.499 |
Compton | -0.493 |
percentile | -0.492 |
totality | -0.471 |
adelphia | -0.452 |
Token | in |
Token ID | 287 |
Feature activation | +2.43e+00 |
Pos logit contributions | |
Adds | +0.351 |
Breach | +0.312 |
oa | +0.287 |
letters | +0.286 |
Newsletter | +0.281 |
Neg logit contributions | |
intend | -0.320 |
Compton | -0.315 |
percentile | -0.314 |
totality | -0.300 |
adelphia | -0.291 |
Token | the |
Token ID | 262 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
Adds | +1.743 |
Breach | +1.538 |
letters | +1.410 |
oa | +1.409 |
Newsletter | +1.388 |
Neg logit contributions | |
intend | -1.700 |
percentile | -1.662 |
Compton | -1.660 |
totality | -1.584 |
adelphia | -1.556 |
Token | infeld |
Token ID | 47187 |
Feature activation | -7.51e+00 |
Pos logit contributions | |
intend | +2.128 |
Compton | +2.082 |
percentile | +2.058 |
totality | +1.874 |
adelphia | +1.859 |
Neg logit contributions | |
Adds | -4.239 |
Breach | -3.857 |
IER | -3.597 |
oa | -3.576 |
̶ | -3.563 |
Token |
|
Token ID | 198 |
Feature activation | -1.79e+00 |
Pos logit contributions | |
Compton | +3.994 |
percentile | +3.911 |
intend | +3.889 |
totality | +3.620 |
lé | +3.435 |
Neg logit contributions | |
Adds | -6.466 |
Breach | -5.797 |
̶ | -5.492 |
artisan | -5.443 |
IER | -5.371 |
Token |
|
Token ID | 198 |
Feature activation | -8.58e-01 |
Pos logit contributions | |
intend | +1.047 |
Compton | +1.033 |
percentile | +1.030 |
totality | +0.978 |
adelphia | +0.936 |
Neg logit contributions | |
Adds | -1.484 |
Breach | -1.336 |
oa | -1.240 |
letters | -1.235 |
artisan | -1.223 |
Token | 1993 |
Token ID | 24465 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
intend | +0.652 |
Compton | +0.646 |
percentile | +0.640 |
totality | +0.615 |
adelphia | +0.597 |
Neg logit contributions | |
Adds | -0.564 |
Breach | -0.496 |
oa | -0.447 |
letters | -0.442 |
̶ | -0.441 |
Token | Garry |
Token ID | 45354 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
intend | +0.680 |
Compton | +0.677 |
percentile | +0.672 |
totality | +0.643 |
adelphia | +0.616 |
Neg logit contributions | |
Adds | -0.819 |
Breach | -0.726 |
oa | -0.672 |
letters | -0.670 |
̶ | -0.664 |
Token | Sh |
Token ID | 911 |
Feature activation | -1.14e+01 |
Pos logit contributions | |
Adds | +1.160 |
Breach | +1.040 |
oa | +0.951 |
letters | +0.946 |
Newsletter | +0.936 |
Neg logit contributions | |
intend | -1.076 |
percentile | -1.059 |
Compton | -1.048 |
totality | -1.023 |
adelphia | -0.982 |
Token | and |
Token ID | 392 |
Feature activation | -7.22e+00 |
Pos logit contributions | |
intend | +5.257 |
percentile | +4.771 |
Compton | +4.272 |
dry | +4.237 |
adelphia | +4.235 |
Neg logit contributions | |
Adds | -10.935 |
Breach | -9.922 |
arrivals | -9.423 |
IER | -9.239 |
Newsletter | -9.235 |
Token | ling |
Token ID | 1359 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
intend | +2.575 |
Compton | +2.570 |
percentile | +2.501 |
totality | +2.243 |
lé | +2.239 |
Neg logit contributions | |
Adds | -7.569 |
Breach | -6.826 |
̶ | -6.602 |
Newsletter | -6.519 |
artisan | -6.426 |
Token | 1994 |
Token ID | 9162 |
Feature activation | -4.72e-01 |
Pos logit contributions | |
Adds | +1.465 |
Breach | +1.312 |
oa | +1.215 |
letters | +1.208 |
IER | +1.190 |
Neg logit contributions | |
intend | -1.174 |
percentile | -1.152 |
Compton | -1.146 |
totality | -1.104 |
adelphia | -1.063 |
Token | Kel |
Token ID | 15150 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
intend | +0.304 |
Compton | +0.301 |
percentile | +0.299 |
totality | +0.287 |
adelphia | +0.275 |
Neg logit contributions | |
Adds | -0.366 |
Breach | -0.325 |
oa | -0.300 |
letters | -0.299 |
̶ | -0.296 |
Token | sey |
Token ID | 4397 |
Feature activation | +3.05e+00 |
Pos logit contributions | |
Adds | +0.621 |
Breach | +0.486 |
oa | +0.409 |
letters | +0.401 |
IER | +0.383 |
Neg logit contributions | |
intend | -1.738 |
percentile | -1.725 |
Compton | -1.717 |
totality | -1.692 |
adelphia | -1.636 |
Token | � |
Token ID | 447 |
Feature activation | +3.19e+00 |
Pos logit contributions | |
Adds | +2.267 |
Breach | +2.022 |
̶ | +1.866 |
oa | +1.856 |
Newsletter | +1.829 |
Neg logit contributions | |
intend | -2.128 |
percentile | -2.103 |
Compton | -2.091 |
totality | -2.036 |
adelphia | -1.958 |
Token | � |
Token ID | 251 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
Adds | +2.669 |
Breach | +2.408 |
letters | +2.229 |
oa | +2.228 |
̶ | +2.204 |
Neg logit contributions | |
intend | -1.838 |
percentile | -1.797 |
Compton | -1.796 |
totality | -1.722 |
adelphia | -1.640 |
Token | said |
Token ID | 531 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
Adds | +1.118 |
Breach | +0.985 |
oa | +0.901 |
letters | +0.895 |
̶ | +0.884 |
Neg logit contributions | |
intend | -1.144 |
percentile | -1.127 |
Compton | -1.123 |
totality | -1.084 |
adelphia | -1.048 |
Token | Ed |
Token ID | 1717 |
Feature activation | +8.93e-01 |
Pos logit contributions | |
Adds | +0.764 |
Breach | +0.676 |
oa | +0.619 |
letters | +0.617 |
̶ | +0.608 |
Neg logit contributions | |
intend | -0.732 |
Compton | -0.722 |
percentile | -0.721 |
totality | -0.693 |
adelphia | -0.668 |
Token | Sc |
Token ID | 1446 |
Feature activation | -3.45e+00 |
Pos logit contributions | |
Adds | +0.663 |
Breach | +0.588 |
oa | +0.541 |
letters | +0.539 |
̶ | +0.531 |
Neg logit contributions | |
intend | -0.604 |
Compton | -0.595 |
percentile | -0.595 |
totality | -0.571 |
adelphia | -0.549 |
Token | r |
Token ID | 81 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
intend | +2.340 |
Compton | +2.262 |
percentile | +2.245 |
totality | +2.113 |
adelphia | +2.111 |
Neg logit contributions | |
Adds | -2.585 |
Breach | -2.266 |
IER | -2.083 |
Newsletter | -2.070 |
letters | -2.064 |
Token | utch |
Token ID | 7140 |
Feature activation | -2.47e+00 |
Pos logit contributions | |
intend | +6.223 |
percentile | +5.647 |
Compton | +5.522 |
adelphia | +5.231 |
lé | +5.179 |
Neg logit contributions | |
Adds | -9.855 |
Breach | -8.697 |
arrivals | -8.334 |
IER | -8.014 |
ン | -8.006 |
Token | ins |
Token ID | 1040 |
Feature activation | +2.13e+00 |
Pos logit contributions | |
intend | +1.742 |
Compton | +1.722 |
percentile | +1.712 |
totality | +1.629 |
adelphia | +1.574 |
Neg logit contributions | |
Adds | -1.766 |
Breach | -1.554 |
oa | -1.411 |
letters | -1.406 |
̶ | -1.404 |
Token | , |
Token ID | 11 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
Adds | +1.513 |
Breach | +1.334 |
oa | +1.227 |
letters | +1.216 |
̶ | +1.203 |
Neg logit contributions | |
intend | -1.506 |
percentile | -1.486 |
Compton | -1.483 |
totality | -1.430 |
adelphia | -1.379 |
Token | the |
Token ID | 262 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Adds | +1.169 |
Breach | +1.038 |
oa | +0.951 |
letters | +0.946 |
̶ | +0.936 |
Neg logit contributions | |
intend | -1.095 |
Compton | -1.077 |
percentile | -1.076 |
totality | -1.035 |
adelphia | -1.001 |
Token | Toledo |
Token ID | 36026 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
intend | +0.818 |
Compton | +0.812 |
percentile | +0.805 |
totality | +0.772 |
adelphia | +0.728 |
Neg logit contributions | |
Adds | -1.121 |
Breach | -1.000 |
oa | -0.932 |
letters | -0.932 |
̶ | -0.920 |
Token | --+ |
Token ID | 44785 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
Adds | +0.080 |
Breach | +0.069 |
oa | +0.062 |
letters | +0.062 |
̶ | +0.061 |
Neg logit contributions | |
intend | -0.102 |
Compton | -0.101 |
percentile | -0.101 |
totality | -0.097 |
adelphia | -0.094 |
Token | < |
Token ID | 1279 |
Feature activation | -4.95e+00 |
Pos logit contributions | |
intend | +0.670 |
Compton | +0.666 |
percentile | +0.665 |
totality | +0.640 |
adelphia | +0.617 |
Neg logit contributions | |
Adds | -0.520 |
Breach | -0.449 |
oa | -0.406 |
letters | -0.403 |
̶ | -0.398 |
Token | -- |
Token ID | 438 |
Feature activation | +1.95e-01 |
Pos logit contributions | |
intend | +3.584 |
percentile | +3.502 |
Compton | +3.496 |
totality | +3.235 |
adelphia | +3.171 |
Neg logit contributions | |
Adds | -3.344 |
Breach | -3.033 |
oa | -2.744 |
IER | -2.703 |
artisan | -2.697 |
Token | pop |
Token ID | 1461 |
Feature activation | -4.61e+00 |
Pos logit contributions | |
Adds | +0.178 |
Breach | +0.162 |
oa | +0.152 |
letters | +0.152 |
̶ | +0.150 |
Neg logit contributions | |
intend | -0.098 |
percentile | -0.097 |
Compton | -0.096 |
totality | -0.091 |
adelphia | -0.086 |
Token | / |
Token ID | 14 |
Feature activation | -3.14e+00 |
Pos logit contributions | |
intend | +2.095 |
percentile | +2.093 |
Compton | +2.072 |
totality | +1.891 |
adelphia | +1.815 |
Neg logit contributions | |
Adds | -4.312 |
Breach | -3.992 |
IER | -3.716 |
artisan | -3.713 |
oa | -3.708 |
Token | pop |
Token ID | 12924 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
intend | +1.671 |
percentile | +1.605 |
Compton | +1.601 |
totality | +1.483 |
adelphia | +1.449 |
Neg logit contributions | |
Adds | -2.769 |
Breach | -2.550 |
IER | -2.363 |
̶ | -2.340 |
Newsletter | -2.332 |
Token | / |
Token ID | 14 |
Feature activation | -4.14e+00 |
Pos logit contributions | |
percentile | +4.002 |
intend | +3.812 |
Compton | +3.760 |
totality | +3.193 |
background | +3.133 |
Neg logit contributions | |
Adds | -10.984 |
Breach | -10.333 |
IER | -9.885 |
artisan | -9.869 |
Newsletter | -9.683 |
Token | pop |
Token ID | 12924 |
Feature activation | -8.48e+00 |
Pos logit contributions | |
intend | +2.231 |
percentile | +2.112 |
Compton | +2.105 |
totality | +1.944 |
adelphia | +1.903 |
Neg logit contributions | |
Adds | -3.628 |
Breach | -3.346 |
IER | -3.095 |
̶ | -3.074 |
Newsletter | -3.048 |
Token | / |
Token ID | 14 |
Feature activation | -2.13e+00 |
Pos logit contributions | |
percentile | +3.431 |
intend | +3.360 |
Compton | +3.253 |
totality | +2.976 |
indication | +2.771 |
Neg logit contributions | |
Adds | -8.126 |
Breach | -7.581 |
IER | -7.137 |
artisan | -7.116 |
Newsletter | -7.049 |
Token | ret |
Token ID | 1186 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
intend | +1.064 |
Compton | +1.028 |
percentile | +1.027 |
totality | +0.962 |
adelphia | +0.919 |
Neg logit contributions | |
Adds | -1.955 |
Breach | -1.786 |
oa | -1.657 |
letters | -1.654 |
IER | -1.651 |
Token | 's |
Token ID | 338 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
Adds | +0.630 |
Breach | +0.544 |
oa | +0.487 |
letters | +0.485 |
̶ | +0.478 |
Neg logit contributions | |
intend | -0.854 |
percentile | -0.846 |
Compton | -0.846 |
totality | -0.817 |
adelphia | -0.790 |
Token | center |
Token ID | 3641 |
Feature activation | +1.67e+00 |
Pos logit contributions | |
Adds | +0.568 |
Breach | +0.499 |
oa | +0.454 |
letters | +0.451 |
IER | +0.444 |
Neg logit contributions | |
intend | -0.624 |
Compton | -0.612 |
percentile | -0.612 |
totality | -0.589 |
adelphia | -0.572 |
Token | , |
Token ID | 11 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
Adds | +1.180 |
Breach | +1.040 |
oa | +0.951 |
letters | +0.948 |
IER | +0.934 |
Neg logit contributions | |
intend | -1.187 |
Compton | -1.169 |
percentile | -1.167 |
totality | -1.122 |
adelphia | -1.084 |
Token | greet |
Token ID | 12589 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
intend | +0.839 |
Compton | +0.830 |
percentile | +0.829 |
totality | +0.795 |
adelphia | +0.761 |
Neg logit contributions | |
Adds | -0.950 |
Breach | -0.840 |
oa | -0.775 |
letters | -0.774 |
̶ | -0.766 |
Token | moderator |
Token ID | 31847 |
Feature activation | +4.05e+00 |
Pos logit contributions | |
Adds | +1.034 |
Breach | +0.908 |
oa | +0.827 |
letters | +0.824 |
̶ | +0.814 |
Neg logit contributions | |
intend | -1.105 |
Compton | -1.092 |
percentile | -1.089 |
totality | -1.050 |
adelphia | -1.013 |
Token | Randy |
Token ID | 21248 |
Feature activation | +6.73e-01 |
Pos logit contributions | |
Adds | +2.850 |
Breach | +2.581 |
oa | +2.319 |
letters | +2.302 |
IER | +2.253 |
Neg logit contributions | |
intend | -2.851 |
percentile | -2.793 |
Compton | -2.722 |
totality | -2.654 |
adelphia | -2.606 |
Token | Sh |
Token ID | 911 |
Feature activation | -1.13e+01 |
Pos logit contributions | |
Adds | +0.486 |
Breach | +0.434 |
oa | +0.395 |
letters | +0.394 |
Newsletter | +0.387 |
Neg logit contributions | |
intend | -0.468 |
percentile | -0.460 |
Compton | -0.457 |
totality | -0.444 |
adelphia | -0.427 |
Token | and |
Token ID | 392 |
Feature activation | -6.38e+00 |
Pos logit contributions | |
intend | +7.660 |
percentile | +7.235 |
adelphia | +6.886 |
Compton | +6.839 |
laim | +6.831 |
Neg logit contributions | |
Adds | -8.243 |
Breach | -7.210 |
arrivals | -6.631 |
Newsletter | -6.583 |
IER | -6.481 |
Token | obil |
Token ID | 25898 |
Feature activation | +2.04e+00 |
Pos logit contributions | |
intend | +3.441 |
Compton | +3.430 |
percentile | +3.379 |
totality | +3.189 |
lé | +3.133 |
Neg logit contributions | |
Adds | -5.518 |
Breach | -4.885 |
̶ | -4.683 |
Newsletter | -4.568 |
letters | -4.525 |
Token | , |
Token ID | 11 |
Feature activation | +2.86e+00 |
Pos logit contributions | |
Adds | +1.508 |
Breach | +1.338 |
oa | +1.235 |
letters | +1.225 |
IER | +1.210 |
Neg logit contributions | |
intend | -1.384 |
percentile | -1.362 |
Compton | -1.361 |
totality | -1.307 |
adelphia | -1.259 |
Token | right |
Token ID | 826 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
Adds | +2.012 |
Breach | +1.783 |
oa | +1.626 |
letters | +1.615 |
IER | +1.589 |
Neg logit contributions | |
intend | -2.043 |
percentile | -1.967 |
Compton | -1.953 |
totality | -1.891 |
adelphia | -1.850 |
Token | , |
Token ID | 11 |
Feature activation | +9.97e-01 |
Pos logit contributions | |
Adds | +3.514 |
Breach | +3.059 |
oa | +2.810 |
letters | +2.774 |
IER | +2.744 |
Neg logit contributions | |
intend | -3.920 |
percentile | -3.836 |
Compton | -3.825 |
totality | -3.684 |
adelphia | -3.578 |
Token | Y |
Token ID | 56 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
intend | +0.387 |
Compton | +0.386 |
percentile | +0.384 |
totality | +0.370 |
adelphia | +0.354 |
Neg logit contributions | |
Adds | -0.430 |
Breach | -0.383 |
oa | -0.350 |
letters | -0.349 |
̶ | -0.346 |
Token | BE |
Token ID | 9348 |
Feature activation | +3.69e-01 |
Pos logit contributions | |
Adds | +1.011 |
Breach | +0.897 |
oa | +0.826 |
letters | +0.823 |
̶ | +0.812 |
Neg logit contributions | |
intend | -0.895 |
Compton | -0.883 |
percentile | -0.881 |
totality | -0.845 |
adelphia | -0.812 |
Token | AR |
Token ID | 1503 |
Feature activation | -5.72e-01 |
Pos logit contributions | |
Adds | +0.253 |
Breach | +0.222 |
oa | +0.203 |
letters | +0.201 |
̶ | +0.198 |
Neg logit contributions | |
intend | -0.270 |
Compton | -0.267 |
percentile | -0.266 |
totality | -0.256 |
adelphia | -0.247 |
Token | and |
Token ID | 290 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
intend | +0.373 |
Compton | +0.370 |
percentile | +0.368 |
totality | +0.352 |
adelphia | +0.338 |
Neg logit contributions | |
Adds | -0.437 |
Breach | -0.385 |
oa | -0.357 |
letters | -0.355 |
Newsletter | -0.352 |
Token | F |
Token ID | 376 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
Adds | +0.897 |
Breach | +0.801 |
oa | +0.739 |
letters | +0.736 |
̶ | +0.726 |
Neg logit contributions | |
intend | -0.746 |
Compton | -0.735 |
percentile | -0.733 |
totality | -0.703 |
adelphia | -0.675 |
Token | ANC |
Token ID | 20940 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
intend | +0.695 |
Compton | +0.686 |
percentile | +0.680 |
totality | +0.649 |
adelphia | +0.632 |
Neg logit contributions | |
Adds | -0.771 |
Breach | -0.691 |
letters | -0.630 |
oa | -0.624 |
Newsletter | -0.621 |
Token | Y |
Token ID | 56 |
Feature activation | -3.38e+00 |
Pos logit contributions | |
percentile | +6.483 |
Compton | +6.359 |
intend | +6.052 |
adelphia | +5.822 |
totality | +5.797 |
Neg logit contributions | |
Adds | -8.366 |
Breach | -7.434 |
oa | -7.046 |
artisan | -6.977 |
ン | -6.891 |
Token | BE |
Token ID | 9348 |
Feature activation | -2.05e+00 |
Pos logit contributions | |
Compton | +2.162 |
intend | +2.147 |
percentile | +2.137 |
totality | +2.038 |
adelphia | +1.958 |
Neg logit contributions | |
Adds | -2.608 |
Breach | -2.270 |
artisan | -2.131 |
oa | -2.123 |
letters | -2.113 |
Token | AR |
Token ID | 1503 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
Compton | +1.348 |
intend | +1.342 |
percentile | +1.333 |
totality | +1.254 |
adelphia | +1.226 |
Neg logit contributions | |
Adds | -1.538 |
Breach | -1.358 |
oa | -1.267 |
artisan | -1.256 |
letters | -1.246 |
Token | for |
Token ID | 329 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
intend | +1.015 |
Compton | +1.005 |
percentile | +1.001 |
totality | +0.958 |
adelphia | +0.919 |
Neg logit contributions | |
Adds | -1.165 |
Breach | -1.023 |
oa | -0.942 |
letters | -0.937 |
artisan | -0.935 |
Token | the |
Token ID | 262 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
Compton | +0.076 |
intend | +0.076 |
percentile | +0.076 |
totality | +0.073 |
adelphia | +0.070 |
Neg logit contributions | |
Adds | -0.082 |
Breach | -0.071 |
letters | -0.066 |
oa | -0.066 |
Newsletter | -0.066 |
Token | Ass |
Token ID | 8021 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
intend | +0.526 |
Compton | +0.518 |
percentile | +0.514 |
totality | +0.488 |
adelphia | +0.478 |
Neg logit contributions | |
Adds | -0.571 |
Breach | -0.516 |
oa | -0.469 |
letters | -0.466 |
artisan | -0.465 |
Token | ists |
Token ID | 1023 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
Adds | +0.980 |
Breach | +0.843 |
oa | +0.754 |
letters | +0.754 |
̶ | +0.748 |
Neg logit contributions | |
intend | -1.289 |
percentile | -1.273 |
Compton | -1.272 |
totality | -1.223 |
adelphia | -1.188 |
Token |
|
Token ID | 198 |
Feature activation | +7.85e-01 |
Pos logit contributions | |
intend | +0.165 |
percentile | +0.164 |
Compton | +0.164 |
totality | +0.155 |
adelphia | +0.148 |
Neg logit contributions | |
Adds | -0.242 |
Breach | -0.218 |
oa | -0.203 |
letters | -0.202 |
artisan | -0.201 |
Token |
|
Token ID | 198 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
Adds | +0.627 |
Breach | +0.558 |
oa | +0.517 |
letters | +0.517 |
̶ | +0.508 |
Neg logit contributions | |
intend | -0.491 |
Compton | -0.481 |
percentile | -0.480 |
totality | -0.468 |
adelphia | -0.445 |
Token | Matt |
Token ID | 13448 |
Feature activation | +6.69e+00 |
Pos logit contributions | |
Adds | +0.323 |
Breach | +0.288 |
oa | +0.263 |
letters | +0.262 |
artisan | +0.259 |
Neg logit contributions | |
intend | -0.299 |
Compton | -0.295 |
percentile | -0.294 |
totality | -0.280 |
adelphia | -0.272 |
Token | N |
Token ID | 399 |
Feature activation | -1.12e+01 |
Pos logit contributions | |
Adds | +4.519 |
Breach | +4.094 |
oa | +3.790 |
letters | +3.634 |
̶ | +3.623 |
Neg logit contributions | |
percentile | -4.741 |
intend | -4.734 |
totality | -4.610 |
Compton | -4.605 |
adelphia | -4.415 |
Token | isk |
Token ID | 1984 |
Feature activation | +2.91e+00 |
Pos logit contributions | |
intend | +4.583 |
percentile | +4.140 |
Compton | +3.820 |
ocl | +3.406 |
laim | +3.380 |
Neg logit contributions | |
Adds | -11.371 |
Breach | -10.197 |
Newsletter | -9.925 |
HCR | -9.852 |
神 | -9.604 |
Token | an |
Token ID | 272 |
Feature activation | +2.77e+00 |
Pos logit contributions | |
Adds | +0.921 |
Breach | +0.682 |
oa | +0.541 |
letters | +0.526 |
̶ | +0.502 |
Neg logit contributions | |
intend | -3.191 |
percentile | -3.160 |
Compton | -3.148 |
totality | -3.088 |
adelphia | -3.020 |
Token | en |
Token ID | 268 |
Feature activation | +5.15e+00 |
Pos logit contributions | |
Adds | +1.150 |
Breach | +0.917 |
oa | +0.766 |
letters | +0.765 |
Newsletter | +0.744 |
Neg logit contributions | |
intend | -2.772 |
Compton | -2.751 |
percentile | -2.744 |
totality | -2.672 |
adelphia | -2.600 |
Token | ( |
Token ID | 357 |
Feature activation | +2.37e+00 |
Pos logit contributions | |
Adds | +3.957 |
Breach | +3.538 |
oa | +3.287 |
letters | +3.235 |
̶ | +3.235 |
Neg logit contributions | |
intend | -3.302 |
Compton | -3.219 |
percentile | -3.205 |
totality | -3.107 |
adelphia | -2.973 |
Token | 2 |
Token ID | 17 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
Adds | +1.780 |
Breach | +1.567 |
oa | +1.457 |
letters | +1.445 |
̶ | +1.426 |
Neg logit contributions | |
intend | -1.583 |
percentile | -1.572 |
Compton | -1.570 |
totality | -1.515 |
adelphia | -1.447 |
Token | the |
Token ID | 262 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
Adds | +0.117 |
Breach | +0.103 |
oa | +0.095 |
letters | +0.095 |
IER | +0.093 |
Neg logit contributions | |
intend | -0.110 |
Compton | -0.109 |
percentile | -0.109 |
totality | -0.105 |
adelphia | -0.101 |
Token | pitches |
Token ID | 22421 |
Feature activation | -2.66e+00 |
Pos logit contributions | |
Adds | +1.332 |
Breach | +1.187 |
oa | +1.092 |
letters | +1.086 |
̶ | +1.072 |
Neg logit contributions | |
intend | -1.136 |
Compton | -1.117 |
percentile | -1.115 |
totality | -1.060 |
adelphia | -1.035 |
Token | you |
Token ID | 345 |
Feature activation | -4.83e+00 |
Pos logit contributions | |
Compton | +1.792 |
intend | +1.788 |
percentile | +1.762 |
totality | +1.707 |
adelphia | +1.618 |
Neg logit contributions | |
Adds | -1.973 |
Breach | -1.732 |
artisan | -1.599 |
oa | -1.596 |
letters | -1.587 |
Token | got |
Token ID | 1392 |
Feature activation | -4.03e+00 |
Pos logit contributions | |
intend | +3.181 |
Compton | +3.092 |
percentile | +3.079 |
totality | +2.916 |
adelphia | +2.819 |
Neg logit contributions | |
Adds | -3.687 |
Breach | -3.256 |
letters | -3.020 |
artisan | -3.012 |
IER | -3.003 |
Token | a |
Token ID | 257 |
Feature activation | -6.36e+00 |
Pos logit contributions | |
intend | +2.577 |
Compton | +2.571 |
percentile | +2.549 |
totality | +2.437 |
disgr | +2.296 |
Neg logit contributions | |
Adds | -3.126 |
Breach | -2.771 |
artisan | -2.580 |
letters | -2.565 |
oa | -2.551 |
Token | hit |
Token ID | 2277 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
intend | +3.846 |
percentile | +3.767 |
Compton | +3.748 |
totality | +3.596 |
adelphia | +3.381 |
Neg logit contributions | |
Adds | -5.054 |
Breach | -4.517 |
artisan | -4.280 |
letters | -4.273 |
IER | -4.158 |
Token | on |
Token ID | 319 |
Feature activation | -6.37e+00 |
Pos logit contributions | |
intend | +6.322 |
Compton | +6.208 |
percentile | +6.172 |
totality | +5.695 |
indication | +5.637 |
Neg logit contributions | |
Adds | -8.717 |
Breach | -7.838 |
artisan | -7.322 |
Newsletter | -7.192 |
oa | -6.988 |
Token | that |
Token ID | 326 |
Feature activation | -2.47e+00 |
Pos logit contributions | |
intend | +3.881 |
Compton | +3.827 |
percentile | +3.781 |
totality | +3.653 |
adelphia | +3.443 |
Neg logit contributions | |
Adds | -5.025 |
Breach | -4.530 |
artisan | -4.193 |
letters | -4.185 |
oa | -4.143 |
Token | you |
Token ID | 345 |
Feature activation | -3.87e+00 |
Pos logit contributions | |
intend | +1.598 |
Compton | +1.574 |
percentile | +1.553 |
totality | +1.511 |
adelphia | +1.421 |
Neg logit contributions | |
Adds | -1.902 |
Breach | -1.693 |
letters | -1.572 |
oa | -1.563 |
artisan | -1.561 |
Token | did |
Token ID | 750 |
Feature activation | -2.88e+00 |
Pos logit contributions | |
intend | +2.620 |
Compton | +2.560 |
percentile | +2.549 |
totality | +2.419 |
adelphia | +2.345 |
Neg logit contributions | |
Adds | -2.884 |
Breach | -2.549 |
letters | -2.343 |
oa | -2.326 |
artisan | -2.326 |
Token | swing |
Token ID | 9628 |
Feature activation | -2.70e+00 |
Pos logit contributions | |
intend | +1.859 |
percentile | +1.825 |
Compton | +1.820 |
totality | +1.738 |
adelphia | +1.677 |
Neg logit contributions | |
Adds | -2.230 |
Breach | -1.983 |
letters | -1.823 |
artisan | -1.817 |
oa | -1.816 |
Token | shift |
Token ID | 6482 |
Feature activation | -3.42e+00 |
Pos logit contributions | |
Adds | +0.613 |
Breach | +0.543 |
oa | +0.502 |
letters | +0.500 |
IER | +0.494 |
Neg logit contributions | |
intend | -0.534 |
Compton | -0.529 |
percentile | -0.527 |
totality | -0.507 |
adelphia | -0.484 |
Token | in |
Token ID | 287 |
Feature activation | +2.95e-01 |
Pos logit contributions | |
percentile | +2.185 |
intend | +2.180 |
Compton | +2.154 |
totality | +2.074 |
adelphia | +1.979 |
Neg logit contributions | |
Adds | -2.669 |
Breach | -2.361 |
oa | -2.170 |
letters | -2.156 |
Newsletter | -2.130 |
Token | demand |
Token ID | 3512 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
Adds | +0.224 |
Breach | +0.199 |
oa | +0.183 |
letters | +0.183 |
̶ | +0.180 |
Neg logit contributions | |
intend | -0.194 |
Compton | -0.192 |
percentile | -0.192 |
totality | -0.184 |
adelphia | -0.176 |
Token | for |
Token ID | 329 |
Feature activation | -9.36e-01 |
Pos logit contributions | |
Adds | +0.954 |
Breach | +0.837 |
oa | +0.768 |
letters | +0.767 |
IER | +0.756 |
Neg logit contributions | |
intend | -0.968 |
Compton | -0.956 |
percentile | -0.948 |
totality | -0.914 |
adelphia | -0.887 |
Token | cleaner |
Token ID | 21723 |
Feature activation | -4.83e+00 |
Pos logit contributions | |
intend | +0.648 |
percentile | +0.646 |
Compton | +0.644 |
totality | +0.624 |
adelphia | +0.589 |
Neg logit contributions | |
Adds | -0.676 |
Breach | -0.596 |
oa | -0.545 |
letters | -0.544 |
̶ | -0.540 |
Token | , |
Token ID | 11 |
Feature activation | -1.11e+01 |
Pos logit contributions | |
Compton | +3.275 |
percentile | +3.269 |
intend | +3.247 |
totality | +3.160 |
adelphia | +2.987 |
Neg logit contributions | |
Adds | -3.541 |
Breach | -3.104 |
letters | -2.842 |
oa | -2.833 |
IER | -2.811 |
Token | cheaper |
Token ID | 11721 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
percentile | +5.856 |
Compton | +5.719 |
totality | +5.530 |
intend | +5.379 |
disgr | +5.300 |
Neg logit contributions | |
Adds | -9.263 |
Breach | -8.371 |
Newsletter | -7.752 |
letters | -7.698 |
oa | -7.628 |
Token | energy |
Token ID | 2568 |
Feature activation | -7.06e+00 |
Pos logit contributions | |
Compton | +2.006 |
percentile | +2.003 |
intend | +1.987 |
totality | +1.936 |
adelphia | +1.825 |
Neg logit contributions | |
Adds | -2.009 |
Breach | -1.771 |
letters | -1.607 |
oa | -1.598 |
artisan | -1.596 |
Token | , |
Token ID | 11 |
Feature activation | -2.91e+00 |
Pos logit contributions | |
percentile | +4.142 |
intend | +4.043 |
Compton | +4.034 |
totality | +3.969 |
indication | +3.693 |
Neg logit contributions | |
Adds | -5.602 |
Breach | -5.143 |
oa | -4.676 |
artisan | -4.667 |
letters | -4.641 |
Token | corporations |
Token ID | 10225 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
percentile | +1.861 |
Compton | +1.856 |
intend | +1.846 |
totality | +1.802 |
adelphia | +1.674 |
Neg logit contributions | |
Adds | -2.242 |
Breach | -1.983 |
oa | -1.841 |
letters | -1.828 |
̶ | -1.809 |
Token | that |
Token ID | 326 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
intend | +1.466 |
percentile | +1.454 |
Compton | +1.447 |
totality | +1.392 |
disgr | +1.323 |
Neg logit contributions | |
Adds | -1.635 |
Breach | -1.437 |
oa | -1.329 |
letters | -1.325 |
artisan | -1.310 |
Token | Islamist |
Token ID | 17780 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
Adds | +1.363 |
Breach | +1.213 |
oa | +1.114 |
letters | +1.104 |
IER | +1.092 |
Neg logit contributions | |
intend | -1.285 |
Compton | -1.254 |
percentile | -1.252 |
totality | -1.202 |
adelphia | -1.168 |
Token | militants |
Token ID | 13162 |
Feature activation | +6.98e-01 |
Pos logit contributions | |
Adds | +0.376 |
Breach | +0.323 |
oa | +0.291 |
letters | +0.289 |
̶ | +0.284 |
Neg logit contributions | |
intend | -0.506 |
Compton | -0.500 |
percentile | -0.499 |
totality | -0.483 |
adelphia | -0.468 |
Token | , |
Token ID | 11 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
Adds | +0.509 |
Breach | +0.451 |
oa | +0.414 |
letters | +0.410 |
̶ | +0.406 |
Neg logit contributions | |
intend | -0.481 |
Compton | -0.473 |
percentile | -0.473 |
totality | -0.454 |
adelphia | -0.439 |
Token | a |
Token ID | 257 |
Feature activation | +4.45e-01 |
Pos logit contributions | |
Adds | +0.927 |
Breach | +0.820 |
oa | +0.751 |
letters | +0.748 |
̶ | +0.738 |
Neg logit contributions | |
intend | -0.892 |
Compton | -0.880 |
percentile | -0.878 |
totality | -0.844 |
adelphia | -0.814 |
Token | Human |
Token ID | 5524 |
Feature activation | +5.87e+00 |
Pos logit contributions | |
Adds | +0.325 |
Breach | +0.287 |
oa | +0.263 |
letters | +0.262 |
̶ | +0.259 |
Neg logit contributions | |
intend | -0.307 |
Compton | -0.303 |
percentile | -0.302 |
totality | -0.291 |
adelphia | -0.280 |
Token | Rights |
Token ID | 6923 |
Feature activation | +8.12e+00 |
Pos logit contributions | |
Adds | +3.240 |
Breach | +2.823 |
oa | +2.526 |
letters | +2.447 |
̶ | +2.411 |
Neg logit contributions | |
percentile | -4.908 |
Compton | -4.902 |
intend | -4.869 |
totality | -4.799 |
adelphia | -4.623 |
Token | Watch |
Token ID | 6305 |
Feature activation | +3.30e+00 |
Pos logit contributions | |
Adds | +6.473 |
Breach | +5.929 |
letters | +5.310 |
oa | +5.252 |
IER | +5.198 |
Neg logit contributions | |
intend | -4.750 |
percentile | -4.684 |
Compton | -4.611 |
totality | -4.592 |
adelphia | -4.481 |
Token | ( |
Token ID | 357 |
Feature activation | +6.19e-01 |
Pos logit contributions | |
Adds | +2.333 |
Breach | +2.045 |
oa | +1.853 |
letters | +1.829 |
IER | +1.824 |
Neg logit contributions | |
intend | -2.356 |
percentile | -2.304 |
Compton | -2.301 |
totality | -2.248 |
adelphia | -2.162 |
Token | HR |
Token ID | 17184 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
Adds | +0.398 |
Breach | +0.357 |
oa | +0.321 |
letters | +0.315 |
artisan | +0.314 |
Neg logit contributions | |
intend | -0.469 |
Compton | -0.460 |
percentile | -0.459 |
totality | -0.441 |
adelphia | -0.428 |
Token | W |
Token ID | 54 |
Feature activation | +3.57e+00 |
Pos logit contributions | |
Adds | +0.419 |
Breach | +0.388 |
oa | +0.365 |
letters | +0.365 |
Newsletter | +0.363 |
Neg logit contributions | |
intend | -0.146 |
Compton | -0.143 |
percentile | -0.142 |
totality | -0.134 |
adelphia | -0.123 |
Token | ) |
Token ID | 8 |
Feature activation | +3.37e+00 |
Pos logit contributions | |
Adds | +2.740 |
Breach | +2.457 |
oa | +2.267 |
letters | +2.252 |
IER | +2.233 |
Neg logit contributions | |
intend | -2.293 |
percentile | -2.264 |
Compton | -2.263 |
totality | -2.185 |
adelphia | -2.113 |
Token | the |
Token ID | 262 |
Feature activation | +3.35e+00 |
Pos logit contributions | |
Adds | +1.875 |
Breach | +1.669 |
oa | +1.518 |
letters | +1.508 |
̶ | +1.500 |
Neg logit contributions | |
intend | -2.040 |
percentile | -1.985 |
Compton | -1.981 |
totality | -1.911 |
adelphia | -1.867 |
Token | Amazon |
Token ID | 6186 |
Feature activation | -2.76e+00 |
Pos logit contributions | |
Adds | +2.330 |
Breach | +2.080 |
oa | +1.889 |
letters | +1.876 |
̶ | +1.864 |
Neg logit contributions | |
intend | -2.396 |
percentile | -2.329 |
Compton | -2.329 |
totality | -2.237 |
adelphia | -2.203 |
Token | store |
Token ID | 3650 |
Feature activation | +4.21e-02 |
Pos logit contributions | |
percentile | +2.103 |
intend | +2.102 |
Compton | +2.092 |
totality | +2.003 |
adelphia | +1.932 |
Neg logit contributions | |
Adds | -1.764 |
Breach | -1.530 |
letters | -1.392 |
oa | -1.388 |
artisan | -1.383 |
Token | , |
Token ID | 11 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
Adds | +0.031 |
Breach | +0.028 |
oa | +0.026 |
letters | +0.025 |
artisan | +0.025 |
Neg logit contributions | |
intend | -0.028 |
Compton | -0.028 |
percentile | -0.028 |
totality | -0.027 |
adelphia | -0.026 |
Token | only |
Token ID | 691 |
Feature activation | +2.71e+00 |
Pos logit contributions | |
Adds | +0.116 |
Breach | +0.103 |
oa | +0.094 |
letters | +0.094 |
IER | +0.093 |
Neg logit contributions | |
intend | -0.102 |
Compton | -0.101 |
percentile | -0.101 |
totality | -0.097 |
adelphia | -0.093 |
Token | free |
Token ID | 1479 |
Feature activation | +7.57e+00 |
Pos logit contributions | |
Adds | +1.970 |
Breach | +1.747 |
oa | +1.605 |
letters | +1.594 |
̶ | +1.579 |
Neg logit contributions | |
intend | -1.882 |
Compton | -1.841 |
percentile | -1.837 |
totality | -1.765 |
adelphia | -1.708 |
Token | ! |
Token ID | 0 |
Feature activation | -3.93e-01 |
Pos logit contributions | |
Adds | +5.302 |
Breach | +4.548 |
oa | +4.281 |
letters | +4.270 |
̶ | +4.209 |
Neg logit contributions | |
intend | -5.397 |
Compton | -5.286 |
percentile | -5.229 |
totality | -5.049 |
adelphia | -4.903 |
Token |
|
Token ID | 198 |
Feature activation | +6.08e-01 |
Pos logit contributions | |
intend | +0.236 |
Compton | +0.234 |
percentile | +0.232 |
totality | +0.221 |
adelphia | +0.211 |
Neg logit contributions | |
Adds | -0.319 |
Breach | -0.286 |
oa | -0.266 |
letters | -0.265 |
artisan | -0.263 |
Token |
|
Token ID | 198 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
Adds | +0.486 |
Breach | +0.432 |
oa | +0.400 |
letters | +0.399 |
̶ | +0.394 |
Neg logit contributions | |
intend | -0.380 |
Compton | -0.374 |
percentile | -0.373 |
totality | -0.364 |
adelphia | -0.346 |
Token | A |
Token ID | 32 |
Feature activation | +4.47e-02 |
Pos logit contributions | |
Adds | +1.043 |
Breach | +0.933 |
oa | +0.858 |
letters | +0.855 |
IER | +0.844 |
Neg logit contributions | |
intend | -0.874 |
Compton | -0.861 |
percentile | -0.858 |
totality | -0.821 |
adelphia | -0.791 |
Token | lot |
Token ID | 1256 |
Feature activation | -3.33e-01 |
Pos logit contributions | |
Adds | +0.034 |
Breach | +0.030 |
oa | +0.028 |
letters | +0.028 |
IER | +0.027 |
Neg logit contributions | |
intend | -0.030 |
Compton | -0.029 |
percentile | -0.029 |
totality | -0.028 |
adelphia | -0.027 |
Token | IMAGES |
Token ID | 45325 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
Compton | +0.636 |
intend | +0.631 |
percentile | +0.631 |
totality | +0.609 |
adelphia | +0.583 |
Neg logit contributions | |
Adds | -0.587 |
Breach | -0.515 |
artisan | -0.473 |
̶ | -0.467 |
oa | -0.463 |
Token | OF |
Token ID | 3963 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
Adds | +1.617 |
Breach | +1.447 |
oa | +1.344 |
letters | +1.341 |
IER | +1.324 |
Neg logit contributions | |
intend | -1.218 |
Compton | -1.193 |
percentile | -1.189 |
totality | -1.139 |
adelphia | -1.090 |
Token | THE |
Token ID | 3336 |
Feature activation | +2.96e+00 |
Pos logit contributions | |
Adds | +0.243 |
Breach | +0.218 |
oa | +0.202 |
letters | +0.202 |
Newsletter | +0.200 |
Neg logit contributions | |
intend | -0.177 |
Compton | -0.175 |
percentile | -0.175 |
totality | -0.166 |
adelphia | -0.159 |
Token | DAY |
Token ID | 24644 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
Adds | +2.063 |
Breach | +1.856 |
oa | +1.683 |
IER | +1.678 |
letters | +1.664 |
Neg logit contributions | |
intend | -2.112 |
percentile | -2.052 |
Compton | -2.047 |
totality | -1.990 |
adelphia | -1.933 |
Token | ) |
Token ID | 8 |
Feature activation | +3.69e+00 |
Pos logit contributions | |
Adds | +1.305 |
Breach | +1.160 |
oa | +1.068 |
letters | +1.065 |
IER | +1.051 |
Neg logit contributions | |
intend | -1.148 |
Compton | -1.128 |
percentile | -1.126 |
totality | -1.081 |
adelphia | -1.041 |
Token | Chris |
Token ID | 5180 |
Feature activation | +8.10e+00 |
Pos logit contributions | |
Adds | +2.603 |
Breach | +2.321 |
oa | +2.091 |
letters | +2.089 |
IER | +2.081 |
Neg logit contributions | |
intend | -2.624 |
percentile | -2.550 |
Compton | -2.509 |
totality | -2.454 |
adelphia | -2.375 |
Token | Christie |
Token ID | 16929 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
Adds | +4.410 |
Breach | +3.756 |
oa | +3.389 |
arrivals | +3.359 |
artisan | +3.334 |
Neg logit contributions | |
intend | -6.703 |
percentile | -6.646 |
totality | -6.453 |
Compton | -6.317 |
�� | -6.296 |
Token | Gov |
Token ID | 10964 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
Adds | +0.982 |
Breach | +0.867 |
oa | +0.795 |
letters | +0.792 |
̶ | +0.781 |
Neg logit contributions | |
intend | -0.946 |
Compton | -0.935 |
percentile | -0.932 |
totality | -0.896 |
adelphia | -0.863 |
Token | . |
Token ID | 13 |
Feature activation | -2.04e+00 |
Pos logit contributions | |
Adds | +0.238 |
Breach | +0.212 |
oa | +0.195 |
letters | +0.194 |
̶ | +0.192 |
Neg logit contributions | |
intend | -0.210 |
Compton | -0.207 |
percentile | -0.206 |
totality | -0.198 |
adelphia | -0.191 |
Token | Chris |
Token ID | 5180 |
Feature activation | +5.05e+00 |
Pos logit contributions | |
intend | +1.380 |
Compton | +1.363 |
percentile | +1.358 |
totality | +1.300 |
adelphia | +1.245 |
Neg logit contributions | |
Adds | -1.484 |
Breach | -1.313 |
artisan | -1.266 |
oa | -1.217 |
IER | -1.211 |
Token | Christie |
Token ID | 16929 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
Adds | +2.968 |
Breach | +2.527 |
oa | +2.273 |
Newsletter | +2.267 |
letters | +2.253 |
Neg logit contributions | |
intend | -4.139 |
percentile | -4.109 |
Compton | -4.016 |
totality | -3.981 |
�� | -3.852 |
Token | be |
Token ID | 307 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
Adds | +0.730 |
Breach | +0.640 |
oa | +0.583 |
letters | +0.580 |
̶ | +0.570 |
Neg logit contributions | |
intend | -0.789 |
Compton | -0.781 |
percentile | -0.773 |
totality | -0.748 |
adelphia | -0.725 |
Token | click |
Token ID | 3904 |
Feature activation | +1.93e+00 |
Pos logit contributions | |
Adds | +0.716 |
Breach | +0.634 |
oa | +0.583 |
letters | +0.580 |
IER | +0.572 |
Neg logit contributions | |
intend | -0.672 |
Compton | -0.662 |
percentile | -0.659 |
totality | -0.634 |
adelphia | -0.612 |
Token | able |
Token ID | 540 |
Feature activation | +2.33e+00 |
Pos logit contributions | |
Adds | +1.371 |
Breach | +1.207 |
oa | +1.109 |
letters | +1.103 |
IER | +1.088 |
Neg logit contributions | |
intend | -1.364 |
Compton | -1.349 |
percentile | -1.343 |
totality | -1.293 |
adelphia | -1.247 |
Token | — |
Token ID | 960 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
Adds | +1.710 |
Breach | +1.507 |
oa | +1.391 |
letters | +1.386 |
̶ | +1.363 |
Neg logit contributions | |
intend | -1.592 |
Compton | -1.571 |
percentile | -1.560 |
totality | -1.498 |
adelphia | -1.454 |
Token | that |
Token ID | 5562 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
Adds | +0.227 |
Breach | +0.206 |
oa | +0.192 |
letters | +0.190 |
̶ | +0.190 |
Neg logit contributions | |
intend | -0.139 |
Compton | -0.136 |
percentile | -0.136 |
totality | -0.129 |
adelphia | -0.122 |
Token | is |
Token ID | 318 |
Feature activation | +7.87e+00 |
Pos logit contributions | |
Adds | +2.347 |
Breach | +2.041 |
oa | +1.864 |
letters | +1.840 |
̶ | +1.813 |
Neg logit contributions | |
intend | -2.610 |
Compton | -2.564 |
percentile | -2.545 |
totality | -2.456 |
adelphia | -2.400 |
Token | no |
Token ID | 645 |
Feature activation | +5.42e+00 |
Pos logit contributions | |
Adds | +4.987 |
Breach | +4.314 |
oa | +3.976 |
letters | +3.971 |
IER | +3.897 |
Neg logit contributions | |
intend | -5.979 |
Compton | -5.900 |
percentile | -5.792 |
totality | -5.626 |
adelphia | -5.543 |
Token | longer |
Token ID | 2392 |
Feature activation | +2.44e+00 |
Pos logit contributions | |
Adds | +2.166 |
Breach | +1.786 |
oa | +1.488 |
letters | +1.448 |
̶ | +1.444 |
Neg logit contributions | |
intend | -5.418 |
Compton | -5.344 |
percentile | -5.314 |
totality | -5.183 |
adelphia | -5.108 |
Token | the |
Token ID | 262 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
Adds | +1.773 |
Breach | +1.573 |
oa | +1.447 |
letters | +1.435 |
̶ | +1.415 |
Neg logit contributions | |
intend | -1.688 |
Compton | -1.653 |
percentile | -1.648 |
totality | -1.581 |
adelphia | -1.534 |
Token | case |
Token ID | 1339 |
Feature activation | +7.62e-01 |
Pos logit contributions | |
Adds | +0.160 |
Breach | +0.142 |
oa | +0.130 |
letters | +0.130 |
̶ | +0.128 |
Neg logit contributions | |
intend | -0.146 |
percentile | -0.145 |
Compton | -0.145 |
totality | -0.139 |
adelphia | -0.133 |
Token | . |
Token ID | 13 |
Feature activation | +5.07e-01 |
Pos logit contributions | |
Adds | +0.567 |
Breach | +0.503 |
oa | +0.461 |
letters | +0.460 |
IER | +0.454 |
Neg logit contributions | |
intend | -0.514 |
Compton | -0.508 |
percentile | -0.507 |
totality | -0.485 |
adelphia | -0.467 |
Token | our |
Token ID | 674 |
Feature activation | +6.08e+00 |
Pos logit contributions | |
Adds | +0.575 |
Breach | +0.501 |
oa | +0.454 |
letters | +0.452 |
̶ | +0.445 |
Neg logit contributions | |
intend | -0.679 |
Compton | -0.671 |
percentile | -0.670 |
totality | -0.646 |
adelphia | -0.625 |
Token | Wine |
Token ID | 20447 |
Feature activation | +8.33e+00 |
Pos logit contributions | |
Adds | +3.896 |
Breach | +3.498 |
letters | +3.187 |
oa | +3.127 |
Newsletter | +3.024 |
Neg logit contributions | |
intend | -4.671 |
percentile | -4.537 |
Compton | -4.426 |
totality | -4.389 |
adelphia | -4.204 |
Token | Club |
Token ID | 6289 |
Feature activation | +6.86e+00 |
Pos logit contributions | |
Adds | +4.244 |
Breach | +3.584 |
letters | +3.248 |
arrivals | +3.078 |
oa | +3.022 |
Neg logit contributions | |
intend | -7.622 |
Compton | -7.316 |
percentile | -7.315 |
totality | -7.173 |
�� | -6.905 |
Token | today |
Token ID | 1909 |
Feature activation | +2.83e+00 |
Pos logit contributions | |
Adds | +3.651 |
Breach | +3.078 |
letters | +2.989 |
Newsletter | +2.729 |
arrivals | +2.705 |
Neg logit contributions | |
intend | -6.102 |
percentile | -5.893 |
Compton | -5.829 |
totality | -5.682 |
adelphia | -5.529 |
Token | . |
Token ID | 13 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
Adds | +1.935 |
Breach | +1.688 |
letters | +1.554 |
oa | +1.539 |
̶ | +1.527 |
Neg logit contributions | |
intend | -2.094 |
percentile | -2.040 |
Compton | -2.033 |
totality | -1.998 |
adelphia | -1.910 |
Token | Did |
Token ID | 7731 |
Feature activation | +7.44e+00 |
Pos logit contributions | |
Adds | +0.966 |
Breach | +0.879 |
oa | +0.810 |
letters | +0.809 |
IER | +0.797 |
Neg logit contributions | |
intend | -0.632 |
percentile | -0.614 |
Compton | -0.612 |
totality | -0.595 |
adelphia | -0.560 |
Token | you |
Token ID | 345 |
Feature activation | +4.87e+00 |
Pos logit contributions | |
Adds | +4.143 |
Breach | +3.618 |
oa | +3.363 |
IER | +3.179 |
artisan | +3.178 |
Neg logit contributions | |
intend | -6.304 |
percentile | -5.854 |
totality | -5.839 |
adelphia | -5.789 |
Compton | -5.780 |
Token | know |
Token ID | 760 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
Adds | +2.779 |
Breach | +2.318 |
arrivals | +2.073 |
fters | +2.068 |
oa | +2.028 |
Neg logit contributions | |
totality | -3.956 |
intend | -3.941 |
Compton | -3.933 |
percentile | -3.876 |
adelphia | -3.789 |
Token | you |
Token ID | 345 |
Feature activation | +5.42e+00 |
Pos logit contributions | |
Adds | +0.080 |
Breach | +0.070 |
oa | +0.063 |
letters | +0.063 |
artisan | +0.062 |
Neg logit contributions | |
intend | -0.093 |
percentile | -0.090 |
Compton | -0.090 |
totality | -0.088 |
adelphia | -0.085 |
Token | can |
Token ID | 460 |
Feature activation | +3.25e+00 |
Pos logit contributions | |
Adds | +2.647 |
Breach | +2.422 |
oa | +2.232 |
fters | +2.077 |
arrivals | +2.010 |
Neg logit contributions | |
intend | -4.771 |
Compton | -4.721 |
totality | -4.693 |
percentile | -4.678 |
adelphia | -4.540 |
Token | support |
Token ID | 1104 |
Feature activation | -2.77e+00 |
Pos logit contributions | |
Adds | +2.707 |
Breach | +2.437 |
oa | +2.273 |
letters | +2.250 |
Newsletter | +2.216 |
Neg logit contributions | |
intend | -1.934 |
percentile | -1.872 |
Compton | -1.869 |
totality | -1.809 |
adelphia | -1.707 |
Token | the |
Token ID | 262 |
Feature activation | +9.15e-01 |
Pos logit contributions | |
intend | +0.032 |
Compton | +0.032 |
percentile | +0.032 |
totality | +0.031 |
adelphia | +0.029 |
Neg logit contributions | |
Adds | -0.034 |
Breach | -0.030 |
oa | -0.028 |
letters | -0.028 |
̶ | -0.027 |
Token | Occupy |
Token ID | 25551 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
Adds | +0.706 |
Breach | +0.632 |
oa | +0.581 |
letters | +0.578 |
̶ | +0.571 |
Neg logit contributions | |
intend | -0.590 |
percentile | -0.579 |
Compton | -0.578 |
totality | -0.553 |
adelphia | -0.535 |
Token | Wall |
Token ID | 5007 |
Feature activation | -2.03e+00 |
Pos logit contributions | |
Adds | +2.133 |
Breach | +1.936 |
oa | +1.803 |
letters | +1.797 |
̶ | +1.780 |
Neg logit contributions | |
intend | -1.351 |
Compton | -1.318 |
percentile | -1.316 |
totality | -1.255 |
adelphia | -1.194 |
Token | Street |
Token ID | 3530 |
Feature activation | +6.40e-01 |
Pos logit contributions | |
intend | +1.432 |
Compton | +1.415 |
percentile | +1.411 |
totality | +1.357 |
adelphia | +1.308 |
Neg logit contributions | |
Adds | -1.440 |
Breach | -1.269 |
oa | -1.162 |
letters | -1.157 |
̶ | -1.141 |
Token | protests |
Token ID | 8536 |
Feature activation | +8.95e-01 |
Pos logit contributions | |
Adds | +0.505 |
Breach | +0.451 |
oa | +0.417 |
letters | +0.416 |
̶ | +0.410 |
Neg logit contributions | |
intend | -0.403 |
Compton | -0.397 |
percentile | -0.396 |
totality | -0.379 |
adelphia | -0.363 |
Token | in |
Token ID | 287 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
Adds | +0.657 |
Breach | +0.582 |
oa | +0.534 |
letters | +0.532 |
̶ | +0.525 |
Neg logit contributions | |
intend | -0.612 |
Compton | -0.603 |
percentile | -0.601 |
totality | -0.577 |
adelphia | -0.557 |
Token | Wednesday |
Token ID | 3583 |
Feature activation | -2.95e+00 |
Pos logit contributions | |
Adds | +0.832 |
Breach | +0.739 |
oa | +0.677 |
letters | +0.675 |
̶ | +0.666 |
Neg logit contributions | |
intend | -0.762 |
percentile | -0.749 |
Compton | -0.748 |
totality | -0.717 |
adelphia | -0.693 |
Token | night |
Token ID | 1755 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
Compton | +2.168 |
intend | +2.164 |
percentile | +2.152 |
totality | +2.082 |
adelphia | +1.982 |
Neg logit contributions | |
Adds | -1.992 |
Breach | -1.763 |
letters | -1.609 |
oa | -1.604 |
artisan | -1.581 |
Token | 's |
Token ID | 338 |
Feature activation | +4.33e-01 |
Pos logit contributions | |
Adds | +0.688 |
Breach | +0.590 |
oa | +0.529 |
letters | +0.526 |
̶ | +0.517 |
Neg logit contributions | |
intend | -0.957 |
Compton | -0.947 |
percentile | -0.945 |
totality | -0.914 |
adelphia | -0.886 |
Token | episode |
Token ID | 4471 |
Feature activation | -2.47e+00 |
Pos logit contributions | |
Adds | +0.326 |
Breach | +0.289 |
oa | +0.267 |
letters | +0.266 |
IER | +0.263 |
Neg logit contributions | |
intend | -0.287 |
Compton | -0.284 |
percentile | -0.283 |
totality | -0.272 |
adelphia | -0.261 |
Token | , |
Token ID | 11 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
Compton | +1.517 |
intend | +1.510 |
percentile | +1.504 |
totality | +1.444 |
adelphia | +1.374 |
Neg logit contributions | |
Adds | -1.966 |
Breach | -1.754 |
letters | -1.635 |
oa | -1.633 |
artisan | -1.629 |
Token | April |
Token ID | 3035 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
Compton | +1.340 |
intend | +1.327 |
percentile | +1.314 |
totality | +1.274 |
adelphia | +1.202 |
Neg logit contributions | |
Adds | -1.479 |
Breach | -1.289 |
oa | -1.190 |
letters | -1.184 |
̶ | -1.184 |
Token | 16 |
Token ID | 1467 |
Feature activation | +1.65e+00 |
Pos logit contributions | |
Adds | +0.623 |
Breach | +0.550 |
oa | +0.502 |
letters | +0.500 |
IER | +0.492 |
Neg logit contributions | |
intend | -0.634 |
Compton | -0.625 |
percentile | -0.624 |
totality | -0.601 |
adelphia | -0.580 |
Token | 25 |
Token ID | 1495 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
Adds | +1.213 |
Breach | +1.075 |
oa | +0.987 |
letters | +0.985 |
Newsletter | +0.970 |
Neg logit contributions | |
intend | -1.130 |
Compton | -1.113 |
percentile | -1.111 |
totality | -1.068 |
adelphia | -1.029 |
Token | , |
Token ID | 11 |
Feature activation | +4.03e-01 |
Pos logit contributions | |
Adds | +0.100 |
Breach | +0.089 |
oa | +0.082 |
letters | +0.082 |
̶ | +0.081 |
Neg logit contributions | |
intend | -0.086 |
Compton | -0.085 |
percentile | -0.085 |
totality | -0.081 |
adelphia | -0.078 |
Token | when |
Token ID | 618 |
Feature activation | -4.71e-01 |
Pos logit contributions | |
Adds | +0.300 |
Breach | +0.265 |
oa | +0.244 |
letters | +0.243 |
̶ | +0.240 |
Neg logit contributions | |
intend | -0.272 |
Compton | -0.269 |
percentile | -0.268 |
totality | -0.257 |
adelphia | -0.247 |
Token | d |
Token ID | 288 |
Feature activation | +4.12e+00 |
Pos logit contributions | |
intend | +0.327 |
Compton | +0.326 |
percentile | +0.322 |
totality | +0.311 |
adelphia | +0.297 |
Neg logit contributions | |
Adds | -0.340 |
Breach | -0.298 |
oa | -0.274 |
letters | -0.273 |
̶ | -0.270 |
Token | ' |
Token ID | 6 |
Feature activation | -2.91e+00 |
Pos logit contributions | |
Adds | +3.054 |
Breach | +2.718 |
oa | +2.533 |
letters | +2.516 |
̶ | +2.482 |
Neg logit contributions | |
Compton | -2.692 |
percentile | -2.690 |
intend | -2.688 |
totality | -2.616 |
adelphia | -2.462 |
Token | Art |
Token ID | 8001 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
intend | +2.228 |
Compton | +2.186 |
percentile | +2.137 |
totality | +2.079 |
lé | +2.035 |
Neg logit contributions | |
Adds | -1.847 |
Breach | -1.636 |
letters | -1.447 |
oa | -1.440 |
̶ | -1.439 |
Token | agn |
Token ID | 4660 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
Adds | +1.337 |
Breach | +1.132 |
oa | +1.015 |
letters | +1.010 |
IER | +0.978 |
Neg logit contributions | |
intend | -2.214 |
Compton | -2.193 |
percentile | -2.185 |
totality | -2.135 |
adelphia | -2.057 |
Token | an |
Token ID | 272 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
Adds | +0.518 |
Breach | +0.386 |
letters | +0.316 |
oa | +0.310 |
Newsletter | +0.306 |
Neg logit contributions | |
intend | -1.463 |
Compton | -1.449 |
percentile | -1.444 |
totality | -1.401 |
adelphia | -1.373 |
Token | , |
Token ID | 11 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
Adds | +0.176 |
Breach | +0.155 |
oa | +0.142 |
letters | +0.142 |
IER | +0.140 |
Neg logit contributions | |
intend | -0.165 |
Compton | -0.163 |
percentile | -0.163 |
totality | -0.156 |
adelphia | -0.150 |
Token | from |
Token ID | 422 |
Feature activation | -1.36e+00 |
Pos logit contributions | |
Adds | +0.195 |
Breach | +0.172 |
oa | +0.158 |
letters | +0.157 |
̶ | +0.154 |
Neg logit contributions | |
intend | -0.193 |
Compton | -0.190 |
percentile | -0.189 |
totality | -0.182 |
adelphia | -0.177 |
Token | ash |
Token ID | 12530 |
Feature activation | -1.96e+00 |
Pos logit contributions | |
intend | +0.891 |
Compton | +0.885 |
percentile | +0.880 |
totality | +0.846 |
adelphia | +0.807 |
Neg logit contributions | |
Adds | -1.037 |
Breach | -0.920 |
letters | -0.849 |
oa | -0.849 |
IER | -0.840 |
Token | ponds |
Token ID | 47339 |
Feature activation | -6.18e-01 |
Pos logit contributions | |
intend | +1.318 |
Compton | +1.304 |
percentile | +1.298 |
totality | +1.248 |
adelphia | +1.196 |
Neg logit contributions | |
Adds | -1.458 |
Breach | -1.293 |
oa | -1.185 |
letters | -1.183 |
Newsletter | -1.174 |
Token | at |
Token ID | 379 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
intend | +0.411 |
Compton | +0.406 |
percentile | +0.405 |
totality | +0.389 |
adelphia | +0.373 |
Neg logit contributions | |
Adds | -0.465 |
Breach | -0.413 |
oa | -0.380 |
letters | -0.379 |
IER | -0.375 |
Token | all |
Token ID | 477 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
intend | +0.368 |
Compton | +0.364 |
percentile | +0.363 |
totality | +0.348 |
adelphia | +0.333 |
Neg logit contributions | |
Adds | -0.437 |
Breach | -0.389 |
oa | -0.359 |
letters | -0.358 |
̶ | -0.354 |
Token | retired |
Token ID | 9880 |
Feature activation | +3.94e+00 |
Pos logit contributions | |
intend | +1.000 |
Compton | +0.988 |
percentile | +0.986 |
totality | +0.942 |
adelphia | +0.899 |
Neg logit contributions | |
Adds | -1.281 |
Breach | -1.143 |
oa | -1.056 |
letters | -1.055 |
Newsletter | -1.044 |
Token | coal |
Token ID | 5655 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
Adds | +3.037 |
Breach | +2.730 |
oa | +2.557 |
letters | +2.491 |
arrivals | +2.457 |
Neg logit contributions | |
intend | -2.487 |
Compton | -2.404 |
percentile | -2.397 |
totality | -2.296 |
adelphia | -2.254 |
Token | plants |
Token ID | 6134 |
Feature activation | +5.83e-01 |
Pos logit contributions | |
Adds | +0.118 |
Breach | +0.105 |
oa | +0.097 |
letters | +0.097 |
IER | +0.095 |
Neg logit contributions | |
intend | -0.099 |
Compton | -0.098 |
percentile | -0.098 |
totality | -0.094 |
adelphia | -0.090 |
Token | . |
Token ID | 13 |
Feature activation | +2.06e+00 |
Pos logit contributions | |
Adds | +0.435 |
Breach | +0.386 |
oa | +0.355 |
letters | +0.354 |
̶ | +0.349 |
Neg logit contributions | |
intend | -0.391 |
Compton | -0.386 |
percentile | -0.385 |
totality | -0.370 |
adelphia | -0.356 |
Token |
|
Token ID | 198 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
Adds | +1.658 |
Breach | +1.485 |
oa | +1.372 |
letters | +1.367 |
̶ | +1.350 |
Neg logit contributions | |
intend | -1.270 |
percentile | -1.247 |
Compton | -1.243 |
totality | -1.193 |
adelphia | -1.144 |
Token |
|
Token ID | 198 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
intend | +0.436 |
Compton | +0.429 |
percentile | +0.428 |
totality | +0.410 |
adelphia | +0.392 |
Neg logit contributions | |
Adds | -0.598 |
Breach | -0.536 |
oa | -0.497 |
letters | -0.496 |
̶ | -0.490 |
Token | of |
Token ID | 286 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
Adds | +3.742 |
Breach | +3.299 |
oa | +3.025 |
letters | +3.003 |
Newsletter | +2.976 |
Neg logit contributions | |
intend | -3.920 |
Compton | -3.811 |
percentile | -3.755 |
totality | -3.720 |
adelphia | -3.594 |
Token | Defense |
Token ID | 5947 |
Feature activation | +2.79e+00 |
Pos logit contributions | |
Adds | +1.129 |
Breach | +0.970 |
oa | +0.870 |
letters | +0.866 |
̶ | +0.851 |
Neg logit contributions | |
intend | -1.543 |
Compton | -1.527 |
percentile | -1.523 |
totality | -1.473 |
adelphia | -1.428 |
Token | has |
Token ID | 468 |
Feature activation | +2.99e+00 |
Pos logit contributions | |
Adds | +1.946 |
Breach | +1.710 |
oa | +1.564 |
letters | +1.555 |
Newsletter | +1.536 |
Neg logit contributions | |
intend | -2.006 |
Compton | -1.979 |
percentile | -1.974 |
totality | -1.902 |
adelphia | -1.840 |
Token | acknowledged |
Token ID | 10810 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
Adds | +2.104 |
Breach | +1.862 |
oa | +1.704 |
letters | +1.689 |
̶ | +1.674 |
Neg logit contributions | |
intend | -2.120 |
Compton | -2.085 |
percentile | -2.077 |
totality | -2.000 |
adelphia | -1.939 |
Token | sending |
Token ID | 7216 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
Adds | +1.148 |
Breach | +1.020 |
oa | +0.939 |
letters | +0.936 |
̶ | +0.924 |
Neg logit contributions | |
intend | -1.009 |
Compton | -0.995 |
percentile | -0.993 |
totality | -0.952 |
adelphia | -0.916 |
Token | at |
Token ID | 379 |
Feature activation | +4.76e+00 |
Pos logit contributions | |
Adds | +1.138 |
Breach | +1.011 |
oa | +0.929 |
letters | +0.926 |
̶ | +0.913 |
Neg logit contributions | |
intend | -1.022 |
Compton | -1.008 |
percentile | -1.005 |
totality | -0.965 |
adelphia | -0.928 |
Token | least |
Token ID | 1551 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Adds | +4.116 |
Breach | +3.754 |
oa | +3.533 |
letters | +3.479 |
̶ | +3.461 |
Neg logit contributions | |
intend | -2.558 |
Compton | -2.509 |
percentile | -2.476 |
totality | -2.299 |
adelphia | -2.263 |
Token | 500 |
Token ID | 5323 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
percentile | +0.681 |
Compton | +0.679 |
intend | +0.677 |
totality | +0.650 |
adelphia | +0.615 |
Neg logit contributions | |
Adds | -0.798 |
Breach | -0.705 |
oa | -0.652 |
letters | -0.649 |
̶ | -0.646 |
Token | Special |
Token ID | 6093 |
Feature activation | +6.38e+00 |
Pos logit contributions | |
intend | +0.664 |
Compton | +0.661 |
percentile | +0.660 |
totality | +0.632 |
adelphia | +0.602 |
Neg logit contributions | |
Adds | -0.769 |
Breach | -0.682 |
oa | -0.631 |
letters | -0.628 |
̶ | -0.620 |
Token | Forces |
Token ID | 12700 |
Feature activation | +8.93e-01 |
Pos logit contributions | |
Adds | +3.621 |
Breach | +3.211 |
letters | +2.811 |
oa | +2.804 |
artisan | +2.700 |
Neg logit contributions | |
intend | -5.218 |
percentile | -5.202 |
Compton | -5.134 |
totality | -5.120 |
�� | -4.919 |
Token | into |
Token ID | 656 |
Feature activation | -8.77e-01 |
Pos logit contributions | |
Adds | +0.662 |
Breach | +0.587 |
oa | +0.539 |
letters | +0.537 |
IER | +0.530 |
Neg logit contributions | |
intend | -0.605 |
Compton | -0.597 |
percentile | -0.595 |
totality | -0.572 |
adelphia | -0.551 |
Token | of |
Token ID | 286 |
Feature activation | +9.97e-01 |
Pos logit contributions | |
Adds | +3.039 |
Breach | +2.691 |
oa | +2.484 |
letters | +2.448 |
arrivals | +2.409 |
Neg logit contributions | |
intend | -2.856 |
Compton | -2.805 |
percentile | -2.798 |
totality | -2.665 |
adelphia | -2.609 |
Token | bamboo |
Token ID | 37252 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
Adds | +0.759 |
Breach | +0.675 |
oa | +0.622 |
letters | +0.619 |
̶ | +0.612 |
Neg logit contributions | |
intend | -0.655 |
Compton | -0.647 |
percentile | -0.645 |
totality | -0.618 |
adelphia | -0.594 |
Token | objects |
Token ID | 5563 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
intend | +0.276 |
percentile | +0.273 |
Compton | +0.273 |
totality | +0.264 |
adelphia | +0.254 |
Neg logit contributions | |
Adds | -0.223 |
Breach | -0.194 |
oa | -0.175 |
letters | -0.173 |
IER | -0.172 |
Token | , |
Token ID | 11 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
intend | +0.378 |
Compton | +0.374 |
percentile | +0.372 |
totality | +0.359 |
adelphia | +0.341 |
Neg logit contributions | |
Adds | -0.414 |
Breach | -0.369 |
letters | -0.339 |
oa | -0.338 |
IER | -0.335 |
Token | including |
Token ID | 1390 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
Adds | +0.753 |
Breach | +0.666 |
oa | +0.611 |
letters | +0.609 |
̶ | +0.599 |
Neg logit contributions | |
intend | -0.718 |
Compton | -0.707 |
percentile | -0.706 |
totality | -0.678 |
adelphia | -0.655 |
Token | handmade |
Token ID | 40973 |
Feature activation | +1.92e+00 |
Pos logit contributions | |
Adds | +0.971 |
Breach | +0.859 |
oa | +0.788 |
letters | +0.785 |
̶ | +0.773 |
Neg logit contributions | |
intend | -0.924 |
Compton | -0.912 |
percentile | -0.909 |
totality | -0.873 |
adelphia | -0.842 |
Token | chop |
Token ID | 30506 |
Feature activation | +2.26e+00 |
Pos logit contributions | |
Adds | +1.357 |
Breach | +1.200 |
oa | +1.099 |
letters | +1.095 |
Newsletter | +1.076 |
Neg logit contributions | |
intend | -1.355 |
Compton | -1.333 |
percentile | -1.328 |
totality | -1.276 |
adelphia | -1.242 |
Token | sticks |
Token ID | 34810 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
Adds | +1.242 |
Breach | +1.051 |
oa | +0.937 |
letters | +0.931 |
̶ | +0.909 |
Neg logit contributions | |
intend | -1.961 |
Compton | -1.948 |
percentile | -1.939 |
totality | -1.880 |
adelphia | -1.825 |
Token | , |
Token ID | 11 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
Adds | +2.322 |
Breach | +2.038 |
oa | +1.877 |
letters | +1.864 |
̶ | +1.842 |
Neg logit contributions | |
intend | -2.292 |
Compton | -2.263 |
percentile | -2.259 |
totality | -2.169 |
adelphia | -2.112 |
Token | the |
Token ID | 262 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
Adds | +0.830 |
Breach | +0.734 |
oa | +0.673 |
letters | +0.671 |
̶ | +0.662 |
Neg logit contributions | |
intend | -0.787 |
Compton | -0.778 |
percentile | -0.776 |
totality | -0.745 |
adelphia | -0.717 |
Token | film |
Token ID | 2646 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
Adds | +0.937 |
Breach | +0.832 |
oa | +0.763 |
letters | +0.760 |
̶ | +0.749 |
Neg logit contributions | |
intend | -0.867 |
Compton | -0.852 |
percentile | -0.851 |
totality | -0.815 |
adelphia | -0.790 |
Token | to |
Token ID | 284 |
Feature activation | +3.16e+00 |
Pos logit contributions | |
Adds | +1.101 |
Breach | +0.976 |
oa | +0.895 |
letters | +0.892 |
Newsletter | +0.879 |
Neg logit contributions | |
intend | -1.032 |
Compton | -1.020 |
percentile | -1.018 |
totality | -0.977 |
adelphia | -0.940 |
Token | a |
Token ID | 257 |
Feature activation | +2.21e+00 |
Pos logit contributions | |
Adds | +2.303 |
Breach | +2.040 |
oa | +1.880 |
letters | +1.861 |
̶ | +1.856 |
Neg logit contributions | |
intend | -2.174 |
Compton | -2.122 |
percentile | -2.102 |
totality | -2.028 |
adelphia | -1.975 |
Token | value |
Token ID | 1988 |
Feature activation | +4.04e+00 |
Pos logit contributions | |
Adds | +1.699 |
Breach | +1.513 |
oa | +1.399 |
letters | +1.390 |
̶ | +1.379 |
Neg logit contributions | |
intend | -1.428 |
Compton | -1.405 |
percentile | -1.396 |
totality | -1.340 |
adelphia | -1.294 |
Token | value |
Token ID | 1988 |
Feature activation | +2.59e+00 |
Pos logit contributions | |
Adds | +3.042 |
Breach | +2.685 |
oa | +2.516 |
letters | +2.487 |
̶ | +2.472 |
Neg logit contributions | |
intend | -2.673 |
Compton | -2.609 |
percentile | -2.581 |
totality | -2.480 |
adelphia | -2.426 |
Token | called |
Token ID | 1444 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
Adds | +1.935 |
Breach | +1.712 |
oa | +1.585 |
letters | +1.576 |
̶ | +1.561 |
Neg logit contributions | |
intend | -1.739 |
Compton | -1.709 |
percentile | -1.698 |
totality | -1.632 |
adelphia | -1.577 |
Token | _ |
Token ID | 4808 |
Feature activation | -4.49e+00 |
Pos logit contributions | |
percentile | +0.283 |
intend | +0.282 |
Compton | +0.282 |
totality | +0.270 |
adelphia | +0.257 |
Neg logit contributions | |
Adds | -0.317 |
Breach | -0.281 |
letters | -0.258 |
oa | -0.257 |
artisan | -0.254 |
Token | P |
Token ID | 47 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
intend | +2.970 |
Compton | +2.947 |
percentile | +2.946 |
totality | +2.796 |
weak | +2.686 |
Neg logit contributions | |
Adds | -3.284 |
Breach | -2.958 |
letters | -2.656 |
artisan | -2.645 |
Newsletter | -2.635 |
Token | ulse |
Token ID | 9615 |
Feature activation | -4.78e+00 |
Pos logit contributions | |
intend | +1.103 |
Compton | +1.099 |
percentile | +1.092 |
totality | +1.054 |
adelphia | +1.006 |
Neg logit contributions | |
Adds | -1.226 |
Breach | -1.097 |
letters | -1.004 |
oa | -0.994 |
artisan | -0.984 |
Token | Amount |
Token ID | 31264 |
Feature activation | +6.73e-01 |
Pos logit contributions | |
Compton | +3.265 |
percentile | +3.248 |
intend | +3.219 |
totality | +3.094 |
adelphia | +2.954 |
Neg logit contributions | |
Adds | -3.393 |
Breach | -3.047 |
artisan | -2.770 |
letters | -2.757 |
oa | -2.751 |
Token | , |
Token ID | 11 |
Feature activation | -5.94e-01 |
Pos logit contributions | |
Adds | +0.494 |
Breach | +0.438 |
oa | +0.401 |
letters | +0.400 |
artisan | +0.395 |
Neg logit contributions | |
intend | -0.460 |
Compton | -0.455 |
percentile | -0.454 |
totality | -0.435 |
adelphia | -0.418 |
Token | completing |
Token ID | 14339 |
Feature activation | -8.92e-02 |
Pos logit contributions | |
intend | +0.395 |
percentile | +0.394 |
Compton | +0.394 |
totality | +0.376 |
adelphia | +0.359 |
Neg logit contributions | |
Adds | -0.444 |
Breach | -0.396 |
oa | -0.363 |
letters | -0.362 |
Newsletter | -0.358 |
Token | energy |
Token ID | 2568 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
Adds | +1.939 |
Breach | +1.697 |
oa | +1.556 |
letters | +1.546 |
IER | +1.524 |
Neg logit contributions | |
intend | -2.003 |
Compton | -1.981 |
percentile | -1.973 |
totality | -1.896 |
adelphia | -1.843 |
Token | company |
Token ID | 1664 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
intend | +1.310 |
percentile | +1.299 |
Compton | +1.277 |
totality | +1.233 |
lé | +1.134 |
Neg logit contributions | |
Adds | -2.109 |
Breach | -1.939 |
̶ | -1.809 |
letters | -1.808 |
oa | -1.805 |
Token | Gaz |
Token ID | 21347 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
intend | +2.079 |
Compton | +2.076 |
percentile | +2.059 |
totality | +2.001 |
disgr | +1.894 |
Neg logit contributions | |
Adds | -1.908 |
Breach | -1.675 |
artisan | -1.541 |
letters | -1.540 |
̶ | -1.532 |
Token | prom |
Token ID | 16963 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
intend | +0.774 |
percentile | +0.757 |
Compton | +0.753 |
totality | +0.723 |
adelphia | +0.687 |
Neg logit contributions | |
Adds | -1.063 |
Breach | -0.954 |
letters | -0.882 |
oa | -0.882 |
̶ | -0.872 |
Token | has |
Token ID | 468 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
intend | +1.531 |
Compton | +1.511 |
percentile | +1.506 |
totality | +1.450 |
lé | +1.385 |
Neg logit contributions | |
Adds | -1.631 |
Breach | -1.435 |
artisan | -1.326 |
letters | -1.318 |
oa | -1.313 |
Token | resumed |
Token ID | 28291 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Adds | +0.020 |
Breach | +0.018 |
letters | +0.016 |
oa | +0.016 |
artisan | +0.016 |
Neg logit contributions | |
intend | -0.019 |
Compton | -0.019 |
percentile | -0.019 |
totality | -0.018 |
adelphia | -0.018 |
Token | some |
Token ID | 617 |
Feature activation | -2.42e+00 |
Pos logit contributions | |
percentile | +1.508 |
Compton | +1.502 |
intend | +1.495 |
totality | +1.471 |
indication | +1.387 |
Neg logit contributions | |
Adds | -1.502 |
Breach | -1.322 |
artisan | -1.222 |
letters | -1.205 |
̶ | -1.197 |
Token | gas |
Token ID | 3623 |
Feature activation | +5.59e-01 |
Pos logit contributions | |
percentile | +1.755 |
Compton | +1.747 |
intend | +1.743 |
totality | +1.699 |
indication | +1.621 |
Neg logit contributions | |
Adds | -1.649 |
Breach | -1.440 |
artisan | -1.317 |
letters | -1.316 |
IER | -1.301 |
Token | supplies |
Token ID | 9416 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
Adds | +0.330 |
Breach | +0.283 |
oa | +0.253 |
letters | +0.252 |
̶ | +0.248 |
Neg logit contributions | |
intend | -0.462 |
Compton | -0.457 |
percentile | -0.456 |
totality | -0.442 |
adelphia | -0.427 |
Token | through |
Token ID | 832 |
Feature activation | +5.11e-01 |
Pos logit contributions | |
intend | +1.208 |
Compton | +1.198 |
percentile | +1.190 |
totality | +1.147 |
adelphia | +1.083 |
Neg logit contributions | |
Adds | -1.369 |
Breach | -1.223 |
letters | -1.119 |
oa | -1.118 |
Newsletter | -1.108 |
Token | Ukraine |
Token ID | 7049 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
Adds | +0.351 |
Breach | +0.308 |
oa | +0.281 |
letters | +0.280 |
̶ | +0.276 |
Neg logit contributions | |
intend | -0.373 |
Compton | -0.369 |
percentile | -0.368 |
totality | -0.355 |
adelphia | -0.342 |
Token | � |
Token ID | 447 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
intend | +0.239 |
Compton | +0.237 |
percentile | +0.236 |
totality | +0.226 |
adelphia | +0.219 |
Neg logit contributions | |
Adds | -0.254 |
Breach | -0.224 |
oa | -0.206 |
letters | -0.205 |
IER | -0.203 |
Token | � |
Token ID | 247 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
intend | +0.839 |
percentile | +0.835 |
Compton | +0.828 |
totality | +0.786 |
adelphia | +0.751 |
Neg logit contributions | |
Adds | -1.310 |
Breach | -1.182 |
oa | -1.104 |
letters | -1.094 |
IER | -1.082 |
Token | Bible |
Token ID | 9111 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
Adds | +0.170 |
Breach | +0.149 |
oa | +0.135 |
letters | +0.135 |
IER | +0.133 |
Neg logit contributions | |
intend | -0.189 |
Compton | -0.186 |
percentile | -0.185 |
totality | -0.179 |
adelphia | -0.173 |
Token | study |
Token ID | 2050 |
Feature activation | +5.00e+00 |
Pos logit contributions | |
Adds | +1.355 |
Breach | +1.223 |
letters | +1.136 |
oa | +1.135 |
̶ | +1.124 |
Neg logit contributions | |
intend | -0.895 |
Compton | -0.881 |
percentile | -0.879 |
totality | -0.837 |
adelphia | -0.797 |
Token | , |
Token ID | 11 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
Adds | +3.592 |
Breach | +3.191 |
letters | +2.941 |
oa | +2.920 |
̶ | +2.918 |
Neg logit contributions | |
intend | -3.411 |
Compton | -3.375 |
percentile | -3.342 |
totality | -3.249 |
adelphia | -3.125 |
Token | which |
Token ID | 543 |
Feature activation | +4.70e-01 |
Pos logit contributions | |
Adds | +0.297 |
Breach | +0.264 |
oa | +0.243 |
letters | +0.242 |
IER | +0.239 |
Neg logit contributions | |
intend | -0.262 |
Compton | -0.258 |
percentile | -0.257 |
totality | -0.247 |
adelphia | -0.237 |
Token | draws |
Token ID | 14293 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
Adds | +0.341 |
Breach | +0.302 |
oa | +0.276 |
letters | +0.276 |
artisan | +0.272 |
Neg logit contributions | |
intend | -0.326 |
Compton | -0.323 |
percentile | -0.322 |
totality | -0.309 |
adelphia | -0.297 |
Token | on |
Token ID | 319 |
Feature activation | +8.33e-01 |
Pos logit contributions | |
Adds | +1.422 |
Breach | +1.260 |
oa | +1.158 |
letters | +1.153 |
̶ | +1.136 |
Neg logit contributions | |
intend | -1.349 |
Compton | -1.324 |
percentile | -1.320 |
totality | -1.268 |
adelphia | -1.232 |
Token | his |
Token ID | 465 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
Adds | +0.605 |
Breach | +0.535 |
oa | +0.491 |
letters | +0.489 |
̶ | +0.482 |
Neg logit contributions | |
intend | -0.576 |
Compton | -0.569 |
percentile | -0.567 |
totality | -0.545 |
adelphia | -0.525 |
Token | Mississippi |
Token ID | 13797 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
intend | +0.096 |
Compton | +0.095 |
percentile | +0.095 |
totality | +0.091 |
adelphia | +0.087 |
Neg logit contributions | |
Adds | -0.115 |
Breach | -0.102 |
oa | -0.095 |
letters | -0.094 |
IER | -0.093 |
Token | roots |
Token ID | 11135 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
intend | +1.012 |
Compton | +1.007 |
percentile | +1.003 |
totality | +0.959 |
adelphia | +0.921 |
Neg logit contributions | |
Adds | -1.219 |
Breach | -1.078 |
letters | -1.000 |
oa | -0.995 |
IER | -0.987 |
Token | MD |
Token ID | 12740 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
Adds | +0.225 |
Breach | +0.203 |
oa | +0.191 |
letters | +0.191 |
̶ | +0.189 |
Neg logit contributions | |
intend | -0.124 |
Compton | -0.122 |
percentile | -0.122 |
totality | -0.117 |
adelphia | -0.110 |
Token | , |
Token ID | 11 |
Feature activation | -1.09e+00 |
Pos logit contributions | |
Adds | +1.322 |
Breach | +1.166 |
oa | +1.068 |
letters | +1.063 |
̶ | +1.048 |
Neg logit contributions | |
intend | -1.309 |
Compton | -1.293 |
percentile | -1.290 |
totality | -1.241 |
adelphia | -1.196 |
Token | Pruitt |
Token ID | 39637 |
Feature activation | -2.06e+00 |
Pos logit contributions | |
intend | +0.788 |
Compton | +0.788 |
percentile | +0.781 |
totality | +0.755 |
disgr | +0.717 |
Neg logit contributions | |
Adds | -0.764 |
Breach | -0.659 |
oa | -0.607 |
letters | -0.604 |
Newsletter | -0.602 |
Token | sent |
Token ID | 1908 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
intend | +1.429 |
Compton | +1.414 |
percentile | +1.409 |
totality | +1.342 |
lé | +1.296 |
Neg logit contributions | |
Adds | -1.505 |
Breach | -1.301 |
oa | -1.192 |
letters | -1.192 |
IER | -1.189 |
Token | an |
Token ID | 281 |
Feature activation | +4.53e+00 |
Pos logit contributions | |
Compton | +0.662 |
percentile | +0.662 |
intend | +0.659 |
totality | +0.636 |
disgr | +0.611 |
Neg logit contributions | |
Adds | -0.531 |
Breach | -0.448 |
oa | -0.409 |
Newsletter | -0.402 |
̶ | -0.401 |
Token | email |
Token ID | 3053 |
Feature activation | -1.71e+00 |
Pos logit contributions | |
Adds | +2.631 |
Breach | +2.258 |
letters | +2.032 |
oa | +2.027 |
IER | +1.979 |
Neg logit contributions | |
intend | -3.773 |
Compton | -3.709 |
percentile | -3.705 |
totality | -3.591 |
adelphia | -3.486 |
Token | to |
Token ID | 284 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
percentile | +1.147 |
intend | +1.146 |
Compton | +1.145 |
totality | +1.092 |
adelphia | +1.043 |
Neg logit contributions | |
Adds | -1.265 |
Breach | -1.106 |
oa | -1.024 |
artisan | -1.011 |
̶ | -1.010 |
Token | supporters |
Token ID | 5941 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
intend | +0.959 |
Compton | +0.957 |
percentile | +0.952 |
totality | +0.918 |
disgr | +0.875 |
Neg logit contributions | |
Adds | -0.953 |
Breach | -0.828 |
oa | -0.762 |
letters | -0.755 |
̶ | -0.751 |
Token | of |
Token ID | 286 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
Adds | +0.261 |
Breach | +0.228 |
oa | +0.208 |
letters | +0.207 |
IER | +0.205 |
Neg logit contributions | |
intend | -0.281 |
Compton | -0.278 |
percentile | -0.277 |
totality | -0.267 |
adelphia | -0.257 |
Token | one |
Token ID | 530 |
Feature activation | +5.35e-01 |
Pos logit contributions | |
Compton | +0.966 |
intend | +0.966 |
percentile | +0.955 |
totality | +0.925 |
disgr | +0.882 |
Neg logit contributions | |
Adds | -1.080 |
Breach | -0.953 |
oa | -0.878 |
letters | -0.877 |
̶ | -0.867 |
Token | federal |
Token ID | 2717 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
Adds | +0.420 |
Breach | +0.374 |
oa | +0.345 |
letters | +0.345 |
̶ | +0.340 |
Neg logit contributions | |
intend | -0.340 |
Compton | -0.337 |
percentile | -0.336 |
totality | -0.322 |
adelphia | -0.306 |
Token | � |
Token ID | 447 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
Adds | +2.516 |
Breach | +2.295 |
oa | +2.092 |
letters | +2.058 |
̶ | +2.058 |
Neg logit contributions | |
intend | -2.672 |
percentile | -2.652 |
Compton | -2.638 |
totality | -2.569 |
adelphia | -2.523 |
Token | � |
Token ID | 247 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
Adds | +0.287 |
Breach | +0.258 |
oa | +0.239 |
letters | +0.238 |
̶ | +0.236 |
Neg logit contributions | |
intend | -0.217 |
Compton | -0.214 |
percentile | -0.212 |
totality | -0.204 |
adelphia | -0.195 |
Token | re |
Token ID | 260 |
Feature activation | +5.35e+00 |
Pos logit contributions | |
intend | +1.132 |
Compton | +1.103 |
percentile | +1.098 |
totality | +1.052 |
adelphia | +1.005 |
Neg logit contributions | |
Adds | -1.359 |
Breach | -1.203 |
letters | -1.108 |
oa | -1.100 |
Newsletter | -1.096 |
Token | going |
Token ID | 1016 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
Adds | +3.704 |
Breach | +3.336 |
oa | +3.069 |
̶ | +3.033 |
letters | +3.017 |
Neg logit contributions | |
intend | -3.722 |
percentile | -3.660 |
Compton | -3.616 |
totality | -3.546 |
adelphia | -3.463 |
Token | to |
Token ID | 284 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
Adds | +0.849 |
Breach | +0.751 |
oa | +0.689 |
letters | +0.688 |
Newsletter | +0.678 |
Neg logit contributions | |
intend | -0.785 |
Compton | -0.775 |
percentile | -0.772 |
totality | -0.742 |
adelphia | -0.713 |
Token | have |
Token ID | 423 |
Feature activation | -8.47e-01 |
Pos logit contributions | |
Adds | +0.864 |
Breach | +0.772 |
oa | +0.709 |
letters | +0.706 |
̶ | +0.700 |
Neg logit contributions | |
intend | -0.753 |
percentile | -0.741 |
Compton | -0.740 |
totality | -0.710 |
adelphia | -0.684 |
Token | to |
Token ID | 284 |
Feature activation | -4.68e-01 |
Pos logit contributions | |
intend | +0.564 |
Compton | +0.562 |
percentile | +0.559 |
totality | +0.537 |
adelphia | +0.512 |
Neg logit contributions | |
Adds | -0.637 |
Breach | -0.561 |
oa | -0.515 |
letters | -0.514 |
Newsletter | -0.512 |
Token | leave |
Token ID | 2666 |
Feature activation | +2.66e+00 |
Pos logit contributions | |
intend | +0.302 |
Compton | +0.298 |
percentile | +0.297 |
totality | +0.285 |
adelphia | +0.272 |
Neg logit contributions | |
Adds | -0.363 |
Breach | -0.322 |
letters | -0.298 |
oa | -0.297 |
Newsletter | -0.294 |
Token | . |
Token ID | 13 |
Feature activation | +1.54e+00 |
Pos logit contributions | |
Adds | +1.821 |
Breach | +1.607 |
oa | +1.468 |
letters | +1.458 |
IER | +1.440 |
Neg logit contributions | |
intend | -1.942 |
percentile | -1.909 |
Compton | -1.895 |
totality | -1.823 |
adelphia | -1.772 |
Token | � |
Token ID | 447 |
Feature activation | +6.17e-01 |
Pos logit contributions | |
Adds | +1.138 |
Breach | +1.012 |
oa | +0.928 |
letters | +0.924 |
̶ | +0.915 |
Neg logit contributions | |
intend | -1.045 |
percentile | -1.029 |
Compton | -1.029 |
totality | -0.989 |
adelphia | -0.953 |
Token | � |
Token ID | 251 |
Feature activation | -9.05e-03 |
Pos logit contributions | |
Adds | +0.546 |
Breach | +0.494 |
oa | +0.461 |
letters | +0.460 |
̶ | +0.455 |
Neg logit contributions | |
intend | -0.329 |
Compton | -0.324 |
percentile | -0.323 |
totality | -0.306 |
adelphia | -0.291 |
Token | to |
Token ID | 284 |
Feature activation | +9.10e-01 |
Pos logit contributions | |
Adds | +0.047 |
Breach | +0.042 |
oa | +0.038 |
letters | +0.038 |
̶ | +0.038 |
Neg logit contributions | |
intend | -0.044 |
Compton | -0.044 |
percentile | -0.044 |
totality | -0.042 |
adelphia | -0.040 |
Token | allocate |
Token ID | 31935 |
Feature activation | -3.21e+00 |
Pos logit contributions | |
Adds | +0.656 |
Breach | +0.583 |
oa | +0.532 |
letters | +0.526 |
Newsletter | +0.519 |
Neg logit contributions | |
intend | -0.630 |
Compton | -0.622 |
percentile | -0.616 |
totality | -0.593 |
adelphia | -0.578 |
Token | more |
Token ID | 517 |
Feature activation | -4.92e-01 |
Pos logit contributions | |
percentile | +2.214 |
Compton | +2.202 |
intend | +2.162 |
totality | +2.136 |
disgr | +1.986 |
Neg logit contributions | |
Adds | -2.342 |
Breach | -2.048 |
oa | -1.886 |
letters | -1.880 |
artisan | -1.876 |
Token | time |
Token ID | 640 |
Feature activation | -7.52e-02 |
Pos logit contributions | |
intend | +0.310 |
Compton | +0.307 |
percentile | +0.307 |
totality | +0.294 |
adelphia | +0.280 |
Neg logit contributions | |
Adds | -0.388 |
Breach | -0.346 |
oa | -0.320 |
letters | -0.319 |
IER | -0.315 |
Token | to |
Token ID | 284 |
Feature activation | -4.14e+00 |
Pos logit contributions | |
intend | +0.051 |
Compton | +0.051 |
percentile | +0.051 |
totality | +0.049 |
adelphia | +0.047 |
Neg logit contributions | |
Adds | -0.055 |
Breach | -0.049 |
oa | -0.045 |
letters | -0.045 |
̶ | -0.044 |
Token | dating |
Token ID | 10691 |
Feature activation | -7.04e+00 |
Pos logit contributions | |
Compton | +2.793 |
intend | +2.756 |
percentile | +2.751 |
totality | +2.696 |
disgr | +2.511 |
Neg logit contributions | |
Adds | -3.034 |
Breach | -2.701 |
oa | -2.490 |
̶ | -2.462 |
artisan | -2.461 |
Token | ." |
Token ID | 526 |
Feature activation | -3.15e+00 |
Pos logit contributions | |
Compton | +4.468 |
percentile | +4.376 |
intend | +4.311 |
totality | +4.183 |
disgr | +4.001 |
Neg logit contributions | |
Adds | -5.397 |
Breach | -4.748 |
artisan | -4.434 |
̶ | -4.421 |
oa | -4.390 |
Token | But |
Token ID | 887 |
Feature activation | -3.52e+00 |
Pos logit contributions | |
Compton | +1.981 |
percentile | +1.916 |
intend | +1.911 |
totality | +1.800 |
adelphia | +1.719 |
Neg logit contributions | |
Adds | -2.464 |
Breach | -2.186 |
oa | -2.076 |
artisan | -2.074 |
̶ | -2.027 |
Token | he |
Token ID | 339 |
Feature activation | -7.55e-01 |
Pos logit contributions | |
Compton | +2.371 |
percentile | +2.335 |
intend | +2.296 |
totality | +2.262 |
disgr | +2.129 |
Neg logit contributions | |
Adds | -2.606 |
Breach | -2.306 |
oa | -2.128 |
artisan | -2.123 |
̶ | -2.105 |
Token | brings |
Token ID | 6774 |
Feature activation | +1.85e+00 |
Pos logit contributions | |
intend | +0.539 |
Compton | +0.533 |
percentile | +0.532 |
totality | +0.511 |
adelphia | +0.492 |
Neg logit contributions | |
Adds | -0.531 |
Breach | -0.469 |
oa | -0.427 |
letters | -0.427 |
IER | -0.422 |
Token | Tal |
Token ID | 7193 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
Adds | +1.263 |
Breach | +1.110 |
oa | +1.010 |
letters | +1.008 |
̶ | +0.989 |
Neg logit contributions | |
intend | -1.364 |
percentile | -1.333 |
Compton | -1.330 |
totality | -1.281 |
adelphia | -1.249 |
Token | with |
Token ID | 351 |
Feature activation | +2.51e+00 |
Pos logit contributions | |
Compton | +1.183 |
intend | +1.183 |
percentile | +1.164 |
totality | +1.125 |
adelphia | +1.069 |
Neg logit contributions | |
Adds | -1.271 |
Breach | -1.121 |
oa | -1.029 |
letters | -1.022 |
IER | -1.018 |
Token | his |
Token ID | 465 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
Adds | +1.796 |
Breach | +1.591 |
oa | +1.451 |
letters | +1.445 |
̶ | +1.419 |
Neg logit contributions | |
intend | -1.762 |
percentile | -1.730 |
Compton | -1.713 |
totality | -1.652 |
adelphia | -1.618 |
Token | en |
Token ID | 551 |
Feature activation | -3.12e+00 |
Pos logit contributions | |
intend | +0.451 |
Compton | +0.446 |
percentile | +0.444 |
totality | +0.425 |
adelphia | +0.405 |
Neg logit contributions | |
Adds | -0.593 |
Breach | -0.530 |
oa | -0.491 |
letters | -0.490 |
̶ | -0.484 |
Token | am |
Token ID | 321 |
Feature activation | -7.72e-01 |
Pos logit contributions | |
intend | +2.163 |
Compton | +2.119 |
percentile | +2.072 |
totality | +2.012 |
lé | +1.940 |
Neg logit contributions | |
Adds | -2.285 |
Breach | -2.040 |
oa | -1.832 |
letters | -1.831 |
IER | -1.827 |
Token | ored |
Token ID | 1850 |
Feature activation | -2.02e+00 |
Pos logit contributions | |
intend | +0.593 |
Compton | +0.586 |
percentile | +0.584 |
totality | +0.563 |
adelphia | +0.546 |
Neg logit contributions | |
Adds | -0.503 |
Breach | -0.436 |
oa | -0.393 |
letters | -0.391 |
IER | -0.388 |
Token | relationship |
Token ID | 2776 |
Feature activation | -9.19e+00 |
Pos logit contributions | |
intend | +1.211 |
Compton | +1.206 |
percentile | +1.193 |
totality | +1.140 |
adelphia | +1.078 |
Neg logit contributions | |
Adds | -1.659 |
Breach | -1.485 |
letters | -1.373 |
oa | -1.368 |
̶ | -1.367 |
Token | with |
Token ID | 351 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
Compton | +5.075 |
percentile | +4.925 |
intend | +4.764 |
totality | +4.654 |
disgr | +4.448 |
Neg logit contributions | |
Adds | -7.526 |
Breach | -6.881 |
artisan | -6.525 |
̶ | -6.303 |
letters | -6.302 |
Token | Love |
Token ID | 5896 |
Feature activation | -7.79e-01 |
Pos logit contributions | |
Compton | +0.782 |
intend | +0.778 |
percentile | +0.768 |
totality | +0.741 |
adelphia | +0.708 |
Neg logit contributions | |
Adds | -0.814 |
Breach | -0.714 |
letters | -0.656 |
oa | -0.655 |
̶ | -0.650 |
Token | conveyed |
Token ID | 33348 |
Feature activation | -2.29e+00 |
Pos logit contributions | |
intend | +0.503 |
Compton | +0.498 |
percentile | +0.493 |
totality | +0.473 |
adelphia | +0.455 |
Neg logit contributions | |
Adds | -0.602 |
Breach | -0.537 |
oa | -0.494 |
letters | -0.492 |
IER | -0.488 |
Token | through |
Token ID | 832 |
Feature activation | +2.24e+00 |
Pos logit contributions | |
Compton | +1.545 |
intend | +1.533 |
percentile | +1.526 |
totality | +1.477 |
lé | +1.382 |
Neg logit contributions | |
Adds | -1.692 |
Breach | -1.495 |
oa | -1.378 |
letters | -1.371 |
Newsletter | -1.366 |
Token | lyr |
Token ID | 47188 |
Feature activation | +4.42e+00 |
Pos logit contributions | |
Adds | +1.552 |
Breach | +1.371 |
letters | +1.248 |
oa | +1.246 |
Newsletter | +1.219 |
Neg logit contributions | |
intend | -1.621 |
percentile | -1.591 |
Compton | -1.581 |
totality | -1.525 |
adelphia | -1.485 |
Token | down |
Token ID | 866 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
intend | +0.258 |
Compton | +0.257 |
percentile | +0.254 |
totality | +0.243 |
adelphia | +0.234 |
Neg logit contributions | |
Adds | -0.348 |
Breach | -0.309 |
oa | -0.287 |
letters | -0.286 |
Newsletter | -0.282 |
Token | by |
Token ID | 416 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
Adds | +0.121 |
Breach | +0.107 |
oa | +0.098 |
letters | +0.098 |
artisan | +0.096 |
Neg logit contributions | |
intend | -0.110 |
Compton | -0.109 |
percentile | -0.109 |
totality | -0.105 |
adelphia | -0.101 |
Token | two |
Token ID | 734 |
Feature activation | -2.32e+00 |
Pos logit contributions | |
intend | +0.140 |
Compton | +0.139 |
percentile | +0.138 |
totality | +0.133 |
adelphia | +0.128 |
Neg logit contributions | |
Adds | -0.157 |
Breach | -0.139 |
oa | -0.128 |
letters | -0.128 |
̶ | -0.126 |
Token | inches |
Token ID | 8331 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
intend | +1.509 |
Compton | +1.503 |
percentile | +1.496 |
totality | +1.438 |
adelphia | +1.360 |
Neg logit contributions | |
Adds | -1.779 |
Breach | -1.566 |
oa | -1.448 |
letters | -1.443 |
artisan | -1.438 |
Token | of |
Token ID | 286 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
intend | +0.789 |
Compton | +0.786 |
percentile | +0.784 |
totality | +0.755 |
adelphia | +0.712 |
Neg logit contributions | |
Adds | -0.991 |
Breach | -0.881 |
letters | -0.817 |
oa | -0.815 |
artisan | -0.807 |
Token | snow |
Token ID | 6729 |
Feature activation | -6.50e+00 |
Pos logit contributions | |
intend | +0.728 |
Compton | +0.728 |
percentile | +0.721 |
totality | +0.699 |
adelphia | +0.655 |
Neg logit contributions | |
Adds | -0.935 |
Breach | -0.828 |
letters | -0.772 |
oa | -0.771 |
Newsletter | -0.763 |
Token | , |
Token ID | 11 |
Feature activation | -3.57e+00 |
Pos logit contributions | |
intend | +4.089 |
Compton | +4.084 |
percentile | +4.038 |
totality | +4.002 |
lé | +3.711 |
Neg logit contributions | |
Adds | -4.943 |
Breach | -4.351 |
oa | -4.022 |
artisan | -4.013 |
Newsletter | -3.970 |
Token | let |
Token ID | 1309 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
Compton | +2.382 |
intend | +2.375 |
percentile | +2.367 |
totality | +2.291 |
adelphia | +2.160 |
Neg logit contributions | |
Adds | -2.666 |
Breach | -2.331 |
letters | -2.162 |
oa | -2.159 |
Newsletter | -2.155 |
Token | � |
Token ID | 447 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
Adds | +0.970 |
Breach | +0.854 |
oa | +0.779 |
letters | +0.776 |
̶ | +0.767 |
Neg logit contributions | |
intend | -1.001 |
Compton | -0.987 |
percentile | -0.985 |
totality | -0.948 |
adelphia | -0.916 |
Token | � |
Token ID | 247 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
intend | +0.579 |
Compton | +0.571 |
percentile | +0.570 |
totality | +0.541 |
adelphia | +0.516 |
Neg logit contributions | |
Adds | -0.882 |
Breach | -0.795 |
oa | -0.741 |
letters | -0.738 |
IER | -0.729 |
Token | s |
Token ID | 82 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
intend | +1.007 |
Compton | +0.991 |
percentile | +0.991 |
totality | +0.956 |
adelphia | +0.926 |
Neg logit contributions | |
Adds | -0.711 |
Breach | -0.606 |
letters | -0.540 |
artisan | -0.538 |
Newsletter | -0.536 |
Token | exact |
Token ID | 2748 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
Adds | +0.318 |
Breach | +0.285 |
oa | +0.264 |
letters | +0.264 |
IER | +0.261 |
Neg logit contributions | |
intend | -0.237 |
Compton | -0.234 |
percentile | -0.234 |
totality | -0.224 |
adelphia | -0.213 |
Token | attitude |
Token ID | 9408 |
Feature activation | -3.08e+00 |
Pos logit contributions | |
Compton | +1.779 |
percentile | +1.770 |
intend | +1.759 |
totality | +1.718 |
adelphia | +1.622 |
Neg logit contributions | |
Adds | -1.840 |
Breach | -1.609 |
oa | -1.484 |
artisan | -1.468 |
letters | -1.467 |
Token | a |
Token ID | 257 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
Compton | +2.037 |
percentile | +2.011 |
intend | +1.983 |
totality | +1.943 |
adelphia | +1.817 |
Neg logit contributions | |
Adds | -2.344 |
Breach | -2.049 |
artisan | -1.937 |
oa | -1.902 |
letters | -1.894 |
Token | cornerback |
Token ID | 26683 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
intend | +0.663 |
Compton | +0.660 |
percentile | +0.656 |
totality | +0.629 |
adelphia | +0.599 |
Neg logit contributions | |
Adds | -0.827 |
Breach | -0.736 |
letters | -0.683 |
oa | -0.682 |
artisan | -0.675 |
Token | should |
Token ID | 815 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
intend | +0.745 |
Compton | +0.738 |
percentile | +0.736 |
totality | +0.706 |
adelphia | +0.676 |
Neg logit contributions | |
Adds | -0.821 |
Breach | -0.727 |
oa | -0.669 |
letters | -0.668 |
artisan | -0.663 |
Token | have |
Token ID | 423 |
Feature activation | -7.66e+00 |
Pos logit contributions | |
intend | +3.249 |
percentile | +3.183 |
Compton | +3.093 |
totality | +2.954 |
adelphia | +2.846 |
Neg logit contributions | |
Adds | -3.851 |
Breach | -3.328 |
artisan | -3.200 |
letters | -3.161 |
Newsletter | -3.141 |
Token | , |
Token ID | 11 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
intend | +4.468 |
percentile | +4.386 |
Compton | +4.265 |
totality | +4.088 |
disgr | +3.983 |
Neg logit contributions | |
Adds | -6.305 |
Breach | -5.573 |
artisan | -5.437 |
letters | -5.282 |
oa | -5.201 |
Token | to |
Token ID | 284 |
Feature activation | +8.35e-01 |
Pos logit contributions | |
intend | +0.222 |
Compton | +0.219 |
percentile | +0.218 |
totality | +0.209 |
adelphia | +0.201 |
Neg logit contributions | |
Adds | -0.260 |
Breach | -0.231 |
oa | -0.213 |
letters | -0.212 |
IER | -0.210 |
Token | be |
Token ID | 307 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
Adds | +0.590 |
Breach | +0.520 |
oa | +0.476 |
letters | +0.474 |
̶ | +0.467 |
Neg logit contributions | |
intend | -0.594 |
Compton | -0.586 |
percentile | -0.585 |
totality | -0.563 |
adelphia | -0.542 |
Token | honest |
Token ID | 5508 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
Compton | +2.228 |
intend | +2.221 |
percentile | +2.196 |
totality | +2.109 |
adelphia | +2.004 |
Neg logit contributions | |
Adds | -2.396 |
Breach | -2.106 |
letters | -1.948 |
oa | -1.948 |
artisan | -1.917 |
Token | . |
Token ID | 13 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
intend | +0.594 |
Compton | +0.592 |
percentile | +0.590 |
totality | +0.566 |
adelphia | +0.539 |
Neg logit contributions | |
Adds | -0.716 |
Breach | -0.637 |
letters | -0.588 |
oa | -0.586 |
artisan | -0.582 |
Token | Canada |
Token ID | 3340 |
Feature activation | -2.31e+00 |
Pos logit contributions | |
intend | +2.253 |
Compton | +2.249 |
percentile | +2.234 |
totality | +2.163 |
adelphia | +2.060 |
Neg logit contributions | |
Adds | -2.957 |
Breach | -2.620 |
letters | -2.449 |
oa | -2.447 |
artisan | -2.430 |
Token | . |
Token ID | 13 |
Feature activation | -1.89e+00 |
Pos logit contributions | |
intend | +1.483 |
percentile | +1.470 |
Compton | +1.462 |
totality | +1.406 |
adelphia | +1.341 |
Neg logit contributions | |
Adds | -1.782 |
Breach | -1.588 |
letters | -1.469 |
oa | -1.459 |
IER | -1.445 |
Token |
|
Token ID | 198 |
Feature activation | -1.29e+00 |
Pos logit contributions | |
Compton | +1.203 |
intend | +1.193 |
percentile | +1.187 |
totality | +1.128 |
adelphia | +1.082 |
Neg logit contributions | |
Adds | -1.461 |
Breach | -1.300 |
oa | -1.213 |
artisan | -1.207 |
letters | -1.200 |
Token |
|
Token ID | 198 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
intend | +0.762 |
Compton | +0.751 |
percentile | +0.749 |
totality | +0.712 |
adelphia | +0.682 |
Neg logit contributions | |
Adds | -1.071 |
Breach | -0.964 |
oa | -0.895 |
letters | -0.891 |
IER | -0.881 |
Token | App |
Token ID | 4677 |
Feature activation | -4.05e+00 |
Pos logit contributions | |
intend | +0.632 |
Compton | +0.622 |
percentile | +0.616 |
totality | +0.584 |
adelphia | +0.570 |
Neg logit contributions | |
Adds | -0.782 |
Breach | -0.714 |
oa | -0.652 |
letters | -0.647 |
artisan | -0.646 |
Token | alach |
Token ID | 33786 |
Feature activation | -8.57e+00 |
Pos logit contributions | |
intend | +2.422 |
percentile | +2.373 |
Compton | +2.356 |
totality | +2.236 |
lé | +2.201 |
Neg logit contributions | |
Adds | -3.278 |
Breach | -2.919 |
letters | -2.698 |
IER | -2.689 |
̶ | -2.685 |
Token | ia |
Token ID | 544 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
intend | +5.493 |
percentile | +5.398 |
Compton | +5.394 |
totality | +5.177 |
adelphia | +5.134 |
Neg logit contributions | |
Adds | -6.415 |
Breach | -5.430 |
Newsletter | -5.162 |
IER | -5.109 |
letters | -5.087 |
Token | and |
Token ID | 290 |
Feature activation | -5.61e-01 |
Pos logit contributions | |
intend | +0.404 |
Compton | +0.401 |
percentile | +0.400 |
totality | +0.383 |
adelphia | +0.369 |
Neg logit contributions | |
Adds | -0.442 |
Breach | -0.389 |
letters | -0.359 |
oa | -0.359 |
artisan | -0.354 |
Token | the |
Token ID | 262 |
Feature activation | -3.76e-01 |
Pos logit contributions | |
intend | +0.371 |
Compton | +0.368 |
percentile | +0.366 |
totality | +0.351 |
adelphia | +0.336 |
Neg logit contributions | |
Adds | -0.425 |
Breach | -0.376 |
oa | -0.347 |
letters | -0.346 |
IER | -0.342 |
Token | U |
Token ID | 471 |
Feature activation | -5.43e+00 |
Pos logit contributions | |
intend | +0.240 |
Compton | +0.239 |
percentile | +0.238 |
totality | +0.228 |
adelphia | +0.218 |
Neg logit contributions | |
Adds | -0.292 |
Breach | -0.259 |
oa | -0.241 |
letters | -0.240 |
IER | -0.237 |
Token | . |
Token ID | 13 |
Feature activation | -4.30e+00 |
Pos logit contributions | |
intend | +3.258 |
percentile | +3.157 |
Compton | +3.114 |
lé | +2.941 |
adelphia | +2.919 |
Neg logit contributions | |
Adds | -4.329 |
Breach | -3.872 |
artisan | -3.607 |
IER | -3.600 |
letters | -3.580 |