Token | would |
Token ID | 561 |
Feature activation | +8.85e-01 |
Pos logit contributions | |
smuggling | +0.757 |
nsic | +0.754 |
Machina | +0.735 |
table | +0.733 |
interrogation | +0.729 |
Neg logit contributions | |
Worcester | -0.977 |
Dartmouth | -0.957 |
heit | -0.887 |
ocene | -0.863 |
Lansing | -0.861 |
Token | be |
Token ID | 307 |
Feature activation | +3.92e-01 |
Pos logit contributions | |
nsic | +0.513 |
smuggling | +0.513 |
Machina | +0.498 |
table | +0.493 |
interrogation | +0.493 |
Neg logit contributions | |
Worcester | -0.776 |
Dartmouth | -0.760 |
heit | -0.710 |
Lansing | -0.691 |
ocene | -0.689 |
Token | ). |
Token ID | 737 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
smuggling | +0.247 |
nsic | +0.246 |
Machina | +0.241 |
table | +0.240 |
interrogation | +0.239 |
Neg logit contributions | |
Worcester | -0.323 |
Dartmouth | -0.316 |
heit | -0.294 |
ocene | -0.286 |
hester | -0.285 |
Token |
|
Token ID | 198 |
Feature activation | -5.62e-02 |
Pos logit contributions | |
nsic | +0.147 |
smuggling | +0.146 |
Machina | +0.145 |
table | +0.144 |
Khe | +0.143 |
Neg logit contributions | |
Worcester | -0.182 |
Dartmouth | -0.178 |
heit | -0.167 |
hester | -0.162 |
ocene | -0.161 |
Token |
|
Token ID | 198 |
Feature activation | -4.07e-01 |
Pos logit contributions | |
Worcester | +0.044 |
Dartmouth | +0.043 |
heit | +0.040 |
ocene | +0.039 |
Lansing | +0.039 |
Neg logit contributions | |
nsic | -0.037 |
smuggling | -0.037 |
Machina | -0.037 |
table | -0.037 |
Khe | -0.036 |
Token | Disclaimer |
Token ID | 19618 |
Feature activation | +6.03e+00 |
Pos logit contributions | |
Worcester | +0.291 |
Dartmouth | +0.284 |
heit | +0.261 |
Lansing | +0.252 |
hester | +0.251 |
Neg logit contributions | |
nsic | -0.302 |
smuggling | -0.300 |
Machina | -0.297 |
table | -0.297 |
interrogation | -0.293 |
Token | : |
Token ID | 25 |
Feature activation | +2.61e+00 |
Pos logit contributions | |
Machina | +3.373 |
nsic | +3.349 |
smuggling | +3.315 |
table | +3.305 |
interrogation | +3.240 |
Neg logit contributions | |
Worcester | -5.160 |
Dartmouth | -5.100 |
heit | -4.787 |
hester | -4.683 |
ocene | -4.631 |
Token | These |
Token ID | 2312 |
Feature activation | +8.88e-01 |
Pos logit contributions | |
smuggling | +1.837 |
nsic | +1.828 |
Machina | +1.799 |
table | +1.794 |
Khe | +1.785 |
Neg logit contributions | |
Worcester | -1.932 |
Dartmouth | -1.880 |
heit | -1.769 |
hester | -1.699 |
ocene | -1.696 |
Token | tips |
Token ID | 9040 |
Feature activation | -4.85e-03 |
Pos logit contributions | |
smuggling | +0.560 |
nsic | +0.558 |
Machina | +0.543 |
interrogation | +0.543 |
table | +0.540 |
Neg logit contributions | |
Worcester | -0.732 |
Dartmouth | -0.716 |
heit | -0.672 |
ocene | -0.649 |
hester | -0.647 |
Token | are |
Token ID | 389 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
Worcester | +0.004 |
Dartmouth | +0.004 |
heit | +0.004 |
Lansing | +0.004 |
ocene | +0.004 |
Neg logit contributions | |
nsic | -0.003 |
smuggling | -0.003 |
Machina | -0.003 |
table | -0.003 |
interrogation | -0.003 |
Token | based |
Token ID | 1912 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
nsic | +0.080 |
smuggling | +0.079 |
Machina | +0.077 |
interrogation | +0.076 |
table | +0.076 |
Neg logit contributions | |
Worcester | -0.115 |
Dartmouth | -0.112 |
heit | -0.105 |
Lansing | -0.102 |
ocene | -0.102 |
Token | confident |
Token ID | 6563 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
Worcester | +0.587 |
Dartmouth | +0.574 |
heit | +0.536 |
ocene | +0.518 |
Lansing | +0.517 |
Neg logit contributions | |
smuggling | -0.474 |
nsic | -0.473 |
Machina | -0.461 |
interrogation | -0.457 |
investig | -0.457 |
Token | investors |
Token ID | 7713 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
Worcester | +1.083 |
Dartmouth | +1.058 |
heit | +0.998 |
ocene | +0.971 |
hester | +0.966 |
Neg logit contributions | |
smuggling | -0.718 |
nsic | -0.718 |
Machina | -0.698 |
table | -0.695 |
investig | -0.694 |
Token | . |
Token ID | 13 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
smuggling | +0.065 |
nsic | +0.065 |
Machina | +0.063 |
table | +0.063 |
interrogation | +0.062 |
Neg logit contributions | |
Worcester | -0.093 |
Dartmouth | -0.091 |
heit | -0.085 |
ocene | -0.083 |
hester | -0.083 |
Token |
|
Token ID | 198 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
Worcester | +0.603 |
Dartmouth | +0.589 |
heit | +0.548 |
ocene | +0.528 |
hester | +0.526 |
Neg logit contributions | |
nsic | -0.565 |
smuggling | -0.565 |
Machina | -0.554 |
table | -0.550 |
interrogation | -0.547 |
Token |
|
Token ID | 198 |
Feature activation | -5.98e-01 |
Pos logit contributions | |
Worcester | +0.083 |
Dartmouth | +0.081 |
heit | +0.075 |
Lansing | +0.073 |
ocene | +0.072 |
Neg logit contributions | |
nsic | -0.073 |
smuggling | -0.072 |
Machina | -0.071 |
table | -0.071 |
interrogation | -0.070 |
Token | Disclaimer |
Token ID | 19618 |
Feature activation | +5.80e+00 |
Pos logit contributions | |
Worcester | +0.424 |
Dartmouth | +0.414 |
heit | +0.380 |
Lansing | +0.367 |
ocene | +0.365 |
Neg logit contributions | |
nsic | -0.447 |
smuggling | -0.446 |
Machina | -0.437 |
table | -0.435 |
interrogation | -0.433 |
Token | : |
Token ID | 25 |
Feature activation | +2.22e+00 |
Pos logit contributions | |
nsic | +3.201 |
smuggling | +3.175 |
Machina | +3.150 |
table | +3.124 |
investig | +3.110 |
Neg logit contributions | |
Worcester | -5.022 |
Dartmouth | -4.941 |
heit | -4.659 |
hester | -4.558 |
ocene | -4.529 |
Token | © |
Token ID | 10673 |
Feature activation | +8.42e-01 |
Pos logit contributions | |
smuggling | +1.511 |
nsic | +1.498 |
Machina | +1.475 |
table | +1.470 |
investig | +1.467 |
Neg logit contributions | |
Worcester | -1.702 |
Dartmouth | -1.658 |
heit | -1.557 |
ocene | -1.509 |
hester | -1.500 |
Token | 2015 |
Token ID | 1853 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
smuggling | +0.579 |
nsic | +0.579 |
Machina | +0.566 |
table | +0.563 |
interrogation | +0.560 |
Neg logit contributions | |
Worcester | -0.643 |
Dartmouth | -0.628 |
heit | -0.583 |
ocene | -0.562 |
Lansing | -0.561 |
Token | Money |
Token ID | 12911 |
Feature activation | -7.58e-01 |
Pos logit contributions | |
smuggling | +0.826 |
nsic | +0.825 |
Machina | +0.809 |
table | +0.801 |
investig | +0.798 |
Neg logit contributions | |
Worcester | -0.987 |
Dartmouth | -0.964 |
heit | -0.900 |
ocene | -0.871 |
hester | -0.870 |
Token | Morning |
Token ID | 14410 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
Worcester | +0.633 |
Dartmouth | +0.621 |
heit | +0.580 |
ocene | +0.561 |
Lansing | +0.560 |
Neg logit contributions | |
smuggling | -0.469 |
nsic | -0.469 |
Machina | -0.457 |
table | -0.453 |
interrogation | -0.452 |
Token | sound |
Token ID | 2128 |
Feature activation | +8.94e-01 |
Pos logit contributions | |
Worcester | +0.426 |
Dartmouth | +0.417 |
heit | +0.386 |
Lansing | +0.377 |
ocene | +0.373 |
Neg logit contributions | |
nsic | -0.345 |
smuggling | -0.342 |
Machina | -0.334 |
xual | -0.331 |
table | -0.331 |
Token | files |
Token ID | 3696 |
Feature activation | -6.27e-01 |
Pos logit contributions | |
nsic | +0.516 |
smuggling | +0.516 |
Machina | +0.501 |
table | +0.499 |
interrogation | +0.496 |
Neg logit contributions | |
Worcester | -0.787 |
Dartmouth | -0.773 |
heit | -0.724 |
Lansing | -0.702 |
hester | -0.702 |
Token | are |
Token ID | 389 |
Feature activation | +4.95e-01 |
Pos logit contributions | |
Worcester | +0.525 |
Dartmouth | +0.514 |
heit | +0.479 |
Lansing | +0.464 |
ocene | +0.463 |
Neg logit contributions | |
nsic | -0.388 |
smuggling | -0.386 |
Machina | -0.376 |
table | -0.373 |
interrogation | -0.373 |
Token | what |
Token ID | 644 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
nsic | +0.317 |
smuggling | +0.316 |
Machina | +0.309 |
interrogation | +0.306 |
table | +0.305 |
Neg logit contributions | |
Worcester | -0.404 |
Dartmouth | -0.395 |
heit | -0.368 |
Lansing | -0.356 |
ocene | -0.356 |
Token | I |
Token ID | 314 |
Feature activation | +4.57e-01 |
Pos logit contributions | |
Worcester | +0.180 |
Dartmouth | +0.176 |
heit | +0.164 |
ocene | +0.159 |
Lansing | +0.159 |
Neg logit contributions | |
smuggling | -0.144 |
nsic | -0.143 |
Machina | -0.140 |
interrogation | -0.139 |
table | -0.139 |
Token | term |
Token ID | 3381 |
Feature activation | +5.74e+00 |
Pos logit contributions | |
nsic | +0.297 |
smuggling | +0.296 |
Machina | +0.289 |
table | +0.286 |
interrogation | +0.286 |
Neg logit contributions | |
Worcester | -0.369 |
Dartmouth | -0.361 |
heit | -0.335 |
Lansing | -0.325 |
ocene | -0.324 |
Token | � |
Token ID | 564 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
smuggling | +3.589 |
nsic | +3.545 |
Machina | +3.541 |
interrogation | +3.503 |
investig | +3.479 |
Neg logit contributions | |
Worcester | -4.663 |
Dartmouth | -4.579 |
heit | -4.218 |
hester | -4.144 |
ocene | -4.113 |
Token | � |
Token ID | 250 |
Feature activation | -5.93e-01 |
Pos logit contributions | |
Worcester | +0.094 |
Dartmouth | +0.093 |
heit | +0.087 |
Lansing | +0.084 |
ocene | +0.084 |
Neg logit contributions | |
nsic | -0.058 |
smuggling | -0.057 |
Machina | -0.056 |
interrogation | -0.055 |
table | -0.055 |
Token | enc |
Token ID | 12685 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
Worcester | +0.460 |
Dartmouth | +0.450 |
heit | +0.417 |
Lansing | +0.403 |
ocene | +0.403 |
Neg logit contributions | |
nsic | -0.404 |
smuggling | -0.403 |
Machina | -0.393 |
interrogation | -0.390 |
table | -0.389 |
Token | oded |
Token ID | 9043 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
nsic | +0.286 |
smuggling | +0.285 |
Machina | +0.277 |
interrogation | +0.275 |
table | +0.274 |
Neg logit contributions | |
Worcester | -0.412 |
Dartmouth | -0.404 |
heit | -0.377 |
Lansing | -0.366 |
ocene | -0.365 |
Token | material |
Token ID | 2587 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
nsic | +0.787 |
smuggling | +0.786 |
Machina | +0.764 |
interrogation | +0.759 |
table | +0.758 |
Neg logit contributions | |
Worcester | -1.050 |
Dartmouth | -1.028 |
heit | -0.958 |
Lansing | -0.928 |
ocene | -0.927 |
Token | struct |
Token ID | 2878 |
Feature activation | +2.49e+00 |
Pos logit contributions | |
smuggling | +1.330 |
nsic | +1.320 |
table | +1.290 |
interrogation | +1.286 |
investig | +1.284 |
Neg logit contributions | |
Worcester | -1.807 |
Dartmouth | -1.773 |
heit | -1.669 |
ocene | -1.616 |
hester | -1.611 |
Token | Own |
Token ID | 11744 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
smuggling | +1.706 |
Machina | +1.690 |
nsic | +1.684 |
table | +1.665 |
Khe | +1.663 |
Neg logit contributions | |
Worcester | -1.878 |
Dartmouth | -1.839 |
heit | -1.727 |
ocene | -1.669 |
hester | -1.666 |
Token | ed |
Token ID | 276 |
Feature activation | -3.28e-01 |
Pos logit contributions | |
Worcester | +1.063 |
Dartmouth | +1.042 |
heit | +0.974 |
Lansing | +0.945 |
ocene | +0.943 |
Neg logit contributions | |
nsic | -0.731 |
smuggling | -0.729 |
Machina | -0.708 |
interrogation | -0.701 |
table | -0.700 |
Token | < |
Token ID | 1279 |
Feature activation | +4.10e+00 |
Pos logit contributions | |
Worcester | +0.218 |
Dartmouth | +0.213 |
heit | +0.195 |
Lansing | +0.187 |
ocene | +0.186 |
Neg logit contributions | |
nsic | -0.259 |
smuggling | -0.259 |
Machina | -0.253 |
table | -0.252 |
interrogation | -0.252 |
Token | T |
Token ID | 309 |
Feature activation | +1.86e+00 |
Pos logit contributions | |
smuggling | +2.578 |
table | +2.550 |
nsic | +2.541 |
interrogation | +2.505 |
investig | +2.495 |
Neg logit contributions | |
Worcester | -3.311 |
Dartmouth | -3.231 |
heit | -3.033 |
hester | -2.949 |
Lansing | -2.943 |
Token | > |
Token ID | 1875 |
Feature activation | +5.48e+00 |
Pos logit contributions | |
smuggling | +1.030 |
nsic | +1.022 |
table | +1.001 |
Machina | +0.996 |
interrogation | +0.986 |
Neg logit contributions | |
Worcester | -1.662 |
Dartmouth | -1.619 |
heit | -1.541 |
ocene | -1.493 |
Lansing | -1.482 |
Token | { |
Token ID | 1391 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
smuggling | +3.831 |
nsic | +3.699 |
table | +3.687 |
investig | +3.665 |
Machina | +3.652 |
Neg logit contributions | |
Worcester | -4.029 |
Dartmouth | -3.974 |
heit | -3.716 |
hester | -3.615 |
ocene | -3.599 |
Token | ... |
Token ID | 2644 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
smuggling | +0.329 |
nsic | +0.325 |
table | +0.318 |
Machina | +0.317 |
interrogation | +0.317 |
Neg logit contributions | |
Worcester | -0.401 |
Dartmouth | -0.392 |
heit | -0.367 |
hester | -0.354 |
ocene | -0.353 |
Token | } |
Token ID | 1782 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
smuggling | +1.152 |
nsic | +1.145 |
Machina | +1.126 |
table | +1.121 |
interrogation | +1.118 |
Neg logit contributions | |
Worcester | -1.027 |
Dartmouth | -1.003 |
heit | -0.931 |
hester | -0.893 |
ocene | -0.892 |
Token | impl |
Token ID | 4114 |
Feature activation | +3.98e+00 |
Pos logit contributions | |
smuggling | +0.847 |
nsic | +0.837 |
Machina | +0.820 |
table | +0.819 |
interrogation | +0.816 |
Neg logit contributions | |
Worcester | -1.011 |
Dartmouth | -0.993 |
heit | -0.930 |
ocene | -0.899 |
hester | -0.897 |
Token | < |
Token ID | 1279 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
smuggling | +2.792 |
nsic | +2.749 |
Machina | +2.726 |
table | +2.717 |
symb | +2.687 |
Neg logit contributions | |
Worcester | -2.926 |
Dartmouth | -2.836 |
heit | -2.713 |
ocene | -2.590 |
hester | -2.584 |
Token | � |
Token ID | 7377 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
smuggling | +0.437 |
nsic | +0.430 |
Machina | +0.423 |
interrogation | +0.422 |
table | +0.419 |
Neg logit contributions | |
Worcester | -0.514 |
Dartmouth | -0.504 |
heit | -0.466 |
ocene | -0.455 |
hester | -0.455 |
Token | � |
Token ID | 119 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
smuggling | +0.870 |
nsic | +0.866 |
table | +0.842 |
Machina | +0.840 |
interrogation | +0.836 |
Neg logit contributions | |
Worcester | -1.257 |
Dartmouth | -1.230 |
heit | -1.149 |
Lansing | -1.119 |
ocene | -1.116 |
Token | 0 |
Token ID | 657 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
smuggling | +0.626 |
nsic | +0.623 |
Machina | +0.607 |
table | +0.603 |
interrogation | +0.602 |
Neg logit contributions | |
Worcester | -0.940 |
Dartmouth | -0.923 |
heit | -0.861 |
ocene | -0.837 |
hester | -0.836 |
Token | and |
Token ID | 290 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
nsic | +0.328 |
smuggling | +0.326 |
Machina | +0.318 |
interrogation | +0.315 |
table | +0.314 |
Neg logit contributions | |
Worcester | -0.439 |
Dartmouth | -0.430 |
heit | -0.400 |
Lansing | -0.389 |
ocene | -0.387 |
Token | the |
Token ID | 262 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
smuggling | +0.267 |
nsic | +0.265 |
Machina | +0.260 |
interrogation | +0.258 |
table | +0.257 |
Neg logit contributions | |
Worcester | -0.329 |
Dartmouth | -0.322 |
heit | -0.299 |
ocene | -0.291 |
hester | -0.291 |
Token | sum |
Token ID | 2160 |
Feature activation | +5.25e+00 |
Pos logit contributions | |
Worcester | +0.132 |
Dartmouth | +0.129 |
heit | +0.121 |
ocene | +0.117 |
hester | +0.117 |
Neg logit contributions | |
smuggling | -0.094 |
nsic | -0.094 |
Machina | -0.091 |
interrogation | -0.091 |
table | -0.090 |
Token | f |
Token ID | 277 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
smuggling | +2.469 |
table | +2.431 |
nsic | +2.428 |
interrogation | +2.401 |
Machina | +2.379 |
Neg logit contributions | |
Worcester | -5.026 |
Dartmouth | -4.950 |
hester | -4.588 |
heit | -4.586 |
ocene | -4.562 |
Token | of |
Token ID | 286 |
Feature activation | +5.12e-01 |
Pos logit contributions | |
nsic | +1.345 |
smuggling | +1.345 |
table | +1.312 |
Machina | +1.307 |
interrogation | +1.304 |
Neg logit contributions | |
Worcester | -1.680 |
Dartmouth | -1.653 |
heit | -1.527 |
hester | -1.485 |
Lansing | -1.484 |
Token | all |
Token ID | 477 |
Feature activation | +6.76e-02 |
Pos logit contributions | |
smuggling | +0.346 |
nsic | +0.341 |
Machina | +0.336 |
interrogation | +0.334 |
table | +0.332 |
Neg logit contributions | |
Worcester | -0.399 |
Dartmouth | -0.391 |
heit | -0.361 |
ocene | -0.353 |
hester | -0.352 |
Token | un |
Token ID | 555 |
Feature activation | +1.84e+00 |
Pos logit contributions | |
smuggling | +0.044 |
nsic | +0.044 |
Machina | +0.043 |
interrogation | +0.043 |
table | +0.043 |
Neg logit contributions | |
Worcester | -0.054 |
Dartmouth | -0.053 |
heit | -0.049 |
ocene | -0.048 |
hester | -0.048 |
Token | am |
Token ID | 321 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
smuggling | +1.068 |
nsic | +1.062 |
table | +1.051 |
Machina | +1.042 |
interrogation | +1.020 |
Neg logit contributions | |
Worcester | -1.600 |
Dartmouth | -1.576 |
heit | -1.458 |
Lansing | -1.435 |
ocene | -1.431 |
Token |
|
Token ID | 198 |
Feature activation | -6.87e-01 |
Pos logit contributions | |
Worcester | +0.287 |
Dartmouth | +0.280 |
heit | +0.260 |
Lansing | +0.251 |
ocene | +0.251 |
Neg logit contributions | |
nsic | -0.252 |
smuggling | -0.252 |
Machina | -0.247 |
table | -0.246 |
interrogation | -0.244 |
Token | Own |
Token ID | 23858 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
Worcester | +0.553 |
Dartmouth | +0.541 |
heit | +0.503 |
Lansing | +0.487 |
ocene | +0.486 |
Neg logit contributions | |
nsic | -0.449 |
smuggling | -0.448 |
Machina | -0.437 |
table | -0.434 |
interrogation | -0.432 |
Token | ed |
Token ID | 276 |
Feature activation | +5.80e-02 |
Pos logit contributions | |
Worcester | +1.085 |
Dartmouth | +1.061 |
heit | +0.985 |
Lansing | +0.954 |
ocene | +0.953 |
Neg logit contributions | |
nsic | -0.911 |
smuggling | -0.906 |
Machina | -0.882 |
interrogation | -0.876 |
Khe | -0.873 |
Token | < |
Token ID | 27 |
Feature activation | +3.60e+00 |
Pos logit contributions | |
smuggling | +0.037 |
nsic | +0.037 |
Machina | +0.036 |
table | +0.036 |
interrogation | +0.036 |
Neg logit contributions | |
Worcester | -0.048 |
Dartmouth | -0.047 |
heit | -0.043 |
Lansing | -0.042 |
ocene | -0.042 |
Token | T |
Token ID | 51 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
smuggling | +2.489 |
nsic | +2.479 |
table | +2.476 |
Machina | +2.419 |
interrogation | +2.418 |
Neg logit contributions | |
Worcester | -2.696 |
Dartmouth | -2.640 |
heit | -2.448 |
hester | -2.365 |
Lansing | -2.357 |
Token | > |
Token ID | 29 |
Feature activation | +5.19e+00 |
Pos logit contributions | |
smuggling | +0.217 |
nsic | +0.217 |
Machina | +0.212 |
table | +0.212 |
interrogation | +0.210 |
Neg logit contributions | |
Worcester | -0.207 |
Dartmouth | -0.201 |
heit | -0.186 |
ocene | -0.179 |
Lansing | -0.178 |
Token | , |
Token ID | 837 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
smuggling | +3.209 |
table | +3.146 |
nsic | +3.136 |
Machina | +3.101 |
investig | +3.073 |
Neg logit contributions | |
Worcester | -4.229 |
Dartmouth | -4.211 |
heit | -3.892 |
ocene | -3.780 |
hester | -3.778 |
Token | akin |
Token ID | 22107 |
Feature activation | +6.83e-02 |
Pos logit contributions | |
smuggling | +0.123 |
nsic | +0.122 |
Machina | +0.120 |
investig | +0.119 |
interrogation | +0.119 |
Neg logit contributions | |
Worcester | -0.155 |
Dartmouth | -0.152 |
heit | -0.142 |
hester | -0.138 |
ocene | -0.137 |
Token | to |
Token ID | 284 |
Feature activation | -9.84e-01 |
Pos logit contributions | |
nsic | +0.045 |
smuggling | +0.045 |
Machina | +0.044 |
table | +0.044 |
interrogation | +0.043 |
Neg logit contributions | |
Worcester | -0.054 |
Dartmouth | -0.053 |
heit | -0.049 |
Lansing | -0.048 |
ocene | -0.048 |
Token | Box |
Token ID | 8315 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
Worcester | +0.779 |
Dartmouth | +0.763 |
heit | +0.709 |
ocene | +0.685 |
Lansing | +0.685 |
Neg logit contributions | |
smuggling | -0.654 |
nsic | -0.652 |
Machina | -0.638 |
interrogation | -0.631 |
table | -0.631 |
Token | < |
Token ID | 27 |
Feature activation | +2.30e+00 |
Pos logit contributions | |
Worcester | +0.070 |
Dartmouth | +0.067 |
heit | +0.058 |
Lansing | +0.054 |
ocene | +0.054 |
Neg logit contributions | |
nsic | -0.162 |
smuggling | -0.162 |
Machina | -0.160 |
table | -0.159 |
interrogation | -0.159 |
Token | was |
Token ID | 373 |
Feature activation | +5.52e-01 |
Pos logit contributions | |
Worcester | +0.682 |
Dartmouth | +0.666 |
heit | +0.616 |
Lansing | +0.597 |
ocene | +0.596 |
Neg logit contributions | |
nsic | -0.616 |
smuggling | -0.615 |
Machina | -0.600 |
table | -0.596 |
interrogation | -0.595 |
Token | optimistic |
Token ID | 16915 |
Feature activation | +7.39e-01 |
Pos logit contributions | |
smuggling | +0.346 |
nsic | +0.340 |
Machina | +0.334 |
interrogation | +0.334 |
table | +0.333 |
Neg logit contributions | |
Worcester | -0.458 |
Dartmouth | -0.449 |
heit | -0.422 |
ocene | -0.413 |
hester | -0.407 |
Token | about |
Token ID | 546 |
Feature activation | +9.04e-01 |
Pos logit contributions | |
smuggling | +0.504 |
nsic | +0.498 |
Machina | +0.494 |
table | +0.490 |
interrogation | +0.488 |
Neg logit contributions | |
Worcester | -0.569 |
Dartmouth | -0.556 |
heit | -0.518 |
ocene | -0.502 |
hester | -0.502 |
Token | what |
Token ID | 644 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
smuggling | +0.605 |
nsic | +0.589 |
Machina | +0.587 |
interrogation | +0.582 |
investig | +0.580 |
Neg logit contributions | |
Worcester | -0.709 |
Dartmouth | -0.697 |
heit | -0.656 |
ocene | -0.635 |
hester | -0.632 |
Token | she |
Token ID | 673 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
Worcester | +0.200 |
Dartmouth | +0.196 |
heit | +0.182 |
ocene | +0.177 |
hester | +0.176 |
Neg logit contributions | |
smuggling | -0.180 |
nsic | -0.178 |
Machina | -0.176 |
interrogation | -0.175 |
investig | -0.174 |
Token | termed |
Token ID | 28569 |
Feature activation | +5.12e+00 |
Pos logit contributions | |
smuggling | +0.393 |
nsic | +0.391 |
Machina | +0.385 |
table | +0.380 |
investig | +0.379 |
Neg logit contributions | |
Worcester | -0.446 |
Dartmouth | -0.437 |
heit | -0.404 |
Lansing | -0.390 |
hester | -0.390 |
Token | NASA |
Token ID | 8884 |
Feature activation | -7.03e-01 |
Pos logit contributions | |
smuggling | +3.357 |
Machina | +3.251 |
procedural | +3.241 |
interrogation | +3.226 |
investig | +3.214 |
Neg logit contributions | |
Worcester | -3.979 |
Dartmouth | -3.922 |
heit | -3.693 |
ocene | -3.595 |
hester | -3.581 |
Token | � |
Token ID | 447 |
Feature activation | +6.23e-01 |
Pos logit contributions | |
Worcester | +0.512 |
Dartmouth | +0.500 |
heit | +0.461 |
Lansing | +0.444 |
ocene | +0.444 |
Neg logit contributions | |
nsic | -0.512 |
smuggling | -0.512 |
Machina | -0.500 |
interrogation | -0.496 |
table | -0.495 |
Token | � |
Token ID | 247 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
nsic | +0.247 |
smuggling | +0.247 |
Machina | +0.237 |
table | +0.234 |
interrogation | +0.233 |
Neg logit contributions | |
Worcester | -0.659 |
Dartmouth | -0.649 |
heit | -0.613 |
Lansing | -0.599 |
hester | -0.598 |
Token | s |
Token ID | 82 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
nsic | +0.048 |
smuggling | +0.048 |
Machina | +0.046 |
interrogation | +0.045 |
table | +0.045 |
Neg logit contributions | |
Worcester | -0.106 |
Dartmouth | -0.104 |
heit | -0.099 |
Lansing | -0.096 |
ocene | -0.096 |
Token | two |
Token ID | 734 |
Feature activation | -5.55e-01 |
Pos logit contributions | |
nsic | +0.245 |
smuggling | +0.245 |
Machina | +0.237 |
interrogation | +0.235 |
table | +0.235 |
Neg logit contributions | |
Worcester | -0.400 |
Dartmouth | -0.393 |
heit | -0.369 |
Lansing | -0.358 |
ocene | -0.358 |
Token | According |
Token ID | 4784 |
Feature activation | -6.98e-01 |
Pos logit contributions | |
Worcester | +0.062 |
Dartmouth | +0.061 |
heit | +0.057 |
ocene | +0.056 |
hester | +0.055 |
Neg logit contributions | |
smuggling | -0.048 |
nsic | -0.048 |
Machina | -0.047 |
Khe | -0.046 |
interrogation | -0.046 |
Token | to |
Token ID | 284 |
Feature activation | -8.19e-01 |
Pos logit contributions | |
Worcester | +0.558 |
Dartmouth | +0.545 |
heit | +0.507 |
ocene | +0.492 |
Lansing | +0.491 |
Neg logit contributions | |
smuggling | -0.458 |
nsic | -0.458 |
Machina | -0.447 |
table | -0.444 |
interrogation | -0.443 |
Token | Mur |
Token ID | 5921 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
Worcester | +0.648 |
Dartmouth | +0.633 |
heit | +0.590 |
ocene | +0.571 |
Lansing | +0.569 |
Neg logit contributions | |
smuggling | -0.546 |
nsic | -0.545 |
Machina | -0.530 |
interrogation | -0.528 |
table | -0.525 |
Token | ad |
Token ID | 324 |
Feature activation | -9.62e-01 |
Pos logit contributions | |
nsic | +0.102 |
smuggling | +0.102 |
Machina | +0.100 |
interrogation | +0.099 |
table | +0.099 |
Neg logit contributions | |
Worcester | -0.105 |
Dartmouth | -0.102 |
heit | -0.095 |
Lansing | -0.091 |
ocene | -0.091 |
Token | Do |
Token ID | 2141 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
Worcester | +0.796 |
Dartmouth | +0.779 |
heit | +0.726 |
Lansing | +0.704 |
ocene | +0.701 |
Neg logit contributions | |
nsic | -0.607 |
smuggling | -0.605 |
Machina | -0.589 |
table | -0.583 |
interrogation | -0.583 |
Token | ğ |
Token ID | 33133 |
Feature activation | +5.08e+00 |
Pos logit contributions | |
Worcester | +0.219 |
Dartmouth | +0.215 |
heit | +0.202 |
Lansing | +0.197 |
ocene | +0.196 |
Neg logit contributions | |
nsic | -0.113 |
smuggling | -0.113 |
Machina | -0.109 |
table | -0.108 |
interrogation | -0.107 |
Token | uk |
Token ID | 2724 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
nsic | +2.997 |
smuggling | +2.934 |
interrogation | +2.845 |
table | +2.845 |
investig | +2.841 |
Neg logit contributions | |
Worcester | -4.389 |
Dartmouth | -4.284 |
ocene | -4.027 |
Lansing | -3.915 |
heit | -3.903 |
Token | an |
Token ID | 272 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
nsic | +0.335 |
smuggling | +0.334 |
Machina | +0.323 |
table | +0.322 |
interrogation | +0.322 |
Neg logit contributions | |
Worcester | -0.479 |
Dartmouth | -0.469 |
heit | -0.437 |
Lansing | -0.426 |
ocene | -0.425 |
Token | li |
Token ID | 4528 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
smuggling | +0.079 |
nsic | +0.079 |
interrogation | +0.076 |
Machina | +0.076 |
Khe | +0.076 |
Neg logit contributions | |
Worcester | -0.117 |
Dartmouth | -0.114 |
heit | -0.106 |
ocene | -0.104 |
Lansing | -0.104 |
Token | , |
Token ID | 11 |
Feature activation | -7.28e-01 |
Pos logit contributions | |
smuggling | +0.139 |
nsic | +0.139 |
interrogation | +0.134 |
Machina | +0.133 |
Khe | +0.133 |
Neg logit contributions | |
Worcester | -0.211 |
Dartmouth | -0.205 |
heit | -0.191 |
Lansing | -0.187 |
ocene | -0.187 |
Token | writing |
Token ID | 3597 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
Worcester | +0.550 |
Dartmouth | +0.537 |
heit | +0.497 |
Lansing | +0.480 |
ocene | +0.479 |
Neg logit contributions | |
nsic | -0.511 |
smuggling | -0.510 |
Machina | -0.498 |
interrogation | -0.494 |
table | -0.494 |
Token | . |
Token ID | 13 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
smuggling | +1.027 |
nsic | +1.020 |
Machina | +0.997 |
table | +0.989 |
interrogation | +0.985 |
Neg logit contributions | |
Worcester | -1.444 |
Dartmouth | -1.416 |
heit | -1.328 |
ocene | -1.288 |
hester | -1.287 |
Token |
|
Token ID | 198 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
Worcester | +0.146 |
Dartmouth | +0.143 |
heit | +0.133 |
ocene | +0.128 |
Lansing | +0.128 |
Neg logit contributions | |
nsic | -0.122 |
smuggling | -0.122 |
Machina | -0.119 |
table | -0.118 |
interrogation | -0.118 |
Token |
|
Token ID | 198 |
Feature activation | +7.44e-01 |
Pos logit contributions | |
nsic | +0.806 |
smuggling | +0.805 |
table | +0.802 |
Machina | +0.799 |
Khe | +0.781 |
Neg logit contributions | |
Worcester | -0.999 |
Dartmouth | -0.974 |
heit | -0.915 |
ocene | -0.889 |
hester | -0.886 |
Token | 5 |
Token ID | 20 |
Feature activation | +9.10e-01 |
Pos logit contributions | |
nsic | +0.557 |
smuggling | +0.556 |
table | +0.549 |
Machina | +0.546 |
interrogation | +0.539 |
Neg logit contributions | |
Worcester | -0.521 |
Dartmouth | -0.513 |
heit | -0.467 |
Lansing | -0.453 |
hester | -0.451 |
Token | . |
Token ID | 13 |
Feature activation | +3.78e-01 |
Pos logit contributions | |
nsic | +0.545 |
smuggling | +0.544 |
Machina | +0.535 |
table | +0.533 |
interrogation | +0.525 |
Neg logit contributions | |
Worcester | -0.774 |
Dartmouth | -0.758 |
heit | -0.709 |
ocene | -0.689 |
hester | -0.689 |
Token | Heat |
Token ID | 12308 |
Feature activation | +5.04e+00 |
Pos logit contributions | |
smuggling | +0.247 |
nsic | +0.247 |
Machina | +0.242 |
table | +0.239 |
interrogation | +0.239 |
Neg logit contributions | |
Worcester | -0.302 |
Dartmouth | -0.296 |
heit | -0.275 |
ocene | -0.267 |
Lansing | -0.266 |
Token | about |
Token ID | 546 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
smuggling | +3.165 |
Machina | +3.078 |
nsic | +3.074 |
table | +3.072 |
interrogation | +3.072 |
Neg logit contributions | |
Dartmouth | -4.010 |
Worcester | -3.969 |
heit | -3.737 |
hester | -3.644 |
ocene | -3.629 |
Token | an |
Token ID | 281 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
smuggling | +1.356 |
Machina | +1.315 |
interrogation | +1.301 |
nsic | +1.300 |
table | +1.299 |
Neg logit contributions | |
Worcester | -2.259 |
Dartmouth | -2.234 |
heit | -2.108 |
hester | -2.068 |
ocene | -2.067 |
Token | inch |
Token ID | 11111 |
Feature activation | -7.92e-01 |
Pos logit contributions | |
smuggling | +0.691 |
nsic | +0.684 |
Machina | +0.674 |
interrogation | +0.669 |
table | +0.669 |
Neg logit contributions | |
Worcester | -0.954 |
Dartmouth | -0.938 |
heit | -0.873 |
hester | -0.848 |
ocene | -0.847 |
Token | of |
Token ID | 286 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
Worcester | +0.723 |
Dartmouth | +0.709 |
heit | +0.666 |
Lansing | +0.647 |
ocene | +0.646 |
Neg logit contributions | |
nsic | -0.431 |
smuggling | -0.429 |
Machina | -0.416 |
interrogation | -0.412 |
table | -0.412 |
Token | oil |
Token ID | 3056 |
Feature activation | +1.99e+00 |
Pos logit contributions | |
Worcester | +0.164 |
Dartmouth | +0.161 |
heit | +0.151 |
Lansing | +0.147 |
ocene | +0.147 |
Neg logit contributions | |
nsic | -0.097 |
smuggling | -0.097 |
Machina | -0.094 |
interrogation | -0.093 |
table | -0.093 |
Token | the |
Token ID | 262 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
Worcester | +0.013 |
Dartmouth | +0.012 |
heit | +0.011 |
ocene | +0.011 |
hester | +0.011 |
Neg logit contributions | |
smuggling | -0.011 |
nsic | -0.011 |
Machina | -0.011 |
interrogation | -0.011 |
table | -0.011 |
Token | dungeon |
Token ID | 18974 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
Worcester | +0.213 |
Dartmouth | +0.209 |
heit | +0.195 |
ocene | +0.188 |
Lansing | +0.188 |
Neg logit contributions | |
smuggling | -0.167 |
nsic | -0.167 |
Machina | -0.163 |
interrogation | -0.161 |
table | -0.161 |
Token | ( |
Token ID | 357 |
Feature activation | +5.99e-02 |
Pos logit contributions | |
nsic | +0.071 |
smuggling | +0.071 |
Machina | +0.069 |
interrogation | +0.068 |
table | +0.068 |
Neg logit contributions | |
Worcester | -0.092 |
Dartmouth | -0.090 |
heit | -0.084 |
Lansing | -0.081 |
ocene | -0.081 |
Token | what |
Token ID | 10919 |
Feature activation | -1.94e-02 |
Pos logit contributions | |
nsic | +0.043 |
smuggling | +0.043 |
Machina | +0.042 |
table | +0.042 |
interrogation | +0.042 |
Neg logit contributions | |
Worcester | -0.044 |
Dartmouth | -0.043 |
heit | -0.039 |
Lansing | -0.038 |
ocene | -0.038 |
Token | we |
Token ID | 356 |
Feature activation | +1.45e+00 |
Pos logit contributions | |
Worcester | +0.015 |
Dartmouth | +0.015 |
heit | +0.014 |
ocene | +0.013 |
Lansing | +0.013 |
Neg logit contributions | |
smuggling | -0.013 |
nsic | -0.013 |
Machina | -0.013 |
table | -0.013 |
interrogation | -0.013 |
Token | call |
Token ID | 869 |
Feature activation | +4.94e+00 |
Pos logit contributions | |
smuggling | +1.012 |
nsic | +1.003 |
Machina | +0.990 |
investig | +0.985 |
table | +0.983 |
Neg logit contributions | |
Worcester | -1.093 |
Dartmouth | -1.069 |
heit | -0.994 |
ocene | -0.961 |
hester | -0.960 |
Token | our |
Token ID | 674 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
smuggling | +3.255 |
Machina | +3.188 |
nsic | +3.178 |
Khe | +3.170 |
interrogation | +3.160 |
Neg logit contributions | |
Worcester | -3.834 |
Dartmouth | -3.777 |
heit | -3.541 |
hester | -3.423 |
ocene | -3.422 |
Token | tv |
Token ID | 31557 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
nsic | +0.175 |
smuggling | +0.174 |
Machina | +0.169 |
interrogation | +0.168 |
table | +0.168 |
Neg logit contributions | |
Worcester | -0.259 |
Dartmouth | -0.254 |
heit | -0.238 |
Lansing | -0.231 |
ocene | -0.230 |
Token | room |
Token ID | 2119 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
nsic | +0.805 |
smuggling | +0.805 |
Machina | +0.779 |
table | +0.776 |
interrogation | +0.776 |
Neg logit contributions | |
Worcester | -1.113 |
Dartmouth | -1.091 |
heit | -1.019 |
Lansing | -0.986 |
ocene | -0.986 |
Token | in |
Token ID | 287 |
Feature activation | +5.10e-01 |
Pos logit contributions | |
nsic | +0.314 |
smuggling | +0.313 |
Machina | +0.305 |
interrogation | +0.303 |
table | +0.303 |
Neg logit contributions | |
Worcester | -0.414 |
Dartmouth | -0.405 |
heit | -0.378 |
Lansing | -0.366 |
ocene | -0.365 |
Token | the |
Token ID | 262 |
Feature activation | -5.76e-01 |
Pos logit contributions | |
smuggling | +0.347 |
nsic | +0.346 |
Machina | +0.339 |
interrogation | +0.336 |
table | +0.336 |
Neg logit contributions | |
Worcester | -0.393 |
Dartmouth | -0.385 |
heit | -0.360 |
ocene | -0.347 |
hester | -0.346 |
Token | fork |
Token ID | 15563 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
smuggling | +0.310 |
nsic | +0.306 |
Machina | +0.300 |
interrogation | +0.297 |
table | +0.297 |
Neg logit contributions | |
Worcester | -0.390 |
Dartmouth | -0.383 |
heit | -0.356 |
ocene | -0.348 |
hester | -0.346 |
Token | - |
Token ID | 12 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
nsic | +0.756 |
smuggling | +0.755 |
Machina | +0.730 |
table | +0.725 |
interrogation | +0.721 |
Neg logit contributions | |
Worcester | -1.458 |
Dartmouth | -1.434 |
heit | -1.345 |
Lansing | -1.315 |
ocene | -1.314 |
Token | t |
Token ID | 83 |
Feature activation | -3.65e-01 |
Pos logit contributions | |
Worcester | +0.183 |
Dartmouth | +0.179 |
heit | +0.167 |
Lansing | +0.162 |
ocene | +0.162 |
Neg logit contributions | |
nsic | -0.139 |
smuggling | -0.139 |
Machina | -0.135 |
table | -0.134 |
interrogation | -0.134 |
Token | ender |
Token ID | 2194 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
Worcester | +0.342 |
Dartmouth | +0.335 |
heit | +0.315 |
Lansing | +0.306 |
ocene | +0.306 |
Neg logit contributions | |
nsic | -0.190 |
smuggling | -0.189 |
Machina | -0.183 |
interrogation | -0.181 |
table | -0.181 |
Token | . |
Token ID | 13 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
smuggling | +0.798 |
nsic | +0.795 |
table | +0.776 |
Machina | +0.774 |
interrogation | +0.767 |
Neg logit contributions | |
Worcester | -1.127 |
Dartmouth | -1.108 |
heit | -1.028 |
hester | -1.008 |
Lansing | -1.006 |
Token | Chop |
Token ID | 40159 |
Feature activation | +4.86e+00 |
Pos logit contributions | |
smuggling | +0.189 |
nsic | +0.189 |
Machina | +0.186 |
table | +0.183 |
Khe | +0.183 |
Neg logit contributions | |
Worcester | -0.224 |
Dartmouth | -0.220 |
heit | -0.205 |
ocene | -0.199 |
hester | -0.198 |
Token | fl |
Token ID | 781 |
Feature activation | +2.55e+00 |
Pos logit contributions | |
smuggling | +3.017 |
Machina | +2.918 |
table | +2.917 |
nsic | +2.903 |
procedural | +2.882 |
Neg logit contributions | |
Worcester | -3.900 |
Dartmouth | -3.863 |
heit | -3.619 |
ocene | -3.586 |
hester | -3.516 |
Token | ore |
Token ID | 382 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
smuggling | +1.491 |
nsic | +1.482 |
Machina | +1.453 |
table | +1.446 |
interrogation | +1.424 |
Neg logit contributions | |
Worcester | -2.198 |
Dartmouth | -2.156 |
heit | -2.005 |
Lansing | -1.966 |
ocene | -1.951 |
Token | ts |
Token ID | 912 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
Worcester | +0.286 |
Dartmouth | +0.280 |
heit | +0.265 |
ocene | +0.258 |
Lansing | +0.258 |
Neg logit contributions | |
nsic | -0.139 |
smuggling | -0.139 |
Machina | -0.134 |
interrogation | -0.133 |
investig | -0.132 |
Token | into |
Token ID | 656 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
smuggling | +0.649 |
nsic | +0.647 |
Machina | +0.631 |
table | +0.625 |
interrogation | +0.624 |
Neg logit contributions | |
Worcester | -0.845 |
Dartmouth | -0.828 |
heit | -0.771 |
ocene | -0.751 |
Lansing | -0.748 |
Token | small |
Token ID | 1402 |
Feature activation | +7.66e-01 |
Pos logit contributions | |
smuggling | +0.921 |
nsic | +0.911 |
Machina | +0.894 |
table | +0.884 |
interrogation | +0.882 |
Neg logit contributions | |
Worcester | -1.395 |
Dartmouth | -1.366 |
heit | -1.287 |
ocene | -1.251 |
hester | -1.247 |
Token | : |
Token ID | 25 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
smuggling | +0.521 |
nsic | +0.520 |
Machina | +0.507 |
interrogation | +0.502 |
table | +0.500 |
Neg logit contributions | |
Worcester | -0.688 |
Dartmouth | -0.672 |
heit | -0.630 |
Lansing | -0.609 |
ocene | -0.607 |
Token | Delicious |
Token ID | 39528 |
Feature activation | +3.35e+00 |
Pos logit contributions | |
smuggling | +0.809 |
nsic | +0.797 |
Machina | +0.788 |
Khe | +0.782 |
table | +0.781 |
Neg logit contributions | |
Worcester | -1.443 |
Dartmouth | -1.417 |
heit | -1.354 |
hester | -1.310 |
Lansing | -1.304 |
Token |
|
Token ID | 198 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
smuggling | +2.080 |
table | +2.031 |
nsic | +2.022 |
Khe | +2.007 |
Machina | +2.003 |
Neg logit contributions | |
Worcester | -2.769 |
Dartmouth | -2.662 |
heit | -2.512 |
ocene | -2.473 |
Lansing | -2.453 |
Token |
|
Token ID | 198 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
nsic | +0.738 |
table | +0.734 |
smuggling | +0.732 |
Machina | +0.727 |
Khe | +0.714 |
Neg logit contributions | |
Worcester | -0.924 |
Dartmouth | -0.899 |
heit | -0.841 |
Lansing | -0.820 |
hester | -0.819 |
Token | D |
Token ID | 35 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
nsic | +0.524 |
smuggling | +0.523 |
Machina | +0.512 |
table | +0.510 |
interrogation | +0.509 |
Neg logit contributions | |
Worcester | -0.419 |
Dartmouth | -0.407 |
heit | -0.372 |
Lansing | -0.357 |
ocene | -0.356 |
Token | igg |
Token ID | 6950 |
Feature activation | +4.82e+00 |
Pos logit contributions | |
Worcester | +1.188 |
Dartmouth | +1.167 |
heit | +1.097 |
ocene | +1.063 |
hester | +1.063 |
Neg logit contributions | |
nsic | -0.787 |
smuggling | -0.778 |
xual | -0.759 |
Khe | -0.756 |
Machina | -0.756 |
Token |
|
Token ID | 198 |
Feature activation | +8.27e-01 |
Pos logit contributions | |
smuggling | +2.839 |
table | +2.838 |
Khe | +2.760 |
Machina | +2.745 |
interrogation | +2.741 |
Neg logit contributions | |
Worcester | -3.997 |
Dartmouth | -3.858 |
heit | -3.759 |
ocene | -3.647 |
hester | -3.604 |
Token |
|
Token ID | 198 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
nsic | +0.528 |
table | +0.527 |
smuggling | +0.526 |
Machina | +0.525 |
Khe | +0.512 |
Neg logit contributions | |
Worcester | -0.665 |
Dartmouth | -0.647 |
heit | -0.606 |
hester | -0.591 |
ocene | -0.590 |
Token | reddit |
Token ID | 10748 |
Feature activation | +3.59e+00 |
Pos logit contributions | |
nsic | +0.351 |
smuggling | +0.351 |
Machina | +0.344 |
xual | +0.343 |
interrogation | +0.341 |
Neg logit contributions | |
Worcester | -0.213 |
Dartmouth | -0.208 |
heit | -0.187 |
ocene | -0.176 |
Lansing | -0.175 |
Token |
|
Token ID | 198 |
Feature activation | +4.84e-01 |
Pos logit contributions | |
smuggling | +2.305 |
nsic | +2.286 |
Machina | +2.269 |
table | +2.254 |
interrogation | +2.244 |
Neg logit contributions | |
Worcester | -2.868 |
Dartmouth | -2.797 |
heit | -2.655 |
ocene | -2.560 |
Lansing | -2.540 |
Token |
|
Token ID | 198 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
smuggling | +0.314 |
nsic | +0.314 |
table | +0.312 |
Machina | +0.311 |
Khe | +0.305 |
Neg logit contributions | |
Worcester | -0.385 |
Dartmouth | -0.376 |
heit | -0.352 |
ocene | -0.341 |
hester | -0.341 |
Token |
|
Token ID | 198 |
Feature activation | -7.84e-01 |
Pos logit contributions | |
Worcester | +0.044 |
Dartmouth | +0.043 |
heit | +0.040 |
ocene | +0.039 |
Lansing | +0.039 |
Neg logit contributions | |
nsic | -0.038 |
smuggling | -0.038 |
Machina | -0.037 |
table | -0.037 |
interrogation | -0.037 |
Token | At |
Token ID | 2953 |
Feature activation | -5.38e-01 |
Pos logit contributions | |
Worcester | +0.640 |
Dartmouth | +0.627 |
heit | +0.583 |
Lansing | +0.565 |
ocene | +0.564 |
Neg logit contributions | |
nsic | -0.502 |
smuggling | -0.500 |
Machina | -0.487 |
interrogation | -0.483 |
table | -0.483 |
Token | omic |
Token ID | 10179 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
Worcester | +0.457 |
Dartmouth | +0.448 |
heit | +0.418 |
Lansing | +0.405 |
ocene | +0.404 |
Neg logit contributions | |
nsic | -0.327 |
smuggling | -0.326 |
Machina | -0.317 |
interrogation | -0.314 |
table | -0.314 |
Token | < |
Token ID | 27 |
Feature activation | +3.27e+00 |
Pos logit contributions | |
smuggling | +1.244 |
nsic | +1.231 |
table | +1.222 |
Machina | +1.219 |
interrogation | +1.212 |
Neg logit contributions | |
Worcester | -0.540 |
Dartmouth | -0.524 |
heit | -0.458 |
ocene | -0.423 |
Lansing | -0.423 |
Token | T |
Token ID | 51 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
nsic | +2.351 |
table | +2.348 |
smuggling | +2.347 |
Machina | +2.294 |
interrogation | +2.264 |
Neg logit contributions | |
Worcester | -2.364 |
Dartmouth | -2.306 |
heit | -2.120 |
Lansing | -2.065 |
hester | -2.053 |
Token | > |
Token ID | 29 |
Feature activation | +4.81e+00 |
Pos logit contributions | |
smuggling | +0.840 |
nsic | +0.839 |
Machina | +0.824 |
table | +0.822 |
interrogation | +0.813 |
Neg logit contributions | |
Worcester | -0.831 |
Dartmouth | -0.805 |
heit | -0.746 |
ocene | -0.723 |
Lansing | -0.715 |
Token | , |
Token ID | 837 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
smuggling | +2.410 |
nsic | +2.376 |
Machina | +2.342 |
table | +2.319 |
interrogation | +2.281 |
Neg logit contributions | |
Worcester | -4.556 |
Dartmouth | -4.489 |
heit | -4.176 |
ocene | -4.122 |
Lansing | -4.053 |
Token | akin |
Token ID | 22107 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
smuggling | +0.332 |
nsic | +0.332 |
Machina | +0.321 |
interrogation | +0.317 |
investig | +0.316 |
Neg logit contributions | |
Worcester | -0.683 |
Dartmouth | -0.671 |
heit | -0.632 |
ocene | -0.616 |
Lansing | -0.616 |
Token | to |
Token ID | 284 |
Feature activation | -8.42e-01 |
Pos logit contributions | |
nsic | +0.301 |
smuggling | +0.300 |
Machina | +0.294 |
table | +0.293 |
interrogation | +0.290 |
Neg logit contributions | |
Worcester | -0.378 |
Dartmouth | -0.370 |
heit | -0.343 |
Lansing | -0.334 |
ocene | -0.334 |
Token | std |
Token ID | 14367 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
Worcester | +0.624 |
Dartmouth | +0.609 |
heit | +0.564 |
Lansing | +0.543 |
ocene | +0.543 |
Neg logit contributions | |
nsic | -0.602 |
smuggling | -0.602 |
Machina | -0.588 |
table | -0.583 |
interrogation | -0.582 |
Token | :: |
Token ID | 3712 |
Feature activation | +2.65e+00 |
Pos logit contributions | |
smuggling | +0.922 |
nsic | +0.921 |
table | +0.896 |
Machina | +0.891 |
interrogation | +0.878 |
Neg logit contributions | |
Worcester | -1.719 |
Dartmouth | -1.694 |
heit | -1.596 |
hester | -1.550 |
ocene | -1.545 |
Token | easy |
Token ID | 2562 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
Worcester | +0.962 |
Dartmouth | +0.946 |
heit | +0.882 |
Lansing | +0.859 |
hester | +0.841 |
Neg logit contributions | |
nsic | -0.646 |
smuggling | -0.632 |
xual | -0.620 |
Machina | -0.616 |
table | -0.607 |
Token | : |
Token ID | 25 |
Feature activation | -4.98e-01 |
Pos logit contributions | |
nsic | +0.169 |
smuggling | +0.168 |
Machina | +0.163 |
interrogation | +0.162 |
table | +0.162 |
Neg logit contributions | |
Worcester | -0.220 |
Dartmouth | -0.216 |
heit | -0.201 |
Lansing | -0.195 |
ocene | -0.194 |
Token |
|
Token ID | 198 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
Worcester | +0.379 |
Dartmouth | +0.371 |
heit | +0.343 |
Lansing | +0.332 |
ocene | +0.330 |
Neg logit contributions | |
nsic | -0.347 |
smuggling | -0.345 |
Machina | -0.337 |
table | -0.334 |
interrogation | -0.334 |
Token |
|
Token ID | 198 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
nsic | +0.134 |
smuggling | +0.134 |
Machina | +0.131 |
table | +0.131 |
interrogation | +0.130 |
Neg logit contributions | |
Worcester | -0.154 |
Dartmouth | -0.150 |
heit | -0.140 |
Lansing | -0.135 |
ocene | -0.135 |
Token | + |
Token ID | 10 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Worcester | +0.278 |
Dartmouth | +0.272 |
heit | +0.252 |
Lansing | +0.243 |
ocene | +0.243 |
Neg logit contributions | |
nsic | -0.249 |
smuggling | -0.249 |
Machina | -0.243 |
interrogation | -0.241 |
investig | -0.240 |
Token | -------------------- |
Token ID | 19351 |
Feature activation | +4.81e+00 |
Pos logit contributions | |
nsic | +1.050 |
smuggling | +1.050 |
table | +1.021 |
Machina | +1.018 |
interrogation | +1.016 |
Neg logit contributions | |
Worcester | -1.299 |
Dartmouth | -1.269 |
heit | -1.187 |
ocene | -1.145 |
hester | -1.143 |
Token | --+ |
Token ID | 44785 |
Feature activation | +2.75e+00 |
Pos logit contributions | |
nsic | +2.087 |
smuggling | +2.073 |
table | +2.050 |
Machina | +2.037 |
interrogation | +2.020 |
Neg logit contributions | |
Worcester | -4.844 |
Dartmouth | -4.728 |
heit | -4.545 |
ocene | -4.433 |
hester | -4.386 |
Token | | |
Token ID | 930 |
Feature activation | +6.79e-01 |
Pos logit contributions | |
smuggling | +1.831 |
nsic | +1.830 |
table | +1.791 |
interrogation | +1.783 |
Machina | +1.781 |
Neg logit contributions | |
Worcester | -2.164 |
Dartmouth | -2.102 |
heit | -1.982 |
ocene | -1.916 |
hester | -1.893 |
Token | ... |
Token ID | 2644 |
Feature activation | +1.92e+00 |
Pos logit contributions | |
nsic | +0.435 |
smuggling | +0.434 |
Machina | +0.422 |
table | +0.420 |
interrogation | +0.420 |
Neg logit contributions | |
Worcester | -0.554 |
Dartmouth | -0.542 |
heit | -0.505 |
Lansing | -0.489 |
ocene | -0.488 |
Token | | |
Token ID | 930 |
Feature activation | +2.10e-01 |
Pos logit contributions | |
nsic | +1.482 |
smuggling | +1.479 |
Machina | +1.446 |
table | +1.445 |
interrogation | +1.442 |
Neg logit contributions | |
Worcester | -1.310 |
Dartmouth | -1.271 |
heit | -1.177 |
ocene | -1.123 |
Lansing | -1.121 |
Token | - |
Token ID | 532 |
Feature activation | +1.64e+00 |
Pos logit contributions | |
nsic | +0.138 |
smuggling | +0.137 |
Machina | +0.134 |
interrogation | +0.133 |
table | +0.133 |
Neg logit contributions | |
Worcester | -0.168 |
Dartmouth | -0.164 |
heit | -0.153 |
Lansing | -0.148 |
ocene | -0.147 |
Token | paste |
Token ID | 17008 |
Feature activation | +8.10e-01 |
Pos logit contributions | |
smuggling | +0.558 |
nsic | +0.551 |
Machina | +0.536 |
interrogation | +0.533 |
table | +0.532 |
Neg logit contributions | |
Worcester | -1.015 |
Dartmouth | -1.000 |
heit | -0.939 |
ocene | -0.921 |
hester | -0.916 |
Token | and |
Token ID | 290 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
smuggling | +0.509 |
nsic | +0.508 |
Machina | +0.495 |
interrogation | +0.491 |
table | +0.491 |
Neg logit contributions | |
Worcester | -0.670 |
Dartmouth | -0.657 |
heit | -0.612 |
ocene | -0.594 |
Lansing | -0.593 |
Token | mix |
Token ID | 5022 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
Worcester | +0.140 |
Dartmouth | +0.137 |
heit | +0.128 |
Lansing | +0.124 |
ocene | +0.123 |
Neg logit contributions | |
nsic | -0.104 |
smuggling | -0.103 |
Machina | -0.100 |
table | -0.099 |
interrogation | -0.099 |
Token | well |
Token ID | 880 |
Feature activation | +2.12e+00 |
Pos logit contributions | |
smuggling | +1.330 |
nsic | +1.318 |
Machina | +1.300 |
table | +1.293 |
interrogation | +1.287 |
Neg logit contributions | |
Worcester | -1.327 |
Dartmouth | -1.297 |
heit | -1.194 |
ocene | -1.165 |
Lansing | -1.155 |
Token | . |
Token ID | 13 |
Feature activation | +6.90e-02 |
Pos logit contributions | |
smuggling | +1.276 |
nsic | +1.272 |
Machina | +1.246 |
table | +1.236 |
interrogation | +1.227 |
Neg logit contributions | |
Worcester | -1.801 |
Dartmouth | -1.768 |
heit | -1.647 |
ocene | -1.610 |
hester | -1.602 |
Token | Season |
Token ID | 7369 |
Feature activation | +4.73e+00 |
Pos logit contributions | |
nsic | +0.046 |
smuggling | +0.046 |
Machina | +0.045 |
table | +0.044 |
interrogation | +0.044 |
Neg logit contributions | |
Worcester | -0.054 |
Dartmouth | -0.053 |
heit | -0.049 |
Lansing | -0.048 |
ocene | -0.048 |
Token | with |
Token ID | 351 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
smuggling | +2.952 |
nsic | +2.850 |
Machina | +2.846 |
table | +2.829 |
interrogation | +2.823 |
Neg logit contributions | |
Worcester | -3.874 |
Dartmouth | -3.829 |
heit | -3.510 |
ocene | -3.495 |
hester | -3.493 |
Token | salt |
Token ID | 8268 |
Feature activation | +2.05e+00 |
Pos logit contributions | |
smuggling | +1.472 |
nsic | +1.468 |
Machina | +1.439 |
interrogation | +1.429 |
table | +1.428 |
Neg logit contributions | |
Worcester | -1.304 |
Dartmouth | -1.273 |
heit | -1.173 |
ocene | -1.126 |
hester | -1.125 |
Token | , |
Token ID | 11 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
smuggling | +1.269 |
nsic | +1.269 |
Machina | +1.235 |
table | +1.228 |
interrogation | +1.225 |
Neg logit contributions | |
Worcester | -1.703 |
Dartmouth | -1.670 |
heit | -1.560 |
ocene | -1.515 |
Lansing | -1.509 |
Token | pepper |
Token ID | 13385 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
nsic | +0.537 |
smuggling | +0.531 |
Machina | +0.512 |
interrogation | +0.505 |
table | +0.504 |
Neg logit contributions | |
Worcester | -1.139 |
Dartmouth | -1.117 |
heit | -1.053 |
Lansing | -1.027 |
ocene | -1.023 |
Token | and |
Token ID | 290 |
Feature activation | +6.15e-01 |
Pos logit contributions | |
smuggling | +1.111 |
nsic | +1.109 |
Machina | +1.079 |
table | +1.070 |
interrogation | +1.069 |
Neg logit contributions | |
Worcester | -1.509 |
Dartmouth | -1.482 |
heit | -1.380 |
Lansing | -1.338 |
ocene | -1.338 |
Token | : |
Token ID | 25 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
smuggling | +0.480 |
nsic | +0.480 |
Machina | +0.467 |
interrogation | +0.462 |
Khe | +0.461 |
Neg logit contributions | |
Worcester | -0.640 |
Dartmouth | -0.625 |
heit | -0.587 |
Lansing | -0.568 |
ocene | -0.565 |
Token | Delicious |
Token ID | 39528 |
Feature activation | +3.43e+00 |
Pos logit contributions | |
smuggling | +0.802 |
nsic | +0.788 |
Machina | +0.781 |
Khe | +0.778 |
table | +0.777 |
Neg logit contributions | |
Worcester | -1.470 |
Dartmouth | -1.446 |
heit | -1.385 |
hester | -1.333 |
Lansing | -1.327 |
Token |
|
Token ID | 198 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
smuggling | +2.161 |
nsic | +2.110 |
table | +2.108 |
Khe | +2.083 |
investig | +2.081 |
Neg logit contributions | |
Worcester | -2.821 |
Dartmouth | -2.719 |
heit | -2.559 |
ocene | -2.510 |
Lansing | -2.490 |
Token |
|
Token ID | 198 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
nsic | +0.712 |
table | +0.708 |
smuggling | +0.707 |
Machina | +0.702 |
Khe | +0.689 |
Neg logit contributions | |
Worcester | -0.888 |
Dartmouth | -0.865 |
heit | -0.809 |
Lansing | -0.788 |
hester | -0.787 |
Token | D |
Token ID | 35 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
nsic | +0.480 |
smuggling | +0.479 |
Machina | +0.470 |
interrogation | +0.466 |
table | +0.466 |
Neg logit contributions | |
Worcester | -0.372 |
Dartmouth | -0.362 |
heit | -0.329 |
Lansing | -0.316 |
ocene | -0.314 |
Token | igg |
Token ID | 6950 |
Feature activation | +4.72e+00 |
Pos logit contributions | |
Worcester | +1.444 |
Dartmouth | +1.418 |
heit | +1.338 |
hester | +1.299 |
ocene | +1.295 |
Neg logit contributions | |
nsic | -1.030 |
smuggling | -1.014 |
xual | -1.012 |
Khe | -0.999 |
Machina | -0.993 |
Token |
|
Token ID | 198 |
Feature activation | +6.63e-01 |
Pos logit contributions | |
smuggling | +2.805 |
table | +2.800 |
Khe | +2.717 |
nsic | +2.709 |
interrogation | +2.704 |
Neg logit contributions | |
Worcester | -3.905 |
Dartmouth | -3.773 |
heit | -3.654 |
ocene | -3.550 |
Lansing | -3.526 |
Token |
|
Token ID | 198 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
nsic | +0.425 |
table | +0.424 |
smuggling | +0.423 |
Machina | +0.421 |
Khe | +0.411 |
Neg logit contributions | |
Worcester | -0.533 |
Dartmouth | -0.519 |
heit | -0.485 |
Lansing | -0.473 |
hester | -0.473 |
Token | reddit |
Token ID | 10748 |
Feature activation | +3.59e+00 |
Pos logit contributions | |
nsic | +0.186 |
smuggling | +0.186 |
Machina | +0.183 |
xual | +0.181 |
interrogation | +0.181 |
Neg logit contributions | |
Worcester | -0.115 |
Dartmouth | -0.112 |
heit | -0.101 |
ocene | -0.095 |
Lansing | -0.095 |
Token |
|
Token ID | 198 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
smuggling | +2.328 |
nsic | +2.311 |
Machina | +2.288 |
table | +2.277 |
interrogation | +2.265 |
Neg logit contributions | |
Worcester | -2.853 |
Dartmouth | -2.782 |
heit | -2.635 |
ocene | -2.543 |
Lansing | -2.524 |
Token |
|
Token ID | 198 |
Feature activation | +6.94e-02 |
Pos logit contributions | |
smuggling | +0.242 |
nsic | +0.242 |
table | +0.240 |
Machina | +0.240 |
Khe | +0.235 |
Neg logit contributions | |
Worcester | -0.296 |
Dartmouth | -0.289 |
heit | -0.270 |
ocene | -0.262 |
hester | -0.262 |
Token | follows |
Token ID | 5679 |
Feature activation | +5.92e-01 |
Pos logit contributions | |
Worcester | +0.723 |
Dartmouth | +0.707 |
heit | +0.655 |
Lansing | +0.634 |
ocene | +0.632 |
Neg logit contributions | |
nsic | -0.634 |
smuggling | -0.632 |
Machina | -0.617 |
interrogation | -0.612 |
table | -0.611 |
Token | . |
Token ID | 13 |
Feature activation | -5.62e-01 |
Pos logit contributions | |
nsic | +0.366 |
smuggling | +0.365 |
Machina | +0.356 |
interrogation | +0.354 |
table | +0.353 |
Neg logit contributions | |
Worcester | -0.497 |
Dartmouth | -0.487 |
heit | -0.453 |
Lansing | -0.442 |
hester | -0.440 |
Token |
|
Token ID | 198 |
Feature activation | +2.36e-02 |
Pos logit contributions | |
Worcester | +0.429 |
Dartmouth | +0.419 |
heit | +0.388 |
Lansing | +0.375 |
ocene | +0.374 |
Neg logit contributions | |
nsic | -0.390 |
smuggling | -0.389 |
Machina | -0.380 |
interrogation | -0.376 |
table | -0.376 |
Token |
|
Token ID | 198 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
nsic | +0.016 |
smuggling | +0.016 |
Machina | +0.016 |
table | +0.016 |
interrogation | +0.015 |
Neg logit contributions | |
Worcester | -0.018 |
Dartmouth | -0.018 |
heit | -0.017 |
Lansing | -0.016 |
ocene | -0.016 |
Token | # |
Token ID | 2 |
Feature activation | +2.67e+00 |
Pos logit contributions | |
Worcester | +0.268 |
Dartmouth | +0.262 |
heit | +0.244 |
Lansing | +0.237 |
ocene | +0.236 |
Neg logit contributions | |
nsic | -0.208 |
smuggling | -0.207 |
Machina | -0.202 |
interrogation | -0.200 |
table | -0.199 |
Token | !/ |
Token ID | 48443 |
Feature activation | +4.71e+00 |
Pos logit contributions | |
smuggling | +1.738 |
nsic | +1.731 |
table | +1.702 |
interrogation | +1.683 |
Machina | +1.682 |
Neg logit contributions | |
Worcester | -2.127 |
Dartmouth | -2.090 |
heit | -1.948 |
Lansing | -1.885 |
ocene | -1.883 |
Token | bin |
Token ID | 8800 |
Feature activation | +4.11e+00 |
Pos logit contributions | |
nsic | +0.963 |
smuggling | +0.938 |
table | +0.857 |
interrogation | +0.816 |
Khe | +0.808 |
Neg logit contributions | |
Worcester | -5.866 |
Dartmouth | -5.787 |
heit | -5.558 |
Lansing | -5.482 |
ocene | -5.465 |
Token | / |
Token ID | 14 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
nsic | +1.745 |
table | +1.729 |
smuggling | +1.729 |
Machina | +1.658 |
procedural | +1.636 |
Neg logit contributions | |
Worcester | -4.173 |
Dartmouth | -4.075 |
heit | -3.862 |
ocene | -3.838 |
hester | -3.836 |
Token | sh |
Token ID | 1477 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
nsic | +1.167 |
smuggling | +1.163 |
table | +1.135 |
interrogation | +1.121 |
Machina | +1.121 |
Neg logit contributions | |
Worcester | -1.694 |
Dartmouth | -1.666 |
heit | -1.552 |
Lansing | -1.511 |
ocene | -1.507 |
Token | / |
Token ID | 1220 |
Feature activation | +2.81e+00 |
Pos logit contributions | |
smuggling | +1.323 |
nsic | +1.314 |
table | +1.280 |
interrogation | +1.276 |
Machina | +1.276 |
Neg logit contributions | |
Worcester | -1.530 |
Dartmouth | -1.505 |
heit | -1.406 |
ocene | -1.358 |
hester | -1.354 |
Token | s |
Token ID | 82 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
nsic | +1.947 |
smuggling | +1.946 |
table | +1.895 |
Machina | +1.878 |
interrogation | +1.876 |
Neg logit contributions | |
Worcester | -2.133 |
Dartmouth | -2.091 |
heit | -1.953 |
Lansing | -1.881 |
ocene | -1.873 |
Token | off |
Token ID | 572 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
smuggling | +1.015 |
nsic | +1.014 |
table | +0.994 |
Machina | +0.983 |
interrogation | +0.980 |
Neg logit contributions | |
Worcester | -1.217 |
Dartmouth | -1.194 |
heit | -1.109 |
ocene | -1.077 |
hester | -1.071 |
Token |
|
Token ID | 198 |
Feature activation | +8.30e-01 |
Pos logit contributions | |
smuggling | +1.133 |
nsic | +1.129 |
Machina | +1.105 |
table | +1.100 |
investig | +1.096 |
Neg logit contributions | |
Worcester | -1.317 |
Dartmouth | -1.289 |
heit | -1.201 |
ocene | -1.165 |
hester | -1.157 |
Token |
|
Token ID | 198 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
nsic | +0.546 |
smuggling | +0.545 |
table | +0.539 |
Machina | +0.538 |
Khe | +0.527 |
Neg logit contributions | |
Worcester | -0.658 |
Dartmouth | -0.641 |
heit | -0.599 |
ocene | -0.581 |
Lansing | -0.580 |
Token | Then |
Token ID | 6423 |
Feature activation | +5.48e-01 |
Pos logit contributions | |
nsic | +0.234 |
smuggling | +0.234 |
Machina | +0.229 |
table | +0.228 |
interrogation | +0.227 |
Neg logit contributions | |
Worcester | -0.211 |
Dartmouth | -0.206 |
heit | -0.189 |
Lansing | -0.182 |
ocene | -0.181 |
Token | we |
Token ID | 356 |
Feature activation | +8.07e-01 |
Pos logit contributions | |
smuggling | +0.366 |
nsic | +0.365 |
Machina | +0.357 |
interrogation | +0.354 |
table | +0.353 |
Neg logit contributions | |
Worcester | -0.431 |
Dartmouth | -0.422 |
heit | -0.392 |
ocene | -0.380 |
Lansing | -0.379 |
Token | run |
Token ID | 1057 |
Feature activation | +4.65e+00 |
Pos logit contributions | |
smuggling | +0.533 |
nsic | +0.532 |
Machina | +0.522 |
investig | +0.517 |
table | +0.516 |
Neg logit contributions | |
Worcester | -0.642 |
Dartmouth | -0.629 |
heit | -0.582 |
Lansing | -0.566 |
ocene | -0.565 |
Token | i |
Token ID | 1312 |
Feature activation | +6.54e-01 |
Pos logit contributions | |
smuggling | +2.966 |
Machina | +2.922 |
nsic | +2.898 |
investig | +2.898 |
interrogation | +2.873 |
Neg logit contributions | |
Worcester | -3.728 |
Dartmouth | -3.670 |
heit | -3.435 |
hester | -3.353 |
ocene | -3.348 |
Token | w |
Token ID | 86 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
nsic | +0.506 |
smuggling | +0.504 |
Machina | +0.493 |
table | +0.491 |
interrogation | +0.489 |
Neg logit contributions | |
Worcester | -0.447 |
Dartmouth | -0.437 |
heit | -0.399 |
Lansing | -0.385 |
ocene | -0.383 |
Token | config |
Token ID | 11250 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
Worcester | +0.168 |
Dartmouth | +0.165 |
heit | +0.153 |
Lansing | +0.148 |
ocene | +0.148 |
Neg logit contributions | |
nsic | -0.139 |
smuggling | -0.139 |
Machina | -0.136 |
interrogation | -0.134 |
table | -0.134 |
Token | again |
Token ID | 757 |
Feature activation | +2.65e-01 |
Pos logit contributions | |
nsic | +0.080 |
smuggling | +0.080 |
Machina | +0.078 |
interrogation | +0.077 |
table | +0.077 |
Neg logit contributions | |
Worcester | -0.101 |
Dartmouth | -0.099 |
heit | -0.092 |
Lansing | -0.089 |
ocene | -0.089 |
Token | . |
Token ID | 13 |
Feature activation | -3.45e-01 |
Pos logit contributions | |
smuggling | +0.168 |
nsic | +0.168 |
Machina | +0.163 |
table | +0.162 |
interrogation | +0.162 |
Neg logit contributions | |
Worcester | -0.219 |
Dartmouth | -0.215 |
heit | -0.200 |
ocene | -0.194 |
Lansing | -0.194 |
Token | iger |
Token ID | 8254 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
Worcester | +0.928 |
Dartmouth | +0.910 |
heit | +0.859 |
Lansing | +0.843 |
ocene | +0.840 |
Neg logit contributions | |
smuggling | -0.390 |
nsic | -0.390 |
Machina | -0.377 |
interrogation | -0.371 |
table | -0.368 |
Token | goal |
Token ID | 3061 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
Worcester | +2.011 |
Dartmouth | +1.970 |
heit | +1.839 |
Lansing | +1.774 |
ocene | +1.771 |
Neg logit contributions | |
nsic | -1.637 |
smuggling | -1.618 |
Machina | -1.575 |
xual | -1.564 |
table | -1.556 |
Token |
|
Token ID | 198 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
Worcester | +1.798 |
Dartmouth | +1.758 |
heit | +1.633 |
Lansing | +1.578 |
ocene | +1.575 |
Neg logit contributions | |
nsic | -1.476 |
smuggling | -1.465 |
Machina | -1.423 |
interrogation | -1.416 |
xual | -1.413 |
Token |
|
Token ID | 198 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
nsic | +0.292 |
smuggling | +0.292 |
table | +0.288 |
Machina | +0.288 |
Khe | +0.283 |
Neg logit contributions | |
Worcester | -0.350 |
Dartmouth | -0.342 |
heit | -0.319 |
ocene | -0.310 |
Lansing | -0.309 |
Token | Hon |
Token ID | 29478 |
Feature activation | +5.90e-01 |
Pos logit contributions | |
Worcester | +0.189 |
Dartmouth | +0.184 |
heit | +0.169 |
Lansing | +0.163 |
ocene | +0.162 |
Neg logit contributions | |
nsic | -0.205 |
smuggling | -0.204 |
Machina | -0.200 |
table | -0.200 |
interrogation | -0.198 |
Token | ours |
Token ID | 4662 |
Feature activation | +4.59e+00 |
Pos logit contributions | |
nsic | +0.450 |
smuggling | +0.447 |
Machina | +0.440 |
table | +0.437 |
interrogation | +0.434 |
Neg logit contributions | |
Worcester | -0.410 |
Dartmouth | -0.400 |
heit | -0.367 |
ocene | -0.355 |
Lansing | -0.354 |
Token |
|
Token ID | 198 |
Feature activation | +7.15e-01 |
Pos logit contributions | |
smuggling | +2.948 |
table | +2.941 |
Machina | +2.924 |
nsic | +2.902 |
Khe | +2.838 |
Neg logit contributions | |
Worcester | -3.620 |
Dartmouth | -3.534 |
heit | -3.305 |
hester | -3.256 |
ocene | -3.244 |
Token |
|
Token ID | 198 |
Feature activation | +3.36e-01 |
Pos logit contributions | |
nsic | +0.466 |
smuggling | +0.465 |
table | +0.462 |
Machina | +0.462 |
Khe | +0.452 |
Neg logit contributions | |
Worcester | -0.568 |
Dartmouth | -0.553 |
heit | -0.519 |
ocene | -0.504 |
hester | -0.502 |
Token | Club |
Token ID | 42350 |
Feature activation | +9.62e-02 |
Pos logit contributions | |
nsic | +0.258 |
smuggling | +0.257 |
Machina | +0.253 |
table | +0.252 |
interrogation | +0.249 |
Neg logit contributions | |
Worcester | -0.231 |
Dartmouth | -0.225 |
heit | -0.206 |
Lansing | -0.199 |
ocene | -0.198 |
Token |
|
Token ID | 198 |
Feature activation | +7.86e-01 |
Pos logit contributions | |
nsic | +0.066 |
smuggling | +0.066 |
Machina | +0.065 |
table | +0.065 |
interrogation | +0.064 |
Neg logit contributions | |
Worcester | -0.073 |
Dartmouth | -0.072 |
heit | -0.067 |
ocene | -0.064 |
Lansing | -0.064 |
Token |
|
Token ID | 198 |
Feature activation | +4.69e-01 |
Pos logit contributions | |
nsic | +0.512 |
smuggling | +0.511 |
table | +0.508 |
Machina | +0.507 |
Khe | +0.497 |
Neg logit contributions | |
Worcester | -0.624 |
Dartmouth | -0.608 |
heit | -0.571 |
ocene | -0.554 |
hester | -0.552 |
Token | s |
Token ID | 82 |
Feature activation | +2.99e-02 |
Pos logit contributions | |
Worcester | +0.247 |
Dartmouth | +0.243 |
heit | +0.229 |
Lansing | +0.224 |
ocene | +0.223 |
Neg logit contributions | |
nsic | -0.110 |
smuggling | -0.109 |
Machina | -0.105 |
table | -0.104 |
interrogation | -0.104 |
Token | O |
Token ID | 440 |
Feature activation | -3.79e-01 |
Pos logit contributions | |
smuggling | +0.019 |
nsic | +0.019 |
Machina | +0.019 |
interrogation | +0.018 |
table | +0.018 |
Neg logit contributions | |
Worcester | -0.024 |
Dartmouth | -0.024 |
heit | -0.022 |
Lansing | -0.022 |
ocene | -0.022 |
Token | lic |
Token ID | 677 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
Worcester | +0.323 |
Dartmouth | +0.316 |
heit | +0.295 |
Lansing | +0.286 |
ocene | +0.286 |
Neg logit contributions | |
nsic | -0.229 |
smuggling | -0.229 |
Machina | -0.222 |
table | -0.220 |
interrogation | -0.220 |
Token | ity |
Token ID | 414 |
Feature activation | -9.15e-01 |
Pos logit contributions | |
smuggling | +0.173 |
nsic | +0.171 |
Machina | +0.169 |
interrogation | +0.168 |
table | +0.168 |
Neg logit contributions | |
Worcester | -0.170 |
Dartmouth | -0.167 |
heit | -0.154 |
Lansing | -0.148 |
ocene | -0.148 |
Token | . |
Token ID | 13 |
Feature activation | -4.81e-03 |
Pos logit contributions | |
Worcester | +0.733 |
Dartmouth | +0.717 |
heit | +0.666 |
Lansing | +0.645 |
ocene | +0.643 |
Neg logit contributions | |
nsic | -0.600 |
smuggling | -0.600 |
Machina | -0.584 |
interrogation | -0.579 |
table | -0.579 |
Token | Oliver |
Token ID | 15416 |
Feature activation | +4.54e+00 |
Pos logit contributions | |
Worcester | +0.004 |
Dartmouth | +0.004 |
heit | +0.003 |
ocene | +0.003 |
hester | +0.003 |
Neg logit contributions | |
nsic | -0.003 |
smuggling | -0.003 |
Machina | -0.003 |
table | -0.003 |
Khe | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +3.49e-01 |
Pos logit contributions | |
smuggling | +2.914 |
nsic | +2.808 |
interrogation | +2.780 |
Machina | +2.776 |
investig | +2.760 |
Neg logit contributions | |
Worcester | -3.660 |
Dartmouth | -3.592 |
heit | -3.423 |
ocene | -3.287 |
hester | -3.242 |
Token | Fel |
Token ID | 13937 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
nsic | +0.221 |
smuggling | +0.220 |
Machina | +0.215 |
interrogation | +0.213 |
table | +0.212 |
Neg logit contributions | |
Worcester | -0.288 |
Dartmouth | -0.282 |
heit | -0.262 |
Lansing | -0.254 |
ocene | -0.254 |
Token | icity |
Token ID | 8467 |
Feature activation | +9.85e-01 |
Pos logit contributions | |
nsic | +1.039 |
smuggling | +1.036 |
Machina | +1.010 |
interrogation | +1.001 |
table | +1.000 |
Neg logit contributions | |
Worcester | -1.258 |
Dartmouth | -1.231 |
heit | -1.143 |
Lansing | -1.108 |
ocene | -1.105 |
Token | may |
Token ID | 743 |
Feature activation | +4.28e-01 |
Pos logit contributions | |
smuggling | +0.625 |
nsic | +0.617 |
Machina | +0.607 |
interrogation | +0.602 |
table | +0.599 |
Neg logit contributions | |
Worcester | -0.811 |
Dartmouth | -0.797 |
heit | -0.744 |
hester | -0.722 |
ocene | -0.720 |
Token | have |
Token ID | 423 |
Feature activation | -6.44e-02 |
Pos logit contributions | |
nsic | +0.255 |
smuggling | +0.255 |
Machina | +0.247 |
interrogation | +0.245 |
table | +0.245 |
Neg logit contributions | |
Worcester | -0.368 |
Dartmouth | -0.361 |
heit | -0.337 |
Lansing | -0.327 |
ocene | -0.327 |
Token | search |
Token ID | 2989 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
nsic | +0.203 |
smuggling | +0.202 |
Machina | +0.196 |
table | +0.194 |
interrogation | +0.194 |
Neg logit contributions | |
Worcester | -0.338 |
Dartmouth | -0.332 |
heit | -0.311 |
Lansing | -0.303 |
ocene | -0.302 |
Token | Space |
Token ID | 14106 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
Worcester | +0.123 |
Dartmouth | +0.120 |
heit | +0.112 |
Lansing | +0.109 |
ocene | +0.109 |
Neg logit contributions | |
nsic | -0.089 |
smuggling | -0.089 |
Machina | -0.087 |
table | -0.086 |
interrogation | -0.086 |
Token | ; |
Token ID | 2162 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
Worcester | +1.675 |
Dartmouth | +1.641 |
heit | +1.523 |
Lansing | +1.478 |
ocene | +1.474 |
Neg logit contributions | |
nsic | -1.362 |
smuggling | -1.355 |
Machina | -1.316 |
xual | -1.304 |
interrogation | -1.303 |
Token | an |
Token ID | 281 |
Feature activation | +1.86e-01 |
Pos logit contributions | |
smuggling | +0.282 |
nsic | +0.280 |
Machina | +0.274 |
table | +0.273 |
interrogation | +0.272 |
Neg logit contributions | |
Worcester | -0.332 |
Dartmouth | -0.325 |
heit | -0.303 |
ocene | -0.294 |
Lansing | -0.293 |
Token | association |
Token ID | 8112 |
Feature activation | -2.45e+00 |
Pos logit contributions | |
nsic | +0.114 |
smuggling | +0.114 |
Machina | +0.111 |
interrogation | +0.111 |
table | +0.111 |
Neg logit contributions | |
Worcester | -0.157 |
Dartmouth | -0.154 |
heit | -0.143 |
ocene | -0.139 |
Lansing | -0.139 |
Token | between |
Token ID | 1022 |
Feature activation | -5.59e+00 |
Pos logit contributions | |
Worcester | +2.084 |
Dartmouth | +2.036 |
heit | +1.910 |
Lansing | +1.850 |
ocene | +1.842 |
Neg logit contributions | |
nsic | -1.483 |
smuggling | -1.468 |
Machina | -1.426 |
Khe | -1.414 |
xual | -1.409 |
Token | the |
Token ID | 262 |
Feature activation | -8.78e-01 |
Pos logit contributions | |
Worcester | +4.198 |
Dartmouth | +4.090 |
heit | +3.757 |
Lansing | +3.667 |
ocene | +3.567 |
Neg logit contributions | |
nsic | -3.940 |
smuggling | -3.838 |
xual | -3.778 |
Machina | -3.738 |
table | -3.719 |
Token | tiles |
Token ID | 19867 |
Feature activation | -8.73e-01 |
Pos logit contributions | |
Worcester | +0.726 |
Dartmouth | +0.711 |
heit | +0.663 |
ocene | +0.642 |
Lansing | +0.641 |
Neg logit contributions | |
smuggling | -0.553 |
nsic | -0.552 |
Machina | -0.538 |
interrogation | -0.534 |
table | -0.533 |
Token | location |
Token ID | 4067 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Worcester | +0.716 |
Dartmouth | +0.700 |
heit | +0.652 |
Lansing | +0.632 |
ocene | +0.630 |
Neg logit contributions | |
nsic | -0.557 |
smuggling | -0.555 |
Machina | -0.541 |
interrogation | -0.536 |
table | -0.536 |
Token | and |
Token ID | 290 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
Worcester | +1.723 |
Dartmouth | +1.685 |
heit | +1.565 |
Lansing | +1.515 |
ocene | +1.512 |
Neg logit contributions | |
nsic | -1.406 |
smuggling | -1.399 |
Machina | -1.362 |
interrogation | -1.347 |
table | -1.345 |
Token | its |
Token ID | 663 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
smuggling | +0.216 |
nsic | +0.214 |
Machina | +0.210 |
interrogation | +0.210 |
table | +0.209 |
Neg logit contributions | |
Worcester | -0.249 |
Dartmouth | -0.243 |
heit | -0.227 |
ocene | -0.220 |
hester | -0.219 |
Token | provide |
Token ID | 2148 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
Worcester | +0.735 |
Dartmouth | +0.722 |
heit | +0.672 |
Lansing | +0.656 |
ocene | +0.649 |
Neg logit contributions | |
nsic | -0.464 |
smuggling | -0.460 |
Machina | -0.449 |
table | -0.442 |
Khe | -0.442 |
Token | evidence |
Token ID | 2370 |
Feature activation | -8.08e-01 |
Pos logit contributions | |
nsic | +0.134 |
smuggling | +0.134 |
Machina | +0.130 |
interrogation | +0.129 |
table | +0.129 |
Neg logit contributions | |
Worcester | -0.180 |
Dartmouth | -0.177 |
heit | -0.165 |
ocene | -0.160 |
Lansing | -0.160 |
Token | that |
Token ID | 326 |
Feature activation | -5.89e-02 |
Pos logit contributions | |
Worcester | +0.611 |
Dartmouth | +0.597 |
heit | +0.550 |
Lansing | +0.533 |
ocene | +0.530 |
Neg logit contributions | |
nsic | -0.567 |
smuggling | -0.564 |
Machina | -0.552 |
table | -0.547 |
interrogation | -0.547 |
Token | the |
Token ID | 262 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
Worcester | +0.043 |
Dartmouth | +0.042 |
heit | +0.039 |
ocene | +0.038 |
hester | +0.038 |
Neg logit contributions | |
smuggling | -0.042 |
nsic | -0.042 |
Machina | -0.041 |
interrogation | -0.041 |
investig | -0.041 |
Token | connection |
Token ID | 4637 |
Feature activation | -2.22e+00 |
Pos logit contributions | |
Worcester | +0.323 |
Dartmouth | +0.316 |
heit | +0.296 |
ocene | +0.285 |
hester | +0.284 |
Neg logit contributions | |
smuggling | -0.263 |
nsic | -0.262 |
Machina | -0.254 |
interrogation | -0.254 |
investig | -0.253 |
Token | between |
Token ID | 1022 |
Feature activation | -5.07e+00 |
Pos logit contributions | |
Worcester | +1.731 |
Dartmouth | +1.694 |
heit | +1.560 |
Lansing | +1.518 |
ocene | +1.506 |
Neg logit contributions | |
nsic | -1.505 |
smuggling | -1.491 |
Machina | -1.462 |
interrogation | -1.446 |
table | -1.445 |
Token | Russian |
Token ID | 3394 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
Worcester | +3.507 |
Dartmouth | +3.440 |
heit | +3.075 |
Lansing | +3.053 |
hester | +2.983 |
Neg logit contributions | |
nsic | -3.825 |
smuggling | -3.769 |
xual | -3.727 |
Machina | -3.712 |
table | -3.696 |
Token | hackers |
Token ID | 17110 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
Worcester | +0.796 |
Dartmouth | +0.772 |
heit | +0.705 |
ocene | +0.674 |
Lansing | +0.672 |
Neg logit contributions | |
smuggling | -1.043 |
nsic | -1.041 |
Machina | -1.016 |
interrogation | -1.015 |
investig | -1.011 |
Token | and |
Token ID | 290 |
Feature activation | +2.36e-01 |
Pos logit contributions | |
Worcester | +1.274 |
Dartmouth | +1.246 |
heit | +1.160 |
Lansing | +1.123 |
ocene | +1.121 |
Neg logit contributions | |
nsic | -1.013 |
smuggling | -1.011 |
Machina | -0.984 |
interrogation | -0.975 |
table | -0.975 |
Token | the |
Token ID | 262 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
smuggling | +0.166 |
nsic | +0.165 |
Machina | +0.161 |
interrogation | +0.160 |
table | +0.160 |
Neg logit contributions | |
Worcester | -0.179 |
Dartmouth | -0.174 |
heit | -0.162 |
ocene | -0.156 |
hester | -0.155 |
Token | DNC |
Token ID | 17824 |
Feature activation | +6.03e-03 |
Pos logit contributions | |
Worcester | +0.213 |
Dartmouth | +0.208 |
heit | +0.195 |
ocene | +0.187 |
Lansing | +0.187 |
Neg logit contributions | |
smuggling | -0.174 |
nsic | -0.174 |
Machina | -0.169 |
interrogation | -0.168 |
table | -0.168 |
Token | reports |
Token ID | 3136 |
Feature activation | -8.77e-01 |
Pos logit contributions | |
Worcester | +0.327 |
Dartmouth | +0.321 |
heit | +0.299 |
Lansing | +0.290 |
ocene | +0.289 |
Neg logit contributions | |
nsic | -0.236 |
smuggling | -0.235 |
Machina | -0.229 |
table | -0.227 |
interrogation | -0.227 |
Token | to |
Token ID | 284 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
Worcester | +0.696 |
Dartmouth | +0.681 |
heit | +0.631 |
Lansing | +0.612 |
ocene | +0.608 |
Neg logit contributions | |
nsic | -0.582 |
smuggling | -0.579 |
Machina | -0.566 |
interrogation | -0.560 |
table | -0.560 |
Token | make |
Token ID | 787 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Worcester | +1.181 |
Dartmouth | +1.160 |
heit | +1.078 |
Lansing | +1.060 |
hester | +1.040 |
Neg logit contributions | |
nsic | -0.728 |
smuggling | -0.715 |
Machina | -0.703 |
xual | -0.693 |
table | -0.691 |
Token | the |
Token ID | 262 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
Worcester | +1.089 |
Dartmouth | +1.065 |
heit | +0.983 |
Lansing | +0.955 |
hester | +0.946 |
Neg logit contributions | |
nsic | -0.963 |
smuggling | -0.956 |
Machina | -0.938 |
table | -0.929 |
interrogation | -0.924 |
Token | connection |
Token ID | 4637 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
smuggling | +0.103 |
nsic | +0.102 |
interrogation | +0.099 |
Machina | +0.099 |
investig | +0.098 |
Neg logit contributions | |
Worcester | -0.194 |
Dartmouth | -0.190 |
heit | -0.180 |
ocene | -0.175 |
hester | -0.174 |
Token | between |
Token ID | 1022 |
Feature activation | -4.96e+00 |
Pos logit contributions | |
Worcester | +1.533 |
Dartmouth | +1.501 |
heit | +1.382 |
Lansing | +1.346 |
ocene | +1.336 |
Neg logit contributions | |
nsic | -1.303 |
smuggling | -1.292 |
Machina | -1.268 |
table | -1.251 |
interrogation | -1.251 |
Token | Russian |
Token ID | 3394 |
Feature activation | -1.18e+00 |
Pos logit contributions | |
Worcester | +3.482 |
Dartmouth | +3.417 |
heit | +3.080 |
Lansing | +3.027 |
hester | +2.988 |
Neg logit contributions | |
nsic | -3.717 |
smuggling | -3.654 |
xual | -3.623 |
Machina | -3.602 |
table | -3.578 |
Token | hackers |
Token ID | 17110 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Worcester | +0.999 |
Dartmouth | +0.978 |
heit | +0.915 |
Lansing | +0.884 |
ocene | +0.884 |
Neg logit contributions | |
smuggling | -0.727 |
nsic | -0.726 |
Machina | -0.704 |
interrogation | -0.700 |
table | -0.698 |
Token | and |
Token ID | 290 |
Feature activation | +5.19e-01 |
Pos logit contributions | |
Worcester | +1.228 |
Dartmouth | +1.199 |
heit | +1.125 |
ocene | +1.088 |
Lansing | +1.085 |
Neg logit contributions | |
smuggling | -0.934 |
nsic | -0.930 |
Machina | -0.899 |
interrogation | -0.895 |
table | -0.895 |
Token | the |
Token ID | 262 |
Feature activation | -1.87e-01 |
Pos logit contributions | |
smuggling | +0.358 |
nsic | +0.354 |
Machina | +0.347 |
table | +0.345 |
interrogation | +0.345 |
Neg logit contributions | |
Worcester | -0.397 |
Dartmouth | -0.388 |
heit | -0.363 |
ocene | -0.350 |
hester | -0.347 |
Token | Democratic |
Token ID | 4390 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
Worcester | +0.152 |
Dartmouth | +0.149 |
heit | +0.140 |
ocene | +0.135 |
hester | +0.135 |
Neg logit contributions | |
smuggling | -0.120 |
nsic | -0.119 |
Machina | -0.116 |
interrogation | -0.115 |
investig | -0.115 |
Token | provide |
Token ID | 2148 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
nsic | +0.296 |
smuggling | +0.295 |
Machina | +0.286 |
interrogation | +0.283 |
table | +0.283 |
Neg logit contributions | |
Worcester | -0.505 |
Dartmouth | -0.495 |
heit | -0.465 |
Lansing | -0.452 |
ocene | -0.451 |
Token | data |
Token ID | 1366 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
nsic | +0.624 |
smuggling | +0.622 |
Machina | +0.605 |
interrogation | +0.600 |
table | +0.600 |
Neg logit contributions | |
Worcester | -0.851 |
Dartmouth | -0.834 |
heit | -0.778 |
Lansing | -0.754 |
ocene | -0.753 |
Token | on |
Token ID | 319 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
nsic | +0.187 |
smuggling | +0.186 |
Machina | +0.182 |
interrogation | +0.180 |
table | +0.179 |
Neg logit contributions | |
Worcester | -0.249 |
Dartmouth | -0.244 |
heit | -0.227 |
Lansing | -0.220 |
ocene | -0.219 |
Token | the |
Token ID | 262 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
smuggling | +0.239 |
nsic | +0.238 |
Machina | +0.232 |
interrogation | +0.231 |
investig | +0.230 |
Neg logit contributions | |
Worcester | -0.303 |
Dartmouth | -0.296 |
heit | -0.277 |
ocene | -0.269 |
Lansing | -0.267 |
Token | relationship |
Token ID | 2776 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
smuggling | +0.088 |
nsic | +0.087 |
Machina | +0.085 |
interrogation | +0.084 |
investig | +0.084 |
Neg logit contributions | |
Worcester | -0.139 |
Dartmouth | -0.136 |
heit | -0.128 |
ocene | -0.124 |
Lansing | -0.124 |
Token | between |
Token ID | 1022 |
Feature activation | -4.92e+00 |
Pos logit contributions | |
Worcester | +1.260 |
Dartmouth | +1.236 |
heit | +1.142 |
ocene | +1.106 |
Lansing | +1.104 |
Neg logit contributions | |
nsic | -1.085 |
smuggling | -1.074 |
Machina | -1.058 |
table | -1.036 |
investig | -1.035 |
Token | the |
Token ID | 262 |
Feature activation | -5.60e-01 |
Pos logit contributions | |
Worcester | +4.205 |
Dartmouth | +4.159 |
heit | +3.811 |
Lansing | +3.729 |
hester | +3.652 |
Neg logit contributions | |
nsic | -2.952 |
smuggling | -2.829 |
Machina | -2.811 |
xual | -2.790 |
table | -2.777 |
Token | source |
Token ID | 2723 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
Worcester | +0.491 |
Dartmouth | +0.480 |
heit | +0.450 |
ocene | +0.437 |
Lansing | +0.437 |
Neg logit contributions | |
smuggling | -0.326 |
nsic | -0.325 |
Machina | -0.315 |
interrogation | -0.313 |
table | -0.312 |
Token | of |
Token ID | 286 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
smuggling | +0.068 |
nsic | +0.068 |
Machina | +0.065 |
interrogation | +0.065 |
table | +0.065 |
Neg logit contributions | |
Worcester | -0.114 |
Dartmouth | -0.111 |
heit | -0.105 |
Lansing | -0.102 |
ocene | -0.102 |
Token | research |
Token ID | 2267 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
Worcester | +0.169 |
Dartmouth | +0.165 |
heit | +0.153 |
Lansing | +0.149 |
ocene | +0.148 |
Neg logit contributions | |
nsic | -0.138 |
smuggling | -0.137 |
Machina | -0.134 |
table | -0.132 |
interrogation | -0.132 |
Token | funding |
Token ID | 4918 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
nsic | +0.147 |
smuggling | +0.146 |
Machina | +0.143 |
table | +0.141 |
interrogation | +0.141 |
Neg logit contributions | |
Worcester | -0.203 |
Dartmouth | -0.199 |
heit | -0.185 |
Lansing | -0.180 |
ocene | -0.179 |
Token | requests |
Token ID | 7007 |
Feature activation | +2.16e+00 |
Pos logit contributions | |
smuggling | +0.677 |
nsic | +0.671 |
Machina | +0.653 |
interrogation | +0.646 |
investig | +0.645 |
Neg logit contributions | |
Worcester | -1.151 |
Dartmouth | -1.129 |
heit | -1.062 |
hester | -1.033 |
ocene | -1.033 |
Token | seeking |
Token ID | 6095 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
smuggling | +1.324 |
nsic | +1.312 |
Machina | +1.289 |
interrogation | +1.273 |
table | +1.270 |
Neg logit contributions | |
Worcester | -1.822 |
Dartmouth | -1.785 |
heit | -1.678 |
ocene | -1.634 |
hester | -1.630 |
Token | information |
Token ID | 1321 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
smuggling | +0.446 |
nsic | +0.444 |
Machina | +0.434 |
interrogation | +0.434 |
investig | +0.432 |
Neg logit contributions | |
Worcester | -0.568 |
Dartmouth | -0.556 |
heit | -0.521 |
hester | -0.504 |
ocene | -0.503 |
Token | about |
Token ID | 546 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
Worcester | +1.725 |
Dartmouth | +1.689 |
heit | +1.562 |
Lansing | +1.530 |
ocene | +1.508 |
Neg logit contributions | |
nsic | -1.317 |
smuggling | -1.299 |
Machina | -1.271 |
xual | -1.264 |
table | -1.260 |
Token | communications |
Token ID | 8062 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
Worcester | +0.119 |
Dartmouth | +0.116 |
heit | +0.108 |
ocene | +0.105 |
hester | +0.105 |
Neg logit contributions | |
smuggling | -0.096 |
nsic | -0.095 |
Machina | -0.093 |
interrogation | -0.092 |
table | -0.092 |
Token | between |
Token ID | 1022 |
Feature activation | -4.90e+00 |
Pos logit contributions | |
Worcester | +0.474 |
Dartmouth | +0.465 |
heit | +0.429 |
Lansing | +0.419 |
ocene | +0.415 |
Neg logit contributions | |
nsic | -0.367 |
smuggling | -0.362 |
Machina | -0.353 |
table | -0.350 |
xual | -0.350 |
Token | Pruitt |
Token ID | 39637 |
Feature activation | +4.09e-01 |
Pos logit contributions | |
Worcester | +3.978 |
Dartmouth | +3.921 |
heit | +3.552 |
Lansing | +3.535 |
ocene | +3.400 |
Neg logit contributions | |
nsic | -3.201 |
smuggling | -3.095 |
xual | -3.076 |
Machina | -3.028 |
table | -3.023 |
Token | � |
Token ID | 447 |
Feature activation | +7.14e-01 |
Pos logit contributions | |
smuggling | +0.254 |
nsic | +0.252 |
Machina | +0.247 |
interrogation | +0.245 |
table | +0.245 |
Neg logit contributions | |
Worcester | -0.342 |
Dartmouth | -0.334 |
heit | -0.312 |
hester | -0.304 |
ocene | -0.302 |
Token | � |
Token ID | 247 |
Feature activation | +6.31e-01 |
Pos logit contributions | |
nsic | +0.387 |
smuggling | +0.387 |
Machina | +0.375 |
table | +0.372 |
interrogation | +0.370 |
Neg logit contributions | |
Worcester | -0.654 |
Dartmouth | -0.639 |
heit | -0.598 |
Lansing | -0.584 |
hester | -0.583 |
Token | s |
Token ID | 82 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
nsic | +0.413 |
smuggling | +0.411 |
Machina | +0.402 |
table | +0.400 |
interrogation | +0.399 |
Neg logit contributions | |
Worcester | -0.507 |
Dartmouth | -0.495 |
heit | -0.460 |
hester | -0.445 |
Lansing | -0.445 |
Token | office |
Token ID | 2607 |
Feature activation | -9.31e-01 |
Pos logit contributions | |
smuggling | +0.236 |
nsic | +0.235 |
interrogation | +0.228 |
Machina | +0.228 |
investig | +0.228 |
Neg logit contributions | |
Worcester | -0.367 |
Dartmouth | -0.359 |
heit | -0.338 |
ocene | -0.328 |
hester | -0.328 |
Token | takes |
Token ID | 2753 |
Feature activation | +9.83e-03 |
Pos logit contributions | |
Worcester | +0.052 |
Dartmouth | +0.051 |
heit | +0.047 |
ocene | +0.045 |
Lansing | +0.045 |
Neg logit contributions | |
smuggling | -0.045 |
nsic | -0.045 |
Machina | -0.044 |
interrogation | -0.043 |
table | -0.043 |
Token | a |
Token ID | 257 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
nsic | +0.006 |
smuggling | +0.006 |
Machina | +0.006 |
interrogation | +0.006 |
table | +0.006 |
Neg logit contributions | |
Worcester | -0.008 |
Dartmouth | -0.008 |
heit | -0.007 |
Lansing | -0.007 |
ocene | -0.007 |
Token | somewhat |
Token ID | 6454 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
Worcester | +0.146 |
Dartmouth | +0.143 |
heit | +0.132 |
Lansing | +0.128 |
ocene | +0.128 |
Neg logit contributions | |
nsic | -0.122 |
smuggling | -0.122 |
Machina | -0.119 |
interrogation | -0.118 |
table | -0.118 |
Token | limited |
Token ID | 3614 |
Feature activation | +6.34e-01 |
Pos logit contributions | |
smuggling | +0.203 |
nsic | +0.203 |
Machina | +0.198 |
interrogation | +0.197 |
table | +0.197 |
Neg logit contributions | |
Worcester | -0.168 |
Dartmouth | -0.163 |
heit | -0.149 |
ocene | -0.143 |
Lansing | -0.143 |
Token | connection |
Token ID | 4637 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
smuggling | +0.424 |
nsic | +0.424 |
Machina | +0.412 |
interrogation | +0.411 |
table | +0.409 |
Neg logit contributions | |
Worcester | -0.498 |
Dartmouth | -0.487 |
heit | -0.454 |
ocene | -0.439 |
Lansing | -0.437 |
Token | between |
Token ID | 1022 |
Feature activation | -4.89e+00 |
Pos logit contributions | |
Worcester | +1.275 |
Dartmouth | +1.248 |
heit | +1.156 |
Lansing | +1.121 |
ocene | +1.110 |
Neg logit contributions | |
nsic | -1.095 |
smuggling | -1.086 |
Machina | -1.064 |
Khe | -1.048 |
interrogation | -1.048 |
Token | the |
Token ID | 262 |
Feature activation | -5.74e-01 |
Pos logit contributions | |
Worcester | +4.095 |
Dartmouth | +4.017 |
heit | +3.732 |
Lansing | +3.616 |
hester | +3.526 |
Neg logit contributions | |
nsic | -3.047 |
smuggling | -2.894 |
Machina | -2.874 |
Khe | -2.859 |
table | -2.835 |
Token | testing |
Token ID | 4856 |
Feature activation | -8.80e-01 |
Pos logit contributions | |
Worcester | +0.523 |
Dartmouth | +0.513 |
heit | +0.480 |
Lansing | +0.468 |
ocene | +0.465 |
Neg logit contributions | |
nsic | -0.315 |
smuggling | -0.312 |
Machina | -0.303 |
table | -0.300 |
interrogation | -0.299 |
Token | company |
Token ID | 1664 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
Worcester | +0.827 |
Dartmouth | +0.812 |
heit | +0.760 |
Lansing | +0.742 |
ocene | +0.737 |
Neg logit contributions | |
nsic | -0.459 |
smuggling | -0.453 |
Machina | -0.440 |
Khe | -0.432 |
table | -0.432 |
Token | and |
Token ID | 290 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
Worcester | +0.138 |
Dartmouth | +0.135 |
heit | +0.126 |
Lansing | +0.122 |
ocene | +0.122 |
Neg logit contributions | |
nsic | -0.111 |
smuggling | -0.111 |
Machina | -0.108 |
interrogation | -0.107 |
table | -0.107 |
Token | gay |
Token ID | 5650 |
Feature activation | +9.69e-01 |
Pos logit contributions | |
smuggling | +0.828 |
nsic | +0.820 |
Machina | +0.803 |
interrogation | +0.799 |
investig | +0.798 |
Neg logit contributions | |
Worcester | -0.977 |
Dartmouth | -0.955 |
heit | -0.887 |
ocene | -0.868 |
hester | -0.861 |
Token | : |
Token ID | 25 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
smuggling | +1.125 |
nsic | +1.114 |
Machina | +1.104 |
table | +1.096 |
interrogation | +1.086 |
Neg logit contributions | |
Worcester | -1.524 |
Dartmouth | -1.487 |
heit | -1.399 |
ocene | -1.359 |
hester | -1.355 |
Token |
|
Token ID | 198 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
Worcester | +0.188 |
Dartmouth | +0.184 |
heit | +0.171 |
ocene | +0.166 |
hester | +0.165 |
Neg logit contributions | |
smuggling | -0.163 |
nsic | -0.162 |
Machina | -0.160 |
interrogation | -0.158 |
investig | -0.157 |
Token |
|
Token ID | 198 |
Feature activation | -4.92e-01 |
Pos logit contributions | |
Worcester | +0.115 |
Dartmouth | +0.112 |
heit | +0.105 |
ocene | +0.101 |
Lansing | +0.101 |
Neg logit contributions | |
nsic | -0.102 |
smuggling | -0.101 |
Machina | -0.100 |
table | -0.099 |
interrogation | -0.098 |
Token | Decre |
Token ID | 43198 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Worcester | +0.376 |
Dartmouth | +0.367 |
heit | +0.339 |
ocene | +0.329 |
Lansing | +0.329 |
Neg logit contributions | |
nsic | -0.339 |
smuggling | -0.339 |
Machina | -0.335 |
table | -0.332 |
interrogation | -0.329 |
Token | ases |
Token ID | 1386 |
Feature activation | -8.90e-01 |
Pos logit contributions | |
Worcester | +1.439 |
Dartmouth | +1.416 |
heit | +1.343 |
hester | +1.306 |
Lansing | +1.305 |
Neg logit contributions | |
smuggling | -0.614 |
nsic | -0.613 |
Machina | -0.588 |
interrogation | -0.581 |
Khe | -0.581 |
Token | blood |
Token ID | 2910 |
Feature activation | -4.87e+00 |
Pos logit contributions | |
Worcester | +0.708 |
Dartmouth | +0.693 |
heit | +0.644 |
Lansing | +0.623 |
ocene | +0.621 |
Neg logit contributions | |
nsic | -0.589 |
smuggling | -0.587 |
Machina | -0.572 |
table | -0.567 |
interrogation | -0.567 |
Token | glucose |
Token ID | 15701 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
Worcester | +4.107 |
Dartmouth | +3.996 |
heit | +3.734 |
Lansing | +3.622 |
ocene | +3.562 |
Neg logit contributions | |
nsic | -2.994 |
smuggling | -2.898 |
xual | -2.875 |
Machina | -2.871 |
Khe | -2.842 |
Token | . |
Token ID | 13 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
Worcester | +1.667 |
Dartmouth | +1.636 |
heit | +1.516 |
Lansing | +1.475 |
ocene | +1.463 |
Neg logit contributions | |
nsic | -1.263 |
smuggling | -1.241 |
Machina | -1.211 |
interrogation | -1.199 |
table | -1.198 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
Worcester | +0.215 |
Dartmouth | +0.209 |
heit | +0.196 |
ocene | +0.190 |
hester | +0.189 |
Neg logit contributions | |
smuggling | -0.188 |
nsic | -0.188 |
Machina | -0.185 |
table | -0.183 |
Khe | -0.182 |
Token |
|
Token ID | 198 |
Feature activation | -4.82e-01 |
Pos logit contributions | |
Worcester | +0.114 |
Dartmouth | +0.111 |
heit | +0.103 |
Lansing | +0.100 |
ocene | +0.100 |
Neg logit contributions | |
nsic | -0.102 |
smuggling | -0.101 |
Machina | -0.099 |
table | -0.099 |
interrogation | -0.098 |
Token | Decre |
Token ID | 43198 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
Worcester | +0.405 |
Dartmouth | +0.396 |
heit | +0.369 |
ocene | +0.358 |
Lansing | +0.358 |
Neg logit contributions | |
nsic | -0.296 |
smuggling | -0.295 |
Machina | -0.290 |
table | -0.287 |
interrogation | -0.285 |
Token | because |
Token ID | 780 |
Feature activation | -4.60e-01 |
Pos logit contributions | |
smuggling | +1.051 |
nsic | +1.048 |
Machina | +1.025 |
table | +1.016 |
Khe | +1.014 |
Neg logit contributions | |
Worcester | -1.496 |
Dartmouth | -1.465 |
heit | -1.369 |
ocene | -1.336 |
Lansing | -1.334 |
Token | it |
Token ID | 340 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
Worcester | +0.358 |
Dartmouth | +0.350 |
heit | +0.325 |
Lansing | +0.314 |
ocene | +0.313 |
Neg logit contributions | |
nsic | -0.313 |
smuggling | -0.312 |
Machina | -0.304 |
interrogation | -0.302 |
table | -0.302 |
Token | concerns |
Token ID | 4786 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
Worcester | +0.099 |
Dartmouth | +0.097 |
heit | +0.091 |
Lansing | +0.088 |
ocene | +0.087 |
Neg logit contributions | |
nsic | -0.074 |
smuggling | -0.074 |
Machina | -0.072 |
table | -0.071 |
interrogation | -0.071 |
Token | the |
Token ID | 262 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
smuggling | +0.743 |
nsic | +0.739 |
Machina | +0.723 |
interrogation | +0.719 |
table | +0.714 |
Neg logit contributions | |
Worcester | -0.977 |
Dartmouth | -0.955 |
heit | -0.896 |
ocene | -0.869 |
hester | -0.865 |
Token | connections |
Token ID | 8787 |
Feature activation | -1.61e+00 |
Pos logit contributions | |
smuggling | +0.152 |
nsic | +0.152 |
Machina | +0.147 |
interrogation | +0.146 |
table | +0.146 |
Neg logit contributions | |
Worcester | -0.235 |
Dartmouth | -0.230 |
heit | -0.216 |
Lansing | -0.210 |
ocene | -0.209 |
Token | between |
Token ID | 1022 |
Feature activation | -4.77e+00 |
Pos logit contributions | |
Worcester | +1.280 |
Dartmouth | +1.253 |
heit | +1.157 |
Lansing | +1.122 |
hester | +1.115 |
Neg logit contributions | |
nsic | -1.073 |
smuggling | -1.060 |
Machina | -1.033 |
table | -1.024 |
interrogation | -1.023 |
Token | judgments |
Token ID | 24195 |
Feature activation | -5.11e-01 |
Pos logit contributions | |
Worcester | +4.080 |
Dartmouth | +4.014 |
heit | +3.640 |
Lansing | +3.605 |
hester | +3.494 |
Neg logit contributions | |
nsic | -2.919 |
smuggling | -2.793 |
table | -2.745 |
xual | -2.708 |
Machina | -2.694 |
Token | about |
Token ID | 546 |
Feature activation | -2.64e-01 |
Pos logit contributions | |
Worcester | +0.432 |
Dartmouth | +0.423 |
heit | +0.394 |
Lansing | +0.382 |
ocene | +0.381 |
Neg logit contributions | |
nsic | -0.313 |
smuggling | -0.310 |
Machina | -0.302 |
table | -0.299 |
interrogation | -0.299 |
Token | justice |
Token ID | 5316 |
Feature activation | -4.32e-01 |
Pos logit contributions | |
Worcester | +0.225 |
Dartmouth | +0.220 |
heit | +0.206 |
Lansing | +0.199 |
ocene | +0.199 |
Neg logit contributions | |
nsic | -0.161 |
smuggling | -0.160 |
Machina | -0.156 |
interrogation | -0.154 |
table | -0.154 |
Token | in |
Token ID | 287 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
Worcester | +0.351 |
Dartmouth | +0.343 |
heit | +0.319 |
Lansing | +0.309 |
ocene | +0.308 |
Neg logit contributions | |
nsic | -0.279 |
smuggling | -0.277 |
Machina | -0.270 |
table | -0.267 |
interrogation | -0.267 |
Token | any |
Token ID | 597 |
Feature activation | +2.32e-02 |
Pos logit contributions | |
Worcester | +0.323 |
Dartmouth | +0.316 |
heit | +0.296 |
Lansing | +0.286 |
ocene | +0.286 |
Neg logit contributions | |
smuggling | -0.238 |
nsic | -0.237 |
Machina | -0.231 |
interrogation | -0.230 |
table | -0.229 |
Token | morning |
Token ID | 3329 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
Worcester | +0.473 |
Dartmouth | +0.463 |
heit | +0.431 |
Lansing | +0.417 |
ocene | +0.417 |
Neg logit contributions | |
smuggling | -0.377 |
nsic | -0.375 |
Machina | -0.366 |
table | -0.363 |
interrogation | -0.363 |
Token | sunshine |
Token ID | 34488 |
Feature activation | -4.12e+00 |
Pos logit contributions | |
Worcester | +0.457 |
Dartmouth | +0.447 |
heit | +0.416 |
ocene | +0.403 |
Lansing | +0.403 |
Neg logit contributions | |
smuggling | -0.371 |
nsic | -0.370 |
Machina | -0.361 |
interrogation | -0.358 |
table | -0.358 |
Token | for |
Token ID | 329 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
Worcester | +3.303 |
Dartmouth | +3.215 |
heit | +2.965 |
Lansing | +2.893 |
hester | +2.849 |
Neg logit contributions | |
nsic | -2.726 |
smuggling | -2.655 |
Machina | -2.599 |
interrogation | -2.584 |
xual | -2.569 |
Token | those |
Token ID | 883 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
Worcester | +0.378 |
Dartmouth | +0.369 |
heit | +0.344 |
ocene | +0.332 |
Lansing | +0.331 |
Neg logit contributions | |
smuggling | -0.341 |
nsic | -0.338 |
Machina | -0.332 |
interrogation | -0.330 |
table | -0.329 |
Token | " |
Token ID | 366 |
Feature activation | -4.99e-01 |
Pos logit contributions | |
Worcester | +1.604 |
Dartmouth | +1.569 |
heit | +1.442 |
Lansing | +1.411 |
hester | +1.391 |
Neg logit contributions | |
nsic | -1.340 |
smuggling | -1.313 |
Machina | -1.291 |
table | -1.278 |
interrogation | -1.275 |
Token | cold |
Token ID | 36673 |
Feature activation | -4.69e+00 |
Pos logit contributions | |
Worcester | +0.396 |
Dartmouth | +0.387 |
heit | +0.360 |
Lansing | +0.348 |
ocene | +0.347 |
Neg logit contributions | |
nsic | -0.332 |
smuggling | -0.331 |
Machina | -0.323 |
table | -0.321 |
interrogation | -0.319 |
Token | " |
Token ID | 1 |
Feature activation | +7.46e-01 |
Pos logit contributions | |
Worcester | +3.764 |
Dartmouth | +3.673 |
heit | +3.409 |
Lansing | +3.308 |
ocene | +3.288 |
Neg logit contributions | |
nsic | -3.037 |
smuggling | -3.004 |
Machina | -2.969 |
xual | -2.921 |
investig | -2.906 |
Token | AM |
Token ID | 3001 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
smuggling | +0.496 |
nsic | +0.492 |
Machina | +0.481 |
interrogation | +0.479 |
table | +0.478 |
Neg logit contributions | |
Worcester | -0.589 |
Dartmouth | -0.576 |
heit | -0.537 |
ocene | -0.519 |
hester | -0.519 |
Token | hours |
Token ID | 2250 |
Feature activation | -2.20e+00 |
Pos logit contributions | |
Worcester | +0.968 |
Dartmouth | +0.948 |
heit | +0.882 |
Lansing | +0.855 |
ocene | +0.853 |
Neg logit contributions | |
nsic | -0.760 |
smuggling | -0.759 |
Machina | -0.738 |
interrogation | -0.732 |
table | -0.732 |
Token | . |
Token ID | 13 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
Worcester | +1.789 |
Dartmouth | +1.749 |
heit | +1.624 |
Lansing | +1.575 |
ocene | +1.565 |
Neg logit contributions | |
nsic | -1.419 |
smuggling | -1.406 |
Machina | -1.374 |
interrogation | -1.360 |
table | -1.358 |
Token | I |
Token ID | 314 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
Worcester | +1.057 |
Dartmouth | +1.033 |
heit | +0.959 |
Lansing | +0.925 |
ocene | +0.924 |
Neg logit contributions | |
nsic | -0.950 |
smuggling | -0.949 |
Machina | -0.929 |
table | -0.920 |
interrogation | -0.919 |
Token | The |
Token ID | 383 |
Feature activation | +4.57e-01 |
Pos logit contributions | |
Worcester | +0.002 |
Dartmouth | +0.002 |
heit | +0.002 |
ocene | +0.001 |
hester | +0.001 |
Neg logit contributions | |
smuggling | -0.002 |
nsic | -0.002 |
Machina | -0.001 |
table | -0.001 |
Khe | -0.001 |
Token | exact |
Token ID | 2748 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
smuggling | +0.287 |
nsic | +0.284 |
Machina | +0.280 |
interrogation | +0.277 |
table | +0.276 |
Neg logit contributions | |
Worcester | -0.377 |
Dartmouth | -0.370 |
heit | -0.347 |
ocene | -0.336 |
hester | -0.335 |
Token | description |
Token ID | 6764 |
Feature activation | -4.44e-01 |
Pos logit contributions | |
Worcester | +0.979 |
Dartmouth | +0.958 |
heit | +0.891 |
Lansing | +0.863 |
ocene | +0.861 |
Neg logit contributions | |
nsic | -0.782 |
smuggling | -0.780 |
Machina | -0.760 |
interrogation | -0.753 |
table | -0.753 |
Token | that |
Token ID | 326 |
Feature activation | -2.31e-01 |
Pos logit contributions | |
Worcester | +0.364 |
Dartmouth | +0.357 |
heit | +0.333 |
ocene | +0.322 |
Lansing | +0.322 |
Neg logit contributions | |
smuggling | -0.282 |
nsic | -0.282 |
Machina | -0.275 |
interrogation | -0.273 |
table | -0.272 |
Token | went |
Token ID | 1816 |
Feature activation | -8.09e-02 |
Pos logit contributions | |
Worcester | +0.173 |
Dartmouth | +0.169 |
heit | +0.158 |
ocene | +0.152 |
hester | +0.151 |
Neg logit contributions | |
smuggling | -0.163 |
nsic | -0.162 |
Machina | -0.160 |
interrogation | -0.158 |
table | -0.158 |
Token | through |
Token ID | 832 |
Feature activation | -4.69e+00 |
Pos logit contributions | |
Worcester | +0.067 |
Dartmouth | +0.066 |
heit | +0.062 |
ocene | +0.060 |
Lansing | +0.060 |
Neg logit contributions | |
smuggling | -0.050 |
nsic | -0.050 |
Machina | -0.049 |
table | -0.048 |
interrogation | -0.048 |
Token | my |
Token ID | 616 |
Feature activation | -7.71e-01 |
Pos logit contributions | |
Worcester | +3.097 |
Dartmouth | +3.012 |
heit | +2.679 |
Lansing | +2.647 |
ocene | +2.585 |
Neg logit contributions | |
nsic | -3.723 |
smuggling | -3.679 |
Machina | -3.572 |
table | -3.561 |
xual | -3.547 |
Token | brain |
Token ID | 3632 |
Feature activation | -1.70e+00 |
Pos logit contributions | |
Worcester | +0.668 |
Dartmouth | +0.654 |
heit | +0.607 |
Lansing | +0.594 |
hester | +0.588 |
Neg logit contributions | |
nsic | -0.460 |
smuggling | -0.455 |
Machina | -0.441 |
table | -0.439 |
xual | -0.437 |
Token | during |
Token ID | 1141 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
Worcester | +1.316 |
Dartmouth | +1.287 |
heit | +1.194 |
Lansing | +1.154 |
ocene | +1.149 |
Neg logit contributions | |
nsic | -1.157 |
smuggling | -1.154 |
Machina | -1.125 |
interrogation | -1.115 |
table | -1.115 |
Token | my |
Token ID | 616 |
Feature activation | -8.63e-02 |
Pos logit contributions | |
smuggling | +0.158 |
nsic | +0.157 |
Machina | +0.154 |
interrogation | +0.153 |
table | +0.153 |
Neg logit contributions | |
Worcester | -0.169 |
Dartmouth | -0.165 |
heit | -0.154 |
ocene | -0.148 |
hester | -0.148 |
Token | first |
Token ID | 717 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
Worcester | +0.072 |
Dartmouth | +0.070 |
heit | +0.065 |
Lansing | +0.064 |
ocene | +0.063 |
Neg logit contributions | |
nsic | -0.054 |
smuggling | -0.054 |
Machina | -0.052 |
table | -0.052 |
interrogation | -0.052 |
Token | al |
Token ID | 282 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
nsic | +1.069 |
smuggling | +1.055 |
Machina | +1.043 |
table | +1.038 |
interrogation | +1.014 |
Neg logit contributions | |
Worcester | -1.601 |
Dartmouth | -1.559 |
heit | -1.446 |
Lansing | -1.417 |
ocene | -1.414 |
Token | on |
Token ID | 319 |
Feature activation | -9.43e-01 |
Pos logit contributions | |
Worcester | +0.219 |
Dartmouth | +0.213 |
heit | +0.197 |
ocene | +0.190 |
Lansing | +0.190 |
Neg logit contributions | |
nsic | -0.209 |
smuggling | -0.209 |
Machina | -0.204 |
table | -0.203 |
interrogation | -0.203 |
Token | the |
Token ID | 262 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
Worcester | +0.744 |
Dartmouth | +0.728 |
heit | +0.676 |
Lansing | +0.654 |
ocene | +0.653 |
Neg logit contributions | |
nsic | -0.629 |
smuggling | -0.628 |
Machina | -0.612 |
interrogation | -0.607 |
table | -0.607 |
Token | claimed |
Token ID | 4752 |
Feature activation | -7.12e-01 |
Pos logit contributions | |
nsic | +0.087 |
smuggling | +0.087 |
Machina | +0.084 |
interrogation | +0.084 |
table | +0.084 |
Neg logit contributions | |
Worcester | -0.133 |
Dartmouth | -0.131 |
heit | -0.122 |
Lansing | -0.119 |
ocene | -0.118 |
Token | parallels |
Token ID | 30614 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
Worcester | +0.649 |
Dartmouth | +0.638 |
heit | +0.594 |
Lansing | +0.581 |
ocene | +0.576 |
Neg logit contributions | |
nsic | -0.391 |
smuggling | -0.386 |
Machina | -0.375 |
table | -0.371 |
interrogation | -0.370 |
Token | between |
Token ID | 1022 |
Feature activation | -4.62e+00 |
Pos logit contributions | |
smuggling | +0.313 |
nsic | +0.311 |
Machina | +0.304 |
table | +0.302 |
interrogation | +0.300 |
Neg logit contributions | |
Worcester | -0.407 |
Dartmouth | -0.398 |
heit | -0.373 |
ocene | -0.361 |
Lansing | -0.360 |
Token | her |
Token ID | 607 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
Worcester | +3.932 |
Dartmouth | +3.861 |
heit | +3.501 |
Lansing | +3.485 |
ocene | +3.381 |
Neg logit contributions | |
nsic | -2.835 |
smuggling | -2.735 |
Machina | -2.665 |
table | -2.654 |
xual | -2.650 |
Token | identity |
Token ID | 5369 |
Feature activation | -2.17e+00 |
Pos logit contributions | |
Worcester | +1.167 |
Dartmouth | +1.146 |
heit | +1.061 |
Lansing | +1.037 |
ocene | +1.028 |
Neg logit contributions | |
nsic | -0.810 |
smuggling | -0.797 |
Machina | -0.778 |
table | -0.771 |
Khe | -0.768 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
Worcester | +1.720 |
Dartmouth | +1.688 |
heit | +1.550 |
ocene | +1.502 |
Lansing | +1.501 |
Neg logit contributions | |
nsic | -1.444 |
smuggling | -1.413 |
Machina | -1.378 |
table | -1.374 |
xual | -1.371 |
Token | transgender |
Token ID | 10637 |
Feature activation | +5.15e-01 |
Pos logit contributions | |
smuggling | +0.693 |
nsic | +0.686 |
Machina | +0.673 |
table | +0.666 |
interrogation | +0.666 |
Neg logit contributions | |
Worcester | -0.903 |
Dartmouth | -0.883 |
heit | -0.835 |
ocene | -0.809 |
hester | -0.805 |
Token | identity |
Token ID | 5369 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
smuggling | +0.268 |
nsic | +0.268 |
Machina | +0.259 |
interrogation | +0.256 |
table | +0.256 |
Neg logit contributions | |
Worcester | -0.481 |
Dartmouth | -0.472 |
heit | -0.445 |
Lansing | -0.433 |
ocene | -0.432 |
Token | However |
Token ID | 2102 |
Feature activation | +8.76e-02 |
Pos logit contributions | |
Worcester | +0.283 |
Dartmouth | +0.277 |
heit | +0.260 |
ocene | +0.250 |
hester | +0.250 |
Neg logit contributions | |
nsic | -0.246 |
smuggling | -0.245 |
Machina | -0.241 |
table | -0.240 |
Khe | -0.239 |
Token | , |
Token ID | 11 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
smuggling | +0.052 |
nsic | +0.052 |
Machina | +0.051 |
table | +0.050 |
interrogation | +0.050 |
Neg logit contributions | |
Worcester | -0.075 |
Dartmouth | -0.074 |
heit | -0.069 |
ocene | -0.067 |
Lansing | -0.067 |
Token | if |
Token ID | 611 |
Feature activation | -8.43e-01 |
Pos logit contributions | |
Worcester | +0.872 |
Dartmouth | +0.853 |
heit | +0.790 |
Lansing | +0.764 |
ocene | +0.761 |
Neg logit contributions | |
nsic | -0.767 |
smuggling | -0.764 |
Machina | -0.746 |
interrogation | -0.739 |
table | -0.739 |
Token | Jordan |
Token ID | 8078 |
Feature activation | +1.16e+00 |
Pos logit contributions | |
Worcester | +0.616 |
Dartmouth | +0.602 |
heit | +0.555 |
Lansing | +0.535 |
ocene | +0.534 |
Neg logit contributions | |
nsic | -0.612 |
smuggling | -0.610 |
Machina | -0.596 |
interrogation | -0.591 |
table | -0.591 |
Token | go |
Token ID | 467 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
smuggling | +0.704 |
nsic | +0.698 |
Machina | +0.686 |
interrogation | +0.676 |
table | +0.676 |
Neg logit contributions | |
Worcester | -0.989 |
Dartmouth | -0.970 |
heit | -0.909 |
hester | -0.881 |
ocene | -0.880 |
Token | through |
Token ID | 832 |
Feature activation | -4.60e+00 |
Pos logit contributions | |
smuggling | +0.075 |
nsic | +0.075 |
Machina | +0.073 |
table | +0.073 |
interrogation | +0.072 |
Neg logit contributions | |
Worcester | -0.102 |
Dartmouth | -0.100 |
heit | -0.094 |
ocene | -0.091 |
Lansing | -0.091 |
Token | , |
Token ID | 11 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
Worcester | +3.585 |
Dartmouth | +3.480 |
heit | +3.175 |
Lansing | +3.115 |
ocene | +3.038 |
Neg logit contributions | |
nsic | -3.155 |
smuggling | -3.057 |
xual | -3.018 |
Machina | -3.004 |
investig | -2.967 |
Token | at |
Token ID | 379 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
Worcester | +0.237 |
Dartmouth | +0.231 |
heit | +0.214 |
ocene | +0.207 |
Lansing | +0.207 |
Neg logit contributions | |
smuggling | -0.225 |
nsic | -0.225 |
Machina | -0.219 |
interrogation | -0.218 |
table | -0.218 |
Token | least |
Token ID | 1551 |
Feature activation | +9.25e-01 |
Pos logit contributions | |
Worcester | +0.142 |
Dartmouth | +0.139 |
heit | +0.130 |
ocene | +0.126 |
Lansing | +0.126 |
Neg logit contributions | |
smuggling | -0.102 |
nsic | -0.102 |
Machina | -0.099 |
table | -0.099 |
interrogation | -0.099 |
Token | one |
Token ID | 530 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
smuggling | +0.633 |
nsic | +0.624 |
Machina | +0.615 |
Khe | +0.612 |
interrogation | +0.610 |
Neg logit contributions | |
Worcester | -0.711 |
Dartmouth | -0.697 |
heit | -0.650 |
ocene | -0.633 |
hester | -0.628 |
Token | of |
Token ID | 286 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
smuggling | +0.863 |
nsic | +0.846 |
interrogation | +0.831 |
Machina | +0.830 |
table | +0.827 |
Neg logit contributions | |
Worcester | -1.327 |
Dartmouth | -1.306 |
heit | -1.237 |
hester | -1.202 |
ocene | -1.200 |
Token | says |
Token ID | 1139 |
Feature activation | +9.91e-02 |
Pos logit contributions | |
Worcester | +0.190 |
Dartmouth | +0.185 |
heit | +0.172 |
ocene | +0.167 |
Lansing | +0.166 |
Neg logit contributions | |
smuggling | -0.164 |
nsic | -0.163 |
Machina | -0.159 |
interrogation | -0.158 |
table | -0.158 |
Token | there |
Token ID | 612 |
Feature activation | +4.86e-01 |
Pos logit contributions | |
smuggling | +0.070 |
nsic | +0.069 |
Machina | +0.068 |
interrogation | +0.067 |
table | +0.067 |
Neg logit contributions | |
Worcester | -0.075 |
Dartmouth | -0.073 |
heit | -0.068 |
ocene | -0.065 |
Lansing | -0.065 |
Token | 's |
Token ID | 338 |
Feature activation | -2.34e+00 |
Pos logit contributions | |
nsic | +0.319 |
smuggling | +0.318 |
Machina | +0.308 |
interrogation | +0.308 |
table | +0.307 |
Neg logit contributions | |
Worcester | -0.391 |
Dartmouth | -0.381 |
heit | -0.354 |
ocene | -0.343 |
hester | -0.343 |
Token | no |
Token ID | 645 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
Worcester | +1.720 |
Dartmouth | +1.689 |
heit | +1.540 |
Lansing | +1.507 |
ocene | +1.473 |
Neg logit contributions | |
nsic | -1.684 |
smuggling | -1.660 |
Machina | -1.636 |
table | -1.618 |
xual | -1.617 |
Token | connection |
Token ID | 4637 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
Worcester | +1.591 |
Dartmouth | +1.563 |
heit | +1.446 |
Lansing | +1.416 |
ocene | +1.391 |
Neg logit contributions | |
nsic | -1.101 |
smuggling | -1.068 |
Machina | -1.056 |
xual | -1.048 |
table | -1.048 |
Token | between |
Token ID | 1022 |
Feature activation | -4.58e+00 |
Pos logit contributions | |
Worcester | +1.321 |
Dartmouth | +1.293 |
heit | +1.195 |
Lansing | +1.160 |
ocene | +1.146 |
Neg logit contributions | |
nsic | -1.136 |
smuggling | -1.121 |
Machina | -1.097 |
interrogation | -1.087 |
table | -1.083 |
Token | the |
Token ID | 262 |
Feature activation | -4.94e-01 |
Pos logit contributions | |
Worcester | +3.491 |
Dartmouth | +3.406 |
heit | +3.103 |
Lansing | +3.063 |
hester | +2.976 |
Neg logit contributions | |
nsic | -3.216 |
smuggling | -3.096 |
Machina | -3.081 |
xual | -3.056 |
table | -3.053 |
Token | lawsuit |
Token ID | 8087 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
Worcester | +0.420 |
Dartmouth | +0.411 |
heit | +0.383 |
Lansing | +0.373 |
ocene | +0.370 |
Neg logit contributions | |
nsic | -0.301 |
smuggling | -0.298 |
Machina | -0.291 |
table | -0.288 |
interrogation | -0.288 |
Token | and |
Token ID | 290 |
Feature activation | +7.66e-01 |
Pos logit contributions | |
Worcester | +0.193 |
Dartmouth | +0.189 |
heit | +0.177 |
ocene | +0.171 |
Lansing | +0.171 |
Neg logit contributions | |
smuggling | -0.151 |
nsic | -0.151 |
Machina | -0.147 |
interrogation | -0.146 |
table | -0.146 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
smuggling | +0.508 |
nsic | +0.502 |
interrogation | +0.490 |
Machina | +0.490 |
table | +0.487 |
Neg logit contributions | |
Worcester | -0.607 |
Dartmouth | -0.595 |
heit | -0.556 |
ocene | -0.541 |
hester | -0.536 |
Token | decision |
Token ID | 2551 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
smuggling | +0.074 |
nsic | +0.074 |
Machina | +0.072 |
interrogation | +0.071 |
table | +0.071 |
Neg logit contributions | |
Worcester | -0.106 |
Dartmouth | -0.104 |
heit | -0.097 |
ocene | -0.094 |
Lansing | -0.094 |
Token | to |
Token ID | 284 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
Worcester | +0.008 |
Dartmouth | +0.007 |
heit | +0.007 |
Lansing | +0.007 |
ocene | +0.007 |
Neg logit contributions | |
nsic | -0.006 |
smuggling | -0.006 |
Machina | -0.006 |
interrogation | -0.006 |
table | -0.006 |
Token | check |
Token ID | 2198 |
Feature activation | -1.51e+00 |
Pos logit contributions | |
smuggling | +0.668 |
nsic | +0.663 |
Machina | +0.643 |
interrogation | +0.642 |
investig | +0.639 |
Neg logit contributions | |
Worcester | -1.032 |
Dartmouth | -1.012 |
heit | -0.951 |
ocene | -0.923 |
hester | -0.921 |
Token | references |
Token ID | 10288 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
Worcester | +1.198 |
Dartmouth | +1.172 |
heit | +1.087 |
Lansing | +1.053 |
ocene | +1.048 |
Neg logit contributions | |
nsic | -1.001 |
smuggling | -0.997 |
Machina | -0.973 |
interrogation | -0.964 |
table | -0.963 |
Token | and |
Token ID | 290 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
smuggling | +0.701 |
nsic | +0.693 |
Machina | +0.677 |
interrogation | +0.671 |
table | +0.671 |
Neg logit contributions | |
Worcester | -0.916 |
Dartmouth | -0.895 |
heit | -0.840 |
ocene | -0.816 |
hester | -0.812 |
Token | go |
Token ID | 467 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
Worcester | +0.493 |
Dartmouth | +0.483 |
heit | +0.451 |
ocene | +0.437 |
Lansing | +0.437 |
Neg logit contributions | |
smuggling | -0.356 |
nsic | -0.356 |
Machina | -0.346 |
interrogation | -0.343 |
table | -0.343 |
Token | through |
Token ID | 832 |
Feature activation | -4.53e+00 |
Pos logit contributions | |
Worcester | +0.228 |
Dartmouth | +0.223 |
heit | +0.207 |
ocene | +0.201 |
Lansing | +0.200 |
Neg logit contributions | |
nsic | -0.182 |
smuggling | -0.181 |
Machina | -0.175 |
table | -0.175 |
interrogation | -0.174 |
Token | the |
Token ID | 262 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
Worcester | +3.587 |
Dartmouth | +3.506 |
heit | +3.207 |
Lansing | +3.159 |
hester | +3.082 |
Neg logit contributions | |
nsic | -2.991 |
smuggling | -2.944 |
Machina | -2.911 |
xual | -2.898 |
Khe | -2.885 |
Token | Better |
Token ID | 11625 |
Feature activation | -2.69e-01 |
Pos logit contributions | |
Worcester | +0.196 |
Dartmouth | +0.192 |
heit | +0.180 |
ocene | +0.174 |
Lansing | +0.174 |
Neg logit contributions | |
smuggling | -0.146 |
nsic | -0.145 |
Machina | -0.141 |
interrogation | -0.140 |
table | -0.140 |
Token | Business |
Token ID | 7320 |
Feature activation | -8.06e-01 |
Pos logit contributions | |
Worcester | +0.223 |
Dartmouth | +0.220 |
heit | +0.205 |
ocene | +0.199 |
hester | +0.198 |
Neg logit contributions | |
smuggling | -0.167 |
nsic | -0.166 |
Machina | -0.162 |
interrogation | -0.160 |
investig | -0.159 |
Token | Bureau |
Token ID | 9840 |
Feature activation | +9.71e-01 |
Pos logit contributions | |
Worcester | +0.538 |
Dartmouth | +0.523 |
heit | +0.478 |
Lansing | +0.461 |
ocene | +0.459 |
Neg logit contributions | |
nsic | -0.638 |
smuggling | -0.636 |
Machina | -0.622 |
interrogation | -0.618 |
table | -0.617 |
Token | . |
Token ID | 13 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
smuggling | +0.639 |
nsic | +0.634 |
interrogation | +0.618 |
Machina | +0.617 |
investig | +0.614 |
Neg logit contributions | |
Worcester | -0.776 |
Dartmouth | -0.759 |
heit | -0.707 |
ocene | -0.688 |
hester | -0.684 |
Token | data |
Token ID | 1366 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
nsic | +0.171 |
smuggling | +0.170 |
Machina | +0.165 |
table | +0.164 |
interrogation | +0.164 |
Neg logit contributions | |
Worcester | -0.283 |
Dartmouth | -0.277 |
heit | -0.260 |
Lansing | -0.253 |
ocene | -0.252 |
Token | in |
Token ID | 287 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
nsic | +0.086 |
smuggling | +0.086 |
Machina | +0.083 |
table | +0.083 |
interrogation | +0.083 |
Neg logit contributions | |
Worcester | -0.115 |
Dartmouth | -0.113 |
heit | -0.105 |
Lansing | -0.102 |
ocene | -0.102 |
Token | instead |
Token ID | 2427 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
nsic | +0.083 |
smuggling | +0.083 |
Machina | +0.081 |
interrogation | +0.080 |
table | +0.080 |
Neg logit contributions | |
Worcester | -0.098 |
Dartmouth | -0.096 |
heit | -0.089 |
Lansing | -0.086 |
ocene | -0.086 |
Token | of |
Token ID | 286 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
Worcester | +0.267 |
Dartmouth | +0.261 |
heit | +0.245 |
Lansing | +0.238 |
ocene | +0.238 |
Neg logit contributions | |
nsic | -0.166 |
smuggling | -0.166 |
Machina | -0.161 |
interrogation | -0.159 |
table | -0.158 |
Token | going |
Token ID | 1016 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
Worcester | +0.944 |
Dartmouth | +0.925 |
heit | +0.859 |
Lansing | +0.834 |
ocene | +0.827 |
Neg logit contributions | |
nsic | -0.764 |
smuggling | -0.758 |
Machina | -0.739 |
interrogation | -0.734 |
table | -0.732 |
Token | through |
Token ID | 832 |
Feature activation | -4.47e+00 |
Pos logit contributions | |
nsic | +0.270 |
smuggling | +0.270 |
Machina | +0.263 |
table | +0.262 |
interrogation | +0.260 |
Neg logit contributions | |
Worcester | -0.333 |
Dartmouth | -0.326 |
heit | -0.303 |
ocene | -0.293 |
Lansing | -0.293 |
Token | std |
Token ID | 14367 |
Feature activation | +1.96e+00 |
Pos logit contributions | |
Worcester | +3.202 |
Dartmouth | +3.162 |
heit | +2.917 |
Lansing | +2.827 |
hester | +2.783 |
Neg logit contributions | |
smuggling | -3.192 |
nsic | -3.187 |
Machina | -3.095 |
investig | -3.094 |
xual | -3.078 |
Token | :: |
Token ID | 3712 |
Feature activation | +2.77e+00 |
Pos logit contributions | |
nsic | +1.275 |
smuggling | +1.269 |
table | +1.241 |
Machina | +1.234 |
interrogation | +1.227 |
Neg logit contributions | |
Worcester | -1.593 |
Dartmouth | -1.561 |
heit | -1.451 |
Lansing | -1.401 |
hester | -1.401 |
Token | ist |
Token ID | 396 |
Feature activation | +1.95e+00 |
Pos logit contributions | |
nsic | +1.768 |
table | +1.735 |
smuggling | +1.728 |
Machina | +1.685 |
interrogation | +1.671 |
Neg logit contributions | |
Worcester | -2.296 |
Dartmouth | -2.249 |
heit | -2.081 |
Lansing | -2.019 |
hester | -2.007 |
Token | ream |
Token ID | 1476 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
nsic | +1.261 |
smuggling | +1.259 |
Machina | +1.225 |
table | +1.223 |
interrogation | +1.215 |
Neg logit contributions | |
Worcester | -1.584 |
Dartmouth | -1.547 |
heit | -1.441 |
Lansing | -1.391 |
hester | -1.387 |
Token | . |
Token ID | 13 |
Feature activation | -2.57e-01 |
Pos logit contributions | |
nsic | +0.901 |
smuggling | +0.899 |
Machina | +0.874 |
table | +0.873 |
interrogation | +0.868 |
Neg logit contributions | |
Worcester | -1.165 |
Dartmouth | -1.141 |
heit | -1.059 |
Lansing | -1.025 |
ocene | -1.024 |
Token | , |
Token ID | 11 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
nsic | +0.315 |
smuggling | +0.314 |
Machina | +0.306 |
interrogation | +0.303 |
table | +0.303 |
Neg logit contributions | |
Worcester | -0.422 |
Dartmouth | -0.413 |
heit | -0.386 |
Lansing | -0.374 |
ocene | -0.373 |
Token | and |
Token ID | 290 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
nsic | +0.374 |
smuggling | +0.373 |
Machina | +0.363 |
interrogation | +0.360 |
table | +0.359 |
Neg logit contributions | |
Worcester | -0.477 |
Dartmouth | -0.467 |
heit | -0.435 |
Lansing | -0.421 |
ocene | -0.420 |
Token | the |
Token ID | 262 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
nsic | +0.232 |
smuggling | +0.232 |
Machina | +0.226 |
interrogation | +0.224 |
table | +0.224 |
Neg logit contributions | |
Worcester | -0.293 |
Dartmouth | -0.287 |
heit | -0.267 |
Lansing | -0.258 |
ocene | -0.258 |
Token | close |
Token ID | 1969 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
nsic | +0.078 |
smuggling | +0.077 |
Machina | +0.075 |
table | +0.074 |
interrogation | +0.074 |
Neg logit contributions | |
Worcester | -0.125 |
Dartmouth | -0.122 |
heit | -0.115 |
Lansing | -0.111 |
ocene | -0.111 |
Token | relationship |
Token ID | 2776 |
Feature activation | -1.81e+00 |
Pos logit contributions | |
nsic | +0.491 |
smuggling | +0.488 |
Machina | +0.469 |
table | +0.461 |
interrogation | +0.461 |
Neg logit contributions | |
Worcester | -1.278 |
Dartmouth | -1.257 |
heit | -1.189 |
Lansing | -1.161 |
ocene | -1.159 |
Token | between |
Token ID | 1022 |
Feature activation | -4.47e+00 |
Pos logit contributions | |
Worcester | +1.438 |
Dartmouth | +1.414 |
heit | +1.304 |
Lansing | +1.263 |
ocene | +1.259 |
Neg logit contributions | |
nsic | -1.203 |
smuggling | -1.187 |
Machina | -1.163 |
table | -1.147 |
interrogation | -1.147 |
Token | academic |
Token ID | 8233 |
Feature activation | +1.89e-01 |
Pos logit contributions | |
Worcester | +4.126 |
Dartmouth | +4.095 |
heit | +3.743 |
Lansing | +3.671 |
hester | +3.616 |
Neg logit contributions | |
nsic | -2.396 |
smuggling | -2.276 |
xual | -2.260 |
Machina | -2.250 |
table | -2.247 |
Token | researchers |
Token ID | 4837 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
nsic | +0.104 |
smuggling | +0.103 |
Machina | +0.100 |
table | +0.099 |
Khe | +0.099 |
Neg logit contributions | |
Worcester | -0.172 |
Dartmouth | -0.169 |
heit | -0.158 |
Lansing | -0.154 |
ocene | -0.153 |
Token | and |
Token ID | 290 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
nsic | +0.139 |
smuggling | +0.139 |
Machina | +0.135 |
interrogation | +0.134 |
table | +0.134 |
Neg logit contributions | |
Worcester | -0.179 |
Dartmouth | -0.175 |
heit | -0.163 |
Lansing | -0.158 |
ocene | -0.158 |
Token | the |
Token ID | 262 |
Feature activation | -6.50e-03 |
Pos logit contributions | |
nsic | +0.124 |
smuggling | +0.124 |
Machina | +0.121 |
table | +0.120 |
interrogation | +0.119 |
Neg logit contributions | |
Worcester | -0.166 |
Dartmouth | -0.163 |
heit | -0.152 |
Lansing | -0.147 |
ocene | -0.146 |
Token | pharmaceutical |
Token ID | 18423 |
Feature activation | -8.55e-01 |
Pos logit contributions | |
Worcester | +0.006 |
Dartmouth | +0.006 |
heit | +0.006 |
Lansing | +0.005 |
ocene | +0.005 |
Neg logit contributions | |
nsic | -0.003 |
smuggling | -0.003 |
Machina | -0.003 |
table | -0.003 |
interrogation | -0.003 |
Token | - |
Token ID | 12 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
smuggling | +0.415 |
nsic | +0.408 |
table | +0.396 |
Machina | +0.394 |
interrogation | +0.394 |
Neg logit contributions | |
Worcester | -0.696 |
Dartmouth | -0.682 |
heit | -0.643 |
hester | -0.627 |
ocene | -0.626 |
Token | on |
Token ID | 261 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
Worcester | +0.143 |
Dartmouth | +0.140 |
heit | +0.130 |
Lansing | +0.126 |
ocene | +0.126 |
Neg logit contributions | |
nsic | -0.106 |
smuggling | -0.106 |
Machina | -0.103 |
interrogation | -0.102 |
table | -0.102 |
Token | baggage |
Token ID | 30466 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
Worcester | +0.271 |
Dartmouth | +0.266 |
heit | +0.250 |
Lansing | +0.243 |
ocene | +0.242 |
Neg logit contributions | |
nsic | -0.150 |
smuggling | -0.149 |
Machina | -0.144 |
table | -0.142 |
interrogation | -0.142 |
Token | when |
Token ID | 618 |
Feature activation | -4.19e-01 |
Pos logit contributions | |
smuggling | +0.268 |
nsic | +0.267 |
Machina | +0.259 |
interrogation | +0.258 |
table | +0.257 |
Neg logit contributions | |
Worcester | -0.336 |
Dartmouth | -0.328 |
heit | -0.306 |
ocene | -0.297 |
Lansing | -0.297 |
Token | going |
Token ID | 1016 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
Worcester | +0.313 |
Dartmouth | +0.305 |
heit | +0.282 |
Lansing | +0.272 |
ocene | +0.270 |
Neg logit contributions | |
nsic | -0.298 |
smuggling | -0.296 |
Machina | -0.291 |
table | -0.288 |
interrogation | -0.287 |
Token | through |
Token ID | 832 |
Feature activation | -4.46e+00 |
Pos logit contributions | |
Worcester | +0.339 |
Dartmouth | +0.332 |
heit | +0.309 |
ocene | +0.299 |
Lansing | +0.298 |
Neg logit contributions | |
smuggling | -0.287 |
nsic | -0.286 |
Machina | -0.278 |
interrogation | -0.277 |
table | -0.277 |
Token | airline |
Token ID | 18091 |
Feature activation | -8.05e-01 |
Pos logit contributions | |
Worcester | +4.074 |
Dartmouth | +3.995 |
heit | +3.743 |
Lansing | +3.634 |
hester | +3.524 |
Neg logit contributions | |
nsic | -2.412 |
Machina | -2.350 |
xual | -2.342 |
smuggling | -2.286 |
table | -2.277 |
Token | security |
Token ID | 2324 |
Feature activation | -6.14e-01 |
Pos logit contributions | |
Worcester | +0.805 |
Dartmouth | +0.792 |
heit | +0.748 |
Lansing | +0.729 |
hester | +0.719 |
Neg logit contributions | |
nsic | -0.370 |
smuggling | -0.355 |
Machina | -0.353 |
xual | -0.351 |
table | -0.346 |
Token | . |
Token ID | 13 |
Feature activation | +8.39e-01 |
Pos logit contributions | |
Worcester | +0.608 |
Dartmouth | +0.597 |
heit | +0.560 |
Lansing | +0.549 |
ocene | +0.544 |
Neg logit contributions | |
nsic | -0.287 |
smuggling | -0.283 |
Machina | -0.275 |
table | -0.271 |
xual | -0.271 |
Token | Given |
Token ID | 11259 |
Feature activation | -9.89e-01 |
Pos logit contributions | |
nsic | +0.559 |
smuggling | +0.557 |
Machina | +0.548 |
table | +0.545 |
Khe | +0.544 |
Neg logit contributions | |
Worcester | -0.653 |
Dartmouth | -0.639 |
heit | -0.599 |
ocene | -0.583 |
hester | -0.580 |
Token | the |
Token ID | 262 |
Feature activation | +4.13e-01 |
Pos logit contributions | |
Worcester | +0.738 |
Dartmouth | +0.721 |
heit | +0.666 |
Lansing | +0.643 |
ocene | +0.641 |
Neg logit contributions | |
nsic | -0.703 |
smuggling | -0.701 |
Machina | -0.685 |
interrogation | -0.679 |
table | -0.679 |
Token | or |
Token ID | 393 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
Worcester | +0.521 |
Dartmouth | +0.511 |
heit | +0.472 |
Lansing | +0.457 |
ocene | +0.456 |
Neg logit contributions | |
nsic | -0.434 |
smuggling | -0.428 |
Machina | -0.418 |
table | -0.415 |
xual | -0.413 |
Token | tribe |
Token ID | 14893 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
nsic | +0.020 |
smuggling | +0.019 |
Machina | +0.019 |
table | +0.019 |
interrogation | +0.019 |
Neg logit contributions | |
Worcester | -0.031 |
Dartmouth | -0.031 |
heit | -0.029 |
Lansing | -0.028 |
ocene | -0.028 |
Token | respecting |
Token ID | 30796 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
Worcester | +1.032 |
Dartmouth | +1.011 |
heit | +0.935 |
Lansing | +0.911 |
ocene | +0.902 |
Neg logit contributions | |
nsic | -0.764 |
smuggling | -0.747 |
Machina | -0.731 |
table | -0.727 |
xual | -0.727 |
Token | a |
Token ID | 257 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
nsic | +0.185 |
smuggling | +0.182 |
Machina | +0.179 |
table | +0.177 |
Khe | +0.177 |
Neg logit contributions | |
Worcester | -0.217 |
Dartmouth | -0.213 |
heit | -0.196 |
Lansing | -0.190 |
ocene | -0.188 |
Token | relationship |
Token ID | 2776 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
nsic | +0.012 |
smuggling | +0.012 |
Machina | +0.012 |
table | +0.012 |
interrogation | +0.012 |
Neg logit contributions | |
Worcester | -0.023 |
Dartmouth | -0.023 |
heit | -0.021 |
Lansing | -0.021 |
ocene | -0.021 |
Token | between |
Token ID | 1022 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
Worcester | +0.941 |
Dartmouth | +0.919 |
heit | +0.853 |
Lansing | +0.821 |
ocene | +0.820 |
Neg logit contributions | |
nsic | -0.741 |
smuggling | -0.726 |
Machina | -0.710 |
interrogation | -0.704 |
table | -0.703 |
Token | persons |
Token ID | 6506 |
Feature activation | -7.01e-01 |
Pos logit contributions | |
Worcester | +3.218 |
Dartmouth | +3.142 |
heit | +2.828 |
Lansing | +2.784 |
hester | +2.669 |
Neg logit contributions | |
nsic | -3.286 |
smuggling | -3.149 |
Machina | -3.108 |
table | -3.105 |
interrogation | -3.085 |
Token | of |
Token ID | 286 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
Worcester | +0.605 |
Dartmouth | +0.589 |
heit | +0.543 |
Lansing | +0.534 |
hester | +0.517 |
Neg logit contributions | |
nsic | -0.427 |
smuggling | -0.408 |
xual | -0.406 |
Machina | -0.405 |
table | -0.403 |
Token | the |
Token ID | 262 |
Feature activation | -6.24e-01 |
Pos logit contributions | |
Worcester | +0.973 |
Dartmouth | +0.949 |
heit | +0.871 |
Lansing | +0.842 |
ocene | +0.830 |
Neg logit contributions | |
nsic | -1.000 |
smuggling | -0.985 |
Machina | -0.965 |
table | -0.961 |
interrogation | -0.957 |
Token | same |
Token ID | 976 |
Feature activation | -9.24e-01 |
Pos logit contributions | |
Worcester | +0.478 |
Dartmouth | +0.466 |
heit | +0.430 |
Lansing | +0.416 |
ocene | +0.413 |
Neg logit contributions | |
nsic | -0.436 |
smuggling | -0.431 |
Machina | -0.421 |
table | -0.418 |
interrogation | -0.417 |
Token | sex |
Token ID | 1714 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
Worcester | +0.893 |
Dartmouth | +0.874 |
heit | +0.822 |
Lansing | +0.800 |
ocene | +0.793 |
Neg logit contributions | |
nsic | -0.465 |
smuggling | -0.452 |
Machina | -0.440 |
table | -0.435 |
Khe | -0.432 |
Token | 2 |
Token ID | 362 |
Feature activation | -7.69e-01 |
Pos logit contributions | |
nsic | +0.007 |
smuggling | +0.007 |
Machina | +0.007 |
interrogation | +0.007 |
table | +0.007 |
Neg logit contributions | |
Worcester | -0.013 |
Dartmouth | -0.013 |
heit | -0.012 |
Lansing | -0.012 |
ocene | -0.012 |
Token | lifetime |
Token ID | 10869 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
Worcester | +0.608 |
Dartmouth | +0.595 |
heit | +0.553 |
Lansing | +0.535 |
ocene | +0.533 |
Neg logit contributions | |
smuggling | -0.512 |
nsic | -0.512 |
Machina | -0.498 |
interrogation | -0.495 |
table | -0.494 |
Token | then |
Token ID | 788 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
smuggling | +0.383 |
nsic | +0.382 |
Machina | +0.372 |
interrogation | +0.370 |
table | +0.370 |
Neg logit contributions | |
Worcester | -0.522 |
Dartmouth | -0.511 |
heit | -0.477 |
Lansing | -0.463 |
hester | -0.463 |
Token | involves |
Token ID | 9018 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
smuggling | +0.224 |
nsic | +0.224 |
Machina | +0.218 |
table | +0.216 |
interrogation | +0.216 |
Neg logit contributions | |
Worcester | -0.322 |
Dartmouth | -0.315 |
heit | -0.295 |
ocene | -0.286 |
Lansing | -0.286 |
Token | exchanges |
Token ID | 14525 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
Worcester | +1.254 |
Dartmouth | +1.226 |
heit | +1.136 |
Lansing | +1.099 |
ocene | +1.095 |
Neg logit contributions | |
nsic | -1.106 |
smuggling | -1.102 |
Machina | -1.076 |
table | -1.066 |
interrogation | -1.066 |
Token | between |
Token ID | 1022 |
Feature activation | -4.41e+00 |
Pos logit contributions | |
Worcester | +0.402 |
Dartmouth | +0.394 |
heit | +0.369 |
Lansing | +0.358 |
ocene | +0.357 |
Neg logit contributions | |
nsic | -0.271 |
smuggling | -0.270 |
Machina | -0.263 |
table | -0.260 |
interrogation | -0.260 |
Token | surface |
Token ID | 4417 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
Worcester | +3.430 |
Dartmouth | +3.361 |
heit | +3.080 |
Lansing | +3.010 |
ocene | +2.984 |
Neg logit contributions | |
nsic | -2.990 |
smuggling | -2.926 |
Machina | -2.863 |
xual | -2.853 |
table | -2.848 |
Token | ocean |
Token ID | 9151 |
Feature activation | +7.39e-01 |
Pos logit contributions | |
Worcester | +0.152 |
Dartmouth | +0.148 |
heit | +0.138 |
Lansing | +0.134 |
hester | +0.134 |
Neg logit contributions | |
nsic | -0.115 |
smuggling | -0.115 |
Machina | -0.111 |
interrogation | -0.111 |
table | -0.110 |
Token | and |
Token ID | 290 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
smuggling | +0.448 |
nsic | +0.448 |
Machina | +0.434 |
interrogation | +0.434 |
table | +0.433 |
Neg logit contributions | |
Worcester | -0.626 |
Dartmouth | -0.614 |
heit | -0.574 |
hester | -0.557 |
Lansing | -0.555 |
Token | deep |
Token ID | 2769 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
smuggling | +0.758 |
nsic | +0.755 |
Machina | +0.739 |
interrogation | +0.734 |
table | +0.732 |
Neg logit contributions | |
Worcester | -0.954 |
Dartmouth | -0.933 |
heit | -0.875 |
hester | -0.848 |
Lansing | -0.842 |
Token | oceans |
Token ID | 23744 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
nsic | +0.226 |
smuggling | +0.226 |
Machina | +0.219 |
interrogation | +0.218 |
table | +0.218 |
Neg logit contributions | |
Worcester | -0.326 |
Dartmouth | -0.320 |
heit | -0.299 |
Lansing | -0.290 |
hester | -0.290 |
Token | , |
Token ID | 11 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
Worcester | +0.994 |
Dartmouth | +0.974 |
heit | +0.912 |
ocene | +0.882 |
Lansing | +0.881 |
Neg logit contributions | |
nsic | -0.730 |
smuggling | -0.729 |
Machina | -0.711 |
table | -0.706 |
interrogation | -0.703 |
Token | but |
Token ID | 475 |
Feature activation | -3.00e-02 |
Pos logit contributions | |
Worcester | +0.012 |
Dartmouth | +0.012 |
heit | +0.011 |
ocene | +0.011 |
hester | +0.011 |
Neg logit contributions | |
smuggling | -0.009 |
nsic | -0.009 |
Machina | -0.009 |
interrogation | -0.009 |
Khe | -0.009 |
Token | if |
Token ID | 611 |
Feature activation | -6.43e-01 |
Pos logit contributions | |
Worcester | +0.023 |
Dartmouth | +0.022 |
heit | +0.021 |
ocene | +0.020 |
hester | +0.020 |
Neg logit contributions | |
smuggling | -0.021 |
nsic | -0.021 |
Machina | -0.020 |
table | -0.020 |
interrogation | -0.020 |
Token | the |
Token ID | 262 |
Feature activation | -7.71e-01 |
Pos logit contributions | |
Worcester | +0.473 |
Dartmouth | +0.462 |
heit | +0.428 |
ocene | +0.413 |
Lansing | +0.412 |
Neg logit contributions | |
smuggling | -0.462 |
nsic | -0.462 |
Machina | -0.452 |
table | -0.448 |
interrogation | -0.447 |
Token | offline |
Token ID | 18043 |
Feature activation | -2.15e+00 |
Pos logit contributions | |
Worcester | +0.626 |
Dartmouth | +0.612 |
heit | +0.568 |
Lansing | +0.551 |
ocene | +0.548 |
Neg logit contributions | |
nsic | -0.500 |
smuggling | -0.497 |
Machina | -0.484 |
interrogation | -0.480 |
table | -0.480 |
Token | qualifier |
Token ID | 39265 |
Feature activation | -4.35e+00 |
Pos logit contributions | |
Worcester | +1.680 |
Dartmouth | +1.640 |
heit | +1.514 |
Lansing | +1.477 |
hester | +1.457 |
Neg logit contributions | |
nsic | -1.459 |
smuggling | -1.446 |
Machina | -1.410 |
xual | -1.398 |
interrogation | -1.395 |
Token | where |
Token ID | 810 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
Worcester | +3.414 |
Dartmouth | +3.323 |
heit | +3.045 |
Lansing | +2.990 |
hester | +2.916 |
Neg logit contributions | |
nsic | -2.971 |
smuggling | -2.883 |
xual | -2.815 |
Machina | -2.800 |
interrogation | -2.788 |
Token | they |
Token ID | 484 |
Feature activation | -5.22e-01 |
Pos logit contributions | |
Worcester | +0.275 |
Dartmouth | +0.269 |
heit | +0.250 |
ocene | +0.242 |
Lansing | +0.241 |
Neg logit contributions | |
smuggling | -0.247 |
nsic | -0.246 |
Machina | -0.241 |
table | -0.239 |
interrogation | -0.238 |
Token | secured |
Token ID | 13659 |
Feature activation | -7.22e-01 |
Pos logit contributions | |
Worcester | +0.420 |
Dartmouth | +0.411 |
heit | +0.383 |
Lansing | +0.371 |
ocene | +0.370 |
Neg logit contributions | |
smuggling | -0.340 |
nsic | -0.339 |
Machina | -0.331 |
table | -0.329 |
interrogation | -0.328 |
Token | their |
Token ID | 511 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
Worcester | +0.544 |
Dartmouth | +0.533 |
heit | +0.498 |
ocene | +0.481 |
hester | +0.480 |
Neg logit contributions | |
smuggling | -0.504 |
nsic | -0.498 |
Machina | -0.492 |
table | -0.488 |
interrogation | -0.487 |
Token | spot |
Token ID | 4136 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
Worcester | +0.089 |
Dartmouth | +0.087 |
heit | +0.081 |
ocene | +0.078 |
hester | +0.078 |
Neg logit contributions | |
smuggling | -0.079 |
nsic | -0.078 |
Machina | -0.077 |
interrogation | -0.076 |
table | -0.076 |
Token | . |
Token ID | 13 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
smuggling | +1.334 |
nsic | +1.322 |
Machina | +1.316 |
table | +1.302 |
interrogation | +1.288 |
Neg logit contributions | |
Worcester | -1.941 |
Dartmouth | -1.910 |
heit | -1.784 |
hester | -1.737 |
ocene | -1.735 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.60e-01 |
Pos logit contributions | |
Worcester | +0.270 |
Dartmouth | +0.264 |
heit | +0.248 |
ocene | +0.239 |
hester | +0.238 |
Neg logit contributions | |
nsic | -0.223 |
smuggling | -0.223 |
Machina | -0.220 |
table | -0.218 |
Khe | -0.216 |
Token | What |
Token ID | 2061 |
Feature activation | -9.96e-01 |
Pos logit contributions | |
Worcester | +0.328 |
Dartmouth | +0.320 |
heit | +0.294 |
Lansing | +0.284 |
ocene | +0.283 |
Neg logit contributions | |
nsic | -0.342 |
smuggling | -0.341 |
Machina | -0.335 |
table | -0.333 |
interrogation | -0.332 |
Token | do |
Token ID | 466 |
Feature activation | +9.97e-01 |
Pos logit contributions | |
Worcester | +0.795 |
Dartmouth | +0.776 |
heit | +0.723 |
ocene | +0.699 |
Lansing | +0.699 |
Neg logit contributions | |
smuggling | -0.656 |
nsic | -0.655 |
Machina | -0.639 |
interrogation | -0.633 |
table | -0.633 |
Token | you |
Token ID | 345 |
Feature activation | +2.50e+00 |
Pos logit contributions | |
smuggling | +0.684 |
nsic | +0.677 |
Machina | +0.665 |
interrogation | +0.661 |
table | +0.658 |
Neg logit contributions | |
Worcester | -0.767 |
Dartmouth | -0.748 |
heit | -0.702 |
ocene | -0.677 |
hester | -0.673 |
Token | call |
Token ID | 869 |
Feature activation | +3.91e+00 |
Pos logit contributions | |
smuggling | +1.542 |
nsic | +1.498 |
Machina | +1.483 |
interrogation | +1.474 |
table | +1.470 |
Neg logit contributions | |
Worcester | -2.097 |
Dartmouth | -2.055 |
heit | -1.938 |
ocene | -1.874 |
hester | -1.864 |
Token | a |
Token ID | 257 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
smuggling | +2.675 |
Machina | +2.604 |
nsic | +2.602 |
interrogation | +2.574 |
Khe | +2.566 |
Neg logit contributions | |
Worcester | -2.973 |
Dartmouth | -2.903 |
heit | -2.744 |
hester | -2.655 |
ocene | -2.653 |
Token | guy |
Token ID | 3516 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
Worcester | +0.273 |
Dartmouth | +0.268 |
heit | +0.250 |
Lansing | +0.243 |
ocene | +0.242 |
Neg logit contributions | |
nsic | -0.196 |
smuggling | -0.196 |
Machina | -0.190 |
interrogation | -0.189 |
table | -0.188 |
Token | who |
Token ID | 508 |
Feature activation | -3.84e-01 |
Pos logit contributions | |
Worcester | +1.262 |
Dartmouth | +1.234 |
heit | +1.144 |
Lansing | +1.108 |
ocene | +1.104 |
Neg logit contributions | |
nsic | -1.069 |
smuggling | -1.064 |
Machina | -1.040 |
interrogation | -1.030 |
table | -1.029 |
Token | smokes |
Token ID | 44589 |
Feature activation | +5.53e-01 |
Pos logit contributions | |
Worcester | +0.308 |
Dartmouth | +0.302 |
heit | +0.281 |
Lansing | +0.272 |
ocene | +0.272 |
Neg logit contributions | |
smuggling | -0.251 |
nsic | -0.251 |
Machina | -0.244 |
interrogation | -0.242 |
table | -0.241 |
Token | meat |
Token ID | 6174 |
Feature activation | +7.35e-01 |
Pos logit contributions | |
nsic | +0.321 |
smuggling | +0.320 |
Machina | +0.311 |
interrogation | +0.308 |
table | +0.308 |
Neg logit contributions | |
Worcester | -0.484 |
Dartmouth | -0.475 |
heit | -0.444 |
Lansing | -0.431 |
ocene | -0.431 |
Token | I |
Token ID | 314 |
Feature activation | -6.41e-01 |
Pos logit contributions | |
smuggling | +0.699 |
nsic | +0.695 |
Machina | +0.678 |
interrogation | +0.676 |
table | +0.675 |
Neg logit contributions | |
Worcester | -0.697 |
Dartmouth | -0.679 |
heit | -0.629 |
ocene | -0.607 |
hester | -0.607 |
Token | have |
Token ID | 423 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
Worcester | +0.513 |
Dartmouth | +0.503 |
heit | +0.467 |
Lansing | +0.450 |
ocene | +0.448 |
Neg logit contributions | |
nsic | -0.421 |
smuggling | -0.417 |
Machina | -0.409 |
table | -0.404 |
interrogation | -0.403 |
Token | to |
Token ID | 284 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
nsic | +0.398 |
smuggling | +0.398 |
Machina | +0.387 |
interrogation | +0.385 |
table | +0.384 |
Neg logit contributions | |
Worcester | -0.446 |
Dartmouth | -0.436 |
heit | -0.405 |
Lansing | -0.391 |
ocene | -0.391 |
Token | give |
Token ID | 1577 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
nsic | +0.341 |
smuggling | +0.339 |
Machina | +0.330 |
table | +0.326 |
interrogation | +0.326 |
Neg logit contributions | |
Worcester | -0.501 |
Dartmouth | -0.491 |
heit | -0.459 |
Lansing | -0.445 |
ocene | -0.444 |
Token | you |
Token ID | 345 |
Feature activation | +8.16e-01 |
Pos logit contributions | |
smuggling | +0.237 |
nsic | +0.236 |
Machina | +0.229 |
interrogation | +0.229 |
table | +0.228 |
Neg logit contributions | |
Worcester | -0.260 |
Dartmouth | -0.253 |
heit | -0.236 |
ocene | -0.228 |
Lansing | -0.227 |
Token | caveat |
Token ID | 36531 |
Feature activation | +3.24e+00 |
Pos logit contributions | |
smuggling | +0.604 |
nsic | +0.601 |
Machina | +0.587 |
interrogation | +0.585 |
table | +0.584 |
Neg logit contributions | |
Worcester | -0.584 |
Dartmouth | -0.569 |
heit | -0.527 |
ocene | -0.509 |
hester | -0.507 |
Token | which |
Token ID | 543 |
Feature activation | +3.98e-01 |
Pos logit contributions | |
smuggling | +2.128 |
nsic | +2.120 |
table | +2.074 |
Machina | +2.064 |
interrogation | +2.061 |
Neg logit contributions | |
Worcester | -2.588 |
Dartmouth | -2.520 |
heit | -2.338 |
ocene | -2.281 |
Lansing | -2.270 |
Token | is |
Token ID | 318 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
nsic | +0.262 |
smuggling | +0.261 |
Machina | +0.254 |
interrogation | +0.252 |
table | +0.252 |
Neg logit contributions | |
Worcester | -0.317 |
Dartmouth | -0.310 |
heit | -0.289 |
Lansing | -0.279 |
ocene | -0.279 |
Token | that |
Token ID | 326 |
Feature activation | -3.60e-01 |
Pos logit contributions | |
Worcester | +0.027 |
Dartmouth | +0.026 |
heit | +0.024 |
Lansing | +0.023 |
ocene | +0.023 |
Neg logit contributions | |
smuggling | -0.024 |
nsic | -0.024 |
Machina | -0.023 |
table | -0.023 |
interrogation | -0.023 |
Token | we |
Token ID | 356 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
Worcester | +0.266 |
Dartmouth | +0.259 |
heit | +0.240 |
Lansing | +0.231 |
ocene | +0.231 |
Neg logit contributions | |
nsic | -0.259 |
smuggling | -0.259 |
Machina | -0.253 |
interrogation | -0.251 |
table | -0.251 |
Token | don |
Token ID | 836 |
Feature activation | +9.98e-01 |
Pos logit contributions | |
nsic | +0.249 |
smuggling | +0.249 |
Machina | +0.243 |
interrogation | +0.240 |
table | +0.240 |
Neg logit contributions | |
Worcester | -0.289 |
Dartmouth | -0.283 |
heit | -0.262 |
Lansing | -0.254 |
ocene | -0.253 |
Token | be |
Token ID | 307 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
smuggling | +0.260 |
nsic | +0.259 |
Machina | +0.252 |
table | +0.250 |
interrogation | +0.249 |
Neg logit contributions | |
Worcester | -0.416 |
Dartmouth | -0.408 |
heit | -0.382 |
Lansing | -0.372 |
ocene | -0.372 |
Token | possible |
Token ID | 1744 |
Feature activation | -2.62e+00 |
Pos logit contributions | |
Worcester | +0.205 |
Dartmouth | +0.200 |
heit | +0.186 |
ocene | +0.179 |
Lansing | +0.179 |
Neg logit contributions | |
smuggling | -0.191 |
nsic | -0.190 |
Machina | -0.186 |
table | -0.184 |
interrogation | -0.184 |
Token | due |
Token ID | 2233 |
Feature activation | -1.63e+00 |
Pos logit contributions | |
Worcester | +2.128 |
Dartmouth | +2.083 |
heit | +1.923 |
Lansing | +1.881 |
hester | +1.860 |
Neg logit contributions | |
nsic | -1.704 |
smuggling | -1.674 |
Machina | -1.640 |
xual | -1.624 |
interrogation | -1.623 |
Token | to |
Token ID | 284 |
Feature activation | -2.43e-02 |
Pos logit contributions | |
Worcester | +1.275 |
Dartmouth | +1.247 |
heit | +1.156 |
Lansing | +1.120 |
ocene | +1.115 |
Neg logit contributions | |
nsic | -1.096 |
smuggling | -1.090 |
Machina | -1.064 |
interrogation | -1.055 |
table | -1.054 |
Token | real |
Token ID | 1103 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
Worcester | +0.019 |
Dartmouth | +0.018 |
heit | +0.017 |
ocene | +0.017 |
hester | +0.017 |
Neg logit contributions | |
smuggling | -0.017 |
nsic | -0.016 |
Machina | -0.016 |
interrogation | -0.016 |
table | -0.016 |
Token | life |
Token ID | 1204 |
Feature activation | +3.21e+00 |
Pos logit contributions | |
nsic | +0.159 |
smuggling | +0.159 |
Machina | +0.154 |
interrogation | +0.153 |
table | +0.153 |
Neg logit contributions | |
Worcester | -0.231 |
Dartmouth | -0.226 |
heit | -0.212 |
Lansing | -0.205 |
ocene | -0.205 |
Token | obligations |
Token ID | 13675 |
Feature activation | +6.43e-01 |
Pos logit contributions | |
smuggling | +1.938 |
nsic | +1.869 |
Machina | +1.859 |
interrogation | +1.857 |
table | +1.849 |
Neg logit contributions | |
Worcester | -2.706 |
Dartmouth | -2.667 |
heit | -2.533 |
ocene | -2.455 |
hester | -2.439 |
Token | . |
Token ID | 13 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
smuggling | +0.400 |
nsic | +0.399 |
Machina | +0.389 |
table | +0.385 |
interrogation | +0.385 |
Neg logit contributions | |
Worcester | -0.536 |
Dartmouth | -0.525 |
heit | -0.491 |
ocene | -0.475 |
Lansing | -0.475 |
Token | That |
Token ID | 1320 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
Worcester | +0.249 |
Dartmouth | +0.244 |
heit | +0.228 |
ocene | +0.220 |
hester | +0.219 |
Neg logit contributions | |
nsic | -0.223 |
smuggling | -0.223 |
Machina | -0.219 |
table | -0.217 |
Khe | -0.217 |
Token | will |
Token ID | 481 |
Feature activation | +6.54e-02 |
Pos logit contributions | |
Worcester | +0.242 |
Dartmouth | +0.237 |
heit | +0.221 |
ocene | +0.214 |
Lansing | +0.213 |
Neg logit contributions | |
smuggling | -0.195 |
nsic | -0.194 |
Machina | -0.189 |
table | -0.188 |
interrogation | -0.188 |
Token | stop |
Token ID | 2245 |
Feature activation | -4.46e-01 |
Pos logit contributions | |
nsic | +0.041 |
smuggling | +0.040 |
Machina | +0.039 |
interrogation | +0.039 |
table | +0.039 |
Neg logit contributions | |
Worcester | -0.055 |
Dartmouth | -0.054 |
heit | -0.050 |
Lansing | -0.048 |
ocene | -0.048 |
Token | - |
Token ID | 12 |
Feature activation | -2.31e-01 |
Pos logit contributions | |
Worcester | +0.677 |
Dartmouth | +0.663 |
heit | +0.617 |
Lansing | +0.598 |
ocene | +0.596 |
Neg logit contributions | |
nsic | -0.530 |
smuggling | -0.529 |
Machina | -0.515 |
interrogation | -0.510 |
table | -0.510 |
Token | and |
Token ID | 392 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
Worcester | +0.124 |
Dartmouth | +0.119 |
heit | +0.107 |
hester | +0.102 |
Lansing | +0.101 |
Neg logit contributions | |
nsic | -0.213 |
smuggling | -0.212 |
table | -0.209 |
Machina | -0.208 |
interrogation | -0.208 |
Token | - |
Token ID | 12 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
Worcester | +0.125 |
Dartmouth | +0.123 |
heit | +0.115 |
ocene | +0.112 |
hester | +0.112 |
Neg logit contributions | |
nsic | -0.080 |
smuggling | -0.080 |
Machina | -0.077 |
interrogation | -0.077 |
table | -0.077 |
Token | a |
Token ID | 64 |
Feature activation | -3.43e-01 |
Pos logit contributions | |
nsic | +0.203 |
smuggling | +0.202 |
table | +0.199 |
Machina | +0.196 |
interrogation | +0.196 |
Neg logit contributions | |
Worcester | -0.258 |
Dartmouth | -0.254 |
heit | -0.234 |
ocene | -0.228 |
Lansing | -0.227 |
Token | - |
Token ID | 12 |
Feature activation | +7.06e-01 |
Pos logit contributions | |
Worcester | +0.312 |
Dartmouth | +0.306 |
heit | +0.287 |
ocene | +0.279 |
Lansing | +0.279 |
Neg logit contributions | |
nsic | -0.188 |
smuggling | -0.188 |
Machina | -0.182 |
table | -0.181 |
interrogation | -0.180 |
Token | half |
Token ID | 13959 |
Feature activation | +3.23e+00 |
Pos logit contributions | |
nsic | +0.339 |
table | +0.336 |
smuggling | +0.335 |
Machina | +0.322 |
interrogation | +0.317 |
Neg logit contributions | |
Worcester | -0.694 |
Dartmouth | -0.684 |
heit | -0.635 |
Lansing | -0.629 |
ocene | -0.627 |
Token | , |
Token ID | 11 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
nsic | +1.862 |
smuggling | +1.836 |
table | +1.798 |
interrogation | +1.787 |
Machina | +1.774 |
Neg logit contributions | |
Worcester | -2.819 |
Dartmouth | -2.778 |
heit | -2.574 |
hester | -2.555 |
ocene | -2.515 |
Token | in |
Token ID | 287 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
Worcester | +0.080 |
Dartmouth | +0.078 |
heit | +0.072 |
ocene | +0.069 |
hester | +0.069 |
Neg logit contributions | |
smuggling | -0.089 |
nsic | -0.089 |
Machina | -0.087 |
table | -0.087 |
interrogation | -0.086 |
Token | 2018 |
Token ID | 2864 |
Feature activation | -6.27e-01 |
Pos logit contributions | |
smuggling | +0.098 |
nsic | +0.098 |
Machina | +0.096 |
interrogation | +0.096 |
investig | +0.095 |
Neg logit contributions | |
Worcester | -0.112 |
Dartmouth | -0.110 |
heit | -0.102 |
ocene | -0.099 |
hester | -0.099 |
Token | there |
Token ID | 612 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
Worcester | +0.519 |
Dartmouth | +0.509 |
heit | +0.474 |
hester | +0.459 |
ocene | +0.458 |
Neg logit contributions | |
nsic | -0.396 |
smuggling | -0.394 |
Machina | -0.383 |
table | -0.381 |
interrogation | -0.381 |
Token | � |
Token ID | 447 |
Feature activation | -1.00e+00 |
Pos logit contributions | |
nsic | +0.458 |
smuggling | +0.454 |
table | +0.445 |
Machina | +0.444 |
interrogation | +0.441 |
Neg logit contributions | |
Worcester | -0.489 |
Dartmouth | -0.478 |
heit | -0.439 |
Lansing | -0.425 |
ocene | -0.425 |
Token | Heath |
Token ID | 25846 |
Feature activation | +9.33e-02 |
Pos logit contributions | |
smuggling | +0.805 |
nsic | +0.804 |
Machina | +0.795 |
table | +0.782 |
interrogation | +0.780 |
Neg logit contributions | |
Worcester | -0.992 |
Dartmouth | -0.977 |
heit | -0.906 |
hester | -0.880 |
Lansing | -0.877 |
Token |
|
Token ID | 198 |
Feature activation | +5.76e-01 |
Pos logit contributions | |
nsic | +0.060 |
smuggling | +0.060 |
Machina | +0.058 |
table | +0.058 |
interrogation | +0.058 |
Neg logit contributions | |
Worcester | -0.076 |
Dartmouth | -0.075 |
heit | -0.069 |
Lansing | -0.067 |
ocene | -0.067 |
Token |
|
Token ID | 198 |
Feature activation | +4.61e-02 |
Pos logit contributions | |
nsic | +0.379 |
smuggling | +0.379 |
Machina | +0.375 |
table | +0.374 |
Khe | +0.368 |
Neg logit contributions | |
Worcester | -0.456 |
Dartmouth | -0.444 |
heit | -0.416 |
ocene | -0.403 |
hester | -0.402 |
Token | M |
Token ID | 44 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
nsic | +0.033 |
smuggling | +0.033 |
Machina | +0.032 |
table | +0.032 |
interrogation | +0.032 |
Neg logit contributions | |
Worcester | -0.034 |
Dartmouth | -0.033 |
heit | -0.031 |
Lansing | -0.030 |
ocene | -0.030 |
Token | ire |
Token ID | 557 |
Feature activation | -7.83e-01 |
Pos logit contributions | |
Worcester | +0.282 |
Dartmouth | +0.275 |
heit | +0.256 |
Lansing | +0.248 |
ocene | +0.247 |
Neg logit contributions | |
nsic | -0.233 |
smuggling | -0.232 |
Machina | -0.226 |
table | -0.224 |
interrogation | -0.224 |
Token | Bl |
Token ID | 1086 |
Feature activation | +3.28e+00 |
Pos logit contributions | |
Worcester | +0.652 |
Dartmouth | +0.637 |
heit | +0.593 |
Lansing | +0.577 |
ocene | +0.575 |
Neg logit contributions | |
nsic | -0.488 |
smuggling | -0.488 |
Machina | -0.472 |
interrogation | -0.470 |
investig | -0.469 |
Token | ight |
Token ID | 432 |
Feature activation | -1.49e+00 |
Pos logit contributions | |
nsic | +1.963 |
Machina | +1.927 |
smuggling | +1.927 |
table | +1.899 |
xual | +1.859 |
Neg logit contributions | |
Worcester | -2.796 |
Dartmouth | -2.746 |
heit | -2.517 |
Lansing | -2.492 |
ocene | -2.463 |
Token | vs |
Token ID | 3691 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
Worcester | +1.236 |
Dartmouth | +1.207 |
heit | +1.129 |
Lansing | +1.093 |
ocene | +1.088 |
Neg logit contributions | |
nsic | -0.944 |
smuggling | -0.942 |
Machina | -0.910 |
interrogation | -0.906 |
investig | -0.904 |
Token | Dark |
Token ID | 3801 |
Feature activation | +2.02e+00 |
Pos logit contributions | |
nsic | +0.123 |
smuggling | +0.122 |
Machina | +0.120 |
interrogation | +0.118 |
table | +0.118 |
Neg logit contributions | |
Worcester | -0.158 |
Dartmouth | -0.155 |
heit | -0.145 |
ocene | -0.140 |
Lansing | -0.140 |
Token | Tut |
Token ID | 22792 |
Feature activation | +6.89e-01 |
Pos logit contributions | |
nsic | +1.326 |
smuggling | +1.318 |
Machina | +1.308 |
table | +1.304 |
Khe | +1.293 |
Neg logit contributions | |
Worcester | -1.588 |
Dartmouth | -1.563 |
heit | -1.441 |
Lansing | -1.403 |
ocene | -1.403 |
Token | el |
Token ID | 417 |
Feature activation | +8.36e-01 |
Pos logit contributions | |
nsic | +0.617 |
smuggling | +0.617 |
Machina | +0.608 |
table | +0.603 |
interrogation | +0.602 |
Neg logit contributions | |
Worcester | -0.384 |
Dartmouth | -0.375 |
heit | -0.335 |
Lansing | -0.320 |
hester | -0.319 |
Token | Pil |
Token ID | 12693 |
Feature activation | +8.78e-01 |
Pos logit contributions | |
Worcester | +0.571 |
Dartmouth | +0.559 |
heit | +0.522 |
Lansing | +0.508 |
ocene | +0.506 |
Neg logit contributions | |
nsic | -0.376 |
smuggling | -0.375 |
Machina | -0.363 |
interrogation | -0.360 |
table | -0.360 |
Token | ots |
Token ID | 1747 |
Feature activation | -7.79e-02 |
Pos logit contributions | |
nsic | +0.392 |
smuggling | +0.391 |
Machina | +0.376 |
table | +0.372 |
interrogation | +0.371 |
Neg logit contributions | |
Worcester | -0.886 |
Dartmouth | -0.871 |
heit | -0.822 |
Lansing | -0.802 |
ocene | -0.801 |
Token | . |
Token ID | 13 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
Worcester | +0.067 |
Dartmouth | +0.065 |
heit | +0.061 |
hester | +0.059 |
ocene | +0.059 |
Neg logit contributions | |
smuggling | -0.047 |
nsic | -0.047 |
Machina | -0.045 |
interrogation | -0.045 |
table | -0.045 |
Token | Alexandria |
Token ID | 27872 |
Feature activation | +9.47e-02 |
Pos logit contributions | |
Worcester | +0.291 |
Dartmouth | +0.285 |
heit | +0.268 |
ocene | +0.257 |
hester | +0.257 |
Neg logit contributions | |
smuggling | -0.284 |
nsic | -0.283 |
Machina | -0.281 |
table | -0.278 |
Khe | -0.278 |
Token | , |
Token ID | 11 |
Feature activation | +3.85e-01 |
Pos logit contributions | |
nsic | +0.057 |
smuggling | +0.057 |
Machina | +0.056 |
table | +0.055 |
interrogation | +0.055 |
Neg logit contributions | |
Worcester | -0.081 |
Dartmouth | -0.079 |
heit | -0.074 |
ocene | -0.072 |
hester | -0.071 |
Token | Va |
Token ID | 17668 |
Feature activation | +1.34e+00 |
Pos logit contributions | |
nsic | +0.252 |
smuggling | +0.252 |
Machina | +0.247 |
table | +0.245 |
Khe | +0.245 |
Neg logit contributions | |
Worcester | -0.305 |
Dartmouth | -0.298 |
heit | -0.282 |
ocene | -0.271 |
hester | -0.269 |
Token | .: |
Token ID | 11207 |
Feature activation | +9.78e-01 |
Pos logit contributions | |
nsic | +0.928 |
smuggling | +0.926 |
Machina | +0.914 |
table | +0.914 |
investig | +0.899 |
Neg logit contributions | |
Worcester | -1.003 |
Dartmouth | -0.976 |
heit | -0.910 |
ocene | -0.871 |
hester | -0.871 |
Token | Time |
Token ID | 3862 |
Feature activation | -1.56e+00 |
Pos logit contributions | |
smuggling | +0.675 |
Machina | +0.671 |
nsic | +0.669 |
Khe | +0.667 |
table | +0.664 |
Neg logit contributions | |
Worcester | -0.725 |
Dartmouth | -0.705 |
heit | -0.673 |
ocene | -0.646 |
hester | -0.641 |
Token | - |
Token ID | 12 |
Feature activation | -8.64e-02 |
Pos logit contributions | |
Worcester | +1.181 |
Dartmouth | +1.154 |
heit | +1.067 |
Lansing | +1.031 |
ocene | +1.029 |
Neg logit contributions | |
nsic | -1.096 |
smuggling | -1.094 |
Machina | -1.068 |
table | -1.059 |
interrogation | -1.059 |
Token | Life |
Token ID | 14662 |
Feature activation | +1.76e+00 |
Pos logit contributions | |
Worcester | +0.058 |
Dartmouth | +0.057 |
heit | +0.052 |
Lansing | +0.050 |
ocene | +0.050 |
Neg logit contributions | |
nsic | -0.068 |
smuggling | -0.068 |
Machina | -0.066 |
table | -0.066 |
interrogation | -0.066 |
Token | Books |
Token ID | 13661 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
smuggling | +1.284 |
nsic | +1.266 |
Machina | +1.264 |
table | +1.248 |
Khe | +1.246 |
Neg logit contributions | |
Worcester | -1.257 |
Dartmouth | -1.237 |
heit | -1.151 |
ocene | -1.112 |
hester | -1.105 |
Token | 47 |
Token ID | 2857 |
Feature activation | +8.87e-01 |
Pos logit contributions | |
nsic | +0.076 |
smuggling | +0.076 |
Machina | +0.073 |
table | +0.073 |
interrogation | +0.073 |
Neg logit contributions | |
Worcester | -0.125 |
Dartmouth | -0.123 |
heit | -0.115 |
Lansing | -0.112 |
ocene | -0.112 |
Token | ] |
Token ID | 60 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
nsic | +0.531 |
table | +0.526 |
Machina | +0.526 |
smuggling | +0.525 |
Khe | +0.511 |
Neg logit contributions | |
Worcester | -0.752 |
Dartmouth | -0.732 |
heit | -0.687 |
ocene | -0.672 |
Lansing | -0.671 |
Token | <@ |
Token ID | 32406 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
Worcester | +0.124 |
Dartmouth | +0.121 |
heit | +0.110 |
Lansing | +0.106 |
ocene | +0.105 |
Neg logit contributions | |
nsic | -0.155 |
smuggling | -0.154 |
Machina | -0.151 |
interrogation | -0.150 |
table | -0.150 |
Token | t |
Token ID | 83 |
Feature activation | -4.25e-01 |
Pos logit contributions | |
nsic | +0.742 |
smuggling | +0.735 |
Machina | +0.720 |
table | +0.717 |
interrogation | +0.713 |
Neg logit contributions | |
Worcester | -0.935 |
Dartmouth | -0.915 |
heit | -0.848 |
Lansing | -0.825 |
ocene | -0.820 |
Token | ay |
Token ID | 323 |
Feature activation | +2.70e+00 |
Pos logit contributions | |
Worcester | +0.325 |
Dartmouth | +0.317 |
heit | +0.290 |
Lansing | +0.285 |
ocene | +0.281 |
Neg logit contributions | |
nsic | -0.297 |
smuggling | -0.295 |
Machina | -0.289 |
table | -0.287 |
interrogation | -0.285 |
Token | l |
Token ID | 75 |
Feature activation | +9.06e-01 |
Pos logit contributions | |
nsic | +1.721 |
smuggling | +1.688 |
Machina | +1.670 |
table | +1.670 |
xual | +1.649 |
Neg logit contributions | |
Worcester | -2.229 |
Dartmouth | -2.185 |
heit | -2.006 |
Lansing | -1.972 |
hester | -1.939 |
Token | ort |
Token ID | 419 |
Feature activation | -7.46e-01 |
Pos logit contributions | |
nsic | +0.612 |
smuggling | +0.611 |
Machina | +0.595 |
interrogation | +0.591 |
table | +0.589 |
Neg logit contributions | |
Worcester | -0.708 |
Dartmouth | -0.693 |
heit | -0.644 |
Lansing | -0.621 |
ocene | -0.621 |
Token | ot |
Token ID | 313 |
Feature activation | -2.35e-01 |
Pos logit contributions | |
Worcester | +0.578 |
Dartmouth | +0.565 |
heit | +0.526 |
Lansing | +0.507 |
ocene | +0.507 |
Neg logit contributions | |
nsic | -0.508 |
smuggling | -0.507 |
Machina | -0.494 |
interrogation | -0.491 |
table | -0.489 |
Token | ft |
Token ID | 701 |
Feature activation | +7.89e-01 |
Pos logit contributions | |
Worcester | +0.181 |
Dartmouth | +0.177 |
heit | +0.164 |
Lansing | +0.158 |
ocene | +0.158 |
Neg logit contributions | |
nsic | -0.162 |
smuggling | -0.162 |
Machina | -0.157 |
interrogation | -0.156 |
table | -0.156 |
Token | w |
Token ID | 86 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
nsic | +0.575 |
smuggling | +0.572 |
Machina | +0.560 |
table | +0.560 |
interrogation | +0.555 |
Neg logit contributions | |
Worcester | -0.576 |
Dartmouth | -0.562 |
heit | -0.515 |
Lansing | -0.500 |
ocene | -0.497 |
Token | > |
Token ID | 29 |
Feature activation | +5.09e-01 |
Pos logit contributions | |
Worcester | +0.341 |
Dartmouth | +0.333 |
heit | +0.305 |
Lansing | +0.293 |
ocene | +0.292 |
Neg logit contributions | |
nsic | -0.397 |
smuggling | -0.397 |
Machina | -0.388 |
interrogation | -0.385 |
table | -0.385 |
Token | , |
Token ID | 11 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
nsic | +0.163 |
smuggling | +0.163 |
Machina | +0.159 |
table | +0.157 |
Khe | +0.157 |
Neg logit contributions | |
Worcester | -0.220 |
Dartmouth | -0.215 |
heit | -0.200 |
Lansing | -0.194 |
ocene | -0.194 |
Token | and |
Token ID | 290 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
nsic | +0.181 |
smuggling | +0.181 |
Machina | +0.176 |
interrogation | +0.174 |
table | +0.174 |
Neg logit contributions | |
Worcester | -0.241 |
Dartmouth | -0.236 |
heit | -0.220 |
Lansing | -0.213 |
ocene | -0.213 |
Token | a |
Token ID | 257 |
Feature activation | -5.31e-02 |
Pos logit contributions | |
smuggling | +0.184 |
nsic | +0.184 |
Machina | +0.180 |
interrogation | +0.178 |
table | +0.178 |
Neg logit contributions | |
Worcester | -0.206 |
Dartmouth | -0.201 |
heit | -0.187 |
Lansing | -0.180 |
ocene | -0.180 |
Token | book |
Token ID | 1492 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
Worcester | +0.044 |
Dartmouth | +0.043 |
heit | +0.040 |
Lansing | +0.039 |
ocene | +0.039 |
Neg logit contributions | |
nsic | -0.033 |
smuggling | -0.033 |
Machina | -0.032 |
interrogation | -0.032 |
table | -0.032 |
Token | of |
Token ID | 286 |
Feature activation | +3.65e-01 |
Pos logit contributions | |
Worcester | +0.150 |
Dartmouth | +0.147 |
heit | +0.137 |
Lansing | +0.133 |
ocene | +0.133 |
Neg logit contributions | |
nsic | -0.114 |
smuggling | -0.114 |
Machina | -0.111 |
interrogation | -0.110 |
table | -0.110 |
Token | unused |
Token ID | 21958 |
Feature activation | +5.59e-01 |
Pos logit contributions | |
nsic | +0.220 |
smuggling | +0.220 |
Machina | +0.214 |
interrogation | +0.212 |
table | +0.212 |
Neg logit contributions | |
Worcester | -0.311 |
Dartmouth | -0.304 |
heit | -0.285 |
Lansing | -0.276 |
ocene | -0.275 |
Token | work |
Token ID | 670 |
Feature activation | -3.47e-01 |
Pos logit contributions | |
nsic | +0.318 |
smuggling | +0.318 |
Machina | +0.309 |
interrogation | +0.306 |
table | +0.305 |
Neg logit contributions | |
Worcester | -0.495 |
Dartmouth | -0.485 |
heit | -0.455 |
Lansing | -0.442 |
ocene | -0.441 |
Token | from |
Token ID | 422 |
Feature activation | -6.93e-03 |
Pos logit contributions | |
Worcester | +0.292 |
Dartmouth | +0.286 |
heit | +0.267 |
Lansing | +0.258 |
ocene | +0.258 |
Neg logit contributions | |
nsic | -0.215 |
smuggling | -0.214 |
Machina | -0.207 |
interrogation | -0.206 |
investig | -0.205 |
Token | between |
Token ID | 1022 |
Feature activation | -2.89e+00 |
Pos logit contributions | |
Worcester | +0.005 |
Dartmouth | +0.005 |
heit | +0.005 |
Lansing | +0.005 |
ocene | +0.005 |
Neg logit contributions | |
smuggling | -0.005 |
nsic | -0.005 |
Machina | -0.005 |
interrogation | -0.005 |
table | -0.005 |
Token | 1985 |
Token ID | 12863 |
Feature activation | -6.54e-01 |
Pos logit contributions | |
Worcester | +2.360 |
Dartmouth | +2.316 |
heit | +2.131 |
Lansing | +2.096 |
ocene | +2.064 |
Neg logit contributions | |
nsic | -1.865 |
smuggling | -1.827 |
xual | -1.781 |
Machina | -1.778 |
investig | -1.768 |
Token | and |
Token ID | 290 |
Feature activation | +6.00e-01 |
Pos logit contributions | |
Worcester | +0.533 |
Dartmouth | +0.522 |
heit | +0.485 |
Lansing | +0.470 |
ocene | +0.469 |
Neg logit contributions | |
nsic | -0.420 |
smuggling | -0.419 |
Machina | -0.408 |
interrogation | -0.404 |
table | -0.404 |
Token | to |
Token ID | 284 |
Feature activation | +5.99e-01 |
Pos logit contributions | |
Worcester | +1.200 |
Dartmouth | +1.174 |
heit | +1.092 |
Lansing | +1.059 |
ocene | +1.054 |
Neg logit contributions | |
nsic | -0.965 |
smuggling | -0.961 |
Machina | -0.935 |
interrogation | -0.928 |
table | -0.926 |
Token | have |
Token ID | 423 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
smuggling | +0.366 |
nsic | +0.363 |
Machina | +0.356 |
interrogation | +0.354 |
table | +0.352 |
Neg logit contributions | |
Worcester | -0.506 |
Dartmouth | -0.496 |
heit | -0.464 |
ocene | -0.449 |
hester | -0.449 |
Token | . |
Token ID | 13 |
Feature activation | +3.36e-02 |
Pos logit contributions | |
Worcester | +0.136 |
Dartmouth | +0.133 |
heit | +0.124 |
Lansing | +0.120 |
ocene | +0.119 |
Neg logit contributions | |
nsic | -0.112 |
smuggling | -0.111 |
Machina | -0.108 |
table | -0.107 |
interrogation | -0.107 |
Token | We |
Token ID | 775 |
Feature activation | +6.02e-01 |
Pos logit contributions | |
nsic | +0.023 |
smuggling | +0.023 |
Machina | +0.023 |
table | +0.023 |
Khe | +0.023 |
Neg logit contributions | |
Worcester | -0.025 |
Dartmouth | -0.025 |
heit | -0.023 |
hester | -0.022 |
ocene | -0.022 |
Token | know |
Token ID | 760 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
smuggling | +0.399 |
nsic | +0.398 |
Machina | +0.390 |
interrogation | +0.387 |
table | +0.386 |
Neg logit contributions | |
Worcester | -0.476 |
Dartmouth | -0.468 |
heit | -0.432 |
hester | -0.420 |
ocene | -0.419 |
Token | the |
Token ID | 262 |
Feature activation | +6.94e-01 |
Pos logit contributions | |
smuggling | +0.667 |
nsic | +0.662 |
Machina | +0.652 |
interrogation | +0.646 |
table | +0.646 |
Neg logit contributions | |
Worcester | -0.820 |
Dartmouth | -0.802 |
heit | -0.751 |
ocene | -0.728 |
hester | -0.725 |
Token | type |
Token ID | 2099 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
nsic | +0.418 |
smuggling | +0.417 |
Machina | +0.405 |
table | +0.401 |
interrogation | +0.401 |
Neg logit contributions | |
Worcester | -0.594 |
Dartmouth | -0.582 |
heit | -0.543 |
Lansing | -0.527 |
ocene | -0.526 |
Token | of |
Token ID | 286 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
nsic | +0.126 |
smuggling | +0.126 |
Machina | +0.122 |
table | +0.121 |
interrogation | +0.121 |
Neg logit contributions | |
Worcester | -0.216 |
Dartmouth | -0.212 |
heit | -0.199 |
Lansing | -0.193 |
hester | -0.193 |
Token | player |
Token ID | 2137 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
Worcester | +0.120 |
Dartmouth | +0.118 |
heit | +0.111 |
ocene | +0.107 |
Lansing | +0.107 |
Neg logit contributions | |
smuggling | -0.080 |
nsic | -0.080 |
Machina | -0.078 |
interrogation | -0.077 |
table | -0.077 |
Token | he |
Token ID | 339 |
Feature activation | +8.29e-01 |
Pos logit contributions | |
smuggling | +0.669 |
nsic | +0.666 |
Machina | +0.655 |
table | +0.648 |
interrogation | +0.647 |
Neg logit contributions | |
Worcester | -0.821 |
Dartmouth | -0.802 |
heit | -0.752 |
ocene | -0.727 |
hester | -0.726 |
Token | is |
Token ID | 318 |
Feature activation | +5.52e-01 |
Pos logit contributions | |
smuggling | +0.514 |
nsic | +0.511 |
Machina | +0.500 |
table | +0.498 |
interrogation | +0.494 |
Neg logit contributions | |
Worcester | -0.693 |
Dartmouth | -0.680 |
heit | -0.631 |
ocene | -0.613 |
Lansing | -0.613 |
Token | M |
Token ID | 44 |
Feature activation | -4.17e-01 |
Pos logit contributions | |
table | +0.540 |
Machina | +0.539 |
nsic | +0.538 |
smuggling | +0.534 |
Khe | +0.525 |
Neg logit contributions | |
Worcester | -0.537 |
Dartmouth | -0.527 |
heit | -0.485 |
ocene | -0.468 |
hester | -0.464 |
Token | OR |
Token ID | 1581 |
Feature activation | -8.29e-01 |
Pos logit contributions | |
Worcester | +0.290 |
Dartmouth | +0.283 |
heit | +0.260 |
Lansing | +0.250 |
ocene | +0.249 |
Neg logit contributions | |
nsic | -0.316 |
smuggling | -0.315 |
Machina | -0.309 |
table | -0.309 |
interrogation | -0.307 |
Token | PH |
Token ID | 11909 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
Worcester | +0.589 |
Dartmouth | +0.576 |
heit | +0.528 |
Lansing | +0.512 |
ocene | +0.511 |
Neg logit contributions | |
nsic | -0.616 |
smuggling | -0.612 |
Machina | -0.602 |
table | -0.602 |
interrogation | -0.596 |
Token | _ |
Token ID | 62 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
Worcester | +1.551 |
Dartmouth | +1.520 |
heit | +1.414 |
Lansing | +1.369 |
ocene | +1.363 |
Neg logit contributions | |
nsic | -1.236 |
smuggling | -1.236 |
Machina | -1.197 |
interrogation | -1.190 |
investig | -1.188 |
Token | RECT |
Token ID | 23988 |
Feature activation | -9.97e-01 |
Pos logit contributions | |
Worcester | +0.835 |
Dartmouth | +0.811 |
heit | +0.737 |
Lansing | +0.706 |
ocene | +0.703 |
Neg logit contributions | |
nsic | -1.121 |
smuggling | -1.119 |
Machina | -1.096 |
interrogation | -1.088 |
table | -1.086 |
Token | , |
Token ID | 11 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
Worcester | +0.853 |
Dartmouth | +0.837 |
heit | +0.781 |
Lansing | +0.758 |
ocene | +0.755 |
Neg logit contributions | |
nsic | -0.599 |
smuggling | -0.598 |
Machina | -0.580 |
interrogation | -0.575 |
table | -0.573 |
Token | ( |
Token ID | 357 |
Feature activation | +7.53e-01 |
Pos logit contributions | |
smuggling | +0.169 |
nsic | +0.168 |
Machina | +0.166 |
table | +0.166 |
interrogation | +0.164 |
Neg logit contributions | |
Worcester | -0.220 |
Dartmouth | -0.214 |
heit | -0.201 |
ocene | -0.196 |
hester | -0.195 |
Token | 21 |
Token ID | 2481 |
Feature activation | +8.88e-02 |
Pos logit contributions | |
nsic | +0.410 |
smuggling | +0.408 |
Machina | +0.396 |
table | +0.393 |
interrogation | +0.391 |
Neg logit contributions | |
Worcester | -0.688 |
Dartmouth | -0.675 |
heit | -0.632 |
Lansing | -0.617 |
ocene | -0.614 |
Token | , |
Token ID | 11 |
Feature activation | +3.11e-01 |
Pos logit contributions | |
nsic | +0.052 |
smuggling | +0.051 |
Machina | +0.050 |
table | +0.050 |
interrogation | +0.049 |
Neg logit contributions | |
Worcester | -0.078 |
Dartmouth | -0.076 |
heit | -0.071 |
Lansing | -0.069 |
ocene | -0.069 |
Token | 21 |
Token ID | 2310 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
nsic | +0.102 |
smuggling | +0.102 |
Machina | +0.097 |
interrogation | +0.095 |
table | +0.095 |
Neg logit contributions | |
Worcester | -0.350 |
Dartmouth | -0.345 |
heit | -0.328 |
Lansing | -0.320 |
ocene | -0.320 |
Token | )) |
Token ID | 4008 |
Feature activation | +1.87e+00 |
Pos logit contributions | |
nsic | +0.276 |
smuggling | +0.275 |
Machina | +0.267 |
interrogation | +0.266 |
table | +0.265 |
Neg logit contributions | |
Worcester | -0.342 |
Dartmouth | -0.335 |
heit | -0.312 |
Lansing | -0.302 |
ocene | -0.301 |
Token | would |
Token ID | 561 |
Feature activation | +5.77e-01 |
Pos logit contributions | |
smuggling | +0.265 |
nsic | +0.263 |
Machina | +0.259 |
investig | +0.256 |
interrogation | +0.256 |
Neg logit contributions | |
Worcester | -0.265 |
Dartmouth | -0.260 |
heit | -0.241 |
ocene | -0.233 |
hester | -0.232 |
Token | drive |
Token ID | 3708 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
smuggling | +0.362 |
nsic | +0.359 |
Machina | +0.351 |
interrogation | +0.349 |
table | +0.348 |
Neg logit contributions | |
Worcester | -0.479 |
Dartmouth | -0.470 |
heit | -0.438 |
Lansing | -0.426 |
ocene | -0.425 |
Token | that |
Token ID | 326 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
smuggling | +0.118 |
nsic | +0.118 |
Machina | +0.115 |
interrogation | +0.114 |
table | +0.114 |
Neg logit contributions | |
Worcester | -0.143 |
Dartmouth | -0.140 |
heit | -0.131 |
hester | -0.126 |
ocene | -0.126 |
Token | explosive |
Token ID | 13835 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
Worcester | +0.188 |
Dartmouth | +0.184 |
heit | +0.172 |
hester | +0.167 |
ocene | +0.167 |
Neg logit contributions | |
smuggling | -0.145 |
nsic | -0.143 |
Machina | -0.140 |
interrogation | -0.139 |
investig | -0.138 |
Token | force |
Token ID | 2700 |
Feature activation | -8.34e-01 |
Pos logit contributions | |
Worcester | +1.116 |
Dartmouth | +1.094 |
heit | +1.024 |
ocene | +0.992 |
hester | +0.992 |
Neg logit contributions | |
smuggling | -0.790 |
nsic | -0.785 |
Machina | -0.765 |
interrogation | -0.758 |
table | -0.755 |
Token | , |
Token ID | 11 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
Worcester | +0.669 |
Dartmouth | +0.657 |
heit | +0.611 |
Lansing | +0.591 |
ocene | +0.590 |
Neg logit contributions | |
smuggling | -0.545 |
nsic | -0.544 |
Machina | -0.529 |
table | -0.526 |
interrogation | -0.525 |
Token | � |
Token ID | 447 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
Worcester | +0.128 |
Dartmouth | +0.125 |
heit | +0.114 |
hester | +0.110 |
ocene | +0.109 |
Neg logit contributions | |
nsic | -0.152 |
smuggling | -0.152 |
Machina | -0.149 |
interrogation | -0.147 |
table | -0.147 |
Token | � |
Token ID | 251 |
Feature activation | -2.37e-01 |
Pos logit contributions | |
Worcester | +0.461 |
Dartmouth | +0.453 |
heit | +0.427 |
Lansing | +0.417 |
ocene | +0.417 |
Neg logit contributions | |
nsic | -0.211 |
smuggling | -0.211 |
Machina | -0.203 |
interrogation | -0.201 |
table | -0.200 |
Token | he |
Token ID | 339 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
Worcester | +0.207 |
Dartmouth | +0.204 |
heit | +0.191 |
ocene | +0.186 |
Lansing | +0.185 |
Neg logit contributions | |
nsic | -0.136 |
smuggling | -0.136 |
Machina | -0.133 |
interrogation | -0.131 |
table | -0.131 |
Token | said |
Token ID | 531 |
Feature activation | +6.97e-02 |
Pos logit contributions | |
Worcester | +0.101 |
Dartmouth | +0.099 |
heit | +0.092 |
ocene | +0.089 |
Lansing | +0.089 |
Neg logit contributions | |
nsic | -0.089 |
smuggling | -0.089 |
Machina | -0.087 |
interrogation | -0.086 |
table | -0.086 |
Token | . |
Token ID | 13 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
nsic | +0.043 |
smuggling | +0.043 |
Machina | +0.042 |
interrogation | +0.041 |
table | +0.041 |
Neg logit contributions | |
Worcester | -0.058 |
Dartmouth | -0.057 |
heit | -0.053 |
Lansing | -0.052 |
ocene | -0.052 |
Token | , |
Token ID | 11 |
Feature activation | -9.19e-01 |
Pos logit contributions | |
smuggling | +0.304 |
nsic | +0.303 |
Machina | +0.295 |
table | +0.293 |
interrogation | +0.293 |
Neg logit contributions | |
Worcester | -0.438 |
Dartmouth | -0.429 |
heit | -0.402 |
ocene | -0.389 |
hester | -0.389 |
Token | three |
Token ID | 1115 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
Worcester | +0.757 |
Dartmouth | +0.741 |
heit | +0.693 |
ocene | +0.669 |
Lansing | +0.669 |
Neg logit contributions | |
smuggling | -0.581 |
nsic | -0.581 |
Machina | -0.565 |
interrogation | -0.561 |
table | -0.559 |
Token | , |
Token ID | 11 |
Feature activation | -9.58e-01 |
Pos logit contributions | |
smuggling | +0.275 |
nsic | +0.273 |
Machina | +0.266 |
interrogation | +0.265 |
table | +0.264 |
Neg logit contributions | |
Worcester | -0.378 |
Dartmouth | -0.370 |
heit | -0.347 |
hester | -0.338 |
ocene | -0.338 |
Token | four |
Token ID | 1440 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
Worcester | +0.790 |
Dartmouth | +0.773 |
heit | +0.724 |
ocene | +0.700 |
hester | +0.699 |
Neg logit contributions | |
smuggling | -0.604 |
nsic | -0.603 |
Machina | -0.587 |
interrogation | -0.585 |
table | -0.581 |
Token | . |
Token ID | 13 |
Feature activation | -5.60e-01 |
Pos logit contributions | |
smuggling | +0.240 |
nsic | +0.238 |
Machina | +0.233 |
interrogation | +0.231 |
table | +0.231 |
Neg logit contributions | |
Worcester | -0.326 |
Dartmouth | -0.319 |
heit | -0.299 |
hester | -0.291 |
ocene | -0.291 |
Token |
|
Token ID | 198 |
Feature activation | -9.16e-02 |
Pos logit contributions | |
Worcester | +0.420 |
Dartmouth | +0.410 |
heit | +0.383 |
hester | +0.370 |
ocene | +0.370 |
Neg logit contributions | |
nsic | -0.389 |
smuggling | -0.389 |
Machina | -0.385 |
Khe | -0.380 |
table | -0.380 |
Token |
|
Token ID | 198 |
Feature activation | -5.63e-01 |
Pos logit contributions | |
Worcester | +0.072 |
Dartmouth | +0.070 |
heit | +0.065 |
ocene | +0.063 |
Lansing | +0.063 |
Neg logit contributions | |
nsic | -0.061 |
smuggling | -0.061 |
Machina | -0.060 |
table | -0.060 |
Khe | -0.059 |
Token | RF |
Token ID | 32754 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
Worcester | +0.512 |
Dartmouth | +0.502 |
heit | +0.471 |
Lansing | +0.458 |
ocene | +0.457 |
Neg logit contributions | |
nsic | -0.309 |
smuggling | -0.308 |
Machina | -0.298 |
table | -0.295 |
interrogation | -0.295 |
Token | : |
Token ID | 25 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
nsic | +0.616 |
smuggling | +0.616 |
Machina | +0.610 |
table | +0.606 |
Khe | +0.597 |
Neg logit contributions | |
Worcester | -0.887 |
Dartmouth | -0.867 |
heit | -0.814 |
ocene | -0.794 |
hester | -0.791 |
Token | Five |
Token ID | 10579 |
Feature activation | +7.45e-01 |
Pos logit contributions | |
smuggling | +0.296 |
Machina | +0.296 |
nsic | +0.296 |
Khe | +0.294 |
table | +0.291 |
Neg logit contributions | |
Worcester | -0.298 |
Dartmouth | -0.290 |
heit | -0.272 |
ocene | -0.265 |
hester | -0.264 |
Token | ! |
Token ID | 0 |
Feature activation | -6.28e-01 |
Pos logit contributions | |
smuggling | +0.466 |
nsic | +0.463 |
Machina | +0.453 |
table | +0.451 |
interrogation | +0.449 |
Neg logit contributions | |
Worcester | -0.617 |
Dartmouth | -0.604 |
heit | -0.563 |
ocene | -0.549 |
hester | -0.548 |
Token | full |
Token ID | 1336 |
Feature activation | +5.16e-01 |
Pos logit contributions | |
Worcester | +0.045 |
Dartmouth | +0.044 |
heit | +0.041 |
Lansing | +0.040 |
ocene | +0.039 |
Neg logit contributions | |
smuggling | -0.032 |
nsic | -0.032 |
Machina | -0.031 |
interrogation | -0.031 |
table | -0.031 |
Token | jQuery |
Token ID | 37420 |
Feature activation | -9.51e-01 |
Pos logit contributions | |
smuggling | +0.312 |
nsic | +0.312 |
Machina | +0.301 |
table | +0.301 |
interrogation | +0.300 |
Neg logit contributions | |
Worcester | -0.440 |
Dartmouth | -0.433 |
heit | -0.402 |
ocene | -0.392 |
Lansing | -0.391 |
Token | implementation |
Token ID | 7822 |
Feature activation | -9.89e-01 |
Pos logit contributions | |
Worcester | +0.818 |
Dartmouth | +0.802 |
heit | +0.750 |
Lansing | +0.728 |
ocene | +0.725 |
Neg logit contributions | |
nsic | -0.567 |
smuggling | -0.565 |
Machina | -0.549 |
interrogation | -0.543 |
table | -0.543 |
Token | in |
Token ID | 287 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
Worcester | +0.813 |
Dartmouth | +0.796 |
heit | +0.742 |
Lansing | +0.718 |
ocene | +0.715 |
Neg logit contributions | |
nsic | -0.627 |
smuggling | -0.624 |
Machina | -0.608 |
interrogation | -0.602 |
table | -0.602 |
Token | lieu |
Token ID | 32267 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
Worcester | +0.223 |
Dartmouth | +0.219 |
heit | +0.204 |
ocene | +0.198 |
Lansing | +0.198 |
Neg logit contributions | |
smuggling | -0.163 |
nsic | -0.163 |
Machina | -0.158 |
interrogation | -0.157 |
table | -0.157 |
Token | of |
Token ID | 286 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
Worcester | +0.277 |
Dartmouth | +0.272 |
heit | +0.256 |
Lansing | +0.248 |
ocene | +0.247 |
Neg logit contributions | |
nsic | -0.166 |
smuggling | -0.165 |
Machina | -0.161 |
interrogation | -0.158 |
table | -0.158 |
Token | j |
Token ID | 474 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
Worcester | +1.125 |
Dartmouth | +1.099 |
heit | +1.018 |
Lansing | +0.984 |
ocene | +0.980 |
Neg logit contributions | |
nsic | -1.017 |
smuggling | -1.012 |
Machina | -0.988 |
interrogation | -0.980 |
table | -0.979 |
Token | q |
Token ID | 80 |
Feature activation | -6.60e-01 |
Pos logit contributions | |
Worcester | +0.247 |
Dartmouth | +0.243 |
heit | +0.231 |
Lansing | +0.225 |
ocene | +0.225 |
Neg logit contributions | |
nsic | -0.085 |
smuggling | -0.085 |
Machina | -0.081 |
table | -0.080 |
interrogation | -0.080 |
Token | L |
Token ID | 43 |
Feature activation | -8.23e-01 |
Pos logit contributions | |
Worcester | +0.479 |
Dartmouth | +0.467 |
heit | +0.431 |
Lansing | +0.415 |
ocene | +0.414 |
Neg logit contributions | |
nsic | -0.483 |
smuggling | -0.482 |
Machina | -0.471 |
table | -0.467 |
interrogation | -0.467 |
Token | ite |
Token ID | 578 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
Worcester | +0.618 |
Dartmouth | +0.604 |
heit | +0.557 |
Lansing | +0.542 |
hester | +0.536 |
Neg logit contributions | |
nsic | -0.582 |
smuggling | -0.580 |
Machina | -0.567 |
table | -0.565 |
interrogation | -0.562 |
Token | . |
Token ID | 13 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
Worcester | +1.789 |
Dartmouth | +1.749 |
heit | +1.635 |
Lansing | +1.585 |
ocene | +1.570 |
Neg logit contributions | |
nsic | -1.468 |
smuggling | -1.455 |
Machina | -1.419 |
Khe | -1.408 |
interrogation | -1.407 |
Token | : |
Token ID | 25 |
Feature activation | -4.04e-01 |
Pos logit contributions | |
smuggling | +0.617 |
nsic | +0.617 |
Machina | +0.602 |
table | +0.598 |
interrogation | +0.597 |
Neg logit contributions | |
Worcester | -0.707 |
Dartmouth | -0.692 |
heit | -0.645 |
ocene | -0.624 |
hester | -0.621 |
Token | the |
Token ID | 262 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
Worcester | +0.321 |
Dartmouth | +0.314 |
heit | +0.292 |
Lansing | +0.282 |
ocene | +0.282 |
Neg logit contributions | |
nsic | -0.267 |
smuggling | -0.267 |
Machina | -0.260 |
interrogation | -0.258 |
table | -0.257 |
Token | " |
Token ID | 366 |
Feature activation | -9.89e-02 |
Pos logit contributions | |
nsic | +0.106 |
smuggling | +0.105 |
Machina | +0.102 |
interrogation | +0.101 |
table | +0.101 |
Neg logit contributions | |
Worcester | -0.154 |
Dartmouth | -0.151 |
heit | -0.142 |
Lansing | -0.137 |
ocene | -0.137 |
Token | How |
Token ID | 2437 |
Feature activation | -8.11e-01 |
Pos logit contributions | |
Worcester | +0.083 |
Dartmouth | +0.081 |
heit | +0.076 |
Lansing | +0.074 |
ocene | +0.073 |
Neg logit contributions | |
nsic | -0.061 |
smuggling | -0.061 |
Machina | -0.059 |
table | -0.059 |
interrogation | -0.059 |
Token | To |
Token ID | 1675 |
Feature activation | +3.52e-01 |
Pos logit contributions | |
Worcester | +0.662 |
Dartmouth | +0.647 |
heit | +0.604 |
Lansing | +0.584 |
ocene | +0.583 |
Neg logit contributions | |
nsic | -0.520 |
smuggling | -0.518 |
Machina | -0.504 |
table | -0.500 |
interrogation | -0.500 |
Token | Stop |
Token ID | 13707 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
nsic | +0.229 |
smuggling | +0.229 |
Machina | +0.223 |
interrogation | +0.221 |
table | +0.221 |
Neg logit contributions | |
Worcester | -0.283 |
Dartmouth | -0.277 |
heit | -0.258 |
Lansing | -0.249 |
ocene | -0.249 |
Token | Rape |
Token ID | 35286 |
Feature activation | +5.30e-02 |
Pos logit contributions | |
Worcester | +1.081 |
Dartmouth | +1.057 |
heit | +0.979 |
Lansing | +0.953 |
ocene | +0.943 |
Neg logit contributions | |
nsic | -0.847 |
smuggling | -0.840 |
Machina | -0.817 |
interrogation | -0.813 |
table | -0.810 |
Token | " |
Token ID | 1 |
Feature activation | +8.72e-01 |
Pos logit contributions | |
nsic | +0.034 |
smuggling | +0.034 |
Machina | +0.033 |
interrogation | +0.033 |
table | +0.033 |
Neg logit contributions | |
Worcester | -0.043 |
Dartmouth | -0.042 |
heit | -0.039 |
Lansing | -0.038 |
ocene | -0.038 |
Token | article |
Token ID | 2708 |
Feature activation | -2.68e+00 |
Pos logit contributions | |
smuggling | +0.588 |
nsic | +0.584 |
Machina | +0.574 |
interrogation | +0.571 |
table | +0.568 |
Neg logit contributions | |
Worcester | -0.679 |
Dartmouth | -0.663 |
heit | -0.619 |
ocene | -0.599 |
hester | -0.598 |
Token | was |
Token ID | 373 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
Worcester | +2.124 |
Dartmouth | +2.080 |
heit | +1.922 |
Lansing | +1.867 |
ocene | +1.852 |
Neg logit contributions | |
nsic | -1.785 |
smuggling | -1.769 |
Machina | -1.725 |
table | -1.711 |
interrogation | -1.710 |
Token | satire |
Token ID | 35704 |
Feature activation | -5.46e-01 |
Pos logit contributions | |
Worcester | +0.156 |
Dartmouth | +0.153 |
heit | +0.143 |
ocene | +0.138 |
Lansing | +0.138 |
Neg logit contributions | |
smuggling | -0.126 |
nsic | -0.125 |
Machina | -0.122 |
table | -0.121 |
interrogation | -0.121 |
Token |
|
Token ID | 198 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
nsic | +0.348 |
smuggling | +0.347 |
table | +0.343 |
Machina | +0.342 |
Khe | +0.336 |
Neg logit contributions | |
Worcester | -0.413 |
Dartmouth | -0.403 |
heit | -0.378 |
ocene | -0.365 |
Lansing | -0.364 |
Token | Dec |
Token ID | 10707 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
nsic | +0.012 |
smuggling | +0.012 |
Machina | +0.012 |
table | +0.012 |
interrogation | +0.012 |
Neg logit contributions | |
Worcester | -0.012 |
Dartmouth | -0.011 |
heit | -0.010 |
Lansing | -0.010 |
ocene | -0.010 |
Token | iding |
Token ID | 2530 |
Feature activation | +2.34e+00 |
Pos logit contributions | |
nsic | +0.993 |
smuggling | +0.990 |
Machina | +0.968 |
table | +0.964 |
interrogation | +0.955 |
Neg logit contributions | |
Worcester | -1.297 |
Dartmouth | -1.266 |
heit | -1.182 |
Lansing | -1.143 |
ocene | -1.137 |
Token | to |
Token ID | 284 |
Feature activation | +6.38e-01 |
Pos logit contributions | |
smuggling | +1.459 |
nsic | +1.444 |
Machina | +1.442 |
table | +1.434 |
interrogation | +1.422 |
Neg logit contributions | |
Worcester | -1.890 |
Dartmouth | -1.855 |
heit | -1.756 |
ocene | -1.711 |
hester | -1.694 |
Token | pass |
Token ID | 1208 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
smuggling | +0.373 |
nsic | +0.368 |
Machina | +0.362 |
interrogation | +0.359 |
table | +0.358 |
Neg logit contributions | |
Worcester | -0.554 |
Dartmouth | -0.543 |
heit | -0.513 |
ocene | -0.497 |
hester | -0.496 |
Token | the |
Token ID | 262 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
smuggling | +0.701 |
nsic | +0.697 |
Machina | +0.685 |
interrogation | +0.678 |
table | +0.676 |
Neg logit contributions | |
Worcester | -0.966 |
Dartmouth | -0.946 |
heit | -0.889 |
ocene | -0.863 |
Lansing | -0.860 |
Token | torch |
Token ID | 28034 |
Feature activation | -6.53e-02 |
Pos logit contributions | |
nsic | +0.016 |
smuggling | +0.016 |
Machina | +0.016 |
interrogation | +0.015 |
table | +0.015 |
Neg logit contributions | |
Worcester | -0.010 |
Dartmouth | -0.010 |
heit | -0.009 |
Lansing | -0.008 |
ocene | -0.008 |
Token | of |
Token ID | 286 |
Feature activation | +7.24e-01 |
Pos logit contributions | |
Worcester | +0.053 |
Dartmouth | +0.052 |
heit | +0.048 |
Lansing | +0.047 |
ocene | +0.046 |
Neg logit contributions | |
nsic | -0.042 |
smuggling | -0.042 |
Machina | -0.041 |
table | -0.041 |
interrogation | -0.041 |
Token | leadership |
Token ID | 5531 |
Feature activation | -1.98e-01 |
Pos logit contributions | |
smuggling | +0.459 |
nsic | +0.455 |
Machina | +0.446 |
interrogation | +0.444 |
table | +0.442 |
Neg logit contributions | |
Worcester | -0.592 |
Dartmouth | -0.579 |
heit | -0.546 |
ocene | -0.527 |
hester | -0.524 |
Token | was |
Token ID | 373 |
Feature activation | +5.95e-02 |
Pos logit contributions | |
Worcester | +0.161 |
Dartmouth | +0.157 |
heit | +0.147 |
Lansing | +0.142 |
ocene | +0.142 |
Neg logit contributions | |
smuggling | -0.127 |
nsic | -0.127 |
Machina | -0.124 |
interrogation | -0.123 |
table | -0.123 |
Token | not |
Token ID | 407 |
Feature activation | +2.12e-01 |
Pos logit contributions | |
smuggling | +0.040 |
nsic | +0.040 |
Machina | +0.039 |
interrogation | +0.039 |
table | +0.039 |
Neg logit contributions | |
Worcester | -0.047 |
Dartmouth | -0.046 |
heit | -0.042 |
ocene | -0.041 |
Lansing | -0.041 |
Token | which |
Token ID | 543 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
smuggling | +0.389 |
nsic | +0.386 |
Machina | +0.379 |
interrogation | +0.374 |
table | +0.374 |
Neg logit contributions | |
Worcester | -0.454 |
Dartmouth | -0.446 |
heit | -0.416 |
ocene | -0.405 |
hester | -0.402 |
Token | goes |
Token ID | 2925 |
Feature activation | -3.61e-01 |
Pos logit contributions | |
smuggling | +0.758 |
nsic | +0.751 |
Machina | +0.737 |
interrogation | +0.729 |
investig | +0.728 |
Neg logit contributions | |
Worcester | -0.914 |
Dartmouth | -0.896 |
heit | -0.841 |
ocene | -0.817 |
Lansing | -0.808 |
Token | from |
Token ID | 422 |
Feature activation | -8.06e-01 |
Pos logit contributions | |
Worcester | +0.307 |
Dartmouth | +0.301 |
heit | +0.283 |
ocene | +0.276 |
Lansing | +0.274 |
Neg logit contributions | |
smuggling | -0.218 |
nsic | -0.216 |
Machina | -0.211 |
interrogation | -0.209 |
investig | -0.209 |
Token | September |
Token ID | 2693 |
Feature activation | -9.60e-01 |
Pos logit contributions | |
Worcester | +0.604 |
Dartmouth | +0.588 |
heit | +0.540 |
Lansing | +0.525 |
hester | +0.517 |
Neg logit contributions | |
nsic | -0.579 |
smuggling | -0.571 |
Machina | -0.560 |
xual | -0.555 |
table | -0.554 |
Token | 19 |
Token ID | 678 |
Feature activation | -6.55e-01 |
Pos logit contributions | |
Worcester | +0.861 |
Dartmouth | +0.844 |
heit | +0.791 |
Lansing | +0.769 |
ocene | +0.767 |
Neg logit contributions | |
nsic | -0.538 |
smuggling | -0.536 |
Machina | -0.520 |
interrogation | -0.515 |
table | -0.515 |
Token | through |
Token ID | 832 |
Feature activation | -3.07e+00 |
Pos logit contributions | |
Worcester | +0.535 |
Dartmouth | +0.524 |
heit | +0.487 |
Lansing | +0.472 |
ocene | +0.471 |
Neg logit contributions | |
nsic | -0.420 |
smuggling | -0.418 |
Machina | -0.407 |
table | -0.404 |
interrogation | -0.404 |
Token | to |
Token ID | 284 |
Feature activation | -6.79e-02 |
Pos logit contributions | |
Worcester | +2.559 |
Dartmouth | +2.499 |
heit | +2.282 |
Lansing | +2.250 |
hester | +2.192 |
Neg logit contributions | |
nsic | -1.965 |
smuggling | -1.905 |
xual | -1.871 |
Machina | -1.860 |
table | -1.848 |
Token | October |
Token ID | 3267 |
Feature activation | -4.78e-01 |
Pos logit contributions | |
Worcester | +0.046 |
Dartmouth | +0.045 |
heit | +0.041 |
Lansing | +0.040 |
ocene | +0.040 |
Neg logit contributions | |
nsic | -0.053 |
smuggling | -0.053 |
Machina | -0.051 |
interrogation | -0.051 |
table | -0.051 |
Token | 4 |
Token ID | 604 |
Feature activation | -5.88e-01 |
Pos logit contributions | |
Worcester | +0.445 |
Dartmouth | +0.436 |
heit | +0.409 |
Lansing | +0.399 |
ocene | +0.397 |
Neg logit contributions | |
nsic | -0.253 |
smuggling | -0.251 |
Machina | -0.243 |
interrogation | -0.241 |
table | -0.240 |
Token | - |
Token ID | 532 |
Feature activation | -4.63e-01 |
Pos logit contributions | |
Worcester | +0.492 |
Dartmouth | +0.482 |
heit | +0.450 |
Lansing | +0.436 |
ocene | +0.435 |
Neg logit contributions | |
nsic | -0.365 |
smuggling | -0.364 |
Machina | -0.354 |
table | -0.351 |
interrogation | -0.350 |
Token | the |
Token ID | 262 |
Feature activation | +1.46e-01 |
Pos logit contributions | |
Worcester | +0.358 |
Dartmouth | +0.350 |
heit | +0.325 |
Lansing | +0.314 |
ocene | +0.313 |
Neg logit contributions | |
nsic | -0.317 |
smuggling | -0.316 |
Machina | -0.308 |
interrogation | -0.306 |
table | -0.306 |
Token | result |
Token ID | 1255 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
smuggling | +0.160 |
nsic | +0.159 |
Machina | +0.155 |
interrogation | +0.154 |
investig | +0.153 |
Neg logit contributions | |
Worcester | -0.225 |
Dartmouth | -0.220 |
heit | -0.206 |
Lansing | -0.200 |
ocene | -0.200 |
Token | of |
Token ID | 286 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
Worcester | +0.028 |
Dartmouth | +0.028 |
heit | +0.026 |
Lansing | +0.025 |
ocene | +0.025 |
Neg logit contributions | |
nsic | -0.017 |
smuggling | -0.017 |
Machina | -0.016 |
table | -0.016 |
interrogation | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
smuggling | +0.082 |
nsic | +0.082 |
Machina | +0.080 |
interrogation | +0.079 |
investig | +0.079 |
Neg logit contributions | |
Worcester | -0.096 |
Dartmouth | -0.094 |
heit | -0.088 |
Lansing | -0.085 |
hester | -0.085 |
Token | feedback |
Token ID | 7538 |
Feature activation | +6.30e-01 |
Pos logit contributions | |
Worcester | +0.254 |
Dartmouth | +0.249 |
heit | +0.233 |
Lansing | +0.226 |
ocene | +0.226 |
Neg logit contributions | |
nsic | -0.172 |
smuggling | -0.171 |
Machina | -0.166 |
interrogation | -0.165 |
table | -0.165 |
Token | loop |
Token ID | 9052 |
Feature activation | +4.72e-01 |
Pos logit contributions | |
smuggling | +0.365 |
nsic | +0.364 |
Machina | +0.354 |
interrogation | +0.351 |
table | +0.351 |
Neg logit contributions | |
Worcester | -0.552 |
Dartmouth | -0.542 |
heit | -0.508 |
Lansing | -0.493 |
hester | -0.491 |
Token | between |
Token ID | 1022 |
Feature activation | -3.75e+00 |
Pos logit contributions | |
smuggling | +0.315 |
nsic | +0.314 |
Machina | +0.307 |
interrogation | +0.304 |
table | +0.304 |
Neg logit contributions | |
Worcester | -0.373 |
Dartmouth | -0.365 |
heit | -0.340 |
Lansing | -0.328 |
hester | -0.327 |
Token | acc |
Token ID | 697 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
Worcester | +3.096 |
Dartmouth | +3.034 |
heit | +2.791 |
Lansing | +2.735 |
ocene | +2.710 |
Neg logit contributions | |
nsic | -2.378 |
smuggling | -2.327 |
Machina | -2.273 |
table | -2.270 |
xual | -2.267 |
Token | ru |
Token ID | 622 |
Feature activation | -8.72e-01 |
Pos logit contributions | |
Worcester | +1.970 |
Dartmouth | +1.932 |
heit | +1.797 |
Lansing | +1.733 |
ocene | +1.727 |
Neg logit contributions | |
nsic | -1.734 |
smuggling | -1.729 |
Machina | -1.685 |
interrogation | -1.680 |
Khe | -1.673 |
Token | al |
Token ID | 282 |
Feature activation | -1.32e+00 |
Pos logit contributions | |
Worcester | +0.648 |
Dartmouth | +0.633 |
heit | +0.585 |
Lansing | +0.565 |
ocene | +0.563 |
Neg logit contributions | |
nsic | -0.623 |
smuggling | -0.622 |
Machina | -0.608 |
table | -0.605 |
interrogation | -0.601 |
Token | of |
Token ID | 286 |
Feature activation | -5.55e-01 |
Pos logit contributions | |
Worcester | +1.127 |
Dartmouth | +1.103 |
heit | +1.033 |
ocene | +1.002 |
Lansing | +1.002 |
Neg logit contributions | |
nsic | -0.789 |
smuggling | -0.782 |
Machina | -0.763 |
interrogation | -0.754 |
Khe | -0.753 |
Token | information |
Token ID | 1321 |
Feature activation | -1.31e+00 |
Pos logit contributions | |
Worcester | +0.476 |
Dartmouth | +0.466 |
heit | +0.436 |
Lansing | +0.423 |
ocene | +0.422 |
Neg logit contributions | |
smuggling | -0.332 |
nsic | -0.332 |
Machina | -0.323 |
interrogation | -0.320 |
table | -0.319 |
Token | - |
Token ID | 12 |
Feature activation | +7.84e-01 |
Pos logit contributions | |
smuggling | +1.028 |
nsic | +1.027 |
Machina | +1.011 |
Khe | +1.000 |
table | +0.999 |
Neg logit contributions | |
Worcester | -1.253 |
Dartmouth | -1.229 |
heit | -1.154 |
Lansing | -1.112 |
hester | -1.112 |
Token | 0 |
Token ID | 15 |
Feature activation | +1.59e+00 |
Pos logit contributions | |
nsic | +0.516 |
smuggling | +0.512 |
Machina | +0.504 |
table | +0.504 |
Khe | +0.499 |
Neg logit contributions | |
Worcester | -0.622 |
Dartmouth | -0.610 |
heit | -0.567 |
Lansing | -0.551 |
hester | -0.548 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
nsic | +0.962 |
smuggling | +0.961 |
Machina | +0.936 |
table | +0.925 |
interrogation | +0.924 |
Neg logit contributions | |
Worcester | -1.355 |
Dartmouth | -1.327 |
heit | -1.241 |
Lansing | -1.202 |
hester | -1.199 |
Token | 11 |
Token ID | 1157 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
nsic | +0.720 |
smuggling | +0.716 |
Machina | +0.711 |
table | +0.705 |
Khe | +0.696 |
Neg logit contributions | |
Worcester | -0.893 |
Dartmouth | -0.873 |
heit | -0.816 |
Lansing | -0.789 |
hester | -0.786 |
Token | million |
Token ID | 1510 |
Feature activation | -3.44e-01 |
Pos logit contributions | |
nsic | +0.800 |
smuggling | +0.797 |
Machina | +0.781 |
table | +0.774 |
interrogation | +0.772 |
Neg logit contributions | |
Worcester | -1.005 |
Dartmouth | -0.987 |
heit | -0.926 |
hester | -0.894 |
Lansing | -0.891 |
Token | years |
Token ID | 812 |
Feature activation | -3.12e+00 |
Pos logit contributions | |
Worcester | +0.228 |
Dartmouth | +0.223 |
heit | +0.204 |
Lansing | +0.196 |
hester | +0.195 |
Neg logit contributions | |
nsic | -0.272 |
smuggling | -0.272 |
Machina | -0.266 |
table | -0.265 |
Khe | -0.264 |
Token | . |
Token ID | 13 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
Worcester | +2.518 |
Dartmouth | +2.454 |
heit | +2.288 |
ocene | +2.215 |
Lansing | +2.202 |
Neg logit contributions | |
nsic | -2.029 |
smuggling | -2.024 |
Machina | -1.961 |
interrogation | -1.955 |
investig | -1.943 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
Worcester | +0.328 |
Dartmouth | +0.321 |
heit | +0.300 |
Lansing | +0.289 |
hester | +0.288 |
Neg logit contributions | |
nsic | -0.287 |
smuggling | -0.285 |
Machina | -0.281 |
table | -0.278 |
Khe | -0.277 |
Token | Image |
Token ID | 5159 |
Feature activation | +1.40e+00 |
Pos logit contributions | |
nsic | +0.021 |
smuggling | +0.021 |
Machina | +0.020 |
table | +0.020 |
interrogation | +0.020 |
Neg logit contributions | |
Worcester | -0.020 |
Dartmouth | -0.019 |
heit | -0.018 |
Lansing | -0.017 |
ocene | -0.017 |
Token | copyright |
Token ID | 6634 |
Feature activation | +3.01e+00 |
Pos logit contributions | |
smuggling | +0.647 |
nsic | +0.646 |
Machina | +0.620 |
interrogation | +0.615 |
investig | +0.613 |
Neg logit contributions | |
Worcester | -1.384 |
Dartmouth | -1.363 |
heit | -1.290 |
Lansing | -1.253 |
hester | -1.252 |
Token | AFP |
Token ID | 8916 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
smuggling | +1.784 |
nsic | +1.770 |
Machina | +1.758 |
Khe | +1.744 |
table | +1.723 |
Neg logit contributions | |
Worcester | -2.519 |
Dartmouth | -2.471 |
heit | -2.379 |
ocene | -2.290 |
hester | -2.280 |
Token | . |
Token ID | 13 |
Feature activation | +3.02e-01 |
Pos logit contributions | |
Worcester | +0.222 |
Dartmouth | +0.217 |
heit | +0.203 |
Lansing | +0.198 |
ocene | +0.197 |
Neg logit contributions | |
nsic | -0.155 |
smuggling | -0.154 |
Machina | -0.149 |
interrogation | -0.148 |
table | -0.148 |
Token | 05 |
Token ID | 2713 |
Feature activation | +1.13e+00 |
Pos logit contributions | |
nsic | +0.208 |
smuggling | +0.208 |
Machina | +0.206 |
table | +0.205 |
Khe | +0.203 |
Neg logit contributions | |
Worcester | -0.228 |
Dartmouth | -0.223 |
heit | -0.208 |
ocene | -0.201 |
hester | -0.200 |
Token | MM |
Token ID | 12038 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
smuggling | +0.642 |
nsic | +0.640 |
Machina | +0.624 |
table | +0.617 |
interrogation | +0.617 |
Neg logit contributions | |
Worcester | -0.999 |
Dartmouth | -0.983 |
heit | -0.921 |
Lansing | -0.891 |
ocene | -0.889 |
Token | from |
Token ID | 422 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
nsic | +0.095 |
smuggling | +0.095 |
Machina | +0.092 |
table | +0.092 |
interrogation | +0.092 |
Neg logit contributions | |
Worcester | -0.128 |
Dartmouth | -0.125 |
heit | -0.117 |
Lansing | -0.113 |
ocene | -0.113 |
Token | now |
Token ID | 783 |
Feature activation | -5.72e-01 |
Pos logit contributions | |
smuggling | +0.204 |
nsic | +0.203 |
Machina | +0.199 |
table | +0.197 |
interrogation | +0.197 |
Neg logit contributions | |
Worcester | -0.217 |
Dartmouth | -0.212 |
heit | -0.197 |
ocene | -0.190 |
Lansing | -0.189 |
Token | through |
Token ID | 832 |
Feature activation | -2.86e+00 |
Pos logit contributions | |
Worcester | +0.462 |
Dartmouth | +0.453 |
heit | +0.421 |
ocene | +0.407 |
Lansing | +0.407 |
Neg logit contributions | |
nsic | -0.370 |
smuggling | -0.370 |
Machina | -0.360 |
table | -0.358 |
interrogation | -0.357 |
Token | the |
Token ID | 262 |
Feature activation | -2.96e-01 |
Pos logit contributions | |
Worcester | +2.125 |
Dartmouth | +2.065 |
heit | +1.861 |
Lansing | +1.843 |
ocene | +1.801 |
Neg logit contributions | |
nsic | -2.088 |
smuggling | -2.036 |
xual | -2.013 |
Machina | -1.997 |
interrogation | -1.977 |
Token | end |
Token ID | 886 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
Worcester | +0.230 |
Dartmouth | +0.224 |
heit | +0.205 |
Lansing | +0.201 |
ocene | +0.199 |
Neg logit contributions | |
nsic | -0.204 |
smuggling | -0.201 |
Machina | -0.197 |
xual | -0.195 |
table | -0.195 |
Token | of |
Token ID | 286 |
Feature activation | +1.80e+00 |
Pos logit contributions | |
smuggling | +0.736 |
nsic | +0.734 |
Machina | +0.717 |
table | +0.716 |
interrogation | +0.704 |
Neg logit contributions | |
Worcester | -1.405 |
Dartmouth | -1.380 |
heit | -1.309 |
ocene | -1.269 |
hester | -1.268 |
Token | the |
Token ID | 262 |
Feature activation | -4.37e-02 |
Pos logit contributions | |
smuggling | +1.248 |
nsic | +1.238 |
Machina | +1.217 |
table | +1.206 |
interrogation | +1.206 |
Neg logit contributions | |
Worcester | -1.368 |
Dartmouth | -1.340 |
heit | -1.252 |
ocene | -1.204 |
hester | -1.202 |
Token | 2018 |
Token ID | 2864 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
Worcester | +0.033 |
Dartmouth | +0.032 |
heit | +0.029 |
Lansing | +0.029 |
ocene | +0.028 |
Neg logit contributions | |
nsic | -0.031 |
smuggling | -0.031 |
Machina | -0.030 |
xual | -0.030 |
interrogation | -0.030 |
Token | 1965 |
Token ID | 17672 |
Feature activation | +4.81e-01 |
Pos logit contributions | |
nsic | +0.171 |
smuggling | +0.171 |
Machina | +0.169 |
table | +0.168 |
interrogation | +0.166 |
Neg logit contributions | |
Worcester | -0.160 |
Dartmouth | -0.156 |
heit | -0.145 |
ocene | -0.140 |
hester | -0.139 |
Token | ). |
Token ID | 6739 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
nsic | +0.206 |
smuggling | +0.205 |
Machina | +0.197 |
interrogation | +0.194 |
table | +0.194 |
Neg logit contributions | |
Worcester | -0.495 |
Dartmouth | -0.487 |
heit | -0.459 |
Lansing | -0.449 |
ocene | -0.447 |
Token | Conce |
Token ID | 44530 |
Feature activation | -1.27e+00 |
Pos logit contributions | |
nsic | +0.851 |
smuggling | +0.846 |
Machina | +0.837 |
Khe | +0.829 |
table | +0.827 |
Neg logit contributions | |
Worcester | -0.986 |
Dartmouth | -0.961 |
heit | -0.905 |
ocene | -0.876 |
hester | -0.872 |
Token | iving |
Token ID | 1412 |
Feature activation | -5.69e-01 |
Pos logit contributions | |
Worcester | +1.087 |
Dartmouth | +1.066 |
heit | +0.998 |
ocene | +0.966 |
Lansing | +0.964 |
Neg logit contributions | |
smuggling | -0.750 |
nsic | -0.748 |
Machina | -0.728 |
interrogation | -0.724 |
Khe | -0.722 |
Token | the |
Token ID | 262 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
Worcester | +0.465 |
Dartmouth | +0.455 |
heit | +0.423 |
Lansing | +0.410 |
ocene | +0.409 |
Neg logit contributions | |
nsic | -0.364 |
smuggling | -0.363 |
Machina | -0.354 |
table | -0.350 |
interrogation | -0.350 |
Token | self |
Token ID | 2116 |
Feature activation | -3.12e+00 |
Pos logit contributions | |
Worcester | +0.337 |
Dartmouth | +0.330 |
heit | +0.308 |
Lansing | +0.300 |
ocene | +0.299 |
Neg logit contributions | |
nsic | -0.231 |
smuggling | -0.229 |
Machina | -0.223 |
table | -0.221 |
interrogation | -0.220 |
Token | . |
Token ID | 13 |
Feature activation | -8.64e-01 |
Pos logit contributions | |
Worcester | +2.519 |
Dartmouth | +2.476 |
heit | +2.297 |
ocene | +2.216 |
Lansing | +2.213 |
Neg logit contributions | |
nsic | -2.008 |
smuggling | -1.996 |
Machina | -1.950 |
Khe | -1.923 |
table | -1.922 |
Token | Mal |
Token ID | 4434 |
Feature activation | +6.78e-02 |
Pos logit contributions | |
Worcester | +0.576 |
Dartmouth | +0.561 |
heit | +0.521 |
ocene | +0.500 |
hester | +0.497 |
Neg logit contributions | |
nsic | -0.671 |
smuggling | -0.669 |
Machina | -0.663 |
table | -0.657 |
Khe | -0.656 |
Token | ab |
Token ID | 397 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
nsic | +0.042 |
smuggling | +0.042 |
Machina | +0.041 |
table | +0.041 |
interrogation | +0.041 |
Neg logit contributions | |
Worcester | -0.056 |
Dartmouth | -0.055 |
heit | -0.051 |
Lansing | -0.050 |
ocene | -0.050 |
Token | ar |
Token ID | 283 |
Feature activation | +8.18e-01 |
Pos logit contributions | |
Worcester | +1.646 |
Dartmouth | +1.612 |
heit | +1.500 |
Lansing | +1.455 |
ocene | +1.448 |
Neg logit contributions | |
nsic | -1.281 |
smuggling | -1.279 |
Machina | -1.242 |
interrogation | -1.234 |
investig | -1.230 |
Token | , |
Token ID | 11 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
nsic | +0.494 |
smuggling | +0.489 |
Machina | +0.479 |
table | +0.476 |
interrogation | +0.475 |
Neg logit contributions | |
Worcester | -0.693 |
Dartmouth | -0.679 |
heit | -0.634 |
ocene | -0.620 |
hester | -0.616 |