Token | Pres |
Token ID | 1763 |
Feature activation | -2.17e-03 |
Pos logit contributions | |
�� | +2.106 |
sqor | +2.050 |
capacity | +1.868 |
ゴ | +1.852 |
Sisters | +1.807 |
Neg logit contributions | |
arial | -1.622 |
utton | -1.573 |
nce | -1.571 |
ody | -1.532 |
illery | -1.518 |
Token | ented |
Token ID | 4714 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
arial | +0.009 |
nce | +0.008 |
utton | +0.008 |
ody | +0.008 |
illery | +0.008 |
Neg logit contributions | |
�� | -0.018 |
sqor | -0.017 |
capacity | -0.016 |
ゴ | -0.016 |
ALSE | -0.015 |
Token | at |
Token ID | 379 |
Feature activation | +9.07e-01 |
Pos logit contributions | |
�� | +3.495 |
sqor | +3.373 |
capacity | +3.082 |
ゴ | +3.007 |
ALSE | +2.986 |
Neg logit contributions | |
arial | -2.908 |
utton | -2.849 |
nce | -2.839 |
illery | -2.777 |
ody | -2.758 |
Token | the |
Token ID | 262 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
�� | +5.639 |
sqor | +5.579 |
capacity | +5.119 |
Sisters | +5.010 |
ゴ | +4.996 |
Neg logit contributions | |
arial | -4.856 |
utton | -4.710 |
nce | -4.649 |
illery | -4.581 |
ody | -4.542 |
Token | 57 |
Token ID | 7632 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
�� | +5.475 |
sqor | +5.415 |
capacity | +4.924 |
Sisters | +4.826 |
ゴ | +4.808 |
Neg logit contributions | |
arial | -5.380 |
utton | -5.247 |
nce | -5.155 |
ody | -5.059 |
illery | -5.047 |
Token | th |
Token ID | 400 |
Feature activation | +1.53e+00 |
Pos logit contributions | |
�� | +2.066 |
sqor | +2.010 |
capacity | +1.850 |
ゴ | +1.840 |
ALSE | +1.796 |
Neg logit contributions | |
arial | -1.156 |
utton | -1.108 |
nce | -1.106 |
ody | -1.068 |
illery | -1.061 |
Token | Annual |
Token ID | 16328 |
Feature activation | +8.93e-01 |
Pos logit contributions | |
�� | +6.835 |
sqor | +6.828 |
SIG | +6.223 |
capacity | +6.172 |
Sisters | +6.105 |
Neg logit contributions | |
arial | -10.019 |
utton | -9.916 |
illery | -9.497 |
ody | -9.483 |
nce | -9.473 |
Token | Meeting |
Token ID | 22244 |
Feature activation | +5.14e-01 |
Pos logit contributions | |
�� | +5.043 |
sqor | +4.940 |
capacity | +4.490 |
Sisters | +4.402 |
ゴ | +4.393 |
Neg logit contributions | |
arial | -5.342 |
utton | -5.267 |
nce | -5.175 |
ody | -5.080 |
illery | -5.060 |
Token | of |
Token ID | 286 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
�� | +2.957 |
sqor | +2.878 |
capacity | +2.563 |
ゴ | +2.524 |
Sisters | +2.478 |
Neg logit contributions | |
arial | -3.138 |
utton | -3.058 |
nce | -3.054 |
illery | -2.961 |
ody | -2.956 |
Token | the |
Token ID | 262 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
�� | +5.936 |
sqor | +5.902 |
capacity | +5.485 |
Sisters | +5.477 |
SIG | +5.362 |
Neg logit contributions | |
arial | -5.453 |
utton | -5.321 |
nce | -5.200 |
illery | -5.108 |
ody | -5.027 |
Token | Association |
Token ID | 5396 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
�� | +5.461 |
sqor | +5.399 |
Sisters | +5.002 |
capacity | +4.914 |
SIG | +4.850 |
Neg logit contributions | |
arial | -6.769 |
utton | -6.652 |
nce | -6.523 |
ody | -6.434 |
illery | -6.398 |
Token | 001 |
Token ID | 8298 |
Feature activation | +6.45e-01 |
Pos logit contributions | |
arial | +0.204 |
nce | +0.197 |
utton | +0.196 |
ody | +0.190 |
illery | +0.188 |
Neg logit contributions | |
�� | -0.344 |
sqor | -0.334 |
capacity | -0.307 |
ゴ | -0.305 |
ALSE | -0.298 |
Token | f |
Token ID | 69 |
Feature activation | +7.01e-01 |
Pos logit contributions | |
�� | +4.138 |
sqor | +4.074 |
capacity | +3.818 |
ゴ | +3.710 |
ALSE | +3.525 |
Neg logit contributions | |
arial | -3.364 |
utton | -3.196 |
nce | -3.170 |
ody | -3.107 |
illery | -3.087 |
Token | 1 |
Token ID | 16 |
Feature activation | +7.87e-01 |
Pos logit contributions | |
�� | +4.744 |
sqor | +4.612 |
capacity | +4.344 |
ゴ | +4.227 |
ALSE | +4.143 |
Neg logit contributions | |
arial | -3.442 |
utton | -3.219 |
nce | -3.196 |
illery | -3.156 |
ody | -3.086 |
Token | f |
Token ID | 69 |
Feature activation | +5.73e-01 |
Pos logit contributions | |
sqor | +5.125 |
�� | +5.111 |
capacity | +4.806 |
ゴ | +4.634 |
Sisters | +4.478 |
Neg logit contributions | |
arial | -3.972 |
utton | -3.779 |
nce | -3.749 |
illery | -3.684 |
ody | -3.679 |
Token | 4 |
Token ID | 19 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
�� | +3.759 |
sqor | +3.636 |
capacity | +3.395 |
ALSE | +3.262 |
ゴ | +3.255 |
Neg logit contributions | |
arial | -2.953 |
nce | -2.778 |
utton | -2.769 |
illery | -2.760 |
izer | -2.678 |
Token | b |
Token ID | 65 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
sqor | +6.615 |
�� | +6.375 |
capacity | +6.328 |
ゴ | +5.898 |
jam | +5.788 |
Neg logit contributions | |
arial | -7.779 |
utton | -7.403 |
illery | -7.317 |
nce | -7.260 |
issance | -7.129 |
Token | be |
Token ID | 1350 |
Feature activation | +5.73e-01 |
Pos logit contributions | |
sqor | +4.776 |
capacity | +4.757 |
�� | +4.376 |
jam | +4.041 |
ゴ | +4.036 |
Neg logit contributions | |
arial | -11.737 |
illery | -11.181 |
utton | -11.166 |
nce | -10.982 |
issance | -10.863 |
Token | 66 |
Token ID | 2791 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
�� | +4.394 |
sqor | +4.361 |
capacity | +4.103 |
ゴ | +4.024 |
ALSE | +3.899 |
Neg logit contributions | |
arial | -2.306 |
nce | -2.185 |
utton | -2.169 |
illery | -2.106 |
ody | -2.073 |
Token | . |
Token ID | 13 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
�� | +2.693 |
sqor | +2.624 |
capacity | +2.364 |
ゴ | +2.340 |
ALSE | +2.292 |
Neg logit contributions | |
arial | -2.342 |
nce | -2.260 |
utton | -2.250 |
illery | -2.195 |
ody | -2.191 |
Token | So |
Token ID | 1406 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
arial | +0.114 |
nce | +0.111 |
utton | +0.110 |
ody | +0.106 |
illery | +0.106 |
Neg logit contributions | |
�� | -0.166 |
sqor | -0.160 |
capacity | -0.146 |
ゴ | -0.145 |
ALSE | -0.141 |
Token | pay |
Token ID | 1414 |
Feature activation | +2.41e-02 |
Pos logit contributions | |
�� | +0.117 |
sqor | +0.112 |
capacity | +0.103 |
ゴ | +0.103 |
ALSE | +0.100 |
Neg logit contributions | |
arial | -0.082 |
nce | -0.079 |
utton | -0.079 |
ody | -0.076 |
illery | -0.076 |
Token | Health |
Token ID | 3893 |
Feature activation | +9.40e-02 |
Pos logit contributions | |
�� | +3.558 |
sqor | +3.547 |
capacity | +3.211 |
Sisters | +3.125 |
ゴ | +3.115 |
Neg logit contributions | |
arial | -3.943 |
utton | -3.810 |
nce | -3.803 |
illery | -3.743 |
ody | -3.691 |
Token | Organization |
Token ID | 12275 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
�� | +0.700 |
sqor | +0.681 |
capacity | +0.629 |
ゴ | +0.625 |
Sisters | +0.609 |
Neg logit contributions | |
arial | -0.427 |
nce | -0.413 |
utton | -0.409 |
ody | -0.394 |
illery | -0.394 |
Token | . |
Token ID | 13 |
Feature activation | +6.10e-01 |
Pos logit contributions | |
�� | +3.243 |
sqor | +3.192 |
capacity | +2.869 |
ゴ | +2.832 |
Sisters | +2.780 |
Neg logit contributions | |
arial | -2.933 |
utton | -2.845 |
nce | -2.834 |
ody | -2.756 |
illery | -2.752 |
Token | In |
Token ID | 554 |
Feature activation | +6.49e-01 |
Pos logit contributions | |
�� | +3.576 |
sqor | +3.509 |
capacity | +3.208 |
ゴ | +3.140 |
Sisters | +3.106 |
Neg logit contributions | |
arial | -3.582 |
utton | -3.497 |
nce | -3.465 |
ody | -3.397 |
illery | -3.392 |
Token | juries |
Token ID | 47496 |
Feature activation | +7.77e-01 |
Pos logit contributions | |
�� | +4.186 |
sqor | +4.118 |
capacity | +3.836 |
ゴ | +3.708 |
Sisters | +3.631 |
Neg logit contributions | |
arial | -3.393 |
utton | -3.325 |
nce | -3.295 |
illery | -3.245 |
ody | -3.241 |
Token | and |
Token ID | 290 |
Feature activation | +1.49e+00 |
Pos logit contributions | |
�� | +4.697 |
sqor | +4.669 |
capacity | +4.177 |
ゴ | +4.109 |
Sisters | +4.030 |
Neg logit contributions | |
arial | -4.413 |
utton | -4.308 |
nce | -4.256 |
illery | -4.160 |
ody | -4.136 |
Token | violence |
Token ID | 3685 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
sqor | +7.947 |
�� | +7.908 |
capacity | +7.473 |
Sisters | +7.076 |
SIG | +6.941 |
Neg logit contributions | |
arial | -8.405 |
illery | -7.971 |
utton | -7.970 |
ody | -7.915 |
nce | -7.832 |
Token | : |
Token ID | 25 |
Feature activation | +4.03e-01 |
Pos logit contributions | |
�� | +6.929 |
sqor | +6.909 |
capacity | +6.346 |
ゴ | +6.154 |
Sisters | +5.946 |
Neg logit contributions | |
arial | -7.046 |
utton | -6.973 |
illery | -6.753 |
nce | -6.737 |
ody | -6.612 |
Token | the |
Token ID | 262 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
�� | +2.623 |
sqor | +2.551 |
capacity | +2.324 |
ゴ | +2.293 |
Sisters | +2.223 |
Neg logit contributions | |
arial | -2.195 |
utton | -2.125 |
nce | -2.123 |
ody | -2.066 |
illery | -2.060 |
Token | facts |
Token ID | 6419 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
�� | +0.773 |
sqor | +0.743 |
ゴ | +0.669 |
capacity | +0.667 |
ALSE | +0.652 |
Neg logit contributions | |
arial | -0.655 |
nce | -0.642 |
utton | -0.634 |
ody | -0.619 |
illery | -0.610 |
Token | . |
Token ID | 13 |
Feature activation | +5.98e-01 |
Pos logit contributions | |
arial | +1.243 |
nce | +1.191 |
utton | +1.178 |
ody | +1.162 |
illery | +1.152 |
Neg logit contributions | |
�� | -1.508 |
sqor | -1.449 |
capacity | -1.317 |
ゴ | -1.308 |
ALSE | -1.275 |
Token | so |
Token ID | 523 |
Feature activation | +2.42e-02 |
Pos logit contributions | |
�� | +0.739 |
sqor | +0.711 |
capacity | +0.644 |
ゴ | +0.643 |
ALSE | +0.624 |
Neg logit contributions | |
arial | -0.586 |
nce | -0.567 |
utton | -0.566 |
ody | -0.553 |
illery | -0.547 |
Token | their |
Token ID | 511 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
�� | +0.175 |
sqor | +0.168 |
ゴ | +0.154 |
capacity | +0.153 |
ALSE | +0.148 |
Neg logit contributions | |
arial | -0.119 |
nce | -0.114 |
utton | -0.114 |
ody | -0.112 |
illery | -0.110 |
Token | teams |
Token ID | 3466 |
Feature activation | -9.79e-02 |
Pos logit contributions | |
�� | +1.579 |
sqor | +1.526 |
capacity | +1.383 |
ゴ | +1.375 |
ALSE | +1.336 |
Neg logit contributions | |
arial | -1.284 |
nce | -1.246 |
utton | -1.242 |
ody | -1.208 |
illery | -1.199 |
Token | are |
Token ID | 389 |
Feature activation | -2.06e-02 |
Pos logit contributions | |
arial | +0.514 |
nce | +0.496 |
utton | +0.491 |
ody | +0.484 |
illery | +0.479 |
Neg logit contributions | |
�� | -0.681 |
sqor | -0.657 |
ゴ | -0.591 |
capacity | -0.589 |
ALSE | -0.574 |
Token | manufacturing |
Token ID | 9138 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
arial | +0.108 |
nce | +0.104 |
utton | +0.103 |
ody | +0.101 |
illery | +0.099 |
Neg logit contributions | |
�� | -0.143 |
sqor | -0.139 |
ゴ | -0.125 |
capacity | -0.124 |
ALSE | -0.121 |
Token | all |
Token ID | 477 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
�� | +1.719 |
sqor | +1.666 |
capacity | +1.514 |
ゴ | +1.500 |
ALSE | +1.463 |
Neg logit contributions | |
arial | -1.392 |
nce | -1.351 |
utton | -1.348 |
ody | -1.308 |
illery | -1.304 |
Token | kinds |
Token ID | 6982 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
sqor | +6.202 |
�� | +5.856 |
capacity | +5.234 |
Sisters | +5.227 |
ゴ | +5.079 |
Neg logit contributions | |
arial | -10.042 |
nce | -9.915 |
utton | -9.713 |
illery | -9.644 |
izer | -9.446 |
Token | of |
Token ID | 286 |
Feature activation | +5.23e-01 |
Pos logit contributions | |
�� | +1.326 |
sqor | +1.270 |
capacity | +1.142 |
ゴ | +1.139 |
ALSE | +1.105 |
Neg logit contributions | |
arial | -1.138 |
nce | -1.103 |
utton | -1.099 |
ody | -1.071 |
illery | -1.062 |
Token | ways |
Token ID | 2842 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
�� | +3.017 |
sqor | +2.920 |
capacity | +2.650 |
ゴ | +2.600 |
Sisters | +2.554 |
Neg logit contributions | |
arial | -3.143 |
nce | -3.088 |
utton | -3.069 |
illery | -2.987 |
ody | -2.981 |
Token | for |
Token ID | 329 |
Feature activation | +2.51e-01 |
Pos logit contributions | |
arial | +0.573 |
nce | +0.557 |
utton | +0.554 |
ody | +0.536 |
illery | +0.535 |
Neg logit contributions | |
�� | -0.842 |
sqor | -0.820 |
capacity | -0.748 |
ゴ | -0.742 |
ALSE | -0.724 |
Token | them |
Token ID | 606 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
�� | +1.558 |
sqor | +1.493 |
capacity | +1.369 |
ゴ | +1.326 |
Sisters | +1.323 |
Neg logit contributions | |
arial | -1.426 |
utton | -1.393 |
nce | -1.372 |
illery | -1.351 |
ody | -1.340 |
Token | 001 |
Token ID | 8298 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
arial | +1.514 |
nce | +1.469 |
utton | +1.466 |
ody | +1.416 |
illery | +1.394 |
Neg logit contributions | |
�� | -2.819 |
sqor | -2.740 |
capacity | -2.507 |
ゴ | -2.505 |
ALSE | -2.446 |
Token | f |
Token ID | 69 |
Feature activation | +5.99e-01 |
Pos logit contributions | |
�� | +3.530 |
sqor | +3.426 |
capacity | +3.226 |
ゴ | +3.130 |
Sisters | +2.982 |
Neg logit contributions | |
arial | -2.776 |
utton | -2.654 |
nce | -2.632 |
ody | -2.579 |
illery | -2.568 |
Token | 1 |
Token ID | 16 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
�� | +4.113 |
sqor | +3.964 |
capacity | +3.753 |
ゴ | +3.637 |
ALSE | +3.580 |
Neg logit contributions | |
arial | -2.929 |
utton | -2.758 |
nce | -2.727 |
illery | -2.710 |
ody | -2.632 |
Token | f |
Token ID | 69 |
Feature activation | +5.07e-01 |
Pos logit contributions | |
�� | +4.788 |
sqor | +4.752 |
capacity | +4.446 |
ゴ | +4.311 |
Sisters | +4.165 |
Neg logit contributions | |
arial | -3.621 |
utton | -3.461 |
nce | -3.432 |
illery | -3.373 |
ody | -3.365 |
Token | 4 |
Token ID | 19 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
�� | +3.372 |
sqor | +3.215 |
capacity | +3.033 |
ALSE | +2.908 |
ゴ | +2.888 |
Neg logit contributions | |
arial | -2.587 |
utton | -2.445 |
nce | -2.439 |
illery | -2.433 |
izer | -2.341 |
Token | b |
Token ID | 65 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
sqor | +6.002 |
�� | +5.942 |
capacity | +5.720 |
ゴ | +5.409 |
jam | +5.244 |
Neg logit contributions | |
arial | -6.601 |
utton | -6.348 |
illery | -6.261 |
nce | -6.239 |
ody | -6.060 |
Token | be |
Token ID | 1350 |
Feature activation | +5.73e-01 |
Pos logit contributions | |
sqor | +4.697 |
capacity | +4.675 |
�� | +4.430 |
ゴ | +4.006 |
jam | +3.972 |
Neg logit contributions | |
arial | -11.214 |
utton | -10.735 |
illery | -10.732 |
nce | -10.558 |
issance | -10.378 |
Token | 66 |
Token ID | 2791 |
Feature activation | +2.85e-01 |
Pos logit contributions | |
�� | +4.419 |
sqor | +4.362 |
capacity | +4.115 |
ゴ | +4.048 |
ALSE | +3.932 |
Neg logit contributions | |
arial | -2.280 |
utton | -2.163 |
nce | -2.161 |
illery | -2.092 |
ody | -2.058 |
Token | power |
Token ID | 1176 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
�� | +1.713 |
sqor | +1.657 |
capacity | +1.482 |
ゴ | +1.463 |
ALSE | +1.429 |
Neg logit contributions | |
arial | -1.701 |
nce | -1.644 |
utton | -1.642 |
illery | -1.605 |
ody | -1.600 |
Token | off |
Token ID | 572 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
arial | +1.560 |
nce | +1.517 |
utton | +1.501 |
ody | +1.466 |
illery | +1.434 |
Neg logit contributions | |
�� | -2.255 |
sqor | -2.186 |
ゴ | -1.987 |
capacity | -1.987 |
ALSE | -1.926 |
Token |
|
Token ID | 198 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
arial | +1.298 |
nce | +1.266 |
utton | +1.256 |
ody | +1.227 |
illery | +1.204 |
Neg logit contributions | |
�� | -1.665 |
sqor | -1.604 |
ゴ | -1.458 |
capacity | -1.456 |
ALSE | -1.408 |
Token | the |
Token ID | 262 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
�� | +2.742 |
sqor | +2.674 |
capacity | +2.474 |
ゴ | +2.469 |
ALSE | +2.395 |
Neg logit contributions | |
arial | -1.550 |
nce | -1.501 |
utton | -1.485 |
illery | -1.434 |
ody | -1.429 |
Token | relevant |
Token ID | 5981 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
�� | +1.624 |
sqor | +1.570 |
capacity | +1.431 |
ゴ | +1.424 |
ALSE | +1.386 |
Neg logit contributions | |
arial | -1.167 |
nce | -1.131 |
utton | -1.125 |
ody | -1.094 |
illery | -1.084 |
Token | portion |
Token ID | 6903 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
arial | +0.056 |
nce | +0.054 |
utton | +0.053 |
ody | +0.051 |
illery | +0.050 |
Neg logit contributions | |
�� | -0.103 |
sqor | -0.100 |
capacity | -0.092 |
ゴ | -0.091 |
ALSE | -0.089 |
Token | of |
Token ID | 286 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
�� | +0.732 |
sqor | +0.708 |
capacity | +0.637 |
ゴ | +0.635 |
ALSE | +0.615 |
Neg logit contributions | |
arial | -0.670 |
nce | -0.652 |
utton | -0.650 |
ody | -0.633 |
illery | -0.629 |
Token | which |
Token ID | 543 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
�� | +1.251 |
sqor | +1.210 |
capacity | +1.115 |
ゴ | +1.105 |
ALSE | +1.079 |
Neg logit contributions | |
arial | -0.882 |
utton | -0.850 |
nce | -0.847 |
illery | -0.822 |
ody | -0.816 |
Token | reads |
Token ID | 9743 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
�� | +1.801 |
sqor | +1.748 |
capacity | +1.603 |
ゴ | +1.595 |
ALSE | +1.555 |
Neg logit contributions | |
arial | -1.122 |
nce | -1.083 |
utton | -1.078 |
ody | -1.044 |
illery | -1.036 |
Token | : |
Token ID | 25 |
Feature activation | +7.47e-01 |
Pos logit contributions | |
�� | +7.027 |
sqor | +6.831 |
capacity | +6.024 |
ゴ | +5.992 |
ALSE | +5.935 |
Neg logit contributions | |
arial | -8.838 |
nce | -8.702 |
utton | -8.482 |
illery | -8.434 |
izer | -8.231 |
Token |
|
Token ID | 198 |
Feature activation | +5.84e-01 |
Pos logit contributions | |
�� | +4.187 |
sqor | +4.011 |
capacity | +3.692 |
ゴ | +3.598 |
Sisters | +3.540 |
Neg logit contributions | |
arial | -4.506 |
nce | -4.410 |
utton | -4.375 |
illery | -4.268 |
ody | -4.241 |
Token |
|
Token ID | 198 |
Feature activation | +6.03e-01 |
Pos logit contributions | |
�� | +3.335 |
sqor | +3.312 |
capacity | +3.083 |
ゴ | +3.010 |
ALSE | +2.920 |
Neg logit contributions | |
arial | -3.393 |
utton | -3.335 |
nce | -3.308 |
ody | -3.244 |
illery | -3.223 |
Token | He |
Token ID | 1544 |
Feature activation | +3.40e-01 |
Pos logit contributions | |
�� | +3.898 |
sqor | +3.743 |
capacity | +3.484 |
ゴ | +3.434 |
ALSE | +3.336 |
Neg logit contributions | |
arial | -3.258 |
utton | -3.170 |
nce | -3.165 |
illery | -3.066 |
ody | -3.055 |
Token | ( |
Token ID | 357 |
Feature activation | -1.51e-01 |
Pos logit contributions | |
�� | +2.368 |
sqor | +2.288 |
capacity | +2.110 |
ゴ | +2.092 |
ALSE | +2.033 |
Neg logit contributions | |
arial | -1.699 |
nce | -1.639 |
utton | -1.638 |
ody | -1.586 |
illery | -1.585 |
Token |
|
Token ID | 198 |
Feature activation | +5.91e-02 |
Pos logit contributions | |
�� | +1.124 |
sqor | +1.088 |
capacity | +0.989 |
ゴ | +0.984 |
ALSE | +0.957 |
Neg logit contributions | |
arial | -0.859 |
nce | -0.833 |
utton | -0.830 |
ody | -0.807 |
illery | -0.801 |
Token |
|
Token ID | 198 |
Feature activation | +2.50e-02 |
Pos logit contributions | |
�� | +0.420 |
sqor | +0.401 |
ゴ | +0.361 |
capacity | +0.359 |
ALSE | +0.350 |
Neg logit contributions | |
arial | -0.305 |
nce | -0.295 |
utton | -0.291 |
ody | -0.283 |
illery | -0.281 |
Token | Sound |
Token ID | 21369 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
�� | +0.172 |
sqor | +0.168 |
capacity | +0.149 |
ゴ | +0.148 |
Sisters | +0.144 |
Neg logit contributions | |
arial | -0.132 |
nce | -0.127 |
utton | -0.126 |
ody | -0.123 |
illery | -0.121 |
Token | tracks |
Token ID | 46074 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
arial | +1.637 |
nce | +1.602 |
utton | +1.580 |
ody | +1.565 |
illery | +1.557 |
Neg logit contributions | |
�� | -1.371 |
sqor | -1.304 |
ゴ | -1.136 |
capacity | -1.135 |
ALSE | -1.102 |
Token | [ |
Token ID | 685 |
Feature activation | +4.71e-01 |
Pos logit contributions | |
�� | +0.864 |
sqor | +0.839 |
capacity | +0.759 |
ゴ | +0.754 |
ALSE | +0.733 |
Neg logit contributions | |
arial | -0.701 |
nce | -0.681 |
utton | -0.680 |
ody | -0.658 |
illery | -0.655 |
Token | edit |
Token ID | 4370 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
�� | +2.453 |
sqor | +2.379 |
capacity | +2.122 |
ゴ | +2.089 |
ALSE | +2.012 |
Neg logit contributions | |
arial | -3.146 |
nce | -3.066 |
utton | -3.065 |
ody | -3.004 |
illery | -2.984 |
Token | ] |
Token ID | 2361 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
sqor | +4.002 |
capacity | +3.708 |
�� | +3.698 |
ゴ | +3.577 |
jam | +3.378 |
Neg logit contributions | |
utton | -11.204 |
arial | -11.200 |
nce | -11.195 |
illery | -11.143 |
ody | -11.115 |
Token |
|
Token ID | 198 |
Feature activation | +5.13e-02 |
Pos logit contributions | |
�� | +3.178 |
sqor | +3.116 |
capacity | +2.833 |
ゴ | +2.825 |
Sisters | +2.738 |
Neg logit contributions | |
arial | -3.248 |
utton | -3.179 |
nce | -3.174 |
ody | -3.096 |
illery | -3.060 |
Token |
|
Token ID | 198 |
Feature activation | +4.40e-02 |
Pos logit contributions | |
�� | +0.363 |
sqor | +0.346 |
ゴ | +0.312 |
capacity | +0.311 |
ALSE | +0.303 |
Neg logit contributions | |
arial | -0.266 |
nce | -0.257 |
utton | -0.254 |
ody | -0.247 |
illery | -0.246 |
Token | Various |
Token ID | 40009 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
�� | +0.296 |
sqor | +0.288 |
capacity | +0.256 |
ゴ | +0.253 |
Sisters | +0.247 |
Neg logit contributions | |
arial | -0.237 |
nce | -0.229 |
utton | -0.227 |
ody | -0.223 |
illery | -0.219 |
Token | sound |
Token ID | 2128 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
arial | +0.958 |
nce | +0.923 |
utton | +0.918 |
ody | +0.897 |
illery | +0.880 |
Neg logit contributions | |
�� | -1.244 |
sqor | -1.184 |
capacity | -1.083 |
ゴ | -1.073 |
ALSE | -1.041 |
Token | bribery |
Token ID | 37388 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
�� | +1.884 |
sqor | +1.833 |
capacity | +1.665 |
ゴ | +1.648 |
ALSE | +1.611 |
Neg logit contributions | |
arial | -1.561 |
nce | -1.515 |
utton | -1.514 |
ody | -1.468 |
illery | -1.465 |
Token | . |
Token ID | 13 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
arial | +1.491 |
nce | +1.454 |
utton | +1.444 |
ody | +1.410 |
illery | +1.382 |
Neg logit contributions | |
�� | -2.053 |
sqor | -1.958 |
capacity | -1.798 |
ゴ | -1.784 |
ALSE | -1.724 |
Token | On |
Token ID | 1550 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
�� | +1.515 |
sqor | +1.465 |
capacity | +1.334 |
ゴ | +1.327 |
ALSE | +1.291 |
Neg logit contributions | |
arial | -1.106 |
nce | -1.072 |
utton | -1.067 |
ody | -1.036 |
illery | -1.029 |
Token | the |
Token ID | 262 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
arial | +0.888 |
nce | +0.864 |
utton | +0.855 |
ody | +0.832 |
illery | +0.821 |
Neg logit contributions | |
�� | -1.414 |
sqor | -1.369 |
capacity | -1.252 |
ゴ | -1.251 |
ALSE | -1.218 |
Token | other |
Token ID | 584 |
Feature activation | +8.06e-01 |
Pos logit contributions | |
�� | +0.882 |
sqor | +0.854 |
capacity | +0.773 |
ゴ | +0.767 |
ALSE | +0.746 |
Neg logit contributions | |
arial | -0.732 |
nce | -0.710 |
utton | -0.708 |
ody | -0.688 |
illery | -0.685 |
Token | hand |
Token ID | 1021 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
sqor | +3.760 |
�� | +3.759 |
capacity | +3.199 |
ALSE | +3.049 |
ゴ | +3.046 |
Neg logit contributions | |
arial | -5.548 |
nce | -5.456 |
utton | -5.376 |
illery | -5.362 |
issance | -5.136 |
Token | , |
Token ID | 11 |
Feature activation | +6.26e-01 |
Pos logit contributions | |
�� | +6.172 |
sqor | +5.880 |
Sisters | +4.948 |
capacity | +4.945 |
ゴ | +4.854 |
Neg logit contributions | |
arial | -9.307 |
nce | -9.211 |
utton | -8.959 |
ody | -8.744 |
illery | -8.712 |
Token | the |
Token ID | 262 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
�� | +4.089 |
sqor | +4.021 |
capacity | +3.659 |
ゴ | +3.564 |
Sisters | +3.546 |
Neg logit contributions | |
arial | -3.305 |
nce | -3.192 |
utton | -3.178 |
ody | -3.081 |
illery | -3.072 |
Token | Sent |
Token ID | 11352 |
Feature activation | -8.58e-02 |
Pos logit contributions | |
arial | +0.533 |
nce | +0.522 |
utton | +0.514 |
ody | +0.501 |
illery | +0.495 |
Neg logit contributions | |
�� | -0.775 |
sqor | -0.744 |
ゴ | -0.684 |
capacity | -0.678 |
ALSE | -0.661 |
Token | encing |
Token ID | 9532 |
Feature activation | -5.45e-02 |
Pos logit contributions | |
arial | +0.244 |
nce | +0.229 |
utton | +0.228 |
ody | +0.217 |
illery | +0.213 |
Neg logit contributions | |
�� | -0.794 |
sqor | -0.773 |
capacity | -0.720 |
ゴ | -0.719 |
ALSE | -0.703 |
Token | Guidelines |
Token ID | 31072 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
arial | +0.312 |
nce | +0.303 |
utton | +0.302 |
ody | +0.295 |
illery | +0.293 |
Neg logit contributions | |
�� | -0.344 |
sqor | -0.332 |
capacity | -0.299 |
ゴ | -0.297 |
ALSE | -0.289 |
Token | continues |
Token ID | 4477 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
�� | +3.258 |
sqor | +3.161 |
capacity | +2.886 |
ゴ | +2.866 |
ALSE | +2.795 |
Neg logit contributions | |
arial | -2.266 |
nce | -2.190 |
utton | -2.184 |
ody | -2.119 |
illery | -2.105 |
Token | playing |
Token ID | 2712 |
Feature activation | +5.31e-03 |
Pos logit contributions | |
�� | +2.898 |
sqor | +2.839 |
capacity | +2.576 |
ゴ | +2.559 |
ALSE | +2.488 |
Neg logit contributions | |
arial | -2.033 |
utton | -1.958 |
nce | -1.955 |
illery | -1.908 |
ody | -1.901 |
Token | next |
Token ID | 1306 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
�� | +0.036 |
sqor | +0.034 |
capacity | +0.031 |
ゴ | +0.031 |
ALSE | +0.030 |
Neg logit contributions | |
arial | -0.028 |
nce | -0.028 |
utton | -0.027 |
ody | -0.027 |
illery | -0.027 |
Token | season |
Token ID | 1622 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
�� | +1.200 |
sqor | +1.164 |
capacity | +1.049 |
ゴ | +1.041 |
ALSE | +1.005 |
Neg logit contributions | |
arial | -1.159 |
nce | -1.130 |
utton | -1.129 |
illery | -1.099 |
ody | -1.099 |
Token | as |
Token ID | 355 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
arial | +0.875 |
nce | +0.852 |
utton | +0.846 |
ody | +0.831 |
illery | +0.815 |
Neg logit contributions | |
�� | -1.032 |
sqor | -0.996 |
capacity | -0.900 |
ゴ | -0.899 |
ALSE | -0.870 |
Token | he |
Token ID | 339 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
�� | +0.943 |
sqor | +0.915 |
capacity | +0.838 |
ゴ | +0.831 |
ALSE | +0.809 |
Neg logit contributions | |
arial | -0.656 |
nce | -0.633 |
utton | -0.631 |
ody | -0.612 |
illery | -0.608 |
Token | has |
Token ID | 468 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
sqor | +8.147 |
�� | +8.121 |
capacity | +7.617 |
decomp | +7.521 |
Sisters | +7.359 |
Neg logit contributions | |
arial | -6.905 |
illery | -6.793 |
nce | -6.727 |
utton | -6.722 |
ody | -6.595 |
Token | the |
Token ID | 262 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
�� | +5.845 |
sqor | +5.757 |
capacity | +5.238 |
ゴ | +5.026 |
Sisters | +4.983 |
Neg logit contributions | |
arial | -5.740 |
utton | -5.613 |
nce | -5.550 |
illery | -5.502 |
ody | -5.356 |
Token | last |
Token ID | 938 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
�� | +1.882 |
sqor | +1.831 |
capacity | +1.661 |
ゴ | +1.630 |
Sisters | +1.593 |
Neg logit contributions | |
arial | -1.588 |
utton | -1.530 |
nce | -1.527 |
illery | -1.485 |
ody | -1.480 |
Token | few |
Token ID | 1178 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
�� | +1.728 |
sqor | +1.672 |
capacity | +1.517 |
ゴ | +1.507 |
ALSE | +1.465 |
Neg logit contributions | |
arial | -1.392 |
nce | -1.350 |
utton | -1.346 |
ody | -1.308 |
illery | -1.300 |
Token | , |
Token ID | 11 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
�� | +0.633 |
sqor | +0.610 |
capacity | +0.549 |
ゴ | +0.546 |
ALSE | +0.530 |
Neg logit contributions | |
arial | -0.579 |
nce | -0.563 |
utton | -0.560 |
ody | -0.546 |
illery | -0.542 |
Token | uk |
Token ID | 2724 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
�� | +0.762 |
sqor | +0.738 |
capacity | +0.671 |
ゴ | +0.667 |
ALSE | +0.649 |
Neg logit contributions | |
arial | -0.584 |
nce | -0.565 |
utton | -0.563 |
ody | -0.547 |
illery | -0.543 |
Token | hand |
Token ID | 1021 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
arial | +0.839 |
utton | +0.818 |
nce | +0.818 |
ody | +0.793 |
illery | +0.789 |
Neg logit contributions | |
�� | -1.079 |
sqor | -1.039 |
capacity | -0.944 |
ゴ | -0.943 |
ALSE | -0.917 |
Token | out |
Token ID | 448 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
�� | +0.769 |
sqor | +0.736 |
ゴ | +0.654 |
capacity | +0.653 |
ALSE | +0.634 |
Neg logit contributions | |
arial | -0.829 |
nce | -0.809 |
utton | -0.806 |
ody | -0.788 |
illery | -0.782 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +2.17e-01 |
Pos logit contributions | |
�� | +0.768 |
sqor | +0.741 |
capacity | +0.673 |
ゴ | +0.669 |
ALSE | +0.650 |
Neg logit contributions | |
arial | -0.619 |
nce | -0.601 |
utton | -0.598 |
ody | -0.582 |
illery | -0.578 |
Token | Or |
Token ID | 5574 |
Feature activation | -1.84e-02 |
Pos logit contributions | |
�� | +1.423 |
sqor | +1.374 |
capacity | +1.245 |
ゴ | +1.238 |
ALSE | +1.203 |
Neg logit contributions | |
arial | -1.182 |
nce | -1.148 |
utton | -1.144 |
ody | -1.113 |
illery | -1.106 |
Token | at |
Token ID | 379 |
Feature activation | +1.37e+00 |
Pos logit contributions | |
arial | +0.099 |
nce | +0.096 |
utton | +0.096 |
ody | +0.093 |
illery | +0.092 |
Neg logit contributions | |
�� | -0.123 |
sqor | -0.118 |
capacity | -0.107 |
ゴ | -0.107 |
ALSE | -0.104 |
Token | least |
Token ID | 1551 |
Feature activation | +5.66e-01 |
Pos logit contributions | |
�� | +5.692 |
sqor | +5.518 |
capacity | +4.877 |
Sisters | +4.786 |
ゴ | +4.572 |
Neg logit contributions | |
arial | -9.917 |
utton | -9.456 |
nce | -9.373 |
illery | -9.342 |
izer | -9.130 |
Token | 26 |
Token ID | 2608 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
�� | +3.633 |
sqor | +3.531 |
capacity | +3.179 |
ゴ | +3.144 |
Sisters | +3.109 |
Neg logit contributions | |
arial | -3.084 |
nce | -2.995 |
utton | -2.989 |
ody | -2.884 |
illery | -2.875 |
Token | of |
Token ID | 286 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
�� | +1.168 |
sqor | +1.127 |
capacity | +1.024 |
ゴ | +1.018 |
ALSE | +0.989 |
Neg logit contributions | |
arial | -0.930 |
nce | -0.904 |
utton | -0.901 |
ody | -0.876 |
illery | -0.869 |
Token | 27 |
Token ID | 2681 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
�� | +1.811 |
sqor | +1.756 |
capacity | +1.598 |
ゴ | +1.580 |
Sisters | +1.541 |
Neg logit contributions | |
arial | -1.439 |
utton | -1.388 |
nce | -1.385 |
ody | -1.346 |
illery | -1.341 |
Token | : |
Token ID | 25 |
Feature activation | -4.71e-02 |
Pos logit contributions | |
�� | +1.740 |
sqor | +1.684 |
capacity | +1.523 |
ゴ | +1.513 |
ALSE | +1.472 |
Neg logit contributions | |
arial | -1.455 |
nce | -1.412 |
utton | -1.407 |
ody | -1.370 |
illery | -1.361 |
Token | you |
Token ID | 345 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
�� | +1.616 |
sqor | +1.564 |
capacity | +1.421 |
ゴ | +1.412 |
ALSE | +1.373 |
Neg logit contributions | |
arial | -1.277 |
nce | -1.237 |
utton | -1.235 |
ody | -1.198 |
illery | -1.194 |
Token | on |
Token ID | 319 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
arial | +1.039 |
nce | +1.015 |
utton | +1.004 |
ody | +0.988 |
illery | +0.953 |
Neg logit contributions | |
�� | -1.520 |
sqor | -1.452 |
capacity | -1.322 |
ゴ | -1.318 |
ALSE | -1.285 |
Token | the |
Token ID | 262 |
Feature activation | +1.05e-03 |
Pos logit contributions | |
�� | +1.012 |
sqor | +0.980 |
capacity | +0.893 |
ゴ | +0.888 |
ALSE | +0.864 |
Neg logit contributions | |
arial | -0.729 |
nce | -0.706 |
utton | -0.703 |
ody | -0.683 |
illery | -0.678 |
Token | front |
Token ID | 2166 |
Feature activation | +5.91e-01 |
Pos logit contributions | |
�� | +0.007 |
sqor | +0.007 |
capacity | +0.006 |
ゴ | +0.006 |
ALSE | +0.006 |
Neg logit contributions | |
arial | -0.005 |
nce | -0.005 |
utton | -0.005 |
ody | -0.005 |
illery | -0.005 |
Token | page |
Token ID | 2443 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
�� | +4.027 |
sqor | +3.969 |
capacity | +3.626 |
ゴ | +3.621 |
ALSE | +3.513 |
Neg logit contributions | |
arial | -2.907 |
nce | -2.837 |
utton | -2.793 |
ody | -2.693 |
illery | -2.681 |
Token | but |
Token ID | 475 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
�� | +0.788 |
sqor | +0.760 |
capacity | +0.688 |
ゴ | +0.684 |
ALSE | +0.664 |
Neg logit contributions | |
arial | -0.664 |
nce | -0.644 |
utton | -0.642 |
ody | -0.626 |
illery | -0.621 |
Token | rather |
Token ID | 2138 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
sqor | +7.069 |
�� | +6.973 |
Sisters | +6.360 |
capacity | +6.304 |
ALSE | +6.091 |
Neg logit contributions | |
arial | -7.831 |
utton | -7.726 |
nce | -7.672 |
illery | -7.526 |
ody | -7.354 |
Token | that |
Token ID | 326 |
Feature activation | +3.12e-01 |
Pos logit contributions | |
sqor | +6.711 |
�� | +6.708 |
Sisters | +6.010 |
capacity | +5.995 |
ALSE | +5.810 |
Neg logit contributions | |
arial | -7.079 |
utton | -6.937 |
nce | -6.911 |
illery | -6.762 |
ody | -6.606 |
Token | they |
Token ID | 484 |
Feature activation | +4.29e-01 |
Pos logit contributions | |
�� | +2.117 |
sqor | +2.053 |
capacity | +1.868 |
ゴ | +1.854 |
ALSE | +1.807 |
Neg logit contributions | |
arial | -1.623 |
utton | -1.570 |
nce | -1.569 |
ody | -1.521 |
illery | -1.511 |
Token | were |
Token ID | 547 |
Feature activation | +2.42e-01 |
Pos logit contributions | |
�� | +2.674 |
sqor | +2.593 |
capacity | +2.337 |
ゴ | +2.313 |
ALSE | +2.252 |
Neg logit contributions | |
arial | -2.451 |
nce | -2.376 |
utton | -2.374 |
ody | -2.308 |
illery | -2.298 |
Token | stupid |
Token ID | 8531 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
�� | +1.571 |
sqor | +1.521 |
capacity | +1.379 |
ゴ | +1.368 |
ALSE | +1.329 |
Neg logit contributions | |
arial | -1.327 |
nce | -1.287 |
utton | -1.285 |
ody | -1.250 |
illery | -1.242 |
Token | | |
Token ID | 91 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
arial | +0.505 |
nce | +0.482 |
utton | +0.475 |
ody | +0.456 |
illery | +0.449 |
Neg logit contributions | |
�� | -1.141 |
sqor | -1.099 |
ゴ | -1.004 |
capacity | -1.000 |
ALSE | -0.980 |
Token | ex |
Token ID | 1069 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
�� | +0.071 |
sqor | +0.068 |
capacity | +0.062 |
ゴ | +0.062 |
ALSE | +0.060 |
Neg logit contributions | |
arial | -0.053 |
nce | -0.051 |
utton | -0.051 |
ody | -0.049 |
illery | -0.049 |
Token | : |
Token ID | 25 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
arial | +0.889 |
nce | +0.865 |
utton | +0.859 |
ody | +0.834 |
izer | +0.831 |
Neg logit contributions | |
�� | -0.986 |
sqor | -0.927 |
ゴ | -0.825 |
capacity | -0.813 |
ALSE | -0.799 |
Token | } |
Token ID | 92 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
arial | +1.373 |
nce | +1.331 |
utton | +1.326 |
ody | +1.289 |
illery | +1.280 |
Neg logit contributions | |
�� | -1.796 |
sqor | -1.737 |
capacity | -1.580 |
ゴ | -1.571 |
ALSE | -1.527 |
Token | the |
Token ID | 262 |
Feature activation | +7.66e-01 |
Pos logit contributions | |
�� | +1.579 |
sqor | +1.527 |
capacity | +1.398 |
ゴ | +1.387 |
ALSE | +1.355 |
Neg logit contributions | |
arial | -1.179 |
nce | -1.141 |
utton | -1.137 |
ody | -1.107 |
illery | -1.099 |
Token | string |
Token ID | 4731 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
�� | +3.198 |
sqor | +3.106 |
capacity | +2.703 |
ゴ | +2.602 |
ALSE | +2.535 |
Neg logit contributions | |
arial | -5.764 |
nce | -5.614 |
utton | -5.570 |
ody | -5.520 |
illery | -5.510 |
Token | " |
Token ID | 366 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
�� | +5.537 |
sqor | +5.298 |
capacity | +4.726 |
sql | +4.667 |
ALSE | +4.631 |
Neg logit contributions | |
utton | -9.244 |
arial | -9.206 |
nce | -9.135 |
illery | -9.009 |
ody | -8.951 |
Token | vi |
Token ID | 8903 |
Feature activation | +2.93e-01 |
Pos logit contributions | |
�� | +1.846 |
sqor | +1.789 |
capacity | +1.645 |
ゴ | +1.634 |
ALSE | +1.587 |
Neg logit contributions | |
arial | -1.256 |
utton | -1.220 |
nce | -1.214 |
ody | -1.180 |
illery | -1.179 |
Token | : |
Token ID | 25 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
�� | +1.521 |
sqor | +1.445 |
ゴ | +1.304 |
capacity | +1.303 |
ALSE | +1.254 |
Neg logit contributions | |
arial | -1.944 |
nce | -1.909 |
utton | -1.909 |
illery | -1.863 |
ody | -1.862 |
Token | ", |
Token ID | 1600 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
�� | +0.834 |
sqor | +0.801 |
capacity | +0.735 |
ゴ | +0.731 |
ALSE | +0.706 |
Neg logit contributions | |
arial | -0.657 |
utton | -0.641 |
nce | -0.637 |
ody | -0.623 |
illery | -0.621 |
Token | " |
Token ID | 366 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
�� | +1.600 |
sqor | +1.535 |
capacity | +1.368 |
ゴ | +1.362 |
ALSE | +1.316 |
Neg logit contributions | |
arial | -1.664 |
nce | -1.621 |
utton | -1.614 |
ody | -1.576 |
illery | -1.565 |
Token | adolescence |
Token ID | 37258 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
�� | +1.444 |
sqor | +1.399 |
capacity | +1.275 |
ゴ | +1.267 |
ALSE | +1.232 |
Neg logit contributions | |
arial | -1.060 |
nce | -1.025 |
utton | -1.022 |
ody | -0.992 |
illery | -0.987 |
Token | . |
Token ID | 764 |
Feature activation | +5.71e-01 |
Pos logit contributions | |
�� | +1.954 |
sqor | +1.892 |
capacity | +1.706 |
ゴ | +1.701 |
ALSE | +1.644 |
Neg logit contributions | |
arial | -1.810 |
nce | -1.761 |
utton | -1.745 |
ody | -1.700 |
illery | -1.696 |
Token | Journal |
Token ID | 4913 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
�� | +3.435 |
sqor | +3.304 |
capacity | +3.006 |
ゴ | +3.000 |
Sisters | +2.968 |
Neg logit contributions | |
arial | -3.330 |
nce | -3.226 |
utton | -3.196 |
ody | -3.134 |
illery | -3.122 |
Token | of |
Token ID | 286 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
�� | +1.719 |
sqor | +1.657 |
capacity | +1.495 |
ゴ | +1.486 |
ALSE | +1.440 |
Neg logit contributions | |
arial | -1.541 |
nce | -1.498 |
utton | -1.493 |
ody | -1.455 |
illery | -1.444 |
Token | Youth |
Token ID | 17582 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
�� | +2.340 |
sqor | +2.237 |
capacity | +2.038 |
ゴ | +2.012 |
Sisters | +1.981 |
Neg logit contributions | |
arial | -2.145 |
nce | -2.080 |
utton | -2.066 |
illery | -2.019 |
ody | -2.001 |
Token | and |
Token ID | 290 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
�� | +1.626 |
sqor | +1.561 |
capacity | +1.426 |
ゴ | +1.407 |
Sisters | +1.360 |
Neg logit contributions | |
arial | -1.607 |
nce | -1.532 |
utton | -1.531 |
illery | -1.497 |
ody | -1.474 |
Token | Ad |
Token ID | 1215 |
Feature activation | +6.48e-01 |
Pos logit contributions | |
�� | +5.241 |
Sisters | +4.934 |
sqor | +4.760 |
SAS | +4.336 |
capacity | +4.290 |
Neg logit contributions | |
arial | -9.737 |
nce | -9.469 |
illery | -9.168 |
utton | -9.072 |
issance | -9.044 |
Token | olesc |
Token ID | 16850 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
�� | +4.129 |
sqor | +3.850 |
capacity | +3.687 |
ゴ | +3.623 |
Sisters | +3.513 |
Neg logit contributions | |
arial | -3.463 |
nce | -3.356 |
utton | -3.266 |
illery | -3.173 |
ody | -3.146 |
Token | ence |
Token ID | 594 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
�� | +2.655 |
sqor | +2.604 |
capacity | +2.434 |
ゴ | +2.375 |
Sisters | +2.329 |
Neg logit contributions | |
arial | -1.691 |
utton | -1.566 |
nce | -1.563 |
illery | -1.514 |
ody | -1.502 |
Token | , |
Token ID | 11 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
�� | +2.700 |
sqor | +2.479 |
ゴ | +2.258 |
capacity | +2.244 |
Sisters | +2.209 |
Neg logit contributions | |
arial | -3.462 |
nce | -3.336 |
utton | -3.329 |
illery | -3.238 |
ody | -3.155 |
Token | 39 |
Token ID | 5014 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
�� | +2.017 |
sqor | +1.946 |
capacity | +1.766 |
ゴ | +1.759 |
ALSE | +1.710 |
Neg logit contributions | |
arial | -1.473 |
nce | -1.427 |
utton | -1.420 |
ody | -1.380 |
illery | -1.369 |
Token | : |
Token ID | 25 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
�� | +0.309 |
sqor | +0.292 |
ゴ | +0.261 |
capacity | +0.259 |
ALSE | +0.250 |
Neg logit contributions | |
arial | -0.301 |
nce | -0.293 |
utton | -0.291 |
ody | -0.284 |
illery | -0.282 |
Token | US |
Token ID | 1294 |
Feature activation | -3.75e-01 |
Pos logit contributions | |
arial | +1.673 |
nce | +1.633 |
utton | +1.624 |
ody | +1.586 |
illery | +1.576 |
Neg logit contributions | |
�� | -1.596 |
sqor | -1.535 |
capacity | -1.373 |
ゴ | -1.365 |
ALSE | -1.318 |
Token | Department |
Token ID | 2732 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
arial | +1.631 |
nce | +1.582 |
utton | +1.554 |
ody | +1.515 |
illery | +1.503 |
Neg logit contributions | |
�� | -2.889 |
sqor | -2.790 |
capacity | -2.567 |
ゴ | -2.564 |
ALSE | -2.497 |
Token | of |
Token ID | 286 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
�� | +1.303 |
sqor | +1.253 |
capacity | +1.128 |
ゴ | +1.123 |
ALSE | +1.089 |
Neg logit contributions | |
arial | -1.157 |
nce | -1.124 |
utton | -1.120 |
ody | -1.091 |
illery | -1.084 |
Token | Health |
Token ID | 3893 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
�� | +1.658 |
sqor | +1.606 |
capacity | +1.465 |
ゴ | +1.422 |
Sisters | +1.420 |
Neg logit contributions | |
arial | -1.739 |
nce | -1.696 |
utton | -1.693 |
ody | -1.641 |
illery | -1.639 |
Token | and |
Token ID | 290 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
arial | +0.767 |
utton | +0.747 |
nce | +0.743 |
ody | +0.729 |
illery | +0.718 |
Neg logit contributions | |
�� | -0.996 |
sqor | -0.947 |
ゴ | -0.863 |
capacity | -0.852 |
ALSE | -0.839 |
Token | Human |
Token ID | 5524 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
sqor | +7.377 |
Sisters | +7.224 |
�� | +7.067 |
capacity | +6.785 |
SIG | +6.737 |
Neg logit contributions | |
arial | -7.178 |
utton | -7.027 |
illery | -6.932 |
nce | -6.884 |
issance | -6.789 |
Token | Services |
Token ID | 6168 |
Feature activation | -4.23e-01 |
Pos logit contributions | |
�� | +1.820 |
sqor | +1.759 |
capacity | +1.592 |
ゴ | +1.570 |
Sisters | +1.531 |
Neg logit contributions | |
arial | -1.742 |
nce | -1.695 |
utton | -1.692 |
ody | -1.649 |
illery | -1.642 |
Token | , |
Token ID | 11 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
arial | +2.492 |
nce | +2.419 |
utton | +2.415 |
ody | +2.357 |
illery | +2.342 |
Neg logit contributions | |
�� | -2.603 |
sqor | -2.503 |
capacity | -2.252 |
ゴ | -2.240 |
ALSE | -2.172 |
Token | CDC |
Token ID | 20434 |
Feature activation | -3.63e-02 |
Pos logit contributions | |
arial | +2.544 |
nce | +2.492 |
utton | +2.472 |
ody | +2.419 |
illery | +2.405 |
Neg logit contributions | |
�� | -1.904 |
sqor | -1.815 |
capacity | -1.597 |
ゴ | -1.590 |
ALSE | -1.520 |
Token | ; |
Token ID | 26 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
arial | +0.210 |
nce | +0.204 |
utton | +0.204 |
ody | +0.198 |
illery | +0.197 |
Neg logit contributions | |
�� | -0.226 |
sqor | -0.219 |
capacity | -0.197 |
ゴ | -0.195 |
ALSE | -0.190 |
Token | ultimate |
Token ID | 8713 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
arial | +0.397 |
nce | +0.386 |
utton | +0.382 |
ody | +0.374 |
illery | +0.369 |
Neg logit contributions | |
�� | -0.578 |
sqor | -0.554 |
ゴ | -0.508 |
capacity | -0.499 |
ALSE | -0.490 |
Token | goals |
Token ID | 4661 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
�� | +2.555 |
sqor | +2.494 |
capacity | +2.308 |
ゴ | +2.285 |
ALSE | +2.240 |
Neg logit contributions | |
arial | -1.268 |
nce | -1.216 |
utton | -1.213 |
ody | -1.165 |
illery | -1.158 |
Token | of |
Token ID | 286 |
Feature activation | +4.06e-01 |
Pos logit contributions | |
arial | +0.680 |
nce | +0.659 |
utton | +0.657 |
ody | +0.644 |
illery | +0.637 |
Neg logit contributions | |
�� | -0.810 |
sqor | -0.781 |
capacity | -0.708 |
ゴ | -0.708 |
ALSE | -0.685 |
Token | preventing |
Token ID | 12174 |
Feature activation | +6.81e-01 |
Pos logit contributions | |
�� | +2.403 |
sqor | +2.331 |
capacity | +2.102 |
ゴ | +2.066 |
ALSE | +2.010 |
Neg logit contributions | |
arial | -2.448 |
nce | -2.386 |
utton | -2.381 |
ody | -2.316 |
illery | -2.314 |
Token | injuries |
Token ID | 6821 |
Feature activation | +4.61e-01 |
Pos logit contributions | |
�� | +3.789 |
sqor | +3.717 |
capacity | +3.324 |
ゴ | +3.219 |
ALSE | +3.167 |
Neg logit contributions | |
arial | -4.220 |
utton | -4.134 |
nce | -4.116 |
illery | -4.040 |
ody | -4.006 |
Token | and |
Token ID | 290 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
�� | +2.892 |
sqor | +2.818 |
capacity | +2.542 |
ゴ | +2.500 |
ALSE | +2.440 |
Neg logit contributions | |
arial | -2.586 |
utton | -2.525 |
nce | -2.518 |
illery | -2.445 |
ody | -2.422 |
Token | deaths |
Token ID | 7040 |
Feature activation | +7.39e-01 |
Pos logit contributions | |
sqor | +6.780 |
�� | +6.767 |
capacity | +6.322 |
decomp | +6.010 |
incapac | +5.991 |
Neg logit contributions | |
arial | -7.724 |
utton | -7.639 |
nce | -7.624 |
illery | -7.601 |
ody | -7.510 |
Token | . |
Token ID | 13 |
Feature activation | +4.66e-02 |
Pos logit contributions | |
�� | +4.514 |
sqor | +4.449 |
capacity | +3.983 |
ゴ | +3.917 |
ALSE | +3.829 |
Neg logit contributions | |
arial | -4.077 |
utton | -4.046 |
nce | -4.003 |
illery | -3.895 |
ody | -3.865 |
Token |
|
Token ID | 198 |
Feature activation | +5.92e-02 |
Pos logit contributions | |
�� | +0.327 |
sqor | +0.314 |
ゴ | +0.282 |
capacity | +0.281 |
ALSE | +0.274 |
Neg logit contributions | |
arial | -0.241 |
nce | -0.234 |
utton | -0.232 |
ody | -0.225 |
illery | -0.224 |
Token |
|
Token ID | 198 |
Feature activation | -3.04e-02 |
Pos logit contributions | |
�� | +0.413 |
sqor | +0.395 |
ゴ | +0.357 |
capacity | +0.355 |
ALSE | +0.345 |
Neg logit contributions | |
arial | -0.310 |
nce | -0.300 |
utton | -0.297 |
ody | -0.289 |
illery | -0.287 |
Token | Community |
Token ID | 20012 |
Feature activation | +7.69e-01 |
Pos logit contributions | |
arial | +0.162 |
nce | +0.156 |
utton | +0.155 |
ody | +0.152 |
illery | +0.148 |
Neg logit contributions | |
�� | -0.210 |
sqor | -0.203 |
ゴ | -0.178 |
capacity | -0.176 |
Sisters | -0.174 |
Token |
|
Token ID | 198 |
Feature activation | -2.64e-02 |
Pos logit contributions | |
�� | +1.333 |
sqor | +1.294 |
capacity | +1.166 |
ゴ | +1.160 |
Sisters | +1.123 |
Neg logit contributions | |
arial | -1.251 |
nce | -1.224 |
utton | -1.213 |
ody | -1.191 |
illery | -1.172 |
Token |
|
Token ID | 198 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
arial | +0.134 |
nce | +0.130 |
utton | +0.128 |
ody | +0.124 |
illery | +0.123 |
Neg logit contributions | |
�� | -0.192 |
sqor | -0.182 |
ゴ | -0.164 |
capacity | -0.163 |
ALSE | -0.159 |
Token | Video |
Token ID | 10798 |
Feature activation | +7.84e-02 |
Pos logit contributions | |
arial | +0.593 |
nce | +0.571 |
utton | +0.568 |
ody | +0.553 |
illery | +0.543 |
Neg logit contributions | |
�� | -0.739 |
sqor | -0.718 |
capacity | -0.628 |
ゴ | -0.627 |
Sisters | -0.616 |
Token | games |
Token ID | 1830 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
�� | +0.528 |
sqor | +0.510 |
capacity | +0.462 |
ゴ | +0.460 |
ALSE | +0.446 |
Neg logit contributions | |
arial | -0.418 |
nce | -0.407 |
utton | -0.405 |
ody | -0.394 |
illery | -0.390 |
Token | [ |
Token ID | 685 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
�� | +1.479 |
sqor | +1.435 |
capacity | +1.300 |
ゴ | +1.285 |
ALSE | +1.251 |
Neg logit contributions | |
arial | -1.243 |
nce | -1.206 |
utton | -1.206 |
ody | -1.170 |
illery | -1.163 |
Token | edit |
Token ID | 4370 |
Feature activation | +1.30e+00 |
Pos logit contributions | |
�� | +2.072 |
sqor | +2.004 |
capacity | +1.786 |
ゴ | +1.762 |
ALSE | +1.699 |
Neg logit contributions | |
arial | -2.627 |
nce | -2.558 |
utton | -2.556 |
ody | -2.505 |
illery | -2.489 |
Token | ] |
Token ID | 2361 |
Feature activation | +4.93e-01 |
Pos logit contributions | |
sqor | +3.931 |
�� | +3.661 |
capacity | +3.589 |
ゴ | +3.485 |
jam | +3.314 |
Neg logit contributions | |
arial | -10.143 |
nce | -10.122 |
utton | -10.061 |
illery | -10.041 |
ody | -10.005 |
Token |
|
Token ID | 198 |
Feature activation | +1.79e-01 |
Pos logit contributions | |
�� | +2.854 |
sqor | +2.756 |
ゴ | +2.499 |
capacity | +2.483 |
Sisters | +2.408 |
Neg logit contributions | |
arial | -2.919 |
nce | -2.867 |
utton | -2.842 |
ody | -2.799 |
illery | -2.731 |
Token |
|
Token ID | 198 |
Feature activation | -9.65e-03 |
Pos logit contributions | |
�� | +1.215 |
sqor | +1.169 |
capacity | +1.055 |
ゴ | +1.052 |
ALSE | +1.023 |
Neg logit contributions | |
arial | -0.950 |
nce | -0.920 |
utton | -0.915 |
ody | -0.890 |
illery | -0.884 |
Token | In |
Token ID | 818 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
arial | +0.053 |
nce | +0.051 |
utton | +0.051 |
ody | +0.050 |
illery | +0.049 |
Neg logit contributions | |
�� | -0.064 |
sqor | -0.063 |
capacity | -0.055 |
ゴ | -0.055 |
Sisters | -0.053 |
Token | the |
Token ID | 262 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
arial | +0.938 |
nce | +0.914 |
utton | +0.902 |
ody | +0.882 |
illery | +0.872 |
Neg logit contributions | |
�� | -1.295 |
sqor | -1.256 |
capacity | -1.129 |
ゴ | -1.128 |
ALSE | -1.109 |
Token | of |
Token ID | 286 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
�� | +2.873 |
sqor | +2.784 |
capacity | +2.504 |
ゴ | +2.502 |
Sisters | +2.416 |
Neg logit contributions | |
arial | -2.438 |
nce | -2.385 |
utton | -2.358 |
illery | -2.283 |
ody | -2.273 |
Token | feeling |
Token ID | 4203 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
�� | +1.047 |
sqor | +1.012 |
capacity | +0.917 |
ゴ | +0.911 |
ALSE | +0.885 |
Neg logit contributions | |
arial | -0.867 |
nce | -0.841 |
utton | -0.839 |
ody | -0.816 |
illery | -0.810 |
Token | both |
Token ID | 1111 |
Feature activation | +4.63e-01 |
Pos logit contributions | |
�� | +1.991 |
sqor | +1.919 |
capacity | +1.719 |
ゴ | +1.708 |
ALSE | +1.655 |
Neg logit contributions | |
arial | -1.972 |
nce | -1.918 |
utton | -1.914 |
ody | -1.865 |
illery | -1.855 |
Token | massive |
Token ID | 4858 |
Feature activation | +4.11e-01 |
Pos logit contributions | |
�� | +2.931 |
sqor | +2.846 |
capacity | +2.558 |
ゴ | +2.546 |
Sisters | +2.477 |
Neg logit contributions | |
arial | -2.597 |
nce | -2.523 |
utton | -2.515 |
illery | -2.438 |
ody | -2.433 |
Token | and |
Token ID | 290 |
Feature activation | +6.34e-01 |
Pos logit contributions | |
�� | +2.520 |
sqor | +2.450 |
capacity | +2.207 |
ゴ | +2.192 |
ALSE | +2.114 |
Neg logit contributions | |
arial | -2.399 |
nce | -2.327 |
utton | -2.317 |
ody | -2.259 |
illery | -2.251 |
Token | compact |
Token ID | 16001 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
�� | +3.785 |
sqor | +3.693 |
capacity | +3.292 |
ゴ | +3.242 |
Sisters | +3.159 |
Neg logit contributions | |
arial | -3.777 |
utton | -3.653 |
nce | -3.647 |
illery | -3.529 |
ody | -3.520 |
Token | , |
Token ID | 11 |
Feature activation | +3.87e-01 |
Pos logit contributions | |
�� | +7.519 |
sqor | +7.390 |
capacity | +6.657 |
ゴ | +6.643 |
ALSE | +6.345 |
Neg logit contributions | |
arial | -7.167 |
nce | -6.965 |
utton | -6.910 |
illery | -6.714 |
ody | -6.650 |
Token | with |
Token ID | 351 |
Feature activation | -4.60e-02 |
Pos logit contributions | |
�� | +2.569 |
sqor | +2.494 |
capacity | +2.264 |
ゴ | +2.249 |
ALSE | +2.178 |
Neg logit contributions | |
arial | -2.076 |
nce | -2.013 |
utton | -2.002 |
ody | -1.945 |
illery | -1.932 |
Token | a |
Token ID | 257 |
Feature activation | -8.85e-02 |
Pos logit contributions | |
arial | +0.230 |
nce | +0.223 |
utton | +0.222 |
ody | +0.216 |
illery | +0.214 |
Neg logit contributions | |
�� | -0.325 |
sqor | -0.312 |
capacity | -0.285 |
ゴ | -0.284 |
ALSE | -0.278 |
Token | clear |
Token ID | 1598 |
Feature activation | -4.28e-02 |
Pos logit contributions | |
arial | +0.501 |
nce | +0.490 |
utton | +0.485 |
ody | +0.471 |
illery | +0.470 |
Neg logit contributions | |
�� | -0.566 |
sqor | -0.542 |
ゴ | -0.490 |
capacity | -0.489 |
ALSE | -0.478 |
Token | purpose |
Token ID | 4007 |
Feature activation | -2.68e-01 |
Pos logit contributions | |
arial | +0.219 |
nce | +0.214 |
utton | +0.211 |
ody | +0.206 |
illery | +0.203 |
Neg logit contributions | |
�� | -0.298 |
sqor | -0.287 |
capacity | -0.263 |
ゴ | -0.262 |
ALSE | -0.255 |
Token | have |
Token ID | 423 |
Feature activation | +5.64e-01 |
Pos logit contributions | |
�� | +2.991 |
sqor | +2.918 |
capacity | +2.651 |
ゴ | +2.615 |
Sisters | +2.550 |
Neg logit contributions | |
arial | -2.367 |
utton | -2.289 |
nce | -2.278 |
ody | -2.221 |
illery | -2.208 |
Token | anything |
Token ID | 1997 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
�� | +3.746 |
sqor | +3.661 |
capacity | +3.354 |
ゴ | +3.264 |
Sisters | +3.243 |
Neg logit contributions | |
arial | -2.905 |
utton | -2.819 |
illery | -2.778 |
nce | -2.769 |
ody | -2.690 |
Token | more |
Token ID | 517 |
Feature activation | +2.29e-01 |
Pos logit contributions | |
�� | +2.147 |
sqor | +2.101 |
capacity | +1.912 |
ゴ | +1.896 |
ALSE | +1.849 |
Neg logit contributions | |
arial | -1.474 |
utton | -1.432 |
nce | -1.421 |
illery | -1.378 |
ody | -1.367 |
Token | serious |
Token ID | 2726 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
�� | +1.646 |
sqor | +1.605 |
capacity | +1.468 |
ゴ | +1.456 |
ALSE | +1.418 |
Neg logit contributions | |
arial | -1.097 |
utton | -1.058 |
nce | -1.057 |
illery | -1.020 |
ody | -1.018 |
Token | than |
Token ID | 621 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
�� | +2.226 |
sqor | +2.189 |
capacity | +1.993 |
ゴ | +1.973 |
ALSE | +1.925 |
Neg logit contributions | |
arial | -1.512 |
utton | -1.469 |
nce | -1.455 |
illery | -1.423 |
ody | -1.409 |
Token | he |
Token ID | 339 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
�� | +1.564 |
sqor | +1.517 |
capacity | +1.383 |
ゴ | +1.371 |
ALSE | +1.337 |
Neg logit contributions | |
arial | -1.164 |
nce | -1.127 |
utton | -1.125 |
ody | -1.089 |
illery | -1.087 |
Token | had |
Token ID | 550 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
sqor | +6.844 |
�� | +6.743 |
decomp | +6.344 |
capacity | +6.339 |
Sisters | +6.216 |
Neg logit contributions | |
utton | -7.280 |
arial | -7.261 |
illery | -7.139 |
nce | -6.999 |
ody | -6.763 |
Token | . |
Token ID | 13 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
sqor | +6.333 |
�� | +6.177 |
capacity | +5.649 |
decomp | +5.579 |
Sisters | +5.577 |
Neg logit contributions | |
arial | -5.805 |
utton | -5.705 |
illery | -5.561 |
nce | -5.464 |
ody | -5.286 |
Token | But |
Token ID | 887 |
Feature activation | +4.26e-01 |
Pos logit contributions | |
�� | +1.936 |
sqor | +1.878 |
capacity | +1.718 |
ゴ | +1.708 |
ALSE | +1.664 |
Neg logit contributions | |
arial | -1.367 |
nce | -1.318 |
utton | -1.317 |
ody | -1.277 |
illery | -1.267 |
Token | the |
Token ID | 262 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
�� | +2.846 |
sqor | +2.778 |
capacity | +2.518 |
ゴ | +2.482 |
ALSE | +2.443 |
Neg logit contributions | |
arial | -2.240 |
utton | -2.166 |
nce | -2.144 |
ody | -2.091 |
illery | -2.086 |
Token | game |
Token ID | 983 |
Feature activation | +1.27e-01 |
Pos logit contributions | |
�� | +0.199 |
sqor | +0.192 |
ゴ | +0.177 |
capacity | +0.176 |
ALSE | +0.172 |
Neg logit contributions | |
arial | -0.124 |
nce | -0.122 |
utton | -0.119 |
ody | -0.116 |
illery | -0.115 |
Token | best |
Token ID | 1266 |
Feature activation | +9.38e-02 |
Pos logit contributions | |
arial | +1.095 |
utton | +1.058 |
nce | +1.055 |
ody | +1.023 |
illery | +1.005 |
Neg logit contributions | |
�� | -1.941 |
sqor | -1.879 |
capacity | -1.733 |
ゴ | -1.713 |
ALSE | -1.682 |
Token | to |
Token ID | 284 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
�� | +0.679 |
sqor | +0.655 |
ゴ | +0.599 |
capacity | +0.591 |
Sisters | +0.580 |
Neg logit contributions | |
arial | -0.450 |
nce | -0.443 |
utton | -0.429 |
illery | -0.423 |
ody | -0.418 |
Token | take |
Token ID | 1011 |
Feature activation | +1.09e-03 |
Pos logit contributions | |
�� | +0.799 |
sqor | +0.774 |
capacity | +0.710 |
ゴ | +0.704 |
ALSE | +0.689 |
Neg logit contributions | |
arial | -0.504 |
nce | -0.487 |
utton | -0.486 |
ody | -0.470 |
illery | -0.464 |
Token | advantage |
Token ID | 4621 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
�� | +0.008 |
sqor | +0.007 |
capacity | +0.007 |
ゴ | +0.007 |
ALSE | +0.007 |
Neg logit contributions | |
arial | -0.005 |
nce | -0.005 |
utton | -0.005 |
ody | -0.005 |
illery | -0.005 |
Token | of |
Token ID | 286 |
Feature activation | +2.87e-01 |
Pos logit contributions | |
�� | +1.542 |
sqor | +1.476 |
ゴ | +1.317 |
capacity | +1.293 |
Sisters | +1.260 |
Neg logit contributions | |
arial | -1.577 |
nce | -1.547 |
utton | -1.535 |
illery | -1.498 |
ody | -1.485 |
Token | Re |
Token ID | 797 |
Feature activation | +1.29e+00 |
Pos logit contributions | |
�� | +1.838 |
sqor | +1.776 |
capacity | +1.610 |
ゴ | +1.602 |
Sisters | +1.547 |
Neg logit contributions | |
arial | -1.603 |
nce | -1.557 |
utton | -1.547 |
illery | -1.506 |
ody | -1.503 |
Token | origin |
Token ID | 47103 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
�� | +8.319 |
sqor | +8.083 |
capacity | +7.946 |
ゴ | +7.462 |
Sisters | +7.253 |
Neg logit contributions | |
arial | -6.157 |
utton | -5.874 |
nce | -5.784 |
izer | -5.708 |
ody | -5.690 |
Token | while |
Token ID | 981 |
Feature activation | +5.33e-01 |
Pos logit contributions | |
�� | +2.091 |
sqor | +2.023 |
capacity | +1.828 |
ゴ | +1.819 |
ALSE | +1.762 |
Neg logit contributions | |
arial | -1.763 |
nce | -1.705 |
utton | -1.693 |
ody | -1.646 |
illery | -1.642 |
Token | avoiding |
Token ID | 14928 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
�� | +3.498 |
sqor | +3.363 |
ゴ | +3.061 |
capacity | +3.051 |
Sisters | +2.976 |
Neg logit contributions | |
arial | -2.877 |
nce | -2.782 |
utton | -2.765 |
ody | -2.700 |
illery | -2.698 |
Token | its |
Token ID | 663 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
�� | +2.115 |
sqor | +2.049 |
capacity | +1.865 |
ゴ | +1.855 |
ALSE | +1.800 |
Neg logit contributions | |
arial | -1.588 |
nce | -1.538 |
utton | -1.532 |
ody | -1.486 |
illery | -1.479 |
Token | steep |
Token ID | 14559 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
arial | +1.207 |
utton | +1.180 |
nce | +1.178 |
ody | +1.150 |
illery | +1.132 |
Neg logit contributions | |
�� | -1.542 |
sqor | -1.464 |
ゴ | -1.327 |
capacity | -1.321 |
ALSE | -1.294 |
Token | x |
Token ID | 87 |
Feature activation | -4.56e-02 |
Pos logit contributions | |
�� | +0.178 |
sqor | +0.174 |
capacity | +0.156 |
ゴ | +0.155 |
ALSE | +0.149 |
Neg logit contributions | |
arial | -0.173 |
nce | -0.167 |
utton | -0.166 |
illery | -0.162 |
ody | -0.162 |
Token | 001 |
Token ID | 8298 |
Feature activation | +6.45e-01 |
Pos logit contributions | |
arial | +0.204 |
nce | +0.197 |
utton | +0.196 |
ody | +0.190 |
illery | +0.188 |
Neg logit contributions | |
�� | -0.344 |
sqor | -0.334 |
capacity | -0.307 |
ゴ | -0.305 |
ALSE | -0.298 |
Token | f |
Token ID | 69 |
Feature activation | +7.01e-01 |
Pos logit contributions | |
�� | +4.138 |
sqor | +4.074 |
capacity | +3.818 |
ゴ | +3.710 |
ALSE | +3.525 |
Neg logit contributions | |
arial | -3.364 |
utton | -3.196 |
nce | -3.170 |
ody | -3.107 |
illery | -3.087 |
Token | 1 |
Token ID | 16 |
Feature activation | +7.87e-01 |
Pos logit contributions | |
�� | +4.744 |
sqor | +4.612 |
capacity | +4.344 |
ゴ | +4.227 |
ALSE | +4.143 |
Neg logit contributions | |
arial | -3.442 |
utton | -3.219 |
nce | -3.196 |
illery | -3.156 |
ody | -3.086 |
Token | f |
Token ID | 69 |
Feature activation | +5.73e-01 |
Pos logit contributions | |
sqor | +5.125 |
�� | +5.111 |
capacity | +4.806 |
ゴ | +4.634 |
Sisters | +4.478 |
Neg logit contributions | |
arial | -3.972 |
utton | -3.779 |
nce | -3.749 |
illery | -3.684 |
ody | -3.679 |
Token | 4 |
Token ID | 19 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
�� | +3.759 |
sqor | +3.636 |
capacity | +3.395 |
ALSE | +3.262 |
ゴ | +3.255 |
Neg logit contributions | |
arial | -2.953 |
nce | -2.778 |
utton | -2.769 |
illery | -2.760 |
izer | -2.678 |
Token | b |
Token ID | 65 |
Feature activation | +1.52e+00 |
Pos logit contributions | |
sqor | +6.615 |
�� | +6.375 |
capacity | +6.328 |
ゴ | +5.898 |
jam | +5.788 |
Neg logit contributions | |
arial | -7.779 |
utton | -7.403 |
illery | -7.317 |
nce | -7.260 |
issance | -7.129 |
Token | be |
Token ID | 1350 |
Feature activation | +5.73e-01 |
Pos logit contributions | |
sqor | +4.776 |
capacity | +4.757 |
�� | +4.376 |
jam | +4.041 |
ゴ | +4.036 |
Neg logit contributions | |
arial | -11.737 |
illery | -11.181 |
utton | -11.166 |
nce | -10.982 |
issance | -10.863 |
Token | 66 |
Token ID | 2791 |
Feature activation | +4.22e-01 |
Pos logit contributions | |
�� | +4.394 |
sqor | +4.361 |
capacity | +4.103 |
ゴ | +4.024 |
ALSE | +3.899 |
Neg logit contributions | |
arial | -2.306 |
nce | -2.185 |
utton | -2.169 |
illery | -2.106 |
ody | -2.073 |
Token | . |
Token ID | 13 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
�� | +2.693 |
sqor | +2.624 |
capacity | +2.364 |
ゴ | +2.340 |
ALSE | +2.292 |
Neg logit contributions | |
arial | -2.342 |
nce | -2.260 |
utton | -2.250 |
illery | -2.195 |
ody | -2.191 |
Token | So |
Token ID | 1406 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
arial | +0.114 |
nce | +0.111 |
utton | +0.110 |
ody | +0.106 |
illery | +0.106 |
Neg logit contributions | |
�� | -0.166 |
sqor | -0.160 |
capacity | -0.146 |
ゴ | -0.145 |
ALSE | -0.141 |
Token | will |
Token ID | 481 |
Feature activation | -5.97e-02 |
Pos logit contributions | |
�� | +1.262 |
sqor | +1.226 |
capacity | +1.121 |
ゴ | +1.113 |
ALSE | +1.085 |
Neg logit contributions | |
arial | -0.856 |
nce | -0.826 |
utton | -0.825 |
ody | -0.800 |
illery | -0.794 |
Token | happen |
Token ID | 1645 |
Feature activation | -3.45e-02 |
Pos logit contributions | |
arial | +0.292 |
nce | +0.287 |
utton | +0.281 |
ody | +0.273 |
illery | +0.270 |
Neg logit contributions | |
�� | -0.430 |
sqor | -0.413 |
capacity | -0.377 |
ゴ | -0.376 |
ALSE | -0.367 |
Token | within |
Token ID | 1626 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
arial | +0.171 |
nce | +0.167 |
utton | +0.164 |
ody | +0.161 |
illery | +0.158 |
Neg logit contributions | |
�� | -0.246 |
sqor | -0.237 |
capacity | -0.217 |
ゴ | -0.216 |
ALSE | -0.209 |
Token | the |
Token ID | 262 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
arial | +0.532 |
nce | +0.522 |
utton | +0.513 |
ody | +0.504 |
illery | +0.492 |
Neg logit contributions | |
�� | -0.809 |
sqor | -0.779 |
ゴ | -0.716 |
capacity | -0.709 |
ALSE | -0.692 |
Token | blink |
Token ID | 21019 |
Feature activation | -3.79e-01 |
Pos logit contributions | |
arial | +0.530 |
nce | +0.520 |
utton | +0.511 |
ody | +0.499 |
illery | +0.491 |
Neg logit contributions | |
�� | -0.719 |
sqor | -0.690 |
ゴ | -0.633 |
capacity | -0.628 |
ALSE | -0.612 |
Token | of |
Token ID | 286 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
arial | +2.136 |
nce | +2.078 |
utton | +2.067 |
ody | +2.018 |
illery | +1.997 |
Neg logit contributions | |
�� | -2.426 |
sqor | -2.343 |
capacity | -2.109 |
ゴ | -2.096 |
ALSE | -2.039 |
Token | an |
Token ID | 281 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
arial | +6.359 |
ody | +6.096 |
nce | +5.756 |
izer | +5.730 |
utton | +5.719 |
Neg logit contributions | |
�� | -12.990 |
sqor | -12.513 |
ゴ | -11.449 |
ALSE | -11.358 |
capacity | -11.255 |
Token | eye |
Token ID | 4151 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
arial | +4.188 |
ody | +4.010 |
izer | +3.679 |
utton | +3.475 |
nce | +3.229 |
Neg logit contributions | |
�� | -13.339 |
sqor | -12.710 |
ゴ | -12.218 |
capacity | -11.391 |
ALSE | -11.321 |
Token | . |
Token ID | 13 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
arial | +4.158 |
nce | +4.125 |
utton | +3.990 |
ody | +3.956 |
izer | +3.879 |
Neg logit contributions | |
�� | -6.792 |
sqor | -6.379 |
ゴ | -5.944 |
capacity | -5.916 |
ALSE | -5.756 |
Token | Everything |
Token ID | 11391 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
arial | +0.690 |
nce | +0.677 |
utton | +0.656 |
ody | +0.642 |
illery | +0.640 |
Neg logit contributions | |
�� | -1.093 |
sqor | -1.043 |
capacity | -0.944 |
ゴ | -0.941 |
ALSE | -0.918 |
Token | will |
Token ID | 481 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
�� | +1.331 |
sqor | +1.292 |
capacity | +1.180 |
ゴ | +1.174 |
ALSE | +1.142 |
Neg logit contributions | |
arial | -0.918 |
nce | -0.888 |
utton | -0.887 |
ody | -0.858 |
illery | -0.853 |
Token | / |
Token ID | 14 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
arial | +4.125 |
nce | +4.039 |
utton | +4.015 |
ody | +3.941 |
izer | +3.880 |
Neg logit contributions | |
�� | -7.095 |
sqor | -6.592 |
ゴ | -5.955 |
Sisters | -5.877 |
ALSE | -5.811 |
Token | AUT |
Token ID | 39371 |
Feature activation | -6.55e-01 |
Pos logit contributions | |
nce | +4.818 |
ody | +4.621 |
utton | +4.585 |
arial | +4.520 |
izer | +4.359 |
Neg logit contributions | |
sqor | -7.641 |
�� | -7.426 |
ゴ | -6.696 |
Sisters | -6.680 |
capacity | -6.672 |
Token | OC |
Token ID | 4503 |
Feature activation | -8.20e-01 |
Pos logit contributions | |
arial | +3.239 |
utton | +3.187 |
ody | +3.138 |
illery | +3.106 |
nce | +2.984 |
Neg logit contributions | |
�� | -4.582 |
sqor | -4.533 |
ゴ | -4.039 |
capacity | -4.010 |
Sisters | -4.003 |
Token | R |
Token ID | 49 |
Feature activation | -4.63e-01 |
Pos logit contributions | |
utton | +2.965 |
arial | +2.909 |
nce | +2.863 |
ody | +2.831 |
izer | +2.735 |
Neg logit contributions | |
�� | -6.501 |
sqor | -6.384 |
ゴ | -6.135 |
Sisters | -5.762 |
capacity | -5.754 |
Token | OP |
Token ID | 3185 |
Feature activation | -8.39e-01 |
Pos logit contributions | |
utton | +2.440 |
nce | +2.337 |
arial | +2.288 |
ody | +2.194 |
illery | +2.156 |
Neg logit contributions | |
�� | -3.254 |
sqor | -3.048 |
ゴ | -2.862 |
capacity | -2.819 |
Sisters | -2.739 |
Token | / |
Token ID | 14 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
nce | +3.543 |
arial | +3.503 |
utton | +3.449 |
ody | +3.368 |
illery | +3.138 |
Neg logit contributions | |
�� | -6.292 |
sqor | -6.275 |
ゴ | -5.874 |
capacity | -5.792 |
Sisters | -5.576 |
Token | h |
Token ID | 71 |
Feature activation | -6.18e-01 |
Pos logit contributions | |
arial | +4.638 |
nce | +4.142 |
ody | +4.092 |
izer | +4.041 |
utton | +3.893 |
Neg logit contributions | |
�� | -13.739 |
sqor | -13.149 |
ゴ | -12.697 |
ALSE | -12.242 |
覚醒 | -11.581 |
Token | 342 |
Token ID | 31575 |
Feature activation | -5.97e-01 |
Pos logit contributions | |
nce | +2.622 |
izer | +2.565 |
utton | +2.540 |
arial | +2.507 |
illery | +2.389 |
Neg logit contributions | |
�� | -4.849 |
sqor | -4.614 |
ゴ | -4.307 |
ALSE | -4.156 |
Sisters | -4.101 |
Token | / |
Token ID | 14 |
Feature activation | -7.21e-01 |
Pos logit contributions | |
arial | +2.673 |
nce | +2.642 |
utton | +2.561 |
illery | +2.502 |
ody | +2.457 |
Neg logit contributions | |
�� | -4.676 |
sqor | -4.298 |
ゴ | -3.951 |
ALSE | -3.889 |
Sisters | -3.867 |
Token | UST |
Token ID | 7759 |
Feature activation | -5.22e-01 |
Pos logit contributions | |
arial | +4.119 |
nce | +3.955 |
utton | +3.951 |
ody | +3.846 |
illery | +3.722 |
Neg logit contributions | |
�� | -4.593 |
sqor | -4.357 |
ゴ | -3.818 |
Sisters | -3.742 |
capacity | -3.733 |
Token | r |
Token ID | 81 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
arial | +2.728 |
utton | +2.637 |
nce | +2.624 |
ody | +2.622 |
illery | +2.558 |
Neg logit contributions | |
�� | -3.544 |
sqor | -3.429 |
capacity | -3.082 |
ゴ | -3.062 |
Sisters | -2.992 |
Token | special |
Token ID | 2041 |
Feature activation | +6.37e-02 |
Pos logit contributions | |
arial | +0.703 |
nce | +0.686 |
utton | +0.681 |
ody | +0.664 |
illery | +0.655 |
Neg logit contributions | |
�� | -1.020 |
sqor | -0.987 |
capacity | -0.902 |
ゴ | -0.897 |
ALSE | -0.874 |
Token | teams |
Token ID | 3466 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
�� | +0.424 |
sqor | +0.410 |
capacity | +0.372 |
ゴ | +0.369 |
ALSE | +0.359 |
Neg logit contributions | |
arial | -0.343 |
nce | -0.333 |
utton | -0.332 |
ody | -0.322 |
illery | -0.320 |
Token | coordinator |
Token ID | 16052 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
arial | +0.721 |
nce | +0.702 |
utton | +0.701 |
ody | +0.679 |
illery | +0.675 |
Neg logit contributions | |
�� | -1.182 |
sqor | -1.144 |
capacity | -1.046 |
ゴ | -1.040 |
ALSE | -1.021 |
Token | D |
Token ID | 360 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
�� | +1.230 |
sqor | +1.195 |
capacity | +1.089 |
ゴ | +1.084 |
ALSE | +1.052 |
Neg logit contributions | |
arial | -0.942 |
utton | -0.912 |
nce | -0.906 |
ody | -0.879 |
illery | -0.876 |
Token | arr |
Token ID | 3258 |
Feature activation | -5.21e-01 |
Pos logit contributions | |
arial | +1.373 |
utton | +1.337 |
nce | +1.334 |
ody | +1.310 |
illery | +1.293 |
Neg logit contributions | |
�� | -1.521 |
sqor | -1.465 |
capacity | -1.315 |
ゴ | -1.305 |
ALSE | -1.261 |
Token | in |
Token ID | 259 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
arial | +2.812 |
nce | +2.788 |
utton | +2.736 |
illery | +2.659 |
ody | +2.645 |
Neg logit contributions | |
�� | -3.469 |
sqor | -3.391 |
capacity | -2.999 |
ゴ | -2.993 |
ALSE | -2.904 |
Token | Simmons |
Token ID | 22553 |
Feature activation | -6.86e-01 |
Pos logit contributions | |
nce | +7.479 |
arial | +7.173 |
utton | +7.033 |
illery | +6.942 |
izer | +6.882 |
Neg logit contributions | |
�� | -10.379 |
sqor | -9.997 |
ALSE | -8.894 |
ゴ | -8.894 |
capacity | -8.680 |
Token | said |
Token ID | 531 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
arial | +3.540 |
nce | +3.495 |
utton | +3.476 |
ody | +3.414 |
izer | +3.379 |
Neg logit contributions | |
�� | -4.581 |
sqor | -4.376 |
capacity | -4.026 |
ゴ | -3.935 |
ALSE | -3.914 |
Token | . |
Token ID | 13 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
arial | +0.630 |
nce | +0.610 |
utton | +0.608 |
ody | +0.592 |
illery | +0.585 |
Neg logit contributions | |
�� | -0.868 |
sqor | -0.838 |
capacity | -0.766 |
ゴ | -0.760 |
ALSE | -0.741 |
Token | � |
Token ID | 564 |
Feature activation | -2.88e-01 |
Pos logit contributions | |
�� | +1.098 |
sqor | +1.064 |
capacity | +0.969 |
ゴ | +0.966 |
ALSE | +0.937 |
Neg logit contributions | |
arial | -0.867 |
utton | -0.838 |
nce | -0.838 |
ody | -0.815 |
illery | -0.809 |
Token | � |
Token ID | 250 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
arial | +1.237 |
nce | +1.191 |
utton | +1.186 |
ody | +1.145 |
illery | +1.134 |
Neg logit contributions | |
�� | -2.234 |
sqor | -2.170 |
capacity | -1.997 |
ゴ | -1.987 |
ALSE | -1.940 |
Token | , |
Token ID | 11 |
Feature activation | -8.33e-02 |
Pos logit contributions | |
arial | +0.357 |
utton | +0.345 |
nce | +0.345 |
ody | +0.339 |
illery | +0.332 |
Neg logit contributions | |
�� | -0.464 |
sqor | -0.446 |
capacity | -0.408 |
ゴ | -0.405 |
ALSE | -0.394 |
Token | this |
Token ID | 428 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
arial | +0.409 |
nce | +0.401 |
utton | +0.399 |
ody | +0.392 |
illery | +0.381 |
Neg logit contributions | |
�� | -0.594 |
sqor | -0.572 |
ゴ | -0.523 |
capacity | -0.521 |
ALSE | -0.503 |
Token | dé |
Token ID | 39073 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
�� | +1.077 |
sqor | +1.044 |
capacity | +0.953 |
ゴ | +0.947 |
ALSE | +0.923 |
Neg logit contributions | |
arial | -0.762 |
nce | -0.737 |
utton | -0.735 |
ody | -0.712 |
illery | -0.708 |
Token | j |
Token ID | 73 |
Feature activation | -6.87e-01 |
Pos logit contributions | |
arial | +0.188 |
nce | +0.184 |
utton | +0.183 |
ody | +0.178 |
illery | +0.177 |
Neg logit contributions | |
�� | -0.202 |
sqor | -0.193 |
capacity | -0.173 |
ゴ | -0.173 |
ALSE | -0.168 |
Token | à |
Token ID | 24247 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
arial | +4.350 |
utton | +4.301 |
ody | +4.241 |
nce | +4.230 |
illery | +4.054 |
Neg logit contributions | |
�� | -3.936 |
sqor | -3.725 |
ゴ | -3.386 |
ALSE | -3.263 |
capacity | -3.163 |
Token | v |
Token ID | 410 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
arial | +1.354 |
nce | +1.326 |
utton | +1.271 |
illery | +1.210 |
ody | +1.206 |
Neg logit contributions | |
�� | -3.837 |
sqor | -3.731 |
ゴ | -3.511 |
capacity | -3.449 |
ALSE | -3.392 |
Token | u |
Token ID | 84 |
Feature activation | -9.18e-01 |
Pos logit contributions | |
utton | +6.247 |
nce | +6.235 |
arial | +6.106 |
ody | +6.082 |
izer | +6.045 |
Neg logit contributions | |
�� | -11.393 |
ゴ | -10.321 |
sqor | -10.262 |
Sisters | -9.557 |
capacity | -9.478 |
Token | isn |
Token ID | 2125 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
arial | +4.251 |
nce | +4.011 |
ody | +3.909 |
utton | +3.877 |
izer | +3.696 |
Neg logit contributions | |
�� | -6.976 |
sqor | -6.678 |
ゴ | -6.039 |
capacity | -6.009 |
ALSE | -5.868 |
Token | � |
Token ID | 447 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
arial | +1.172 |
utton | +1.116 |
nce | +1.109 |
ody | +1.064 |
izer | +1.036 |
Neg logit contributions | |
�� | -2.890 |
sqor | -2.771 |
capacity | -2.528 |
ゴ | -2.526 |
ALSE | -2.464 |
Token | � |
Token ID | 247 |
Feature activation | -1.98e-01 |
Pos logit contributions | |
arial | +0.843 |
nce | +0.836 |
utton | +0.825 |
ody | +0.810 |
illery | +0.792 |
Neg logit contributions | |
�� | -1.111 |
sqor | -1.107 |
capacity | -0.997 |
ゴ | -0.993 |
Sisters | -0.962 |
Token | t |
Token ID | 83 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
arial | +1.034 |
nce | +1.014 |
utton | +0.997 |
ody | +0.975 |
illery | +0.957 |
Neg logit contributions | |
�� | -1.377 |
sqor | -1.321 |
ゴ | -1.191 |
capacity | -1.185 |
ALSE | -1.156 |
Token |
|
Token ID | 198 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
arial | +3.956 |
izer | +3.908 |
nce | +3.885 |
utton | +3.622 |
illery | +3.443 |
Neg logit contributions | |
�� | -9.899 |
sqor | -8.941 |
carbohyd | -8.429 |
ゴ | -8.082 |
satell | -8.053 |
Token | Reddit |
Token ID | 22367 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
nce | +5.426 |
arial | +5.383 |
izer | +5.218 |
utton | +5.214 |
ody | +5.191 |
Neg logit contributions | |
�� | -8.427 |
sqor | -7.948 |
ゴ | -7.233 |
capacity | -7.191 |
cov | -6.965 |
Token |
|
Token ID | 198 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
arial | +0.811 |
utton | +0.787 |
nce | +0.786 |
ody | +0.763 |
illery | +0.756 |
Neg logit contributions | |
�� | -1.365 |
sqor | -1.319 |
capacity | -1.207 |
ゴ | -1.201 |
ALSE | -1.173 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +4.402 |
izer | +4.293 |
nce | +4.189 |
utton | +3.872 |
illery | +3.761 |
Neg logit contributions | |
�� | -12.114 |
sqor | -11.019 |
carbohyd | -10.574 |
satell | -10.110 |
ゴ | -9.886 |
Token | Pocket |
Token ID | 45454 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
arial | +5.948 |
nce | +5.894 |
ody | +5.822 |
izer | +5.737 |
utton | +5.577 |
Neg logit contributions | |
�� | -10.861 |
sqor | -10.415 |
capacity | -9.428 |
ゴ | -9.358 |
cov | -9.174 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +0.749 |
nce | +0.732 |
utton | +0.725 |
ody | +0.711 |
illery | +0.704 |
Neg logit contributions | |
�� | -1.288 |
sqor | -1.246 |
capacity | -1.137 |
ゴ | -1.135 |
ALSE | -1.102 |
Token |
|
Token ID | 198 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
izer | +4.567 |
arial | +4.491 |
nce | +4.482 |
utton | +3.994 |
illery | +3.880 |
Neg logit contributions | |
�� | -13.576 |
sqor | -12.314 |
carbohyd | -12.090 |
satell | -11.304 |
practition | -11.123 |
Token | Print |
Token ID | 18557 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
nce | +5.910 |
arial | +5.823 |
ody | +5.724 |
izer | +5.708 |
utton | +5.594 |
Neg logit contributions | |
�� | -10.480 |
sqor | -10.305 |
cov | -9.065 |
ゴ | -9.045 |
capacity | -9.014 |
Token |
|
Token ID | 198 |
Feature activation | -8.74e-01 |
Pos logit contributions | |
�� | +1.437 |
sqor | +1.399 |
capacity | +1.288 |
ゴ | +1.275 |
Sisters | +1.243 |
Neg logit contributions | |
arial | -1.082 |
nce | -1.042 |
utton | -1.036 |
ody | -1.006 |
illery | -0.989 |
Token |
|
Token ID | 198 |
Feature activation | -9.40e-01 |
Pos logit contributions | |
arial | +3.375 |
izer | +3.302 |
nce | +3.270 |
utton | +3.074 |
illery | +3.054 |
Neg logit contributions | |
�� | -7.591 |
sqor | -6.998 |
carbohyd | -6.320 |
ゴ | -6.158 |
cov | -6.116 |
Token | Email |
Token ID | 15333 |
Feature activation | +4.87e-01 |
Pos logit contributions | |
arial | +4.372 |
nce | +4.310 |
izer | +4.261 |
ody | +4.205 |
illery | +4.124 |
Neg logit contributions | |
�� | -6.761 |
sqor | -6.630 |
capacity | -5.764 |
ゴ | -5.626 |
cov | -5.594 |
Token | legraph |
Token ID | 16606 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
nce | +1.023 |
arial | +1.008 |
utton | +0.990 |
ody | +0.926 |
illery | +0.918 |
Neg logit contributions | |
�� | -3.653 |
sqor | -3.514 |
ゴ | -3.290 |
Sisters | -3.216 |
capacity | -3.204 |
Token | . |
Token ID | 13 |
Feature activation | -7.98e-01 |
Pos logit contributions | |
arial | +1.328 |
utton | +1.297 |
nce | +1.291 |
illery | +1.250 |
ody | +1.249 |
Neg logit contributions | |
�� | -2.421 |
sqor | -2.254 |
ゴ | -2.037 |
capacity | -2.019 |
ALSE | -1.994 |
Token | co |
Token ID | 1073 |
Feature activation | -6.55e-01 |
Pos logit contributions | |
arial | +4.210 |
nce | +4.183 |
izer | +4.048 |
utton | +4.040 |
ody | +4.022 |
Neg logit contributions | |
�� | -5.805 |
sqor | -5.284 |
ALSE | -4.641 |
ゴ | -4.590 |
Sisters | -4.544 |
Token | . |
Token ID | 13 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
arial | +2.673 |
nce | +2.671 |
utton | +2.606 |
izer | +2.568 |
ody | +2.540 |
Neg logit contributions | |
�� | -5.511 |
sqor | -5.097 |
ゴ | -4.633 |
ALSE | -4.521 |
capacity | -4.511 |
Token | uk |
Token ID | 2724 |
Feature activation | -7.50e-01 |
Pos logit contributions | |
nce | +4.408 |
arial | +4.213 |
utton | +4.157 |
ody | +3.918 |
izer | +3.868 |
Neg logit contributions | |
�� | -10.922 |
sqor | -9.977 |
carbohyd | -9.140 |
ゴ | -9.054 |
覚醒 | -8.849 |
Token | / |
Token ID | 14 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +3.287 |
nce | +3.237 |
utton | +3.140 |
izer | +3.057 |
illery | +3.052 |
Neg logit contributions | |
�� | -6.027 |
sqor | -5.612 |
ゴ | -5.017 |
capacity | -4.917 |
ALSE | -4.862 |
Token | in |
Token ID | 259 |
Feature activation | -7.62e-01 |
Pos logit contributions | |
nce | +6.894 |
arial | +6.834 |
ody | +6.800 |
utton | +6.760 |
illery | +6.354 |
Neg logit contributions | |
�� | -10.143 |
sqor | -9.647 |
ALSE | -8.741 |
ゴ | -8.396 |
Sisters | -8.325 |
Token | coming |
Token ID | 4976 |
Feature activation | -8.64e-01 |
Pos logit contributions | |
arial | +1.332 |
utton | +1.224 |
nce | +1.188 |
ody | +1.072 |
illery | +1.068 |
Neg logit contributions | |
�� | -7.870 |
sqor | -7.688 |
ALSE | -7.177 |
ゴ | -7.163 |
capacity | -6.998 |
Token | / |
Token ID | 14 |
Feature activation | -7.15e-01 |
Pos logit contributions | |
arial | +3.927 |
nce | +3.880 |
utton | +3.878 |
ody | +3.748 |
illery | +3.739 |
Neg logit contributions | |
�� | -6.417 |
sqor | -6.128 |
ゴ | -5.584 |
capacity | -5.459 |
Sisters | -5.451 |
Token | article |
Token ID | 20205 |
Feature activation | -7.64e-01 |
Pos logit contributions | |
arial | +3.281 |
utton | +3.256 |
nce | +3.249 |
ody | +3.146 |
izer | +2.991 |
Neg logit contributions | |
�� | -5.382 |
sqor | -5.023 |
ゴ | -4.610 |
ALSE | -4.576 |
Sisters | -4.501 |
Token | 35 |
Token ID | 2327 |
Feature activation | -6.17e-01 |
Pos logit contributions | |
arial | +3.819 |
ody | +3.725 |
nce | +3.724 |
utton | +3.724 |
illery | +3.721 |
Neg logit contributions | |
�� | -5.303 |
sqor | -4.898 |
ALSE | -4.455 |
capacity | -4.436 |
ゴ | -4.422 |
Token | polit |
Token ID | 34470 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
arial | +0.320 |
nce | +0.312 |
utton | +0.310 |
ody | +0.303 |
illery | +0.297 |
Neg logit contributions | |
�� | -0.406 |
sqor | -0.390 |
ゴ | -0.349 |
capacity | -0.349 |
Sisters | -0.338 |
Token | ically |
Token ID | 1146 |
Feature activation | +9.39e-02 |
Pos logit contributions | |
�� | +1.912 |
sqor | +1.844 |
capacity | +1.663 |
ゴ | +1.641 |
ALSE | +1.588 |
Neg logit contributions | |
arial | -1.986 |
nce | -1.938 |
utton | -1.929 |
ody | -1.877 |
illery | -1.868 |
Token | correct |
Token ID | 3376 |
Feature activation | +1.00e-01 |
Pos logit contributions | |
�� | +0.606 |
sqor | +0.585 |
capacity | +0.528 |
ゴ | +0.525 |
ALSE | +0.509 |
Neg logit contributions | |
arial | -0.525 |
nce | -0.509 |
utton | -0.509 |
ody | -0.496 |
illery | -0.492 |
Token | o |
Token ID | 267 |
Feature activation | -4.20e-01 |
Pos logit contributions | |
�� | +0.664 |
sqor | +0.642 |
capacity | +0.582 |
ゴ | +0.579 |
ALSE | +0.562 |
Neg logit contributions | |
arial | -0.542 |
nce | -0.526 |
utton | -0.525 |
ody | -0.510 |
illery | -0.507 |
Token | omp |
Token ID | 3361 |
Feature activation | -3.18e-01 |
Pos logit contributions | |
arial | +2.336 |
nce | +2.334 |
utton | +2.308 |
ody | +2.292 |
izer | +2.188 |
Neg logit contributions | |
�� | -2.698 |
sqor | -2.606 |
capacity | -2.321 |
ゴ | -2.313 |
ALSE | -2.241 |
Token | a |
Token ID | 64 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +1.840 |
utton | +1.825 |
nce | +1.794 |
ody | +1.776 |
illery | +1.741 |
Neg logit contributions | |
�� | -1.980 |
sqor | -1.908 |
ゴ | -1.722 |
capacity | -1.699 |
ALSE | -1.650 |
Token | lo |
Token ID | 2376 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
utton | +6.528 |
izer | +6.193 |
nce | +6.184 |
arial | +6.162 |
illery | +6.093 |
Neg logit contributions | |
�� | -10.764 |
sqor | -9.761 |
capacity | -9.198 |
ゴ | -9.107 |
ALSE | -9.083 |
Token | omp |
Token ID | 3361 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
arial | +0.970 |
utton | +0.940 |
nce | +0.938 |
ody | +0.923 |
illery | +0.910 |
Neg logit contributions | |
�� | -1.352 |
sqor | -1.301 |
capacity | -1.193 |
ゴ | -1.187 |
ALSE | -1.151 |
Token | as |
Token ID | 292 |
Feature activation | -5.25e-01 |
Pos logit contributions | |
arial | +2.563 |
utton | +2.500 |
nce | +2.483 |
ody | +2.466 |
illery | +2.411 |
Neg logit contributions | |
�� | -2.300 |
sqor | -2.197 |
ゴ | -1.967 |
capacity | -1.941 |
ALSE | -1.865 |
Token | for |
Token ID | 329 |
Feature activation | -2.19e-01 |
Pos logit contributions | |
arial | +2.780 |
nce | +2.726 |
utton | +2.694 |
ody | +2.656 |
illery | +2.583 |
Neg logit contributions | |
�� | -3.521 |
sqor | -3.355 |
capacity | -3.068 |
ゴ | -3.031 |
ALSE | -2.932 |
Token | the |
Token ID | 262 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
arial | +1.170 |
nce | +1.143 |
utton | +1.134 |
ody | +1.105 |
illery | +1.085 |
Neg logit contributions | |
�� | -1.474 |
sqor | -1.418 |
capacity | -1.287 |
ゴ | -1.278 |
ALSE | -1.241 |
Token | LinkedIn |
Token ID | 40574 |
Feature activation | +2.10e-01 |
Pos logit contributions | |
nce | +5.515 |
arial | +5.456 |
ody | +5.325 |
izer | +5.316 |
utton | +5.280 |
Neg logit contributions | |
�� | -8.893 |
sqor | -8.385 |
ゴ | -7.573 |
capacity | -7.563 |
ALSE | -7.263 |
Token |
|
Token ID | 198 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
�� | +1.396 |
sqor | +1.360 |
capacity | +1.237 |
ゴ | +1.232 |
Sisters | +1.204 |
Neg logit contributions | |
arial | -1.105 |
nce | -1.072 |
utton | -1.055 |
ody | -1.025 |
illery | -1.022 |
Token |
|
Token ID | 198 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
arial | +3.956 |
izer | +3.908 |
nce | +3.885 |
utton | +3.622 |
illery | +3.443 |
Neg logit contributions | |
�� | -9.899 |
sqor | -8.941 |
carbohyd | -8.429 |
ゴ | -8.082 |
satell | -8.053 |
Token | Reddit |
Token ID | 22367 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
nce | +5.426 |
arial | +5.383 |
izer | +5.218 |
utton | +5.214 |
ody | +5.191 |
Neg logit contributions | |
�� | -8.427 |
sqor | -7.948 |
ゴ | -7.233 |
capacity | -7.191 |
cov | -6.965 |
Token |
|
Token ID | 198 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
arial | +0.811 |
utton | +0.787 |
nce | +0.786 |
ody | +0.763 |
illery | +0.756 |
Neg logit contributions | |
�� | -1.365 |
sqor | -1.319 |
capacity | -1.207 |
ゴ | -1.201 |
ALSE | -1.173 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +4.402 |
izer | +4.293 |
nce | +4.189 |
utton | +3.872 |
illery | +3.761 |
Neg logit contributions | |
�� | -12.114 |
sqor | -11.019 |
carbohyd | -10.574 |
satell | -10.110 |
ゴ | -9.886 |
Token | Pocket |
Token ID | 45454 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
arial | +5.948 |
nce | +5.894 |
ody | +5.822 |
izer | +5.737 |
utton | +5.577 |
Neg logit contributions | |
�� | -10.861 |
sqor | -10.415 |
capacity | -9.428 |
ゴ | -9.358 |
cov | -9.174 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +0.749 |
nce | +0.732 |
utton | +0.725 |
ody | +0.711 |
illery | +0.704 |
Neg logit contributions | |
�� | -1.288 |
sqor | -1.246 |
capacity | -1.137 |
ゴ | -1.135 |
ALSE | -1.102 |
Token |
|
Token ID | 198 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
izer | +4.567 |
arial | +4.491 |
nce | +4.482 |
utton | +3.994 |
illery | +3.880 |
Neg logit contributions | |
�� | -13.576 |
sqor | -12.314 |
carbohyd | -12.090 |
satell | -11.304 |
practition | -11.123 |
Token | Print |
Token ID | 18557 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
nce | +5.910 |
arial | +5.823 |
ody | +5.724 |
izer | +5.708 |
utton | +5.594 |
Neg logit contributions | |
�� | -10.480 |
sqor | -10.305 |
cov | -9.065 |
ゴ | -9.045 |
capacity | -9.014 |
Token |
|
Token ID | 198 |
Feature activation | -8.74e-01 |
Pos logit contributions | |
�� | +1.437 |
sqor | +1.399 |
capacity | +1.288 |
ゴ | +1.275 |
Sisters | +1.243 |
Neg logit contributions | |
arial | -1.082 |
nce | -1.042 |
utton | -1.036 |
ody | -1.006 |
illery | -0.989 |
Token | happen |
Token ID | 1645 |
Feature activation | -3.45e-02 |
Pos logit contributions | |
arial | +0.292 |
nce | +0.287 |
utton | +0.281 |
ody | +0.273 |
illery | +0.270 |
Neg logit contributions | |
�� | -0.430 |
sqor | -0.413 |
capacity | -0.377 |
ゴ | -0.376 |
ALSE | -0.367 |
Token | within |
Token ID | 1626 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
arial | +0.171 |
nce | +0.167 |
utton | +0.164 |
ody | +0.161 |
illery | +0.158 |
Neg logit contributions | |
�� | -0.246 |
sqor | -0.237 |
capacity | -0.217 |
ゴ | -0.216 |
ALSE | -0.209 |
Token | the |
Token ID | 262 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
arial | +0.532 |
nce | +0.522 |
utton | +0.513 |
ody | +0.504 |
illery | +0.492 |
Neg logit contributions | |
�� | -0.809 |
sqor | -0.779 |
ゴ | -0.716 |
capacity | -0.709 |
ALSE | -0.692 |
Token | blink |
Token ID | 21019 |
Feature activation | -3.79e-01 |
Pos logit contributions | |
arial | +0.530 |
nce | +0.520 |
utton | +0.511 |
ody | +0.499 |
illery | +0.491 |
Neg logit contributions | |
�� | -0.719 |
sqor | -0.690 |
ゴ | -0.633 |
capacity | -0.628 |
ALSE | -0.612 |
Token | of |
Token ID | 286 |
Feature activation | -1.69e+00 |
Pos logit contributions | |
arial | +2.136 |
nce | +2.078 |
utton | +2.067 |
ody | +2.018 |
illery | +1.997 |
Neg logit contributions | |
�� | -2.426 |
sqor | -2.343 |
capacity | -2.109 |
ゴ | -2.096 |
ALSE | -2.039 |
Token | an |
Token ID | 281 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
arial | +6.359 |
ody | +6.096 |
nce | +5.756 |
izer | +5.730 |
utton | +5.719 |
Neg logit contributions | |
�� | -12.990 |
sqor | -12.513 |
ゴ | -11.449 |
ALSE | -11.358 |
capacity | -11.255 |
Token | eye |
Token ID | 4151 |
Feature activation | -9.25e-01 |
Pos logit contributions | |
arial | +4.188 |
ody | +4.010 |
izer | +3.679 |
utton | +3.475 |
nce | +3.229 |
Neg logit contributions | |
�� | -13.339 |
sqor | -12.710 |
ゴ | -12.218 |
capacity | -11.391 |
ALSE | -11.321 |
Token | . |
Token ID | 13 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
arial | +4.158 |
nce | +4.125 |
utton | +3.990 |
ody | +3.956 |
izer | +3.879 |
Neg logit contributions | |
�� | -6.792 |
sqor | -6.379 |
ゴ | -5.944 |
capacity | -5.916 |
ALSE | -5.756 |
Token | Everything |
Token ID | 11391 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
arial | +0.690 |
nce | +0.677 |
utton | +0.656 |
ody | +0.642 |
illery | +0.640 |
Neg logit contributions | |
�� | -1.093 |
sqor | -1.043 |
capacity | -0.944 |
ゴ | -0.941 |
ALSE | -0.918 |
Token | will |
Token ID | 481 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
�� | +1.331 |
sqor | +1.292 |
capacity | +1.180 |
ゴ | +1.174 |
ALSE | +1.142 |
Neg logit contributions | |
arial | -0.918 |
nce | -0.888 |
utton | -0.887 |
ody | -0.858 |
illery | -0.853 |
Token | begin |
Token ID | 2221 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
�� | +1.569 |
sqor | +1.516 |
capacity | +1.377 |
ゴ | +1.370 |
ALSE | +1.331 |
Neg logit contributions | |
arial | -1.223 |
nce | -1.187 |
utton | -1.182 |
ody | -1.149 |
illery | -1.140 |
Token | sweet |
Token ID | 6029 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
arial | +1.794 |
nce | +1.777 |
utton | +1.774 |
ody | +1.715 |
illery | +1.693 |
Neg logit contributions | |
�� | -2.134 |
sqor | -2.042 |
ゴ | -1.862 |
capacity | -1.859 |
ALSE | -1.795 |
Token | put |
Token ID | 1234 |
Feature activation | +7.72e-02 |
Pos logit contributions | |
�� | +0.989 |
sqor | +0.955 |
capacity | +0.863 |
ゴ | +0.857 |
ALSE | +0.832 |
Neg logit contributions | |
arial | -0.877 |
nce | -0.853 |
utton | -0.851 |
ody | -0.828 |
illery | -0.822 |
Token | ts |
Token ID | 912 |
Feature activation | -5.69e-01 |
Pos logit contributions | |
�� | +0.519 |
sqor | +0.501 |
capacity | +0.454 |
ゴ | +0.452 |
ALSE | +0.440 |
Neg logit contributions | |
arial | -0.410 |
nce | -0.400 |
utton | -0.398 |
ody | -0.387 |
illery | -0.383 |
Token | . |
Token ID | 13 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
arial | +2.754 |
nce | +2.644 |
utton | +2.637 |
ody | +2.585 |
izer | +2.563 |
Neg logit contributions | |
�� | -4.093 |
sqor | -3.892 |
capacity | -3.587 |
ゴ | -3.568 |
ALSE | -3.461 |
Token | Wo |
Token ID | 22173 |
Feature activation | -6.30e-01 |
Pos logit contributions | |
arial | +2.343 |
nce | +2.323 |
utton | +2.250 |
illery | +2.197 |
izer | +2.192 |
Neg logit contributions | |
�� | -3.905 |
sqor | -3.706 |
ゴ | -3.354 |
capacity | -3.339 |
ALSE | -3.242 |
Token | oh |
Token ID | 1219 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
arial | +2.473 |
ody | +2.347 |
utton | +2.330 |
nce | +2.304 |
illery | +2.242 |
Neg logit contributions | |
�� | -5.086 |
sqor | -4.976 |
ゴ | -4.598 |
capacity | -4.594 |
ALSE | -4.453 |
Token | oo |
Token ID | 2238 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
ody | +5.357 |
nce | +5.245 |
arial | +5.136 |
utton | +5.123 |
izer | +4.723 |
Neg logit contributions | |
�� | -11.230 |
sqor | -10.741 |
ゴ | -10.207 |
capacity | -10.195 |
ALSE | -9.582 |
Token | ! |
Token ID | 0 |
Feature activation | -5.40e-01 |
Pos logit contributions | |
arial | +1.924 |
nce | +1.864 |
utton | +1.843 |
ody | +1.813 |
illery | +1.749 |
Neg logit contributions | |
�� | -3.665 |
sqor | -3.555 |
capacity | -3.285 |
ゴ | -3.279 |
ALSE | -3.165 |
Token |
|
Token ID | 198 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
arial | +2.438 |
nce | +2.427 |
utton | +2.335 |
ody | +2.292 |
illery | +2.284 |
Neg logit contributions | |
�� | -4.058 |
sqor | -3.857 |
ゴ | -3.529 |
capacity | -3.494 |
ALSE | -3.398 |
Token |
|
Token ID | 198 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
arial | +0.848 |
nce | +0.820 |
utton | +0.806 |
ody | +0.784 |
izer | +0.780 |
Neg logit contributions | |
�� | -1.289 |
sqor | -1.215 |
ゴ | -1.098 |
capacity | -1.079 |
ALSE | -1.061 |
Token | Now |
Token ID | 3844 |
Feature activation | -4.13e-01 |
Pos logit contributions | |
arial | +1.141 |
nce | +1.106 |
utton | +1.086 |
ody | +1.067 |
izer | +1.046 |
Neg logit contributions | |
�� | -1.704 |
sqor | -1.656 |
ゴ | -1.451 |
capacity | -1.450 |
Sisters | -1.425 |
Token | Reddit |
Token ID | 22367 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
nce | +5.426 |
arial | +5.383 |
izer | +5.218 |
utton | +5.214 |
ody | +5.191 |
Neg logit contributions | |
�� | -8.427 |
sqor | -7.948 |
ゴ | -7.233 |
capacity | -7.191 |
cov | -6.965 |
Token |
|
Token ID | 198 |
Feature activation | -1.34e+00 |
Pos logit contributions | |
arial | +0.811 |
utton | +0.787 |
nce | +0.786 |
ody | +0.763 |
illery | +0.756 |
Neg logit contributions | |
�� | -1.365 |
sqor | -1.319 |
capacity | -1.207 |
ゴ | -1.201 |
ALSE | -1.173 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +4.402 |
izer | +4.293 |
nce | +4.189 |
utton | +3.872 |
illery | +3.761 |
Neg logit contributions | |
�� | -12.114 |
sqor | -11.019 |
carbohyd | -10.574 |
satell | -10.110 |
ゴ | -9.886 |
Token | Pocket |
Token ID | 45454 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
arial | +5.948 |
nce | +5.894 |
ody | +5.822 |
izer | +5.737 |
utton | +5.577 |
Neg logit contributions | |
�� | -10.861 |
sqor | -10.415 |
capacity | -9.428 |
ゴ | -9.358 |
cov | -9.174 |
Token |
|
Token ID | 198 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
arial | +0.749 |
nce | +0.732 |
utton | +0.725 |
ody | +0.711 |
illery | +0.704 |
Neg logit contributions | |
�� | -1.288 |
sqor | -1.246 |
capacity | -1.137 |
ゴ | -1.135 |
ALSE | -1.102 |
Token |
|
Token ID | 198 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
izer | +4.567 |
arial | +4.491 |
nce | +4.482 |
utton | +3.994 |
illery | +3.880 |
Neg logit contributions | |
�� | -13.576 |
sqor | -12.314 |
carbohyd | -12.090 |
satell | -11.304 |
practition | -11.123 |
Token | Print |
Token ID | 18557 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
nce | +5.910 |
arial | +5.823 |
ody | +5.724 |
izer | +5.708 |
utton | +5.594 |
Neg logit contributions | |
�� | -10.480 |
sqor | -10.305 |
cov | -9.065 |
ゴ | -9.045 |
capacity | -9.014 |
Token |
|
Token ID | 198 |
Feature activation | -8.74e-01 |
Pos logit contributions | |
�� | +1.437 |
sqor | +1.399 |
capacity | +1.288 |
ゴ | +1.275 |
Sisters | +1.243 |
Neg logit contributions | |
arial | -1.082 |
nce | -1.042 |
utton | -1.036 |
ody | -1.006 |
illery | -0.989 |
Token |
|
Token ID | 198 |
Feature activation | -9.40e-01 |
Pos logit contributions | |
arial | +3.375 |
izer | +3.302 |
nce | +3.270 |
utton | +3.074 |
illery | +3.054 |
Neg logit contributions | |
�� | -7.591 |
sqor | -6.998 |
carbohyd | -6.320 |
ゴ | -6.158 |
cov | -6.116 |
Token | Email |
Token ID | 15333 |
Feature activation | +4.87e-01 |
Pos logit contributions | |
arial | +4.372 |
nce | +4.310 |
izer | +4.261 |
ody | +4.205 |
illery | +4.124 |
Neg logit contributions | |
�� | -6.761 |
sqor | -6.630 |
capacity | -5.764 |
ゴ | -5.626 |
cov | -5.594 |
Token |
|
Token ID | 198 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
�� | +3.126 |
sqor | +2.993 |
capacity | +2.808 |
ゴ | +2.791 |
Sisters | +2.704 |
Neg logit contributions | |
arial | -2.646 |
utton | -2.525 |
nce | -2.505 |
ody | -2.433 |
illery | -2.419 |
Token | of |
Token ID | 286 |
Feature activation | -1.10e+00 |
Pos logit contributions | |
arial | +2.721 |
nce | +2.651 |
utton | +2.643 |
ody | +2.580 |
illery | +2.559 |
Neg logit contributions | |
�� | -3.168 |
sqor | -3.047 |
capacity | -2.768 |
ゴ | -2.742 |
ALSE | -2.667 |
Token | Oregon |
Token ID | 8819 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
nce | +4.841 |
arial | +4.739 |
ody | +4.634 |
utton | +4.615 |
izer | +4.550 |
Neg logit contributions | |
�� | -8.081 |
sqor | -7.717 |
ゴ | -7.157 |
capacity | -6.958 |
ALSE | -6.850 |
Token | (@ |
Token ID | 4275 |
Feature activation | -3.48e-01 |
Pos logit contributions | |
nce | +3.278 |
arial | +3.233 |
utton | +3.209 |
izer | +3.121 |
ody | +3.080 |
Neg logit contributions | |
�� | -9.903 |
sqor | -9.189 |
capacity | -8.552 |
ゴ | -8.510 |
ALSE | -8.382 |
Token | AC |
Token ID | 2246 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
arial | +2.206 |
utton | +2.136 |
nce | +2.114 |
ody | +2.089 |
illery | +2.033 |
Neg logit contributions | |
�� | -2.097 |
sqor | -1.981 |
ゴ | -1.682 |
capacity | -1.644 |
Sisters | -1.631 |
Token | LU |
Token ID | 41596 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
arial | +2.460 |
utton | +2.437 |
nce | +2.434 |
ody | +2.403 |
illery | +2.371 |
Neg logit contributions | |
�� | -2.900 |
sqor | -2.726 |
ゴ | -2.456 |
capacity | -2.429 |
Sisters | -2.297 |
Token | _ |
Token ID | 62 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
arial | +3.354 |
utton | +3.180 |
nce | +3.170 |
ody | +3.008 |
izer | +2.971 |
Neg logit contributions | |
�� | -9.530 |
sqor | -8.931 |
ゴ | -8.047 |
cov | -7.853 |
capacity | -7.806 |
Token | OR |
Token ID | 1581 |
Feature activation | -8.48e-01 |
Pos logit contributions | |
arial | +4.529 |
ody | +4.454 |
utton | +4.371 |
nce | +4.370 |
izer | +3.940 |
Neg logit contributions | |
�� | -12.204 |
sqor | -11.839 |
carbohyd | -10.605 |
satell | -10.600 |
cov | -10.480 |
Token | ) |
Token ID | 8 |
Feature activation | -6.31e-01 |
Pos logit contributions | |
arial | +3.712 |
nce | +3.685 |
utton | +3.579 |
izer | +3.549 |
ody | +3.487 |
Neg logit contributions | |
�� | -6.825 |
sqor | -6.187 |
ゴ | -5.608 |
capacity | -5.487 |
ALSE | -5.368 |
Token | May |
Token ID | 1737 |
Feature activation | -1.14e+00 |
Pos logit contributions | |
arial | +3.440 |
nce | +3.369 |
utton | +3.315 |
ody | +3.268 |
illery | +3.244 |
Neg logit contributions | |
�� | -4.128 |
sqor | -3.926 |
capacity | -3.571 |
ゴ | -3.563 |
ALSE | -3.473 |
Token | 29 |
Token ID | 2808 |
Feature activation | -6.13e-01 |
Pos logit contributions | |
nce | +5.209 |
utton | +5.093 |
arial | +5.082 |
illery | +5.015 |
ody | +4.915 |
Neg logit contributions | |
�� | -8.107 |
sqor | -7.809 |
ゴ | -7.156 |
capacity | -7.050 |
ALSE | -6.905 |
Token | , |
Token ID | 11 |
Feature activation | +4.21e-02 |
Pos logit contributions | |
arial | +3.032 |
nce | +2.909 |
utton | +2.878 |
izer | +2.829 |
ody | +2.820 |
Neg logit contributions | |
�� | -4.745 |
sqor | -4.303 |
ゴ | -3.865 |
capacity | -3.783 |
ALSE | -3.690 |
Token | 1 |
Token ID | 352 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
arial | +0.124 |
nce | +0.121 |
utton | +0.120 |
ody | +0.117 |
illery | +0.116 |
Neg logit contributions | |
�� | -0.165 |
sqor | -0.160 |
capacity | -0.145 |
ゴ | -0.144 |
ALSE | -0.141 |
Token | AL |
Token ID | 8355 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
arial | +0.074 |
nce | +0.072 |
utton | +0.072 |
ody | +0.070 |
illery | +0.069 |
Neg logit contributions | |
�� | -0.078 |
sqor | -0.075 |
capacity | -0.068 |
ゴ | -0.067 |
ALSE | -0.066 |
Token | READ |
Token ID | 15675 |
Feature activation | +5.71e-01 |
Pos logit contributions | |
�� | +1.013 |
sqor | +0.979 |
capacity | +0.894 |
ゴ | +0.889 |
ALSE | +0.865 |
Neg logit contributions | |
arial | -0.718 |
nce | -0.694 |
utton | -0.691 |
ody | -0.672 |
illery | -0.665 |
Token | Y |
Token ID | 56 |
Feature activation | +6.89e-02 |
Pos logit contributions | |
�� | +2.842 |
sqor | +2.702 |
capacity | +2.365 |
ゴ | +2.352 |
ALSE | +2.270 |
Neg logit contributions | |
arial | -4.008 |
nce | -3.916 |
utton | -3.902 |
illery | -3.814 |
ody | -3.810 |
Token | COMP |
Token ID | 24301 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
�� | +0.442 |
sqor | +0.427 |
capacity | +0.387 |
ゴ | +0.386 |
ALSE | +0.372 |
Neg logit contributions | |
arial | -0.388 |
nce | -0.376 |
utton | -0.374 |
ody | -0.366 |
illery | -0.361 |
Token | ET |
Token ID | 2767 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
�� | +1.661 |
sqor | +1.601 |
capacity | +1.434 |
ゴ | +1.422 |
ALSE | +1.368 |
Neg logit contributions | |
arial | -1.687 |
nce | -1.642 |
utton | -1.637 |
ody | -1.595 |
illery | -1.585 |
Token | ED |
Token ID | 1961 |
Feature activation | +4.57e-02 |
Pos logit contributions | |
arial | +6.851 |
nce | +6.675 |
utton | +6.658 |
izer | +6.541 |
illery | +6.280 |
Neg logit contributions | |
�� | -9.708 |
sqor | -9.103 |
capacity | -8.296 |
ゴ | -8.247 |
Sisters | -7.761 |
Token | : |
Token ID | 25 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
�� | +0.297 |
sqor | +0.286 |
capacity | +0.259 |
ゴ | +0.258 |
ALSE | +0.249 |
Neg logit contributions | |
arial | -0.254 |
nce | -0.247 |
utton | -0.246 |
ody | -0.240 |
illery | -0.238 |
Token | at |
Token ID | 379 |
Feature activation | +4.74e-02 |
Pos logit contributions | |
arial | +0.901 |
nce | +0.890 |
utton | +0.872 |
ody | +0.855 |
illery | +0.837 |
Neg logit contributions | |
�� | -1.275 |
sqor | -1.227 |
capacity | -1.118 |
ゴ | -1.114 |
ALSE | -1.085 |
Token | Arizona |
Token ID | 7943 |
Feature activation | +4.37e-02 |
Pos logit contributions | |
�� | +0.293 |
sqor | +0.282 |
capacity | +0.254 |
ゴ | +0.252 |
ALSE | +0.245 |
Neg logit contributions | |
arial | -0.277 |
nce | -0.270 |
utton | -0.269 |
ody | -0.262 |
illery | -0.260 |
Token | Cardinals |
Token ID | 18071 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
�� | +0.270 |
sqor | +0.260 |
capacity | +0.234 |
ゴ | +0.233 |
ALSE | +0.226 |
Neg logit contributions | |
arial | -0.256 |
nce | -0.249 |
utton | -0.248 |
ody | -0.242 |
illery | -0.241 |
Token | oust |
Token ID | 23968 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
�� | +0.778 |
sqor | +0.747 |
capacity | +0.664 |
ゴ | +0.664 |
ALSE | +0.639 |
Neg logit contributions | |
arial | -0.850 |
nce | -0.828 |
utton | -0.827 |
ody | -0.808 |
illery | -0.803 |
Token | ache |
Token ID | 4891 |
Feature activation | -2.31e-01 |
Pos logit contributions | |
�� | +1.937 |
sqor | +1.866 |
capacity | +1.671 |
ゴ | +1.656 |
ALSE | +1.603 |
Neg logit contributions | |
arial | -2.050 |
nce | -1.996 |
utton | -1.990 |
ody | -1.943 |
illery | -1.930 |
Token | and |
Token ID | 290 |
Feature activation | -4.18e-01 |
Pos logit contributions | |
arial | +1.338 |
nce | +1.300 |
utton | +1.295 |
ody | +1.260 |
illery | +1.254 |
Neg logit contributions | |
�� | -1.438 |
sqor | -1.388 |
capacity | -1.250 |
ゴ | -1.243 |
ALSE | -1.202 |
Token | a |
Token ID | 257 |
Feature activation | -3.21e-01 |
Pos logit contributions | |
arial | +1.705 |
nce | +1.651 |
utton | +1.616 |
ody | +1.605 |
izer | +1.535 |
Neg logit contributions | |
�� | -3.424 |
sqor | -3.267 |
ゴ | -2.976 |
capacity | -2.967 |
ALSE | -2.895 |
Token | bit |
Token ID | 1643 |
Feature activation | -4.39e-01 |
Pos logit contributions | |
arial | +1.307 |
nce | +1.298 |
utton | +1.271 |
ody | +1.248 |
izer | +1.215 |
Neg logit contributions | |
�� | -2.577 |
sqor | -2.466 |
capacity | -2.276 |
ゴ | -2.265 |
ALSE | -2.235 |
Token | of |
Token ID | 286 |
Feature activation | -1.42e+00 |
Pos logit contributions | |
arial | +2.160 |
nce | +2.084 |
utton | +2.028 |
izer | +1.995 |
ody | +1.984 |
Neg logit contributions | |
�� | -3.300 |
sqor | -3.080 |
ゴ | -2.765 |
capacity | -2.752 |
ALSE | -2.668 |
Token | Paul |
Token ID | 3362 |
Feature activation | -3.89e-01 |
Pos logit contributions | |
arial | +4.941 |
nce | +4.603 |
utton | +4.558 |
ody | +4.374 |
izer | +4.142 |
Neg logit contributions | |
�� | -11.758 |
sqor | -11.391 |
capacity | -10.409 |
ゴ | -10.239 |
ALSE | -10.094 |
Token | Newman |
Token ID | 27698 |
Feature activation | -5.01e-01 |
Pos logit contributions | |
arial | +1.750 |
nce | +1.701 |
utton | +1.681 |
ody | +1.635 |
illery | +1.601 |
Neg logit contributions | |
�� | -3.002 |
sqor | -2.881 |
capacity | -2.622 |
ゴ | -2.613 |
ALSE | -2.517 |
Token | about |
Token ID | 546 |
Feature activation | -4.47e-01 |
Pos logit contributions | |
arial | +2.836 |
nce | +2.756 |
utton | +2.746 |
ody | +2.676 |
illery | +2.657 |
Neg logit contributions | |
�� | -3.194 |
sqor | -3.076 |
capacity | -2.781 |
ゴ | -2.755 |
ALSE | -2.678 |
Token | him |
Token ID | 683 |
Feature activation | -3.77e-01 |
Pos logit contributions | |
arial | +1.992 |
nce | +1.954 |
utton | +1.908 |
izer | +1.860 |
ody | +1.844 |
Neg logit contributions | |
�� | -3.452 |
sqor | -3.312 |
ゴ | -3.024 |
capacity | -3.003 |
ALSE | -2.927 |
Token | . |
Token ID | 13 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
arial | +1.977 |
utton | +1.910 |
nce | +1.909 |
ody | +1.863 |
illery | +1.842 |
Neg logit contributions | |
�� | -2.554 |
sqor | -2.444 |
capacity | -2.247 |
ゴ | -2.220 |
ALSE | -2.169 |
Token | , |
Token ID | 11 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
arial | +1.014 |
utton | +0.983 |
nce | +0.979 |
ody | +0.960 |
illery | +0.945 |
Neg logit contributions | |
�� | -1.366 |
sqor | -1.312 |
capacity | -1.195 |
ゴ | -1.194 |
ALSE | -1.159 |
Token | or |
Token ID | 393 |
Feature activation | -2.16e-01 |
Pos logit contributions | |
arial | +0.752 |
nce | +0.732 |
utton | +0.730 |
ody | +0.709 |
illery | +0.694 |
Neg logit contributions | |
�� | -1.197 |
sqor | -1.145 |
capacity | -1.055 |
ゴ | -1.051 |
ALSE | -1.024 |
Token | the |
Token ID | 262 |
Feature activation | -9.14e-02 |
Pos logit contributions | |
arial | +1.084 |
nce | +1.060 |
utton | +1.038 |
ody | +1.025 |
illery | +1.002 |
Neg logit contributions | |
�� | -1.532 |
sqor | -1.460 |
capacity | -1.341 |
ゴ | -1.337 |
ALSE | -1.294 |
Token | Cru |
Token ID | 6472 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
arial | +0.503 |
nce | +0.491 |
utton | +0.487 |
ody | +0.474 |
illery | +0.471 |
Neg logit contributions | |
�� | -0.599 |
sqor | -0.576 |
capacity | -0.522 |
ゴ | -0.520 |
ALSE | -0.504 |
Token | c |
Token ID | 66 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
�� | +1.689 |
sqor | +1.642 |
capacity | +1.505 |
ゴ | +1.491 |
ALSE | +1.455 |
Neg logit contributions | |
arial | -1.105 |
nce | -1.062 |
utton | -1.059 |
ody | -1.021 |
illery | -1.013 |
Token | if |
Token ID | 361 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
arial | +2.165 |
ody | +2.115 |
nce | +2.111 |
utton | +2.101 |
illery | +2.044 |
Neg logit contributions | |
�� | -4.840 |
sqor | -4.640 |
capacity | -4.318 |
ゴ | -4.295 |
ALSE | -4.214 |
Token | ux |
Token ID | 2821 |
Feature activation | +3.58e-01 |
Pos logit contributions | |
utton | +7.279 |
ody | +7.138 |
illery | +7.045 |
arial | +7.036 |
nce | +7.033 |
Neg logit contributions | |
�� | -9.113 |
sqor | -8.654 |
ゴ | -7.796 |
capacity | -7.452 |
ALSE | -7.247 |
Token | . |
Token ID | 13 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
�� | +2.307 |
sqor | +2.241 |
capacity | +2.025 |
ゴ | +2.008 |
Sisters | +1.991 |
Neg logit contributions | |
arial | -1.960 |
utton | -1.891 |
nce | -1.889 |
ody | -1.831 |
illery | -1.822 |
Token | Gr |
Token ID | 1902 |
Feature activation | -5.13e-02 |
Pos logit contributions | |
arial | +0.599 |
nce | +0.592 |
utton | +0.575 |
ody | +0.561 |
illery | +0.556 |
Neg logit contributions | |
�� | -0.938 |
sqor | -0.893 |
capacity | -0.814 |
ゴ | -0.800 |
ALSE | -0.784 |
Token | ong |
Token ID | 506 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
arial | +0.255 |
nce | +0.247 |
utton | +0.246 |
ody | +0.239 |
illery | +0.237 |
Neg logit contributions | |
�� | -0.362 |
sqor | -0.351 |
capacity | -0.320 |
ゴ | -0.318 |
ALSE | -0.310 |
Token | Gr |
Token ID | 1902 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
�� | +2.006 |
sqor | +1.948 |
capacity | +1.781 |
ゴ | +1.765 |
Sisters | +1.733 |
Neg logit contributions | |
arial | -1.274 |
utton | -1.216 |
nce | -1.215 |
ody | -1.168 |
illery | -1.167 |
Token | waiting |
Token ID | 4953 |
Feature activation | +9.16e-02 |
Pos logit contributions | |
arial | +1.388 |
nce | +1.325 |
utton | +1.308 |
ody | +1.282 |
izer | +1.262 |
Neg logit contributions | |
�� | -1.855 |
sqor | -1.779 |
ゴ | -1.621 |
capacity | -1.610 |
ALSE | -1.583 |
Token | : |
Token ID | 25 |
Feature activation | -8.38e-02 |
Pos logit contributions | |
�� | +0.668 |
sqor | +0.644 |
ゴ | +0.588 |
capacity | +0.586 |
ALSE | +0.572 |
Neg logit contributions | |
arial | -0.444 |
nce | -0.427 |
utton | -0.423 |
ody | -0.411 |
illery | -0.404 |
Token | " |
Token ID | 366 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
arial | +0.493 |
nce | +0.478 |
utton | +0.474 |
ody | +0.468 |
illery | +0.462 |
Neg logit contributions | |
�� | -0.523 |
sqor | -0.501 |
capacity | -0.447 |
ゴ | -0.446 |
ALSE | -0.430 |
Token | T |
Token ID | 51 |
Feature activation | -5.71e-02 |
Pos logit contributions | |
�� | +1.659 |
sqor | +1.603 |
capacity | +1.440 |
ゴ | +1.435 |
ALSE | +1.394 |
Neg logit contributions | |
arial | -1.340 |
nce | -1.298 |
utton | -1.287 |
ody | -1.260 |
illery | -1.247 |
Token | rev |
Token ID | 18218 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
arial | +0.321 |
nce | +0.313 |
utton | +0.313 |
ody | +0.307 |
illery | +0.305 |
Neg logit contributions | |
�� | -0.371 |
sqor | -0.354 |
ゴ | -0.319 |
capacity | -0.318 |
ALSE | -0.306 |
Token | or |
Token ID | 273 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
arial | +0.465 |
nce | +0.449 |
utton | +0.446 |
ody | +0.435 |
illery | +0.427 |
Neg logit contributions | |
�� | -0.828 |
sqor | -0.802 |
capacity | -0.737 |
ゴ | -0.736 |
ALSE | -0.718 |
Token | would |
Token ID | 561 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
arial | +6.503 |
nce | +6.478 |
izer | +6.384 |
ody | +6.186 |
utton | +6.092 |
Neg logit contributions | |
�� | -9.572 |
sqor | -8.958 |
ゴ | -8.226 |
capacity | -8.114 |
ALSE | -7.851 |
Token | just |
Token ID | 655 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
�� | +0.758 |
sqor | +0.731 |
ゴ | +0.667 |
capacity | +0.665 |
ALSE | +0.645 |
Neg logit contributions | |
arial | -0.539 |
nce | -0.523 |
utton | -0.518 |
ody | -0.503 |
illery | -0.500 |
Token | p |
Token ID | 279 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
�� | +2.896 |
sqor | +2.810 |
capacity | +2.553 |
ゴ | +2.525 |
ALSE | +2.464 |
Neg logit contributions | |
arial | -2.367 |
nce | -2.298 |
utton | -2.296 |
ody | -2.231 |
illery | -2.218 |
Token | ore |
Token ID | 382 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
arial | +1.094 |
nce | +1.074 |
utton | +1.059 |
ody | +1.039 |
illery | +1.018 |
Neg logit contributions | |
�� | -1.417 |
sqor | -1.366 |
ゴ | -1.240 |
capacity | -1.221 |
ALSE | -1.192 |
Token | over |
Token ID | 625 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
�� | +1.387 |
sqor | +1.336 |
capacity | +1.199 |
ゴ | +1.193 |
ALSE | +1.158 |
Neg logit contributions | |
arial | -1.300 |
nce | -1.266 |
utton | -1.260 |
ody | -1.230 |
illery | -1.220 |
Token | xx |
Token ID | 5324 |
Feature activation | -9.42e-02 |
Pos logit contributions | |
arial | +0.501 |
nce | +0.487 |
utton | +0.485 |
ody | +0.471 |
illery | +0.469 |
Neg logit contributions | |
�� | -0.578 |
sqor | -0.559 |
capacity | -0.508 |
ゴ | -0.503 |
ALSE | -0.487 |
Token | brand |
Token ID | 17938 |
Feature activation | +8.42e-02 |
Pos logit contributions | |
arial | +0.505 |
nce | +0.491 |
utton | +0.490 |
ody | +0.476 |
illery | +0.472 |
Neg logit contributions | |
�� | -0.631 |
sqor | -0.608 |
capacity | -0.549 |
ゴ | -0.547 |
ALSE | -0.535 |
Token | ? |
Token ID | 30 |
Feature activation | -3.83e-02 |
Pos logit contributions | |
�� | +0.566 |
sqor | +0.548 |
capacity | +0.497 |
ゴ | +0.495 |
ALSE | +0.480 |
Neg logit contributions | |
arial | -0.447 |
nce | -0.432 |
utton | -0.431 |
ody | -0.419 |
illery | -0.416 |
Token | f |
Token ID | 69 |
Feature activation | -3.66e-01 |
Pos logit contributions | |
arial | +0.168 |
nce | +0.162 |
utton | +0.161 |
ody | +0.156 |
illery | +0.153 |
Neg logit contributions | |
�� | -0.295 |
sqor | -0.282 |
capacity | -0.261 |
ゴ | -0.259 |
ALSE | -0.254 |
Token | ref |
Token ID | 5420 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
arial | +1.350 |
utton | +1.294 |
nce | +1.292 |
ody | +1.239 |
illery | +1.216 |
Neg logit contributions | |
�� | -3.067 |
sqor | -2.977 |
capacity | -2.755 |
ゴ | -2.745 |
ALSE | -2.676 |
Token | = |
Token ID | 28 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
utton | +4.965 |
nce | +4.880 |
arial | +4.876 |
ody | +4.824 |
izer | +4.648 |
Neg logit contributions | |
�� | -6.964 |
sqor | -6.552 |
ゴ | -6.003 |
capacity | -5.990 |
Sisters | -5.812 |
Token | ts |
Token ID | 912 |
Feature activation | -3.21e-01 |
Pos logit contributions | |
nce | +5.935 |
ody | +5.705 |
arial | +5.622 |
utton | +5.605 |
izer | +4.960 |
Neg logit contributions | |
�� | -10.911 |
sqor | -10.044 |
capacity | -9.167 |
ゴ | -9.103 |
decomp | -8.974 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
arial | +1.659 |
nce | +1.613 |
utton | +1.610 |
ody | +1.561 |
illery | +1.543 |
Neg logit contributions | |
�� | -2.217 |
sqor | -2.132 |
capacity | -1.938 |
ゴ | -1.924 |
ALSE | -1.871 |
Token | A |
Token ID | 32 |
Feature activation | +8.87e-02 |
Pos logit contributions | |
�� | +0.969 |
sqor | +0.937 |
capacity | +0.846 |
ゴ | +0.842 |
ALSE | +0.818 |
Neg logit contributions | |
arial | -0.804 |
nce | -0.780 |
utton | -0.777 |
ody | -0.757 |
illery | -0.751 |
Token | month |
Token ID | 1227 |
Feature activation | -5.34e-01 |
Pos logit contributions | |
�� | +0.579 |
sqor | +0.559 |
capacity | +0.506 |
ゴ | +0.503 |
ALSE | +0.488 |
Neg logit contributions | |
arial | -0.489 |
nce | -0.476 |
utton | -0.474 |
ody | -0.461 |
illery | -0.458 |
Token | before |
Token ID | 878 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
arial | +2.176 |
nce | +2.109 |
utton | +2.099 |
ody | +2.016 |
illery | +1.977 |
Neg logit contributions | |
�� | -4.234 |
sqor | -4.126 |
capacity | -3.786 |
ゴ | -3.757 |
ALSE | -3.685 |
Token | that |
Token ID | 326 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
arial | +0.586 |
nce | +0.572 |
utton | +0.564 |
ody | +0.554 |
illery | +0.539 |
Neg logit contributions | |
�� | -0.818 |
sqor | -0.786 |
ゴ | -0.724 |
capacity | -0.721 |
ALSE | -0.694 |
Token | game |
Token ID | 983 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
arial | +1.157 |
nce | +1.137 |
utton | +1.110 |
ody | +1.091 |
illery | +1.068 |
Neg logit contributions | |
�� | -1.587 |
sqor | -1.508 |
ゴ | -1.393 |
capacity | -1.384 |
ALSE | -1.340 |
Token | of |
Token ID | 286 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
arial | +0.818 |
nce | +0.795 |
utton | +0.788 |
ody | +0.769 |
illery | +0.758 |
Neg logit contributions | |
�� | -1.174 |
sqor | -1.140 |
capacity | -1.043 |
ゴ | -1.031 |
ALSE | -1.011 |
Token | peek |
Token ID | 27185 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
�� | +1.264 |
sqor | +1.216 |
capacity | +1.099 |
ゴ | +1.093 |
ALSE | +1.065 |
Neg logit contributions | |
arial | -1.095 |
nce | -1.065 |
utton | -1.060 |
ody | -1.030 |
illery | -1.026 |
Token | - |
Token ID | 12 |
Feature activation | -9.73e-01 |
Pos logit contributions | |
�� | +1.083 |
sqor | +1.048 |
capacity | +0.953 |
ゴ | +0.948 |
ALSE | +0.921 |
Neg logit contributions | |
arial | -0.823 |
nce | -0.798 |
utton | -0.795 |
ody | -0.772 |
illery | -0.767 |
Token | a |
Token ID | 64 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
arial | +5.547 |
utton | +5.452 |
nce | +5.348 |
ody | +5.273 |
illery | +5.190 |
Neg logit contributions | |
�� | -5.970 |
sqor | -5.798 |
ゴ | -5.139 |
ALSE | -5.100 |
capacity | -4.867 |
Token | - |
Token ID | 12 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
arial | +4.589 |
izer | +4.514 |
utton | +4.452 |
ody | +4.394 |
nce | +4.346 |
Neg logit contributions | |
�� | -11.547 |
sqor | -10.786 |
ゴ | -10.218 |
capacity | -9.991 |
ALSE | -9.844 |
Token | bo |
Token ID | 2127 |
Feature activation | -2.83e-01 |
Pos logit contributions | |
utton | +5.819 |
nce | +5.701 |
arial | +5.619 |
ody | +5.601 |
izer | +5.433 |
Neg logit contributions | |
�� | -6.522 |
sqor | -6.504 |
ゴ | -5.878 |
ALSE | -5.709 |
Sisters | -5.453 |
Token | o |
Token ID | 78 |
Feature activation | -9.65e-01 |
Pos logit contributions | |
arial | +1.510 |
utton | +1.467 |
nce | +1.465 |
ody | +1.431 |
illery | +1.416 |
Neg logit contributions | |
�� | -1.897 |
sqor | -1.839 |
capacity | -1.664 |
ゴ | -1.657 |
ALSE | -1.605 |
Token | that |
Token ID | 326 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
arial | +4.495 |
ody | +4.456 |
nce | +4.378 |
utton | +4.346 |
izer | +4.217 |
Neg logit contributions | |
�� | -6.732 |
sqor | -6.608 |
capacity | -6.020 |
ゴ | -5.977 |
ALSE | -5.795 |
Token | human |
Token ID | 1692 |
Feature activation | -6.38e-01 |
Pos logit contributions | |
arial | +0.776 |
nce | +0.756 |
utton | +0.749 |
ody | +0.734 |
illery | +0.717 |
Neg logit contributions | |
�� | -1.171 |
sqor | -1.142 |
capacity | -1.042 |
ゴ | -1.037 |
ALSE | -1.009 |
Token | state |
Token ID | 1181 |
Feature activation | -6.69e-01 |
Pos logit contributions | |
arial | +2.231 |
nce | +2.172 |
utton | +2.153 |
ody | +2.101 |
illery | +2.056 |
Neg logit contributions | |
�� | -3.682 |
sqor | -3.540 |
ゴ | -3.241 |
capacity | -3.236 |
ALSE | -3.154 |
Token | ( |
Token ID | 357 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
arial | +2.538 |
nce | +2.531 |
utton | +2.470 |
izer | +2.376 |
ody | +2.365 |
Neg logit contributions | |
�� | -5.648 |
sqor | -5.252 |
ゴ | -4.821 |
capacity | -4.771 |
ALSE | -4.695 |
Token | such |
Token ID | 10508 |
Feature activation | -4.72e-01 |
Pos logit contributions | |
�� | +1.048 |
sqor | +0.998 |
ゴ | +0.865 |
capacity | +0.853 |
ALSE | +0.842 |
Neg logit contributions | |
arial | -1.284 |
nce | -1.258 |
utton | -1.250 |
ody | -1.231 |
illery | -1.206 |
Token | as |
Token ID | 355 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
arial | +2.358 |
nce | +2.273 |
utton | +2.226 |
izer | +2.210 |
ody | +2.200 |
Neg logit contributions | |
�� | -3.503 |
sqor | -3.295 |
ゴ | -2.968 |
capacity | -2.891 |
ALSE | -2.870 |
Token | through |
Token ID | 832 |
Feature activation | -5.83e-01 |
Pos logit contributions | |
arial | +2.732 |
nce | +2.706 |
utton | +2.672 |
ody | +2.647 |
illery | +2.565 |
Neg logit contributions | |
�� | -3.877 |
sqor | -3.756 |
capacity | -3.356 |
ゴ | -3.356 |
ALSE | -3.315 |
Token | a |
Token ID | 257 |
Feature activation | -1.38e+00 |
Pos logit contributions | |
nce | +2.186 |
arial | +2.162 |
utton | +2.123 |
ody | +2.089 |
izer | +2.023 |
Neg logit contributions | |
�� | -4.949 |
sqor | -4.638 |
ゴ | -4.276 |
capacity | -4.173 |
ALSE | -4.154 |
Token | or |
Token ID | 393 |
Feature activation | -5.49e-01 |
Pos logit contributions | |
nce | +5.608 |
arial | +5.537 |
utton | +5.483 |
ody | +5.395 |
illery | +5.299 |
Neg logit contributions | |
�� | -10.290 |
sqor | -9.828 |
ゴ | -8.929 |
capacity | -8.900 |
ALSE | -8.858 |
Token | ) |
Token ID | 1267 |
Feature activation | +4.72e-01 |
Pos logit contributions | |
arial | +3.093 |
nce | +3.056 |
utton | +2.990 |
ody | +2.929 |
illery | +2.917 |
Neg logit contributions | |
�� | -3.511 |
sqor | -3.355 |
ゴ | -3.002 |
capacity | -2.990 |
ALSE | -2.914 |
Token | must |
Token ID | 1276 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
sqor | +2.847 |
�� | +2.815 |
capacity | +2.606 |
ゴ | +2.528 |
ALSE | +2.472 |
Neg logit contributions | |
arial | -2.655 |
utton | -2.595 |
nce | -2.545 |
ody | -2.507 |
illery | -2.505 |
Token | not |
Token ID | 407 |
Feature activation | -7.43e-02 |
Pos logit contributions | |
arial | +0.865 |
nce | +0.838 |
utton | +0.826 |
ody | +0.794 |
illery | +0.774 |
Neg logit contributions | |
�� | -2.073 |
sqor | -1.992 |
ゴ | -1.856 |
capacity | -1.848 |
ALSE | -1.796 |
Token | modify |
Token ID | 13096 |
Feature activation | -4.24e-01 |
Pos logit contributions | |
arial | +0.447 |
nce | +0.436 |
utton | +0.430 |
ody | +0.421 |
illery | +0.416 |
Neg logit contributions | |
�� | -0.459 |
sqor | -0.436 |
capacity | -0.391 |
ゴ | -0.390 |
ALSE | -0.374 |
Token | ux |
Token ID | 2821 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
�� | +0.579 |
sqor | +0.558 |
capacity | +0.499 |
ゴ | +0.496 |
ALSE | +0.481 |
Neg logit contributions | |
arial | -0.589 |
nce | -0.574 |
utton | -0.572 |
ody | -0.558 |
illery | -0.555 |
Token | s |
Token ID | 264 |
Feature activation | -5.10e-01 |
Pos logit contributions | |
�� | +0.978 |
sqor | +0.943 |
capacity | +0.850 |
ゴ | +0.845 |
ALSE | +0.820 |
Neg logit contributions | |
arial | -0.889 |
nce | -0.865 |
utton | -0.861 |
ody | -0.840 |
illery | -0.834 |
Token | ont |
Token ID | 756 |
Feature activation | +8.56e-02 |
Pos logit contributions | |
arial | +2.093 |
utton | +2.019 |
nce | +2.006 |
ody | +1.976 |
illery | +1.949 |
Neg logit contributions | |
�� | -4.111 |
sqor | -3.918 |
ゴ | -3.671 |
capacity | -3.611 |
ALSE | -3.570 |
Token | dé |
Token ID | 39073 |
Feature activation | +3.48e-01 |
Pos logit contributions | |
�� | +0.542 |
sqor | +0.524 |
capacity | +0.472 |
ゴ | +0.469 |
ALSE | +0.455 |
Neg logit contributions | |
arial | -0.487 |
nce | -0.473 |
utton | -0.473 |
ody | -0.460 |
illery | -0.457 |
Token | pl |
Token ID | 489 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
�� | +2.277 |
sqor | +2.212 |
capacity | +2.014 |
ゴ | +1.986 |
ALSE | +1.922 |
Neg logit contributions | |
arial | -1.885 |
utton | -1.825 |
nce | -1.818 |
ody | -1.773 |
illery | -1.757 |
Token | or |
Token ID | 273 |
Feature activation | -1.37e+00 |
Pos logit contributions | |
�� | +0.911 |
sqor | +0.883 |
capacity | +0.809 |
ゴ | +0.801 |
ALSE | +0.778 |
Neg logit contributions | |
arial | -0.657 |
nce | -0.639 |
utton | -0.633 |
ody | -0.615 |
illery | -0.610 |
Token | és |
Token ID | 20954 |
Feature activation | -4.88e-03 |
Pos logit contributions | |
arial | +6.986 |
nce | +6.838 |
izer | +6.516 |
utton | +6.457 |
ody | +6.428 |
Neg logit contributions | |
�� | -9.071 |
sqor | -8.633 |
ゴ | -7.923 |
ALSE | -7.613 |
capacity | -7.387 |
Token | et |
Token ID | 2123 |
Feature activation | +4.32e-02 |
Pos logit contributions | |
arial | +0.027 |
nce | +0.027 |
utton | +0.026 |
ody | +0.026 |
illery | +0.026 |
Neg logit contributions | |
�� | -0.031 |
sqor | -0.030 |
capacity | -0.027 |
ゴ | -0.027 |
ALSE | -0.026 |
Token | le |
Token ID | 443 |
Feature activation | +2.00e-01 |
Pos logit contributions | |
�� | +0.279 |
sqor | +0.269 |
capacity | +0.243 |
ゴ | +0.242 |
ALSE | +0.235 |
Neg logit contributions | |
arial | -0.241 |
nce | -0.234 |
utton | -0.233 |
ody | -0.227 |
illery | -0.226 |
Token | ur |
Token ID | 333 |
Feature activation | -6.13e-01 |
Pos logit contributions | |
�� | +1.230 |
sqor | +1.186 |
capacity | +1.066 |
ゴ | +1.058 |
ALSE | +1.026 |
Neg logit contributions | |
arial | -1.174 |
nce | -1.141 |
utton | -1.138 |
ody | -1.110 |
illery | -1.102 |
Token | dé |
Token ID | 39073 |
Feature activation | +2.21e-01 |
Pos logit contributions | |
arial | +3.596 |
nce | +3.531 |
utton | +3.369 |
illery | +3.367 |
ody | +3.342 |
Neg logit contributions | |
�� | -3.781 |
sqor | -3.482 |
ゴ | -3.256 |
capacity | -3.195 |
ALSE | -3.154 |
Token | Scotland |
Token ID | 8838 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
arial | +2.104 |
nce | +2.095 |
utton | +2.056 |
ody | +2.029 |
illery | +1.983 |
Neg logit contributions | |
�� | -3.060 |
sqor | -2.965 |
capacity | -2.678 |
ゴ | -2.676 |
ALSE | -2.579 |
Token | , |
Token ID | 11 |
Feature activation | -3.46e-01 |
Pos logit contributions | |
arial | +1.953 |
nce | +1.903 |
utton | +1.895 |
ody | +1.856 |
illery | +1.827 |
Neg logit contributions | |
�� | -2.850 |
sqor | -2.745 |
capacity | -2.505 |
ゴ | -2.492 |
ALSE | -2.419 |
Token | or |
Token ID | 393 |
Feature activation | +4.27e-01 |
Pos logit contributions | |
arial | +1.538 |
nce | +1.507 |
utton | +1.501 |
ody | +1.463 |
illery | +1.424 |
Neg logit contributions | |
�� | -2.622 |
sqor | -2.513 |
ゴ | -2.308 |
capacity | -2.301 |
ALSE | -2.224 |
Token | whether |
Token ID | 1771 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
�� | +2.792 |
sqor | +2.729 |
capacity | +2.463 |
ゴ | +2.423 |
ALSE | +2.398 |
Neg logit contributions | |
arial | -2.299 |
nce | -2.222 |
utton | -2.211 |
ody | -2.154 |
illery | -2.146 |
Token | they |
Token ID | 484 |
Feature activation | +9.23e-01 |
Pos logit contributions | |
�� | +1.894 |
sqor | +1.839 |
capacity | +1.671 |
ゴ | +1.653 |
ALSE | +1.617 |
Neg logit contributions | |
arial | -1.446 |
nce | -1.396 |
utton | -1.394 |
ody | -1.353 |
illery | -1.348 |
Token | will |
Token ID | 481 |
Feature activation | +9.20e-01 |
Pos logit contributions | |
�� | +5.666 |
sqor | +5.592 |
capacity | +5.074 |
Sisters | +4.959 |
ゴ | +4.898 |
Neg logit contributions | |
arial | -4.954 |
utton | -4.784 |
nce | -4.688 |
illery | -4.638 |
ody | -4.617 |
Token | look |
Token ID | 804 |
Feature activation | +4.02e-01 |
Pos logit contributions | |
�� | +5.490 |
sqor | +5.389 |
capacity | +4.908 |
Sisters | +4.798 |
ゴ | +4.747 |
Neg logit contributions | |
arial | -5.128 |
utton | -5.003 |
ody | -4.905 |
nce | -4.881 |
illery | -4.797 |
Token | to |
Token ID | 284 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
�� | +2.791 |
sqor | +2.724 |
capacity | +2.485 |
ゴ | +2.461 |
Sisters | +2.430 |
Neg logit contributions | |
arial | -1.984 |
utton | -1.918 |
nce | -1.892 |
illery | -1.863 |
ody | -1.855 |
Token | be |
Token ID | 307 |
Feature activation | +7.30e-01 |
Pos logit contributions | |
�� | +3.110 |
sqor | +3.007 |
capacity | +2.721 |
ゴ | +2.686 |
Sisters | +2.629 |
Neg logit contributions | |
arial | -2.729 |
utton | -2.652 |
nce | -2.643 |
ody | -2.580 |
illery | -2.561 |
Token | independent |
Token ID | 4795 |
Feature activation | +6.57e-01 |
Pos logit contributions | |
�� | +4.962 |
sqor | +4.817 |
capacity | +4.410 |
ゴ | +4.366 |
Sisters | +4.351 |
Neg logit contributions | |
arial | -3.616 |
utton | -3.530 |
nce | -3.484 |
ody | -3.381 |
illery | -3.380 |
Token | from |
Token ID | 422 |
Feature activation | -3.58e-02 |
Pos logit contributions | |
�� | +4.241 |
sqor | +4.173 |
capacity | +3.746 |
ゴ | +3.692 |
Sisters | +3.652 |
Neg logit contributions | |
arial | -3.538 |
utton | -3.448 |
nce | -3.436 |
illery | -3.322 |
ody | -3.315 |
Token | care |
Token ID | 1337 |
Feature activation | +1.44e-01 |
Pos logit contributions | |
arial | +0.304 |
nce | +0.295 |
utton | +0.290 |
ody | +0.282 |
illery | +0.279 |
Neg logit contributions | |
�� | -0.474 |
sqor | -0.451 |
ゴ | -0.412 |
capacity | -0.411 |
ALSE | -0.404 |
Token | about |
Token ID | 546 |
Feature activation | +3.75e-01 |
Pos logit contributions | |
�� | +0.965 |
sqor | +0.934 |
capacity | +0.847 |
ゴ | +0.843 |
ALSE | +0.819 |
Neg logit contributions | |
arial | -0.763 |
nce | -0.740 |
utton | -0.738 |
ody | -0.717 |
illery | -0.712 |
Token | what |
Token ID | 644 |
Feature activation | +3.19e-01 |
Pos logit contributions | |
�� | +2.518 |
sqor | +2.447 |
capacity | +2.228 |
ゴ | +2.204 |
ALSE | +2.148 |
Neg logit contributions | |
arial | -1.972 |
utton | -1.904 |
nce | -1.901 |
ody | -1.844 |
illery | -1.842 |
Token | he |
Token ID | 339 |
Feature activation | +3.69e-01 |
Pos logit contributions | |
�� | +2.149 |
sqor | +2.086 |
capacity | +1.897 |
ゴ | +1.880 |
ALSE | +1.832 |
Neg logit contributions | |
arial | -1.673 |
utton | -1.617 |
nce | -1.614 |
ody | -1.568 |
illery | -1.564 |
Token | cares |
Token ID | 16609 |
Feature activation | +8.20e-01 |
Pos logit contributions | |
�� | +2.793 |
sqor | +2.720 |
capacity | +2.503 |
ゴ | +2.491 |
ALSE | +2.424 |
Neg logit contributions | |
arial | -1.622 |
nce | -1.564 |
utton | -1.563 |
ody | -1.508 |
illery | -1.495 |
Token | about |
Token ID | 546 |
Feature activation | +8.15e-01 |
Pos logit contributions | |
�� | +4.228 |
sqor | +4.143 |
capacity | +3.737 |
ゴ | +3.634 |
Sisters | +3.512 |
Neg logit contributions | |
arial | -5.255 |
utton | -5.159 |
nce | -5.118 |
illery | -5.033 |
ody | -4.911 |
Token | . |
Token ID | 13 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
�� | +4.755 |
sqor | +4.702 |
capacity | +4.251 |
ゴ | +4.202 |
Sisters | +4.111 |
Neg logit contributions | |
arial | -4.700 |
utton | -4.601 |
nce | -4.569 |
illery | -4.463 |
ody | -4.345 |
Token | It |
Token ID | 632 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
�� | +1.380 |
sqor | +1.328 |
capacity | +1.203 |
ゴ | +1.201 |
ALSE | +1.165 |
Neg logit contributions | |
arial | -0.992 |
nce | -0.965 |
utton | -0.955 |
ody | -0.928 |
illery | -0.924 |
Token | doesn |
Token ID | 1595 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
�� | +0.836 |
sqor | +0.810 |
capacity | +0.744 |
ゴ | +0.742 |
ALSE | +0.725 |
Neg logit contributions | |
arial | -0.463 |
nce | -0.446 |
utton | -0.443 |
ody | -0.428 |
illery | -0.424 |
Token | 't |
Token ID | 470 |
Feature activation | +3.29e-02 |
Pos logit contributions | |
�� | +1.905 |
sqor | +1.857 |
capacity | +1.723 |
ゴ | +1.713 |
ALSE | +1.675 |
Neg logit contributions | |
arial | -0.878 |
nce | -0.842 |
utton | -0.838 |
ody | -0.804 |
illery | -0.797 |
Token | care |
Token ID | 1337 |
Feature activation | +3.44e-01 |
Pos logit contributions | |
�� | +0.241 |
sqor | +0.232 |
capacity | +0.213 |
ゴ | +0.212 |
ALSE | +0.207 |
Neg logit contributions | |
arial | -0.156 |
nce | -0.151 |
utton | -0.150 |
ody | -0.145 |
illery | -0.144 |
Token | and |
Token ID | 290 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
�� | +0.178 |
sqor | +0.171 |
ゴ | +0.152 |
capacity | +0.151 |
ALSE | +0.148 |
Neg logit contributions | |
arial | -0.175 |
nce | -0.169 |
utton | -0.169 |
ody | -0.165 |
illery | -0.164 |
Token | somewhere |
Token ID | 7382 |
Feature activation | +5.00e-01 |
Pos logit contributions | |
�� | +0.945 |
sqor | +0.911 |
ゴ | +0.826 |
capacity | +0.824 |
ALSE | +0.800 |
Neg logit contributions | |
arial | -0.742 |
nce | -0.718 |
utton | -0.713 |
ody | -0.697 |
illery | -0.690 |
Token | between |
Token ID | 1022 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
�� | +3.064 |
sqor | +2.955 |
capacity | +2.683 |
ゴ | +2.630 |
ALSE | +2.574 |
Neg logit contributions | |
arial | -2.890 |
utton | -2.813 |
nce | -2.798 |
illery | -2.731 |
ody | -2.717 |
Token | 6 |
Token ID | 718 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
�� | +0.970 |
sqor | +0.934 |
ゴ | +0.849 |
capacity | +0.844 |
ALSE | +0.822 |
Neg logit contributions | |
arial | -0.710 |
nce | -0.688 |
utton | -0.683 |
ody | -0.667 |
illery | -0.658 |
Token | and |
Token ID | 290 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
�� | +0.906 |
sqor | +0.871 |
capacity | +0.776 |
ゴ | +0.771 |
ALSE | +0.745 |
Neg logit contributions | |
arial | -1.005 |
nce | -0.980 |
utton | -0.977 |
ody | -0.954 |
illery | -0.948 |
Token | 7 |
Token ID | 767 |
Feature activation | +7.94e-01 |
Pos logit contributions | |
�� | +2.529 |
sqor | +2.451 |
capacity | +2.226 |
ゴ | +2.205 |
ALSE | +2.144 |
Neg logit contributions | |
arial | -2.101 |
nce | -2.040 |
utton | -2.035 |
ody | -1.979 |
illery | -1.964 |
Token | GW |
Token ID | 27164 |
Feature activation | +3.96e-01 |
Pos logit contributions | |
�� | +3.966 |
sqor | +3.885 |
capacity | +3.412 |
ゴ | +3.345 |
ALSE | +3.184 |
Neg logit contributions | |
arial | -5.350 |
nce | -5.281 |
utton | -5.196 |
ody | -5.129 |
illery | -5.124 |
Token | of |
Token ID | 286 |
Feature activation | -3.57e-02 |
Pos logit contributions | |
�� | +2.262 |
sqor | +2.180 |
capacity | +2.002 |
ゴ | +1.898 |
ALSE | +1.884 |
Neg logit contributions | |
arial | -2.421 |
nce | -2.410 |
utton | -2.370 |
illery | -2.317 |
ody | -2.311 |
Token | solar |
Token ID | 6591 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
arial | +0.207 |
nce | +0.200 |
utton | +0.200 |
ody | +0.195 |
illery | +0.193 |
Neg logit contributions | |
�� | -0.224 |
sqor | -0.215 |
ゴ | -0.193 |
capacity | -0.193 |
ALSE | -0.187 |
Token | generating |
Token ID | 15453 |
Feature activation | +6.59e-02 |
Pos logit contributions | |
�� | +1.187 |
sqor | +1.149 |
capacity | +1.043 |
ゴ | +1.030 |
ALSE | +1.000 |
Neg logit contributions | |
arial | -1.070 |
nce | -1.042 |
utton | -1.037 |
ody | -1.009 |
illery | -1.005 |
Token | capacity |
Token ID | 5339 |
Feature activation | +3.08e-01 |
Pos logit contributions | |
�� | +0.299 |
sqor | +0.283 |
ゴ | +0.242 |
capacity | +0.241 |
ALSE | +0.231 |
Neg logit contributions | |
arial | -0.496 |
nce | -0.485 |
utton | -0.483 |
ody | -0.474 |
illery | -0.471 |
Token | received |
Token ID | 2722 |
Feature activation | -5.55e-02 |
Pos logit contributions | |
�� | +2.001 |
sqor | +1.944 |
capacity | +1.782 |
ゴ | +1.769 |
ALSE | +1.728 |
Neg logit contributions | |
arial | -1.344 |
nce | -1.295 |
utton | -1.294 |
ody | -1.252 |
illery | -1.243 |
Token | agreement |
Token ID | 4381 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
arial | +0.268 |
nce | +0.259 |
utton | +0.257 |
ody | +0.250 |
illery | +0.247 |
Neg logit contributions | |
�� | -0.403 |
sqor | -0.390 |
capacity | -0.355 |
ゴ | -0.354 |
ALSE | -0.345 |
Token | from |
Token ID | 422 |
Feature activation | +3.59e-01 |
Pos logit contributions | |
�� | +0.710 |
sqor | +0.687 |
capacity | +0.614 |
ゴ | +0.609 |
ALSE | +0.594 |
Neg logit contributions | |
arial | -0.746 |
utton | -0.737 |
nce | -0.735 |
illery | -0.715 |
ody | -0.711 |
Token | the |
Token ID | 262 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
�� | +2.425 |
sqor | +2.354 |
capacity | +2.156 |
ゴ | +2.127 |
Sisters | +2.094 |
Neg logit contributions | |
arial | -1.856 |
utton | -1.798 |
nce | -1.787 |
illery | -1.741 |
ody | -1.734 |
Token | Eth |
Token ID | 9956 |
Feature activation | +3.61e-01 |
Pos logit contributions | |
�� | +1.280 |
sqor | +1.237 |
capacity | +1.122 |
ゴ | +1.115 |
ALSE | +1.084 |
Neg logit contributions | |
arial | -1.043 |
nce | -1.011 |
utton | -1.009 |
ody | -0.981 |
illery | -0.974 |
Token | ical |
Token ID | 605 |
Feature activation | +7.79e-01 |
Pos logit contributions | |
�� | +2.113 |
sqor | +2.021 |
capacity | +1.831 |
ゴ | +1.773 |
ALSE | +1.747 |
Neg logit contributions | |
arial | -2.178 |
nce | -2.134 |
utton | -2.128 |
illery | -2.058 |
ody | -2.040 |
Token | Committee |
Token ID | 4606 |
Feature activation | +3.24e-01 |
Pos logit contributions | |
�� | +4.992 |
sqor | +4.920 |
capacity | +4.538 |
Sisters | +4.508 |
ゴ | +4.446 |
Neg logit contributions | |
arial | -3.967 |
nce | -3.945 |
utton | -3.924 |
illery | -3.758 |
ody | -3.718 |
Token | for |
Token ID | 329 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
�� | +2.135 |
sqor | +2.079 |
capacity | +1.878 |
ゴ | +1.859 |
ALSE | +1.821 |
Neg logit contributions | |
arial | -1.730 |
utton | -1.688 |
nce | -1.676 |
illery | -1.627 |
ody | -1.626 |
Token | Animal |
Token ID | 13792 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
�� | +2.211 |
sqor | +2.143 |
capacity | +1.971 |
ゴ | +1.935 |
Sisters | +1.910 |
Neg logit contributions | |
arial | -1.736 |
utton | -1.683 |
nce | -1.681 |
illery | -1.634 |
ody | -1.622 |
Token | Research |
Token ID | 4992 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
�� | +1.550 |
sqor | +1.499 |
capacity | +1.370 |
ゴ | +1.349 |
Sisters | +1.330 |
Neg logit contributions | |
arial | -1.304 |
nce | -1.269 |
utton | -1.265 |
illery | -1.229 |
ody | -1.213 |
Token | CE |
Token ID | 18671 |
Feature activation | -4.08e-02 |
Pos logit contributions | |
�� | +1.007 |
sqor | +0.973 |
capacity | +0.883 |
ゴ | +0.878 |
ALSE | +0.853 |
Neg logit contributions | |
arial | -0.808 |
nce | -0.784 |
utton | -0.781 |
ody | -0.760 |
illery | -0.755 |
Token | one |
Token ID | 530 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
arial | +2.437 |
nce | +2.359 |
ody | +2.306 |
utton | +2.274 |
izer | +2.198 |
Neg logit contributions | |
�� | -3.924 |
sqor | -3.775 |
ゴ | -3.465 |
capacity | -3.454 |
ALSE | -3.284 |
Token | 's |
Token ID | 338 |
Feature activation | -3.85e-01 |
Pos logit contributions | |
arial | +0.749 |
nce | +0.726 |
utton | +0.725 |
ody | +0.700 |
illery | +0.699 |
Neg logit contributions | |
�� | -1.045 |
sqor | -1.015 |
capacity | -0.925 |
ゴ | -0.918 |
ALSE | -0.897 |
Token | accuser |
Token ID | 43738 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
arial | +2.236 |
nce | +2.193 |
ody | +2.162 |
utton | +2.141 |
izer | +2.117 |
Neg logit contributions | |
�� | -2.434 |
sqor | -2.258 |
ゴ | -2.082 |
capacity | -2.026 |
ALSE | -1.937 |
Token | is |
Token ID | 318 |
Feature activation | -9.00e-02 |
Pos logit contributions | |
arial | +0.097 |
nce | +0.094 |
utton | +0.092 |
ody | +0.091 |
illery | +0.089 |
Neg logit contributions | |
�� | -0.145 |
sqor | -0.140 |
capacity | -0.127 |
ゴ | -0.127 |
ALSE | -0.123 |
Token | important |
Token ID | 1593 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
arial | +0.440 |
nce | +0.428 |
utton | +0.422 |
ody | +0.414 |
illery | +0.405 |
Neg logit contributions | |
�� | -0.650 |
sqor | -0.630 |
ゴ | -0.572 |
capacity | -0.569 |
ALSE | -0.553 |
Token | not |
Token ID | 407 |
Feature activation | +7.56e-01 |
Pos logit contributions | |
arial | +1.456 |
nce | +1.401 |
utton | +1.389 |
ody | +1.360 |
illery | +1.332 |
Neg logit contributions | |
�� | -2.175 |
sqor | -2.068 |
ゴ | -1.890 |
capacity | -1.887 |
ALSE | -1.840 |
Token | merely |
Token ID | 6974 |
Feature activation | +3.73e-01 |
Pos logit contributions | |
�� | +4.284 |
sqor | +4.244 |
capacity | +3.839 |
ゴ | +3.677 |
Sisters | +3.666 |
Neg logit contributions | |
nce | -4.399 |
utton | -4.376 |
arial | -4.354 |
illery | -4.263 |
ody | -4.213 |
Token | because |
Token ID | 780 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
�� | +2.585 |
sqor | +2.531 |
capacity | +2.321 |
ゴ | +2.292 |
ALSE | +2.232 |
Neg logit contributions | |
arial | -1.832 |
utton | -1.790 |
nce | -1.789 |
illery | -1.735 |
ody | -1.715 |
Token | it |
Token ID | 340 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
�� | +2.682 |
sqor | +2.595 |
capacity | +2.359 |
ゴ | +2.322 |
Sisters | +2.294 |
Neg logit contributions | |
arial | -2.305 |
utton | -2.245 |
nce | -2.233 |
illery | -2.175 |
ody | -2.165 |
Token | aids |
Token ID | 31378 |
Feature activation | +7.88e-02 |
Pos logit contributions | |
�� | +1.890 |
sqor | +1.834 |
capacity | +1.685 |
ゴ | +1.675 |
ALSE | +1.633 |
Neg logit contributions | |
arial | -1.161 |
nce | -1.120 |
utton | -1.118 |
ody | -1.081 |
illery | -1.074 |
Token | in |
Token ID | 287 |
Feature activation | +2.90e-01 |
Pos logit contributions | |
�� | +0.540 |
sqor | +0.523 |
capacity | +0.477 |
ゴ | +0.473 |
ALSE | +0.462 |
Neg logit contributions | |
arial | -0.406 |
nce | -0.393 |
utton | -0.392 |
ody | -0.380 |
illery | -0.378 |
Token | in |
Token ID | 287 |
Feature activation | -3.92e-01 |
Pos logit contributions | |
�� | +0.194 |
sqor | +0.188 |
capacity | +0.170 |
ゴ | +0.169 |
ALSE | +0.164 |
Neg logit contributions | |
arial | -0.163 |
nce | -0.158 |
utton | -0.158 |
ody | -0.153 |
illery | -0.152 |
Token | Pakistan |
Token ID | 7648 |
Feature activation | -9.32e-02 |
Pos logit contributions | |
arial | +2.316 |
nce | +2.273 |
utton | +2.235 |
ody | +2.191 |
illery | +2.157 |
Neg logit contributions | |
�� | -2.400 |
sqor | -2.297 |
ゴ | -2.051 |
capacity | -2.036 |
ALSE | -1.996 |
Token |
|
Token ID | 198 |
Feature activation | -2.64e-01 |
Pos logit contributions | |
arial | +0.505 |
nce | +0.491 |
utton | +0.489 |
ody | +0.476 |
illery | +0.472 |
Neg logit contributions | |
�� | -0.617 |
sqor | -0.595 |
capacity | -0.539 |
ゴ | -0.537 |
ALSE | -0.522 |
Token |
|
Token ID | 198 |
Feature activation | -4.09e-01 |
Pos logit contributions | |
arial | +1.274 |
nce | +1.231 |
utton | +1.204 |
izer | +1.174 |
ody | +1.167 |
Neg logit contributions | |
�� | -2.016 |
sqor | -1.889 |
ゴ | -1.710 |
capacity | -1.681 |
ALSE | -1.654 |
Token | With |
Token ID | 3152 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
arial | +2.083 |
nce | +1.996 |
utton | +1.990 |
ody | +1.971 |
illery | +1.900 |
Neg logit contributions | |
�� | -2.851 |
sqor | -2.807 |
capacity | -2.430 |
ゴ | -2.411 |
ALSE | -2.368 |
Token | the |
Token ID | 262 |
Feature activation | -6.78e-02 |
Pos logit contributions | |
arial | +1.010 |
nce | +0.982 |
utton | +0.972 |
ody | +0.955 |
illery | +0.927 |
Neg logit contributions | |
�� | -1.431 |
sqor | -1.378 |
capacity | -1.246 |
ゴ | -1.244 |
ALSE | -1.217 |
Token | success |
Token ID | 1943 |
Feature activation | -4.72e-01 |
Pos logit contributions | |
arial | +0.353 |
nce | +0.344 |
utton | +0.341 |
ody | +0.331 |
illery | +0.327 |
Neg logit contributions | |
�� | -0.467 |
sqor | -0.448 |
ゴ | -0.406 |
capacity | -0.404 |
ALSE | -0.395 |
Token | of |
Token ID | 286 |
Feature activation | -9.53e-02 |
Pos logit contributions | |
arial | +2.545 |
nce | +2.483 |
utton | +2.466 |
ody | +2.408 |
illery | +2.379 |
Neg logit contributions | |
�� | -3.093 |
sqor | -3.000 |
capacity | -2.726 |
ゴ | -2.680 |
ALSE | -2.630 |
Token | online |
Token ID | 2691 |
Feature activation | -9.65e-02 |
Pos logit contributions | |
arial | +0.483 |
nce | +0.470 |
utton | +0.465 |
ody | +0.456 |
illery | +0.449 |
Neg logit contributions | |
�� | -0.665 |
sqor | -0.643 |
capacity | -0.583 |
ゴ | -0.578 |
ALSE | -0.567 |
Token | shopping |
Token ID | 9735 |
Feature activation | +3.62e-02 |
Pos logit contributions | |
arial | +0.489 |
nce | +0.473 |
utton | +0.472 |
ody | +0.459 |
illery | +0.454 |
Neg logit contributions | |
�� | -0.673 |
sqor | -0.652 |
capacity | -0.593 |
ゴ | -0.590 |
ALSE | -0.574 |
Token | in |
Token ID | 287 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
�� | +0.238 |
sqor | +0.230 |
capacity | +0.208 |
ゴ | +0.207 |
ALSE | +0.201 |
Neg logit contributions | |
arial | -0.198 |
nce | -0.193 |
utton | -0.192 |
ody | -0.186 |
illery | -0.185 |
Token | ly |
Token ID | 306 |
Feature activation | -2.18e-02 |
Pos logit contributions | |
arial | +0.054 |
nce | +0.052 |
utton | +0.052 |
ody | +0.051 |
illery | +0.050 |
Neg logit contributions | |
�� | -0.065 |
sqor | -0.062 |
capacity | -0.056 |
ゴ | -0.056 |
ALSE | -0.055 |
Token | designed |
Token ID | 3562 |
Feature activation | -4.41e-01 |
Pos logit contributions | |
arial | +0.112 |
nce | +0.108 |
utton | +0.108 |
ody | +0.105 |
illery | +0.104 |
Neg logit contributions | |
�� | -0.151 |
sqor | -0.146 |
capacity | -0.133 |
ゴ | -0.132 |
ALSE | -0.129 |
Token | brain |
Token ID | 3632 |
Feature activation | -2.86e-01 |
Pos logit contributions | |
arial | +2.353 |
nce | +2.291 |
utton | +2.254 |
ody | +2.224 |
izer | +2.210 |
Neg logit contributions | |
�� | -2.960 |
sqor | -2.793 |
capacity | -2.566 |
ゴ | -2.544 |
ALSE | -2.474 |
Token | boosting |
Token ID | 27611 |
Feature activation | -5.77e-02 |
Pos logit contributions | |
arial | +1.567 |
utton | +1.516 |
nce | +1.507 |
ody | +1.493 |
illery | +1.461 |
Neg logit contributions | |
�� | -1.878 |
sqor | -1.812 |
ゴ | -1.621 |
capacity | -1.603 |
ALSE | -1.577 |
Token | toys |
Token ID | 14958 |
Feature activation | +7.05e-02 |
Pos logit contributions | |
arial | +0.320 |
nce | +0.310 |
utton | +0.309 |
ody | +0.301 |
illery | +0.298 |
Neg logit contributions | |
�� | -0.376 |
sqor | -0.362 |
capacity | -0.327 |
ゴ | -0.326 |
ALSE | -0.317 |
Token | , |
Token ID | 11 |
Feature activation | +8.88e-02 |
Pos logit contributions | |
�� | +0.449 |
sqor | +0.433 |
capacity | +0.391 |
ゴ | +0.388 |
ALSE | +0.377 |
Neg logit contributions | |
arial | -0.399 |
nce | -0.388 |
utton | -0.387 |
ody | -0.378 |
illery | -0.375 |
Token | there |
Token ID | 612 |
Feature activation | -2.28e-01 |
Pos logit contributions | |
�� | +0.617 |
sqor | +0.597 |
capacity | +0.543 |
ゴ | +0.540 |
ALSE | +0.526 |
Neg logit contributions | |
arial | -0.451 |
nce | -0.439 |
utton | -0.436 |
ody | -0.426 |
illery | -0.421 |
Token | is |
Token ID | 318 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
arial | +1.279 |
nce | +1.247 |
utton | +1.245 |
ody | +1.221 |
illery | +1.194 |
Neg logit contributions | |
�� | -1.464 |
sqor | -1.406 |
capacity | -1.269 |
ゴ | -1.265 |
ALSE | -1.222 |
Token | something |
Token ID | 1223 |
Feature activation | -4.13e-01 |
Pos logit contributions | |
arial | +1.124 |
nce | +1.090 |
utton | +1.078 |
ody | +1.061 |
izer | +1.018 |
Neg logit contributions | |
�� | -1.754 |
sqor | -1.693 |
capacity | -1.541 |
ゴ | -1.537 |
ALSE | -1.491 |
Token | for |
Token ID | 329 |
Feature activation | -3.92e-01 |
Pos logit contributions | |
arial | +1.875 |
nce | +1.794 |
utton | +1.784 |
ody | +1.750 |
izer | +1.711 |
Neg logit contributions | |
�� | -3.090 |
sqor | -2.974 |
capacity | -2.765 |
ゴ | -2.739 |
ALSE | -2.660 |
Token | every |
Token ID | 790 |
Feature activation | -5.04e-01 |
Pos logit contributions | |
arial | +2.058 |
nce | +2.004 |
utton | +1.994 |
ody | +1.989 |
izer | +1.936 |
Neg logit contributions | |
�� | -2.607 |
sqor | -2.534 |
ゴ | -2.295 |
capacity | -2.294 |
ALSE | -2.211 |
Token | that |
Token ID | 326 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
arial | +0.790 |
nce | +0.758 |
utton | +0.756 |
ody | +0.738 |
illery | +0.728 |
Neg logit contributions | |
�� | -1.145 |
sqor | -1.101 |
capacity | -1.013 |
ゴ | -1.005 |
ALSE | -0.978 |
Token | myth |
Token ID | 7918 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
arial | +0.621 |
nce | +0.603 |
utton | +0.598 |
ody | +0.584 |
illery | +0.572 |
Neg logit contributions | |
�� | -0.887 |
sqor | -0.853 |
capacity | -0.783 |
ゴ | -0.778 |
ALSE | -0.756 |
Token | could |
Token ID | 714 |
Feature activation | -8.95e-02 |
Pos logit contributions | |
arial | +0.668 |
nce | +0.641 |
utton | +0.641 |
ody | +0.628 |
illery | +0.614 |
Neg logit contributions | |
�� | -1.055 |
sqor | -1.030 |
capacity | -0.939 |
ゴ | -0.931 |
ALSE | -0.909 |
Token | be |
Token ID | 307 |
Feature activation | +8.83e-02 |
Pos logit contributions | |
arial | +0.460 |
nce | +0.449 |
utton | +0.443 |
ody | +0.430 |
illery | +0.426 |
Neg logit contributions | |
�� | -0.620 |
sqor | -0.600 |
capacity | -0.544 |
ゴ | -0.544 |
ALSE | -0.529 |
Token | explained |
Token ID | 4893 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
�� | +0.564 |
sqor | +0.547 |
capacity | +0.491 |
ゴ | +0.489 |
ALSE | +0.475 |
Neg logit contributions | |
arial | -0.502 |
nce | -0.489 |
utton | -0.484 |
ody | -0.473 |
illery | -0.468 |
Token | away |
Token ID | 1497 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
arial | +1.562 |
nce | +1.509 |
utton | +1.486 |
ody | +1.468 |
izer | +1.431 |
Neg logit contributions | |
�� | -1.854 |
sqor | -1.785 |
capacity | -1.622 |
ゴ | -1.608 |
ALSE | -1.559 |
Token | as |
Token ID | 355 |
Feature activation | -2.72e-01 |
Pos logit contributions | |
arial | +0.054 |
nce | +0.052 |
utton | +0.052 |
ody | +0.051 |
illery | +0.050 |
Neg logit contributions | |
�� | -0.071 |
sqor | -0.068 |
capacity | -0.062 |
ゴ | -0.062 |
ALSE | -0.060 |
Token | an |
Token ID | 281 |
Feature activation | -2.76e-01 |
Pos logit contributions | |
arial | +1.366 |
nce | +1.314 |
utton | +1.312 |
ody | +1.285 |
illery | +1.251 |
Neg logit contributions | |
�� | -1.919 |
sqor | -1.845 |
capacity | -1.680 |
ゴ | -1.667 |
ALSE | -1.631 |
Token | aber |
Token ID | 42499 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
arial | +1.521 |
ody | +1.468 |
nce | +1.467 |
utton | +1.459 |
izer | +1.398 |
Neg logit contributions | |
�� | -1.823 |
sqor | -1.766 |
ゴ | -1.574 |
capacity | -1.571 |
ALSE | -1.521 |
Token | ration |
Token ID | 1358 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
arial | +0.597 |
nce | +0.577 |
utton | +0.573 |
ody | +0.554 |
illery | +0.548 |
Neg logit contributions | |
�� | -1.042 |
sqor | -1.012 |
capacity | -0.929 |
ゴ | -0.926 |
ALSE | -0.903 |
Token | of |
Token ID | 286 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
arial | +0.633 |
nce | +0.612 |
utton | +0.608 |
ody | +0.597 |
illery | +0.587 |
Neg logit contributions | |
�� | -0.794 |
sqor | -0.767 |
capacity | -0.695 |
ゴ | -0.689 |
ALSE | -0.672 |
Token | into |
Token ID | 656 |
Feature activation | -3.74e-02 |
Pos logit contributions | |
�� | +4.575 |
sqor | +4.521 |
capacity | +4.204 |
ゴ | +4.154 |
Sisters | +4.060 |
Neg logit contributions | |
arial | -2.346 |
utton | -2.274 |
nce | -2.253 |
illery | -2.189 |
ody | -2.160 |
Token | the |
Token ID | 262 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
arial | +0.186 |
nce | +0.180 |
utton | +0.179 |
ody | +0.174 |
illery | +0.172 |
Neg logit contributions | |
�� | -0.265 |
sqor | -0.256 |
capacity | -0.234 |
ゴ | -0.233 |
ALSE | -0.227 |
Token | Alberta |
Token ID | 15555 |
Feature activation | -3.02e-01 |
Pos logit contributions | |
arial | +1.231 |
nce | +1.191 |
utton | +1.177 |
ody | +1.146 |
illery | +1.142 |
Neg logit contributions | |
�� | -1.598 |
sqor | -1.525 |
ゴ | -1.391 |
capacity | -1.383 |
ALSE | -1.348 |
Token | legislature |
Token ID | 15928 |
Feature activation | +9.65e-02 |
Pos logit contributions | |
arial | +1.606 |
utton | +1.548 |
nce | +1.547 |
ody | +1.515 |
illery | +1.509 |
Neg logit contributions | |
�� | -2.036 |
sqor | -1.963 |
ゴ | -1.768 |
capacity | -1.763 |
ALSE | -1.725 |
Token | in |
Token ID | 287 |
Feature activation | +6.39e-02 |
Pos logit contributions | |
�� | +0.669 |
sqor | +0.647 |
capacity | +0.589 |
ゴ | +0.586 |
ALSE | +0.570 |
Neg logit contributions | |
arial | -0.493 |
nce | -0.477 |
utton | -0.476 |
ody | -0.462 |
illery | -0.459 |
Token | 2004 |
Token ID | 5472 |
Feature activation | +4.35e-02 |
Pos logit contributions | |
�� | +0.388 |
sqor | +0.373 |
capacity | +0.333 |
ゴ | +0.332 |
ALSE | +0.322 |
Neg logit contributions | |
arial | -0.383 |
nce | -0.373 |
utton | -0.372 |
ody | -0.363 |
illery | -0.361 |
Token | , |
Token ID | 11 |
Feature activation | +4.39e-02 |
Pos logit contributions | |
�� | +0.288 |
sqor | +0.278 |
capacity | +0.252 |
ゴ | +0.251 |
ALSE | +0.244 |
Neg logit contributions | |
arial | -0.235 |
nce | -0.228 |
utton | -0.228 |
ody | -0.222 |
illery | -0.220 |
Token | admits |
Token ID | 15534 |
Feature activation | -3.27e-01 |
Pos logit contributions | |
�� | +0.307 |
sqor | +0.297 |
capacity | +0.271 |
ゴ | +0.270 |
ALSE | +0.263 |
Neg logit contributions | |
arial | -0.221 |
nce | -0.214 |
utton | -0.213 |
ody | -0.207 |
illery | -0.205 |
Token | he |
Token ID | 339 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
arial | +1.562 |
nce | +1.496 |
utton | +1.489 |
ody | +1.457 |
illery | +1.444 |
Neg logit contributions | |
�� | -2.400 |
sqor | -2.300 |
ゴ | -2.103 |
capacity | -2.101 |
ALSE | -2.031 |
Token | once |
Token ID | 1752 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
arial | +1.554 |
nce | +1.493 |
utton | +1.466 |
ody | +1.441 |
izer | +1.435 |
Neg logit contributions | |
�� | -2.586 |
sqor | -2.480 |
ゴ | -2.259 |
capacity | -2.241 |
ALSE | -2.201 |
Token | told |
Token ID | 1297 |
Feature activation | -3.44e-01 |
Pos logit contributions | |
arial | +1.576 |
nce | +1.514 |
utton | +1.501 |
ody | +1.478 |
izer | +1.451 |
Neg logit contributions | |
�� | -2.136 |
sqor | -2.051 |
ゴ | -1.860 |
capacity | -1.860 |
ALSE | -1.812 |
Token | hit |
Token ID | 2277 |
Feature activation | -5.45e-01 |
Pos logit contributions | |
�� | +0.316 |
sqor | +0.306 |
capacity | +0.277 |
ゴ | +0.276 |
ALSE | +0.268 |
Neg logit contributions | |
arial | -0.243 |
nce | -0.235 |
utton | -0.232 |
ody | -0.228 |
illery | -0.224 |
Token | it |
Token ID | 340 |
Feature activation | -5.17e-01 |
Pos logit contributions | |
arial | +2.442 |
nce | +2.420 |
utton | +2.378 |
ody | +2.354 |
izer | +2.258 |
Neg logit contributions | |
�� | -4.021 |
sqor | -3.901 |
ゴ | -3.546 |
capacity | -3.514 |
ALSE | -3.479 |
Token | big |
Token ID | 1263 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
arial | +2.366 |
utton | +2.332 |
nce | +2.325 |
ody | +2.296 |
izer | +2.249 |
Neg logit contributions | |
�� | -3.753 |
sqor | -3.585 |
ゴ | -3.301 |
capacity | -3.282 |
ALSE | -3.237 |
Token | … |
Token ID | 3926 |
Feature activation | +2.74e-01 |
Pos logit contributions | |
arial | +0.642 |
nce | +0.622 |
utton | +0.618 |
ody | +0.609 |
izer | +0.592 |
Neg logit contributions | |
�� | -0.869 |
sqor | -0.840 |
capacity | -0.758 |
ゴ | -0.758 |
ALSE | -0.738 |
Token | until |
Token ID | 1566 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
�� | +1.727 |
sqor | +1.665 |
capacity | +1.505 |
ゴ | +1.495 |
ALSE | +1.449 |
Neg logit contributions | |
arial | -1.569 |
nce | -1.524 |
utton | -1.518 |
ody | -1.476 |
illery | -1.472 |
Token | this |
Token ID | 428 |
Feature activation | -5.34e-02 |
Pos logit contributions | |
arial | +0.492 |
nce | +0.475 |
utton | +0.471 |
ody | +0.465 |
illery | +0.457 |
Neg logit contributions | |
�� | -0.749 |
sqor | -0.724 |
ゴ | -0.660 |
capacity | -0.660 |
ALSE | -0.643 |
Token | month |
Token ID | 1227 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
arial | +0.281 |
nce | +0.273 |
utton | +0.271 |
ody | +0.265 |
illery | +0.262 |
Neg logit contributions | |
�� | -0.363 |
sqor | -0.350 |
capacity | -0.318 |
ゴ | -0.317 |
ALSE | -0.308 |
Token | . |
Token ID | 13 |
Feature activation | +9.80e-02 |
Pos logit contributions | |
arial | +1.846 |
utton | +1.799 |
nce | +1.787 |
ody | +1.770 |
illery | +1.732 |
Neg logit contributions | |
�� | -2.580 |
sqor | -2.502 |
capacity | -2.284 |
ゴ | -2.264 |
ALSE | -2.205 |
Token |
|
Token ID | 198 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
�� | +0.661 |
sqor | +0.639 |
capacity | +0.580 |
ゴ | +0.577 |
ALSE | +0.561 |
Neg logit contributions | |
arial | -0.519 |
nce | -0.503 |
utton | -0.502 |
ody | -0.488 |
illery | -0.484 |
Token |
|
Token ID | 198 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
�� | +0.901 |
sqor | +0.866 |
capacity | +0.782 |
ゴ | +0.782 |
ALSE | +0.759 |
Neg logit contributions | |
arial | -0.702 |
nce | -0.680 |
utton | -0.676 |
ody | -0.658 |
illery | -0.653 |
Token | The |
Token ID | 464 |
Feature activation | +3.00e-02 |
Pos logit contributions | |
�� | +0.727 |
sqor | +0.708 |
capacity | +0.635 |
ゴ | +0.629 |
ALSE | +0.614 |
Neg logit contributions | |
arial | -0.540 |
nce | -0.523 |
utton | -0.520 |
ody | -0.509 |
illery | -0.500 |
Token | trained |
Token ID | 8776 |
Feature activation | -5.25e-01 |
Pos logit contributions | |
arial | +0.878 |
nce | +0.863 |
utton | +0.849 |
ody | +0.832 |
illery | +0.820 |
Neg logit contributions | |
�� | -1.112 |
sqor | -1.074 |
ゴ | -0.982 |
capacity | -0.968 |
ALSE | -0.936 |
Token | to |
Token ID | 284 |
Feature activation | -4.55e-01 |
Pos logit contributions | |
arial | +2.253 |
nce | +2.169 |
utton | +2.160 |
ody | +2.101 |
illery | +2.064 |
Neg logit contributions | |
�� | -4.037 |
sqor | -3.927 |
capacity | -3.610 |
ゴ | -3.604 |
ALSE | -3.490 |
Token | follow |
Token ID | 1061 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
arial | +2.300 |
nce | +2.268 |
utton | +2.205 |
ody | +2.133 |
illery | +2.127 |
Neg logit contributions | |
�� | -3.179 |
sqor | -3.057 |
ゴ | -2.823 |
capacity | -2.760 |
ALSE | -2.640 |
Token | a |
Token ID | 257 |
Feature activation | -8.49e-02 |
Pos logit contributions | |
arial | +2.174 |
nce | +2.129 |
utton | +2.081 |
ody | +2.069 |
illery | +1.993 |
Neg logit contributions | |
�� | -3.548 |
sqor | -3.472 |
capacity | -3.178 |
ゴ | -3.166 |
ALSE | -3.045 |
Token | route |
Token ID | 6339 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
arial | +0.458 |
nce | +0.447 |
utton | +0.442 |
ody | +0.430 |
illery | +0.428 |
Neg logit contributions | |
�� | -0.564 |
sqor | -0.549 |
capacity | -0.495 |
ゴ | -0.494 |
ALSE | -0.477 |
Token | from |
Token ID | 422 |
Feature activation | -7.75e-01 |
Pos logit contributions | |
arial | +0.702 |
nce | +0.680 |
utton | +0.671 |
ody | +0.660 |
illery | +0.651 |
Neg logit contributions | |
�� | -0.955 |
sqor | -0.922 |
ゴ | -0.841 |
capacity | -0.840 |
ALSE | -0.808 |
Token | room |
Token ID | 2119 |
Feature activation | -7.16e-01 |
Pos logit contributions | |
arial | +3.384 |
nce | +3.313 |
utton | +3.276 |
ody | +3.238 |
izer | +3.162 |
Neg logit contributions | |
�� | -5.741 |
sqor | -5.643 |
ゴ | -5.147 |
capacity | -5.088 |
ALSE | -4.939 |
Token | to |
Token ID | 284 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
arial | +3.016 |
nce | +2.867 |
utton | +2.816 |
ody | +2.780 |
izer | +2.728 |
Neg logit contributions | |
�� | -5.523 |
sqor | -5.415 |
ゴ | -4.984 |
capacity | -4.924 |
ALSE | -4.823 |
Token | room |
Token ID | 2119 |
Feature activation | -5.78e-01 |
Pos logit contributions | |
arial | +3.245 |
nce | +3.162 |
utton | +3.119 |
ody | +3.067 |
izer | +2.985 |
Neg logit contributions | |
�� | -5.469 |
sqor | -5.294 |
ゴ | -4.934 |
capacity | -4.866 |
ALSE | -4.761 |
Token | by |
Token ID | 416 |
Feature activation | +3.85e-02 |
Pos logit contributions | |
arial | +2.830 |
nce | +2.703 |
ody | +2.679 |
utton | +2.669 |
izer | +2.609 |
Neg logit contributions | |
�� | -4.122 |
sqor | -3.950 |
ゴ | -3.635 |
capacity | -3.619 |
ALSE | -3.463 |
Token | choosing |
Token ID | 11236 |
Feature activation | -2.77e-01 |
Pos logit contributions | |
�� | +0.266 |
sqor | +0.258 |
capacity | +0.235 |
ゴ | +0.233 |
ALSE | +0.227 |
Neg logit contributions | |
arial | -0.197 |
nce | -0.191 |
utton | -0.190 |
ody | -0.185 |
illery | -0.183 |
Token | machine |
Token ID | 4572 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
arial | +1.992 |
nce | +1.970 |
utton | +1.912 |
ody | +1.850 |
illery | +1.830 |
Neg logit contributions | |
�� | -2.969 |
sqor | -2.837 |
ゴ | -2.604 |
capacity | -2.586 |
ALSE | -2.538 |
Token | will |
Token ID | 481 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
arial | +0.893 |
nce | +0.865 |
utton | +0.862 |
ody | +0.837 |
illery | +0.829 |
Neg logit contributions | |
�� | -1.281 |
sqor | -1.240 |
capacity | -1.127 |
ゴ | -1.121 |
ALSE | -1.095 |
Token | not |
Token ID | 407 |
Feature activation | -6.35e-02 |
Pos logit contributions | |
arial | +0.665 |
nce | +0.656 |
utton | +0.643 |
ody | +0.624 |
illery | +0.615 |
Neg logit contributions | |
�� | -1.090 |
sqor | -1.050 |
ゴ | -0.957 |
capacity | -0.956 |
ALSE | -0.939 |
Token | work |
Token ID | 670 |
Feature activation | -2.15e-01 |
Pos logit contributions | |
arial | +0.325 |
nce | +0.318 |
utton | +0.312 |
ody | +0.305 |
illery | +0.300 |
Neg logit contributions | |
�� | -0.450 |
sqor | -0.430 |
ゴ | -0.390 |
capacity | -0.387 |
ALSE | -0.381 |
Token | properly |
Token ID | 6105 |
Feature activation | -3.84e-01 |
Pos logit contributions | |
arial | +1.023 |
nce | +0.981 |
utton | +0.975 |
ody | +0.960 |
izer | +0.931 |
Neg logit contributions | |
�� | -1.591 |
sqor | -1.520 |
capacity | -1.397 |
ゴ | -1.394 |
ALSE | -1.348 |
Token | unless |
Token ID | 4556 |
Feature activation | -4.46e-01 |
Pos logit contributions | |
arial | +1.687 |
nce | +1.641 |
utton | +1.619 |
ody | +1.608 |
izer | +1.559 |
Neg logit contributions | |
�� | -2.959 |
sqor | -2.820 |
ゴ | -2.600 |
capacity | -2.599 |
ALSE | -2.533 |
Token | it |
Token ID | 340 |
Feature activation | +8.92e-02 |
Pos logit contributions | |
arial | +2.113 |
nce | +2.066 |
utton | +2.047 |
ody | +2.023 |
izer | +1.955 |
Neg logit contributions | |
�� | -3.211 |
sqor | -3.095 |
capacity | -2.824 |
ゴ | -2.818 |
ALSE | -2.756 |
Token | is |
Token ID | 318 |
Feature activation | +5.79e-02 |
Pos logit contributions | |
�� | +0.670 |
sqor | +0.649 |
capacity | +0.596 |
ゴ | +0.593 |
ALSE | +0.579 |
Neg logit contributions | |
arial | -0.405 |
nce | -0.391 |
utton | -0.389 |
ody | -0.377 |
illery | -0.372 |
Token | threaded |
Token ID | 40945 |
Feature activation | -2.29e-01 |
Pos logit contributions | |
�� | +0.387 |
sqor | +0.373 |
capacity | +0.337 |
ゴ | +0.336 |
ALSE | +0.328 |
Neg logit contributions | |
arial | -0.313 |
nce | -0.304 |
utton | -0.302 |
ody | -0.295 |
illery | -0.291 |
Token | correctly |
Token ID | 9380 |
Feature activation | -8.69e-01 |
Pos logit contributions | |
arial | +1.118 |
nce | +1.084 |
utton | +1.077 |
ody | +1.058 |
izer | +1.031 |
Neg logit contributions | |
�� | -1.650 |
sqor | -1.571 |
ゴ | -1.439 |
capacity | -1.430 |
ALSE | -1.403 |
Token | and |
Token ID | 290 |
Feature activation | -5.22e-01 |
Pos logit contributions | |
arial | +3.762 |
nce | +3.640 |
utton | +3.636 |
ody | +3.616 |
izer | +3.532 |
Neg logit contributions | |
�� | -6.512 |
sqor | -6.104 |
ゴ | -5.715 |
capacity | -5.705 |
ALSE | -5.622 |
Token | machine |
Token ID | 4572 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
arial | +0.279 |
nce | +0.273 |
utton | +0.269 |
ody | +0.262 |
illery | +0.260 |
Neg logit contributions | |
�� | -0.345 |
sqor | -0.331 |
capacity | -0.300 |
ゴ | -0.298 |
ALSE | -0.291 |
Token | repaired |
Token ID | 27457 |
Feature activation | -3.90e-01 |
Pos logit contributions | |
�� | +0.173 |
sqor | +0.167 |
capacity | +0.151 |
ゴ | +0.151 |
ALSE | +0.147 |
Neg logit contributions | |
arial | -0.128 |
nce | -0.123 |
utton | -0.122 |
ody | -0.120 |
illery | -0.118 |
Token | , |
Token ID | 11 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
arial | +1.930 |
nce | +1.878 |
utton | +1.839 |
ody | +1.838 |
izer | +1.776 |
Neg logit contributions | |
�� | -2.762 |
sqor | -2.652 |
capacity | -2.415 |
ゴ | -2.400 |
ALSE | -2.363 |
Token | by |
Token ID | 416 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
arial | +1.045 |
utton | +1.013 |
nce | +1.007 |
ody | +0.995 |
illery | +0.966 |
Neg logit contributions | |
�� | -1.457 |
sqor | -1.403 |
capacity | -1.269 |
ゴ | -1.254 |
ALSE | -1.242 |
Token | Andrew |
Token ID | 6858 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
arial | +0.952 |
nce | +0.923 |
utton | +0.911 |
ody | +0.899 |
illery | +0.878 |
Neg logit contributions | |
�� | -1.238 |
sqor | -1.185 |
capacity | -1.077 |
ゴ | -1.067 |
ALSE | -1.054 |
Token | Baron |
Token ID | 21770 |
Feature activation | -2.82e-01 |
Pos logit contributions | |
arial | +1.023 |
nce | +0.996 |
utton | +0.989 |
ody | +0.964 |
illery | +0.955 |
Neg logit contributions | |
�� | -1.309 |
sqor | -1.261 |
capacity | -1.143 |
ゴ | -1.138 |
ALSE | -1.110 |
Token | , |
Token ID | 11 |
Feature activation | -2.70e-01 |
Pos logit contributions | |
arial | +1.561 |
nce | +1.529 |
utton | +1.520 |
ody | +1.497 |
illery | +1.468 |
Neg logit contributions | |
�� | -1.830 |
sqor | -1.759 |
capacity | -1.593 |
ゴ | -1.577 |
ALSE | -1.546 |
Token | a |
Token ID | 257 |
Feature activation | +8.05e-02 |
Pos logit contributions | |
arial | +1.233 |
nce | +1.199 |
utton | +1.195 |
ody | +1.164 |
illery | +1.138 |
Neg logit contributions | |
�� | -2.021 |
sqor | -1.950 |
capacity | -1.785 |
ゴ | -1.759 |
ALSE | -1.731 |
Token | designer |
Token ID | 11915 |
Feature activation | -9.04e-02 |
Pos logit contributions | |
�� | +0.527 |
sqor | +0.505 |
capacity | +0.457 |
ゴ | +0.453 |
ALSE | +0.443 |
Neg logit contributions | |
arial | -0.447 |
nce | -0.436 |
utton | -0.432 |
ody | -0.420 |
illery | -0.419 |
Token | of |
Token ID | 286 |
Feature activation | +1.57e-01 |
Pos logit contributions | |
arial | +0.439 |
nce | +0.427 |
utton | +0.422 |
ody | +0.412 |
illery | +0.407 |
Neg logit contributions | |
�� | -0.650 |
sqor | -0.628 |
capacity | -0.575 |
ゴ | -0.570 |
ALSE | -0.557 |
Token | pop |
Token ID | 1461 |
Feature activation | +4.41e-02 |
Pos logit contributions | |
�� | +1.083 |
sqor | +1.050 |
capacity | +0.956 |
ゴ | +0.952 |
ALSE | +0.925 |
Neg logit contributions | |
arial | -0.797 |
nce | -0.772 |
utton | -0.771 |
ody | -0.747 |
illery | -0.742 |
Token | to |
Token ID | 284 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
arial | +0.255 |
nce | +0.248 |
utton | +0.245 |
ody | +0.239 |
illery | +0.237 |
Neg logit contributions | |
�� | -0.395 |
sqor | -0.386 |
capacity | -0.351 |
ゴ | -0.350 |
ALSE | -0.341 |
Token | take |
Token ID | 1011 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
�� | +0.151 |
sqor | +0.145 |
ゴ | +0.132 |
capacity | +0.132 |
ALSE | +0.127 |
Neg logit contributions | |
arial | -0.116 |
nce | -0.113 |
utton | -0.112 |
ody | -0.108 |
illery | -0.108 |
Token | the |
Token ID | 262 |
Feature activation | +3.74e-01 |
Pos logit contributions | |
arial | +0.519 |
nce | +0.503 |
utton | +0.498 |
ody | +0.485 |
illery | +0.480 |
Neg logit contributions | |
�� | -0.734 |
sqor | -0.707 |
capacity | -0.644 |
ゴ | -0.644 |
ALSE | -0.625 |
Token | next |
Token ID | 1306 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
�� | +2.458 |
sqor | +2.397 |
capacity | +2.170 |
ゴ | +2.148 |
Sisters | +2.097 |
Neg logit contributions | |
arial | -1.991 |
nce | -1.928 |
utton | -1.926 |
ody | -1.873 |
illery | -1.863 |
Token | steps |
Token ID | 4831 |
Feature activation | -2.05e-01 |
Pos logit contributions | |
�� | +0.970 |
sqor | +0.937 |
capacity | +0.847 |
ゴ | +0.842 |
ALSE | +0.817 |
Neg logit contributions | |
arial | -0.834 |
nce | -0.810 |
utton | -0.807 |
ody | -0.786 |
illery | -0.781 |
Token | . |
Token ID | 13 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
arial | +1.035 |
utton | +0.997 |
nce | +0.996 |
ody | +0.971 |
illery | +0.958 |
Neg logit contributions | |
�� | -1.442 |
sqor | -1.387 |
capacity | -1.274 |
ゴ | -1.265 |
ALSE | -1.231 |
Token | � |
Token ID | 447 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
arial | +0.616 |
nce | +0.597 |
utton | +0.594 |
ody | +0.576 |
illery | +0.569 |
Neg logit contributions | |
�� | -0.993 |
sqor | -0.957 |
capacity | -0.876 |
ゴ | -0.873 |
ALSE | -0.851 |
Token | � |
Token ID | 251 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
�� | +0.131 |
sqor | +0.123 |
capacity | +0.110 |
ゴ | +0.110 |
ALSE | +0.105 |
Neg logit contributions | |
arial | -0.149 |
utton | -0.145 |
nce | -0.144 |
illery | -0.140 |
ody | -0.140 |
Token |
|
Token ID | 198 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
�� | +1.151 |
sqor | +1.116 |
capacity | +1.007 |
ゴ | +1.000 |
Sisters | +0.976 |
Neg logit contributions | |
arial | -0.990 |
nce | -0.957 |
utton | -0.952 |
illery | -0.926 |
ody | -0.922 |
Token |
|
Token ID | 198 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
arial | +0.778 |
nce | +0.754 |
utton | +0.743 |
ody | +0.724 |
izer | +0.720 |
Neg logit contributions | |
�� | -1.167 |
sqor | -1.101 |
ゴ | -0.998 |
capacity | -0.983 |
ALSE | -0.965 |
Token | But |
Token ID | 1537 |
Feature activation | +4.95e-02 |
Pos logit contributions | |
arial | +0.992 |
nce | +0.961 |
utton | +0.961 |
ody | +0.942 |
illery | +0.914 |
Neg logit contributions | |
�� | -1.422 |
sqor | -1.377 |
ゴ | -1.238 |
capacity | -1.235 |
ALSE | -1.203 |
Token | undred |
Token ID | 3229 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
arial | +0.145 |
utton | +0.143 |
nce | +0.142 |
ody | +0.138 |
illery | +0.137 |
Neg logit contributions | |
�� | -0.183 |
sqor | -0.177 |
capacity | -0.160 |
ゴ | -0.160 |
ALSE | -0.155 |
Token | times |
Token ID | 1661 |
Feature activation | -5.85e-02 |
Pos logit contributions | |
arial | +0.504 |
nce | +0.489 |
utton | +0.487 |
ody | +0.473 |
illery | +0.468 |
Neg logit contributions | |
�� | -0.753 |
sqor | -0.726 |
capacity | -0.662 |
ゴ | -0.661 |
ALSE | -0.643 |
Token | the |
Token ID | 262 |
Feature activation | +4.79e-01 |
Pos logit contributions | |
arial | +0.305 |
nce | +0.296 |
utton | +0.294 |
ody | +0.287 |
illery | +0.283 |
Neg logit contributions | |
�� | -0.405 |
sqor | -0.384 |
ゴ | -0.353 |
capacity | -0.349 |
ALSE | -0.337 |
Token | major |
Token ID | 1688 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
�� | +2.908 |
sqor | +2.832 |
capacity | +2.564 |
ゴ | +2.507 |
ALSE | +2.441 |
Neg logit contributions | |
arial | -2.798 |
nce | -2.719 |
utton | -2.718 |
ody | -2.649 |
illery | -2.636 |
Token | version |
Token ID | 2196 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
arial | +1.052 |
nce | +1.021 |
utton | +1.016 |
ody | +0.984 |
illery | +0.974 |
Neg logit contributions | |
�� | -1.485 |
sqor | -1.429 |
ゴ | -1.300 |
capacity | -1.294 |
ALSE | -1.263 |
Token | plus |
Token ID | 5556 |
Feature activation | -9.59e-02 |
Pos logit contributions | |
�� | +1.128 |
sqor | +1.086 |
capacity | +0.977 |
ゴ | +0.971 |
ALSE | +0.941 |
Neg logit contributions | |
arial | -1.067 |
nce | -1.038 |
utton | -1.034 |
ody | -1.008 |
illery | -1.002 |
Token | minor |
Token ID | 4159 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
arial | +0.490 |
nce | +0.476 |
utton | +0.474 |
ody | +0.461 |
illery | +0.459 |
Neg logit contributions | |
�� | -0.666 |
sqor | -0.642 |
capacity | -0.582 |
ゴ | -0.582 |
ALSE | -0.564 |
Token | ). |
Token ID | 737 |
Feature activation | +8.03e-02 |
Pos logit contributions | |
arial | +0.336 |
nce | +0.326 |
utton | +0.326 |
ody | +0.316 |
illery | +0.314 |
Neg logit contributions | |
�� | -0.403 |
sqor | -0.389 |
capacity | -0.352 |
ゴ | -0.350 |
ALSE | -0.340 |
Token | For |
Token ID | 1114 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
�� | +0.556 |
sqor | +0.536 |
capacity | +0.488 |
ゴ | +0.487 |
ALSE | +0.472 |
Neg logit contributions | |
arial | -0.413 |
nce | -0.401 |
utton | -0.399 |
ody | -0.387 |
illery | -0.385 |
Token | example |
Token ID | 1672 |
Feature activation | -2.77e-01 |
Pos logit contributions | |
arial | +1.967 |
nce | +1.932 |
utton | +1.894 |
ody | +1.840 |
illery | +1.836 |
Neg logit contributions | |
�� | -2.363 |
sqor | -2.271 |
ゴ | -2.052 |
capacity | -2.041 |
ALSE | -1.980 |
Token | , |
Token ID | 11 |
Feature activation | -5.43e-01 |
Pos logit contributions | |
arial | +1.603 |
nce | +1.548 |
utton | +1.547 |
ody | +1.504 |
illery | +1.504 |
Neg logit contributions | |
�� | -1.741 |
sqor | -1.669 |
capacity | -1.505 |
ゴ | -1.505 |
ALSE | -1.450 |
Token | on |
Token ID | 319 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
�� | +2.261 |
sqor | +2.189 |
capacity | +2.011 |
ゴ | +1.998 |
ALSE | +1.943 |
Neg logit contributions | |
arial | -1.528 |
utton | -1.471 |
nce | -1.466 |
illery | -1.424 |
ody | -1.415 |
Token | all |
Token ID | 477 |
Feature activation | +7.02e-01 |
Pos logit contributions | |
�� | +1.632 |
sqor | +1.578 |
capacity | +1.430 |
ゴ | +1.423 |
ALSE | +1.383 |
Neg logit contributions | |
arial | -1.297 |
nce | -1.260 |
utton | -1.253 |
ody | -1.220 |
illery | -1.210 |
Token | the |
Token ID | 262 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
�� | +4.386 |
sqor | +4.255 |
capacity | +3.854 |
ゴ | +3.839 |
Sisters | +3.742 |
Neg logit contributions | |
arial | -3.931 |
utton | -3.795 |
nce | -3.782 |
illery | -3.707 |
ody | -3.651 |
Token | best |
Token ID | 1266 |
Feature activation | +3.16e-02 |
Pos logit contributions | |
�� | +2.960 |
sqor | +2.874 |
capacity | +2.607 |
ゴ | +2.583 |
Sisters | +2.509 |
Neg logit contributions | |
arial | -2.461 |
utton | -2.387 |
nce | -2.382 |
ody | -2.315 |
illery | -2.308 |
Token | - |
Token ID | 12 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
�� | +0.215 |
sqor | +0.208 |
capacity | +0.188 |
ゴ | +0.188 |
ALSE | +0.182 |
Neg logit contributions | |
arial | -0.166 |
nce | -0.160 |
utton | -0.160 |
ody | -0.157 |
illery | -0.154 |
Token | of |
Token ID | 1659 |
Feature activation | -9.18e-01 |
Pos logit contributions | |
�� | +1.125 |
sqor | +1.085 |
capacity | +0.977 |
ゴ | +0.977 |
ALSE | +0.953 |
Neg logit contributions | |
arial | -0.903 |
nce | -0.874 |
utton | -0.873 |
ody | -0.851 |
illery | -0.838 |
Token | lists |
Token ID | 8341 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
arial | +4.737 |
nce | +4.646 |
utton | +4.575 |
ody | +4.529 |
izer | +4.351 |
Neg logit contributions | |
�� | -5.910 |
sqor | -5.667 |
capacity | -5.221 |
ゴ | -5.202 |
ALSE | -5.055 |
Token | , |
Token ID | 11 |
Feature activation | +2.27e-01 |
Pos logit contributions | |
�� | +2.064 |
sqor | +1.995 |
capacity | +1.789 |
ゴ | +1.780 |
ALSE | +1.719 |
Neg logit contributions | |
arial | -1.947 |
utton | -1.894 |
nce | -1.894 |
ody | -1.835 |
illery | -1.829 |
Token | even |
Token ID | 772 |
Feature activation | +4.46e-02 |
Pos logit contributions | |
�� | +1.532 |
sqor | +1.482 |
capacity | +1.345 |
ゴ | +1.338 |
ALSE | +1.301 |
Neg logit contributions | |
arial | -1.205 |
nce | -1.168 |
utton | -1.164 |
ody | -1.132 |
illery | -1.124 |
Token | influenced |
Token ID | 12824 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
�� | +0.318 |
sqor | +0.307 |
capacity | +0.280 |
ゴ | +0.278 |
ALSE | +0.272 |
Neg logit contributions | |
arial | -0.222 |
nce | -0.214 |
utton | -0.213 |
ody | -0.207 |
illery | -0.205 |
Token | fashion |
Token ID | 6977 |
Feature activation | -5.74e-02 |
Pos logit contributions | |
�� | +1.260 |
sqor | +1.221 |
capacity | +1.110 |
ゴ | +1.105 |
ALSE | +1.075 |
Neg logit contributions | |
arial | -0.940 |
nce | -0.910 |
utton | -0.907 |
ody | -0.880 |
illery | -0.875 |
Token | Res |
Token ID | 4965 |
Feature activation | -3.32e-01 |
Pos logit contributions | |
�� | +0.620 |
sqor | +0.600 |
capacity | +0.542 |
ゴ | +0.539 |
ALSE | +0.524 |
Neg logit contributions | |
arial | -0.495 |
nce | -0.480 |
utton | -0.478 |
ody | -0.466 |
illery | -0.462 |
Token | ign |
Token ID | 570 |
Feature activation | -5.69e-01 |
Pos logit contributions | |
arial | +1.545 |
utton | +1.499 |
nce | +1.485 |
ody | +1.456 |
illery | +1.431 |
Neg logit contributions | |
�� | -2.477 |
sqor | -2.373 |
capacity | -2.178 |
ゴ | -2.154 |
ALSE | -2.122 |
Token | ! |
Token ID | 0 |
Feature activation | -8.43e-01 |
Pos logit contributions | |
arial | +2.775 |
nce | +2.730 |
utton | +2.667 |
ody | +2.601 |
illery | +2.565 |
Neg logit contributions | |
�� | -4.055 |
sqor | -3.893 |
capacity | -3.590 |
ゴ | -3.554 |
ALSE | -3.428 |
Token | Res |
Token ID | 1874 |
Feature activation | -5.31e-01 |
Pos logit contributions | |
arial | +4.533 |
nce | +4.467 |
utton | +4.404 |
ody | +4.286 |
illery | +4.281 |
Neg logit contributions | |
�� | -5.439 |
sqor | -5.124 |
ゴ | -4.658 |
capacity | -4.617 |
ALSE | -4.470 |
Token | ign |
Token ID | 570 |
Feature activation | -9.61e-01 |
Pos logit contributions | |
arial | +3.283 |
nce | +3.221 |
utton | +3.216 |
ody | +3.160 |
illery | +3.114 |
Neg logit contributions | |
�� | -3.179 |
sqor | -2.966 |
ゴ | -2.657 |
capacity | -2.612 |
ALSE | -2.558 |
Token | ! |
Token ID | 0 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
arial | +3.729 |
nce | +3.627 |
utton | +3.534 |
ody | +3.461 |
illery | +3.396 |
Neg logit contributions | |
�� | -7.578 |
sqor | -7.325 |
capacity | -6.866 |
ゴ | -6.806 |
ALSE | -6.589 |
Token | � |
Token ID | 447 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
arial | +5.219 |
nce | +5.086 |
utton | +5.024 |
ody | +4.999 |
illery | +4.988 |
Neg logit contributions | |
�� | -6.488 |
sqor | -6.182 |
ゴ | -5.652 |
capacity | -5.600 |
ALSE | -5.455 |
Token | � |
Token ID | 251 |
Feature activation | +5.11e-02 |
Pos logit contributions | |
arial | +1.586 |
nce | +1.575 |
utton | +1.553 |
ody | +1.521 |
illery | +1.488 |
Neg logit contributions | |
�� | -1.785 |
sqor | -1.774 |
capacity | -1.585 |
ゴ | -1.564 |
Sisters | -1.520 |
Token | could |
Token ID | 714 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
�� | +0.344 |
sqor | +0.334 |
capacity | +0.302 |
ゴ | +0.300 |
ALSE | +0.292 |
Neg logit contributions | |
arial | -0.272 |
nce | -0.263 |
utton | -0.261 |
ody | -0.257 |
illery | -0.254 |
Token | be |
Token ID | 307 |
Feature activation | +5.32e-02 |
Pos logit contributions | |
�� | +0.806 |
sqor | +0.780 |
capacity | +0.712 |
ゴ | +0.704 |
ALSE | +0.687 |
Neg logit contributions | |
arial | -0.573 |
utton | -0.556 |
nce | -0.555 |
illery | -0.533 |
ody | -0.532 |
Token | heard |
Token ID | 2982 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
�� | +0.384 |
sqor | +0.372 |
capacity | +0.340 |
ゴ | +0.339 |
ALSE | +0.330 |
Neg logit contributions | |
arial | -0.256 |
nce | -0.247 |
utton | -0.246 |
ody | -0.239 |
illery | -0.237 |
Token | apples |
Token ID | 22514 |
Feature activation | -6.64e-01 |
Pos logit contributions | |
�� | +0.384 |
sqor | +0.373 |
capacity | +0.336 |
ゴ | +0.336 |
ALSE | +0.325 |
Neg logit contributions | |
arial | -0.281 |
nce | -0.270 |
utton | -0.270 |
ody | -0.265 |
illery | -0.259 |
Token | - |
Token ID | 12 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
arial | +3.061 |
utton | +2.944 |
nce | +2.912 |
ody | +2.848 |
illery | +2.796 |
Neg logit contributions | |
�� | -4.927 |
sqor | -4.725 |
capacity | -4.315 |
ゴ | -4.302 |
ALSE | -4.256 |
Token | to |
Token ID | 1462 |
Feature activation | -9.29e-01 |
Pos logit contributions | |
arial | +4.725 |
utton | +4.531 |
nce | +4.458 |
ody | +4.323 |
izer | +4.101 |
Neg logit contributions | |
�� | -7.981 |
sqor | -7.700 |
ゴ | -7.014 |
ALSE | -7.011 |
capacity | -6.644 |
Token | - |
Token ID | 12 |
Feature activation | -3.06e-01 |
Pos logit contributions | |
arial | +3.474 |
utton | +3.380 |
nce | +3.355 |
ody | +3.247 |
izer | +3.193 |
Neg logit contributions | |
�� | -7.866 |
sqor | -7.323 |
ゴ | -6.797 |
capacity | -6.591 |
ALSE | -6.518 |
Token | app |
Token ID | 1324 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
arial | +1.827 |
utton | +1.773 |
nce | +1.752 |
ody | +1.733 |
illery | +1.691 |
Neg logit contributions | |
�� | -1.895 |
sqor | -1.820 |
ゴ | -1.626 |
capacity | -1.600 |
ALSE | -1.569 |
Token | les |
Token ID | 829 |
Feature activation | -9.14e-01 |
Pos logit contributions | |
�� | +2.483 |
sqor | +2.390 |
capacity | +2.171 |
ゴ | +2.111 |
Sisters | +2.084 |
Neg logit contributions | |
arial | -2.752 |
nce | -2.660 |
utton | -2.635 |
illery | -2.553 |
ody | -2.545 |
Token | comparison |
Token ID | 7208 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
arial | +2.486 |
izer | +2.151 |
nce | +2.149 |
utton | +2.120 |
ody | +2.090 |
Neg logit contributions | |
�� | -8.525 |
sqor | -8.284 |
ゴ | -7.817 |
capacity | -7.638 |
ALSE | -7.545 |
Token | . |
Token ID | 13 |
Feature activation | -2.95e-01 |
Pos logit contributions | |
arial | +1.030 |
nce | +0.993 |
utton | +0.984 |
ody | +0.970 |
illery | +0.955 |
Neg logit contributions | |
�� | -1.303 |
sqor | -1.244 |
ゴ | -1.131 |
capacity | -1.129 |
ALSE | -1.094 |
Token |
|
Token ID | 198 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
arial | +1.424 |
nce | +1.377 |
utton | +1.352 |
illery | +1.325 |
ody | +1.316 |
Neg logit contributions | |
�� | -2.185 |
sqor | -2.085 |
capacity | -1.875 |
ゴ | -1.868 |
ALSE | -1.821 |
Token |
|
Token ID | 198 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
arial | +0.955 |
nce | +0.925 |
utton | +0.906 |
ody | +0.885 |
izer | +0.882 |
Neg logit contributions | |
�� | -1.474 |
sqor | -1.389 |
ゴ | -1.255 |
capacity | -1.235 |
ALSE | -1.214 |
Token | " |
Token ID | 1 |
Feature activation | +1.92e-01 |
Pos logit contributions | |
arial | +0.945 |
nce | +0.906 |
utton | +0.901 |
ody | +0.889 |
illery | +0.864 |
Neg logit contributions | |
�� | -1.417 |
sqor | -1.382 |
capacity | -1.216 |
ゴ | -1.215 |
Sisters | -1.195 |
Token | this |
Token ID | 428 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
arial | +0.409 |
nce | +0.401 |
utton | +0.399 |
ody | +0.392 |
illery | +0.381 |
Neg logit contributions | |
�� | -0.594 |
sqor | -0.572 |
ゴ | -0.523 |
capacity | -0.521 |
ALSE | -0.503 |
Token | dé |
Token ID | 39073 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
�� | +1.077 |
sqor | +1.044 |
capacity | +0.953 |
ゴ | +0.947 |
ALSE | +0.923 |
Neg logit contributions | |
arial | -0.762 |
nce | -0.737 |
utton | -0.735 |
ody | -0.712 |
illery | -0.708 |
Token | j |
Token ID | 73 |
Feature activation | -6.87e-01 |
Pos logit contributions | |
arial | +0.188 |
nce | +0.184 |
utton | +0.183 |
ody | +0.178 |
illery | +0.177 |
Neg logit contributions | |
�� | -0.202 |
sqor | -0.193 |
capacity | -0.173 |
ゴ | -0.173 |
ALSE | -0.168 |
Token | à |
Token ID | 24247 |
Feature activation | -4.33e-01 |
Pos logit contributions | |
arial | +4.350 |
utton | +4.301 |
ody | +4.241 |
nce | +4.230 |
illery | +4.054 |
Neg logit contributions | |
�� | -3.936 |
sqor | -3.725 |
ゴ | -3.386 |
ALSE | -3.263 |
capacity | -3.163 |
Token | v |
Token ID | 410 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
arial | +1.354 |
nce | +1.326 |
utton | +1.271 |
illery | +1.210 |
ody | +1.206 |
Neg logit contributions | |
�� | -3.837 |
sqor | -3.731 |
ゴ | -3.511 |
capacity | -3.449 |
ALSE | -3.392 |
Token | u |
Token ID | 84 |
Feature activation | -9.18e-01 |
Pos logit contributions | |
utton | +6.247 |
nce | +6.235 |
arial | +6.106 |
ody | +6.082 |
izer | +6.045 |
Neg logit contributions | |
�� | -11.393 |
ゴ | -10.321 |
sqor | -10.262 |
Sisters | -9.557 |
capacity | -9.478 |
Token | isn |
Token ID | 2125 |
Feature activation | -3.30e-01 |
Pos logit contributions | |
arial | +4.251 |
nce | +4.011 |
ody | +3.909 |
utton | +3.877 |
izer | +3.696 |
Neg logit contributions | |
�� | -6.976 |
sqor | -6.678 |
ゴ | -6.039 |
capacity | -6.009 |
ALSE | -5.868 |
Token | � |
Token ID | 447 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
arial | +1.172 |
utton | +1.116 |
nce | +1.109 |
ody | +1.064 |
izer | +1.036 |
Neg logit contributions | |
�� | -2.890 |
sqor | -2.771 |
capacity | -2.528 |
ゴ | -2.526 |
ALSE | -2.464 |
Token | � |
Token ID | 247 |
Feature activation | -1.98e-01 |
Pos logit contributions | |
arial | +0.843 |
nce | +0.836 |
utton | +0.825 |
ody | +0.810 |
illery | +0.792 |
Neg logit contributions | |
�� | -1.111 |
sqor | -1.107 |
capacity | -0.997 |
ゴ | -0.993 |
Sisters | -0.962 |
Token | t |
Token ID | 83 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
arial | +1.034 |
nce | +1.014 |
utton | +0.997 |
ody | +0.975 |
illery | +0.957 |
Neg logit contributions | |
�� | -1.377 |
sqor | -1.321 |
ゴ | -1.191 |
capacity | -1.185 |
ALSE | -1.156 |
Token | just |
Token ID | 655 |
Feature activation | +3.87e-02 |
Pos logit contributions | |
arial | +1.758 |
nce | +1.680 |
utton | +1.658 |
ody | +1.651 |
izer | +1.594 |
Neg logit contributions | |
�� | -2.342 |
sqor | -2.247 |
capacity | -2.026 |
ゴ | -2.026 |
ALSE | -1.938 |
Token | ahn |
Token ID | 15386 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
arial | +0.933 |
utton | +0.905 |
nce | +0.905 |
illery | +0.886 |
ody | +0.883 |
Neg logit contributions | |
�� | -0.723 |
sqor | -0.693 |
capacity | -0.613 |
ゴ | -0.603 |
ALSE | -0.587 |
Token | . |
Token ID | 13 |
Feature activation | -2.06e-01 |
Pos logit contributions | |
arial | +1.383 |
utton | +1.340 |
nce | +1.334 |
ody | +1.298 |
izer | +1.281 |
Neg logit contributions | |
�� | -1.918 |
sqor | -1.838 |
capacity | -1.679 |
ゴ | -1.665 |
ALSE | -1.633 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +2.20e-01 |
Pos logit contributions | |
arial | +1.100 |
nce | +1.067 |
utton | +1.063 |
ody | +1.034 |
illery | +1.027 |
Neg logit contributions | |
�� | -1.380 |
sqor | -1.335 |
capacity | -1.211 |
ゴ | -1.204 |
ALSE | -1.170 |
Token | SAN |
Token ID | 36753 |
Feature activation | +9.09e-02 |
Pos logit contributions | |
�� | +1.443 |
sqor | +1.394 |
capacity | +1.263 |
ゴ | +1.256 |
ALSE | +1.220 |
Neg logit contributions | |
arial | -1.199 |
nce | -1.164 |
utton | -1.159 |
ody | -1.128 |
illery | -1.121 |
Token | FR |
Token ID | 8782 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
�� | +0.496 |
sqor | +0.475 |
capacity | +0.420 |
ゴ | +0.417 |
ALSE | +0.400 |
Neg logit contributions | |
arial | -0.600 |
nce | -0.587 |
utton | -0.584 |
ody | -0.571 |
illery | -0.567 |
Token | ANC |
Token ID | 20940 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
arial | +0.814 |
nce | +0.804 |
utton | +0.791 |
ody | +0.773 |
illery | +0.771 |
Neg logit contributions | |
�� | -0.731 |
sqor | -0.700 |
capacity | -0.613 |
ゴ | -0.605 |
Sisters | -0.579 |
Token | IS |
Token ID | 1797 |
Feature activation | -8.93e-01 |
Pos logit contributions | |
arial | +4.937 |
nce | +4.882 |
izer | +4.840 |
illery | +4.789 |
utton | +4.685 |
Neg logit contributions | |
�� | -7.127 |
sqor | -6.625 |
capacity | -5.979 |
ゴ | -5.780 |
cov | -5.715 |
Token | CO |
Token ID | 8220 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
arial | +4.873 |
nce | +4.860 |
utton | +4.481 |
ody | +4.449 |
illery | +4.417 |
Neg logit contributions | |
�� | -5.847 |
sqor | -5.161 |
capacity | -4.888 |
cedes | -4.558 |
volunt | -4.478 |
Token | - |
Token ID | 532 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
arial | +0.511 |
nce | +0.495 |
utton | +0.493 |
ody | +0.479 |
illery | +0.475 |
Neg logit contributions | |
�� | -0.716 |
sqor | -0.693 |
capacity | -0.632 |
ゴ | -0.629 |
ALSE | -0.611 |
Token | Reddit |
Token ID | 10750 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
arial | +2.864 |
nce | +2.814 |
utton | +2.745 |
ody | +2.694 |
illery | +2.680 |
Neg logit contributions | |
�� | -3.834 |
sqor | -3.630 |
capacity | -3.234 |
ゴ | -3.204 |
ALSE | -3.084 |
Token | and |
Token ID | 290 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
�� | +1.689 |
sqor | +1.635 |
capacity | +1.487 |
ゴ | +1.478 |
ALSE | +1.439 |
Neg logit contributions | |
arial | -1.271 |
nce | -1.231 |
utton | -1.228 |
ody | -1.191 |
illery | -1.183 |