Token | Gu |
Token ID | 1962 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
ensed | +0.047 |
icably | +0.045 |
scam | +0.045 |
ous | +0.042 |
ighting | +0.041 |
Neg logit contributions | |
Marshal | -0.047 |
lator | -0.046 |
iler | -0.040 |
layer | -0.040 |
Gutenberg | -0.040 |
Token | zz |
Token ID | 3019 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
Marshal | +0.096 |
lator | +0.095 |
iler | +0.083 |
layer | +0.083 |
Gutenberg | +0.082 |
Neg logit contributions | |
ensed | -0.091 |
icably | -0.088 |
scam | -0.088 |
ous | -0.081 |
ighting | -0.080 |
Token | oni |
Token ID | 14651 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
Marshal | +0.011 |
lator | +0.011 |
iler | +0.010 |
layer | +0.010 |
Gutenberg | +0.010 |
Neg logit contributions | |
ensed | -0.009 |
icably | -0.008 |
scam | -0.008 |
ous | -0.008 |
ella | -0.008 |
Token | while |
Token ID | 981 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
Marshal | +0.222 |
lator | +0.217 |
iler | +0.191 |
layer | +0.190 |
Gutenberg | +0.188 |
Neg logit contributions | |
ensed | -0.217 |
icably | -0.211 |
scam | -0.209 |
ous | -0.192 |
ighting | -0.192 |
Token | Field |
Token ID | 7663 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
Marshal | +0.155 |
lator | +0.153 |
iler | +0.135 |
layer | +0.134 |
Gutenberg | +0.132 |
Neg logit contributions | |
ensed | -0.145 |
icably | -0.141 |
scam | -0.140 |
ous | -0.129 |
ighting | -0.128 |
Token | Marshal |
Token ID | 37899 |
Feature activation | +6.79e-01 |
Pos logit contributions | |
Marshal | +0.004 |
lator | +0.001 |
iler | -0.016 |
layer | -0.017 |
Gutenberg | -0.018 |
Neg logit contributions | |
ensed | -0.281 |
icably | -0.277 |
scam | -0.276 |
ous | -0.265 |
ighting | -0.264 |
Token | Rod |
Token ID | 6882 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
Marshal | +0.492 |
lator | +0.480 |
iler | +0.419 |
layer | +0.416 |
Gutenberg | +0.411 |
Neg logit contributions | |
ensed | -0.539 |
icably | -0.525 |
scam | -0.521 |
ous | -0.481 |
ighting | -0.480 |
Token | olf |
Token ID | 4024 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
Marshal | +0.122 |
lator | +0.120 |
iler | +0.105 |
layer | +0.104 |
Gutenberg | +0.103 |
Neg logit contributions | |
ensed | -0.126 |
icably | -0.123 |
scam | -0.122 |
ous | -0.113 |
ighting | -0.112 |
Token | o |
Token ID | 78 |
Feature activation | -3.95e-02 |
Pos logit contributions | |
Marshal | +0.141 |
lator | +0.138 |
iler | +0.126 |
layer | +0.125 |
Gutenberg | +0.124 |
Neg logit contributions | |
ensed | -0.068 |
icably | -0.064 |
scam | -0.064 |
recomm | -0.056 |
ighting | -0.056 |
Token | G |
Token ID | 402 |
Feature activation | +8.94e-02 |
Pos logit contributions | |
ensed | +0.029 |
icably | +0.028 |
scam | +0.028 |
ous | +0.026 |
ighting | +0.026 |
Neg logit contributions | |
Marshal | -0.031 |
lator | -0.030 |
iler | -0.027 |
layer | -0.026 |
Gutenberg | -0.026 |
Token | raz |
Token ID | 3247 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
Marshal | +0.066 |
lator | +0.064 |
iler | +0.057 |
layer | +0.056 |
Gutenberg | +0.055 |
Neg logit contributions | |
ensed | -0.070 |
icably | -0.068 |
scam | -0.067 |
ighting | -0.062 |
recomm | -0.062 |
Token | ral |
Token ID | 1373 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
ensed | +0.174 |
icably | +0.169 |
scam | +0.168 |
ous | +0.158 |
ella | +0.157 |
Neg logit contributions | |
Marshal | -0.117 |
lator | -0.114 |
iler | -0.097 |
layer | -0.096 |
Gutenberg | -0.095 |
Token | Process |
Token ID | 10854 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
Marshal | +0.141 |
lator | +0.139 |
iler | +0.121 |
layer | +0.120 |
Gutenberg | +0.118 |
Neg logit contributions | |
ensed | -0.163 |
icably | -0.158 |
scam | -0.158 |
ous | -0.147 |
ighting | -0.145 |
Token | ion |
Token ID | 295 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
Marshal | +0.116 |
lator | +0.114 |
iler | +0.102 |
layer | +0.101 |
Gutenberg | +0.100 |
Neg logit contributions | |
ensed | -0.089 |
icably | -0.087 |
scam | -0.086 |
ous | -0.078 |
ighting | -0.077 |
Token |
|
Token ID | 198 |
Feature activation | -8.68e-02 |
Pos logit contributions | |
ensed | +0.043 |
scam | +0.042 |
icably | +0.042 |
ous | +0.039 |
ella | +0.038 |
Neg logit contributions | |
Marshal | -0.049 |
lator | -0.048 |
iler | -0.043 |
layer | -0.042 |
Gutenberg | -0.042 |
Token |
|
Token ID | 198 |
Feature activation | -9.11e-02 |
Pos logit contributions | |
ensed | +0.063 |
icably | +0.061 |
scam | +0.061 |
ighting | +0.055 |
ous | +0.055 |
Neg logit contributions | |
Marshal | -0.069 |
lator | -0.067 |
iler | -0.060 |
layer | -0.059 |
Gutenberg | -0.059 |
Token | Pir |
Token ID | 46772 |
Feature activation | +6.59e-01 |
Pos logit contributions | |
ensed | +0.068 |
icably | +0.066 |
scam | +0.066 |
ous | +0.061 |
ighting | +0.060 |
Neg logit contributions | |
Marshal | -0.070 |
lator | -0.068 |
iler | -0.060 |
layer | -0.060 |
Gutenberg | -0.059 |
Token | acy |
Token ID | 1590 |
Feature activation | +7.04e-02 |
Pos logit contributions | |
Marshal | +0.510 |
lator | +0.500 |
iler | +0.442 |
layer | +0.439 |
Gutenberg | +0.432 |
Neg logit contributions | |
ensed | -0.487 |
icably | -0.474 |
scam | -0.471 |
recomm | -0.432 |
ighting | -0.429 |
Token | Charm |
Token ID | 30225 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
Marshal | +0.052 |
lator | +0.051 |
iler | +0.044 |
layer | +0.044 |
Gutenberg | +0.043 |
Neg logit contributions | |
ensed | -0.055 |
icably | -0.054 |
scam | -0.053 |
ous | -0.049 |
ighting | -0.049 |
Token | vs |
Token ID | 3691 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
Marshal | +0.012 |
lator | +0.012 |
iler | +0.010 |
layer | +0.010 |
Gutenberg | +0.010 |
Neg logit contributions | |
ensed | -0.015 |
icably | -0.014 |
scam | -0.014 |
ous | -0.013 |
ella | -0.013 |
Token | Talent |
Token ID | 29505 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
ensed | +0.020 |
icably | +0.019 |
scam | +0.019 |
ous | +0.018 |
ighting | +0.018 |
Neg logit contributions | |
Marshal | -0.018 |
lator | -0.018 |
iler | -0.016 |
layer | -0.016 |
Gutenberg | -0.015 |
Token | of |
Token ID | 286 |
Feature activation | -5.67e-02 |
Pos logit contributions | |
ensed | +0.077 |
icably | +0.075 |
scam | +0.074 |
ous | +0.068 |
ighting | +0.068 |
Neg logit contributions | |
Marshal | -0.077 |
lator | -0.075 |
iler | -0.066 |
layer | -0.066 |
Gutenberg | -0.065 |
Token | formations |
Token ID | 30648 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
Marshal | +0.164 |
lator | +0.159 |
iler | +0.143 |
layer | +0.142 |
Gutenberg | +0.140 |
Neg logit contributions | |
ensed | -0.121 |
icably | -0.116 |
scam | -0.115 |
ella | -0.104 |
ous | -0.104 |
Token | . |
Token ID | 13 |
Feature activation | +5.99e-02 |
Pos logit contributions | |
Marshal | +0.023 |
lator | +0.022 |
iler | +0.020 |
layer | +0.020 |
Gutenberg | +0.019 |
Neg logit contributions | |
ensed | -0.022 |
icably | -0.021 |
scam | -0.021 |
ous | -0.019 |
ighting | -0.019 |
Token | This |
Token ID | 770 |
Feature activation | -6.25e-03 |
Pos logit contributions | |
Marshal | +0.049 |
lator | +0.047 |
iler | +0.042 |
layer | +0.042 |
Gutenberg | +0.042 |
Neg logit contributions | |
ensed | -0.043 |
icably | -0.041 |
scam | -0.041 |
ighting | -0.037 |
recomm | -0.037 |
Token | protocol |
Token ID | 8435 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
ensed | +0.004 |
icably | +0.004 |
scam | +0.004 |
ighting | +0.003 |
ous | +0.003 |
Neg logit contributions | |
Marshal | -0.006 |
lator | -0.006 |
iler | -0.005 |
layer | -0.005 |
Gutenberg | -0.005 |
Token | allowed |
Token ID | 3142 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
Marshal | +0.103 |
lator | +0.101 |
iler | +0.090 |
layer | +0.089 |
Gutenberg | +0.088 |
Neg logit contributions | |
ensed | -0.079 |
icably | -0.076 |
scam | -0.075 |
ighting | -0.069 |
ous | -0.068 |
Token | Marshal |
Token ID | 37899 |
Feature activation | +6.41e-01 |
Pos logit contributions | |
ensed | +0.094 |
icably | +0.091 |
scam | +0.090 |
ighting | +0.082 |
ous | +0.082 |
Neg logit contributions | |
Marshal | -0.110 |
lator | -0.107 |
iler | -0.095 |
layer | -0.094 |
Gutenberg | -0.094 |
Token | Rod |
Token ID | 6882 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
Marshal | +0.443 |
lator | +0.433 |
iler | +0.375 |
layer | +0.372 |
Gutenberg | +0.368 |
Neg logit contributions | |
ensed | -0.530 |
icably | -0.516 |
scam | -0.513 |
ous | -0.476 |
ighting | -0.474 |
Token | olf |
Token ID | 4024 |
Feature activation | +7.42e-02 |
Pos logit contributions | |
Marshal | +0.104 |
lator | +0.103 |
iler | +0.090 |
layer | +0.090 |
Gutenberg | +0.089 |
Neg logit contributions | |
ensed | -0.103 |
icably | -0.100 |
scam | -0.099 |
ous | -0.092 |
ella | -0.091 |
Token | o |
Token ID | 78 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
Marshal | +0.069 |
lator | +0.068 |
iler | +0.062 |
layer | +0.061 |
Gutenberg | +0.061 |
Neg logit contributions | |
ensed | -0.043 |
icably | -0.041 |
scam | -0.041 |
ous | -0.037 |
ighting | -0.037 |
Token | G |
Token ID | 402 |
Feature activation | +8.80e-02 |
Pos logit contributions | |
ensed | +0.102 |
icably | +0.099 |
scam | +0.099 |
ous | +0.091 |
ella | +0.090 |
Neg logit contributions | |
Marshal | -0.101 |
lator | -0.099 |
iler | -0.087 |
layer | -0.087 |
Gutenberg | -0.085 |
Token | raz |
Token ID | 3247 |
Feature activation | +9.77e-02 |
Pos logit contributions | |
Marshal | +0.074 |
lator | +0.073 |
iler | +0.065 |
layer | +0.064 |
Gutenberg | +0.064 |
Neg logit contributions | |
ensed | -0.059 |
icably | -0.057 |
scam | -0.057 |
ous | -0.052 |
ighting | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | +3.55e-02 |
Pos logit contributions | |
Marshal | +0.088 |
lator | +0.087 |
layer | +0.076 |
iler | +0.076 |
Gutenberg | +0.074 |
Neg logit contributions | |
ensed | -0.090 |
icably | -0.087 |
scam | -0.087 |
ighting | -0.080 |
recomm | -0.080 |
Token | The |
Token ID | 383 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
Marshal | +0.028 |
lator | +0.027 |
layer | +0.024 |
iler | +0.024 |
Gutenberg | +0.024 |
Neg logit contributions | |
ensed | -0.026 |
scam | -0.025 |
icably | -0.025 |
ighting | -0.023 |
recomm | -0.023 |
Token | bl |
Token ID | 698 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
ensed | +0.016 |
icably | +0.015 |
scam | +0.015 |
ighting | +0.014 |
ous | +0.014 |
Neg logit contributions | |
Marshal | -0.026 |
lator | -0.025 |
iler | -0.023 |
layer | -0.023 |
Gutenberg | -0.022 |
Token | uish |
Token ID | 32091 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
Marshal | +0.019 |
lator | +0.018 |
iler | +0.016 |
layer | +0.016 |
Gutenberg | +0.016 |
Neg logit contributions | |
ensed | -0.015 |
scam | -0.015 |
icably | -0.014 |
recomm | -0.013 |
ella | -0.013 |
Token | v |
Token ID | 410 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
ensed | +0.013 |
icably | +0.013 |
scam | +0.013 |
ighting | +0.012 |
ous | +0.012 |
Neg logit contributions | |
Marshal | -0.012 |
lator | -0.012 |
iler | -0.010 |
layer | -0.010 |
Gutenberg | -0.010 |
Token | ort |
Token ID | 419 |
Feature activation | +6.23e-01 |
Pos logit contributions | |
Marshal | +0.081 |
lator | +0.078 |
iler | +0.062 |
layer | +0.062 |
Gutenberg | +0.061 |
Neg logit contributions | |
ensed | -0.177 |
icably | -0.173 |
scam | -0.172 |
ous | -0.163 |
ighting | -0.162 |
Token | on |
Token ID | 261 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
Marshal | +0.486 |
lator | +0.478 |
iler | +0.423 |
layer | +0.421 |
Gutenberg | +0.411 |
Neg logit contributions | |
ensed | -0.455 |
icably | -0.443 |
scam | -0.442 |
ighting | -0.402 |
recomm | -0.402 |
Token | has |
Token ID | 468 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
Marshal | +0.103 |
lator | +0.102 |
iler | +0.090 |
layer | +0.090 |
Gutenberg | +0.089 |
Neg logit contributions | |
ensed | -0.085 |
icably | -0.083 |
scam | -0.082 |
ighting | -0.075 |
ous | -0.074 |
Token | a |
Token ID | 257 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
Marshal | +0.087 |
lator | +0.086 |
iler | +0.075 |
layer | +0.075 |
Gutenberg | +0.074 |
Neg logit contributions | |
ensed | -0.085 |
icably | -0.082 |
scam | -0.082 |
ous | -0.075 |
ighting | -0.075 |
Token | positive |
Token ID | 3967 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
Marshal | +0.117 |
lator | +0.115 |
iler | +0.104 |
layer | +0.104 |
Gutenberg | +0.103 |
Neg logit contributions | |
ensed | -0.068 |
icably | -0.066 |
scam | -0.065 |
ous | -0.058 |
ighting | -0.058 |
Token | density |
Token ID | 12109 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
ensed | +0.102 |
icably | +0.099 |
scam | +0.098 |
ighting | +0.091 |
ous | +0.091 |
Neg logit contributions | |
Marshal | -0.081 |
lator | -0.079 |
layer | -0.068 |
iler | -0.068 |
Gutenberg | -0.067 |
Token | Feed |
Token ID | 18272 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
ensed | +0.044 |
icably | +0.043 |
scam | +0.042 |
ous | +0.039 |
ighting | +0.039 |
Neg logit contributions | |
Marshal | -0.047 |
lator | -0.046 |
iler | -0.041 |
layer | -0.041 |
Gutenberg | -0.040 |
Token | books |
Token ID | 12106 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
ensed | +0.128 |
icably | +0.125 |
scam | +0.124 |
ous | +0.115 |
ella | +0.115 |
Neg logit contributions | |
Marshal | -0.111 |
lator | -0.109 |
iler | -0.095 |
layer | -0.094 |
Gutenberg | -0.092 |
Token | , |
Token ID | 11 |
Feature activation | -2.08e-03 |
Pos logit contributions | |
Marshal | +0.093 |
lator | +0.091 |
iler | +0.080 |
layer | +0.080 |
Gutenberg | +0.079 |
Neg logit contributions | |
ensed | -0.090 |
icably | -0.088 |
scam | -0.087 |
ous | -0.080 |
ighting | -0.080 |
Token | try |
Token ID | 1949 |
Feature activation | -9.29e-02 |
Pos logit contributions | |
ensed | +0.001 |
icably | +0.001 |
scam | +0.001 |
ous | +0.001 |
ighting | +0.001 |
Neg logit contributions | |
Marshal | -0.002 |
lator | -0.002 |
iler | -0.002 |
layer | -0.002 |
Gutenberg | -0.002 |
Token | Project |
Token ID | 4935 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
ensed | +0.063 |
icably | +0.061 |
scam | +0.060 |
ighting | +0.055 |
ous | +0.055 |
Neg logit contributions | |
Marshal | -0.078 |
lator | -0.076 |
iler | -0.068 |
layer | -0.068 |
Gutenberg | -0.068 |
Token | Gutenberg |
Token ID | 20336 |
Feature activation | +6.20e-01 |
Pos logit contributions | |
Marshal | +0.096 |
lator | +0.093 |
iler | +0.071 |
layer | +0.070 |
Gutenberg | +0.069 |
Neg logit contributions | |
ensed | -0.269 |
icably | -0.264 |
scam | -0.262 |
ous | -0.248 |
ighting | -0.247 |
Token | ( |
Token ID | 357 |
Feature activation | -4.74e-02 |
Pos logit contributions | |
Marshal | +0.478 |
lator | +0.470 |
iler | +0.413 |
layer | +0.411 |
Gutenberg | +0.408 |
Neg logit contributions | |
ensed | -0.461 |
icably | -0.449 |
scam | -0.444 |
ous | -0.407 |
ighting | -0.407 |
Token | www |
Token ID | 2503 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
ensed | +0.038 |
icably | +0.037 |
scam | +0.036 |
ous | +0.034 |
ighting | +0.034 |
Neg logit contributions | |
Marshal | -0.034 |
lator | -0.033 |
iler | -0.029 |
layer | -0.029 |
Gutenberg | -0.028 |
Token | . |
Token ID | 13 |
Feature activation | -3.03e-02 |
Pos logit contributions | |
Marshal | +0.103 |
lator | +0.102 |
iler | +0.089 |
layer | +0.088 |
Gutenberg | +0.087 |
Neg logit contributions | |
ensed | -0.112 |
icably | -0.109 |
scam | -0.108 |
ighting | -0.099 |
ous | -0.099 |
Token | g |
Token ID | 70 |
Feature activation | -7.92e-02 |
Pos logit contributions | |
ensed | +0.024 |
icably | +0.024 |
scam | +0.023 |
ous | +0.022 |
ighting | +0.022 |
Neg logit contributions | |
Marshal | -0.022 |
lator | -0.021 |
iler | -0.018 |
layer | -0.018 |
Gutenberg | -0.018 |
Token | utenberg |
Token ID | 19028 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
ensed | +0.079 |
icably | +0.078 |
scam | +0.078 |
ous | +0.073 |
ighting | +0.073 |
Neg logit contributions | |
Marshal | -0.040 |
lator | -0.039 |
iler | -0.032 |
layer | -0.032 |
Gutenberg | -0.031 |
Token | wood |
Token ID | 3822 |
Feature activation | -6.92e-02 |
Pos logit contributions | |
Marshal | +0.209 |
lator | +0.205 |
iler | +0.180 |
layer | +0.179 |
Gutenberg | +0.177 |
Neg logit contributions | |
ensed | -0.197 |
icably | -0.192 |
scam | -0.190 |
ous | -0.174 |
ighting | -0.174 |
Token | met |
Token ID | 1138 |
Feature activation | +6.49e-02 |
Pos logit contributions | |
ensed | +0.049 |
icably | +0.048 |
scam | +0.047 |
ous | +0.043 |
ighting | +0.043 |
Neg logit contributions | |
Marshal | -0.056 |
lator | -0.055 |
iler | -0.048 |
layer | -0.048 |
Gutenberg | -0.048 |
Token | with |
Token ID | 351 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
Marshal | +0.050 |
lator | +0.049 |
iler | +0.043 |
layer | +0.043 |
Gutenberg | +0.043 |
Neg logit contributions | |
ensed | -0.048 |
icably | -0.047 |
scam | -0.046 |
ous | -0.043 |
ighting | -0.043 |
Token | the |
Token ID | 262 |
Feature activation | -9.06e-02 |
Pos logit contributions | |
ensed | +0.014 |
icably | +0.014 |
scam | +0.014 |
ous | +0.013 |
ighting | +0.013 |
Neg logit contributions | |
Marshal | -0.015 |
lator | -0.014 |
iler | -0.013 |
layer | -0.013 |
Gutenberg | -0.013 |
Token | Carolina |
Token ID | 5913 |
Feature activation | +1.69e-01 |
Pos logit contributions | |
ensed | +0.069 |
icably | +0.067 |
scam | +0.067 |
ous | +0.061 |
ighting | +0.061 |
Neg logit contributions | |
Marshal | -0.068 |
lator | -0.067 |
iler | -0.059 |
layer | -0.058 |
Gutenberg | -0.058 |
Token | Panthers |
Token ID | 17782 |
Feature activation | +6.05e-01 |
Pos logit contributions | |
Marshal | +0.070 |
lator | +0.069 |
iler | +0.053 |
layer | +0.053 |
Gutenberg | +0.051 |
Neg logit contributions | |
ensed | -0.186 |
scam | -0.182 |
icably | -0.182 |
ous | -0.172 |
ighting | -0.171 |
Token | for |
Token ID | 329 |
Feature activation | -4.40e-02 |
Pos logit contributions | |
Marshal | +0.473 |
lator | +0.463 |
iler | +0.409 |
layer | +0.406 |
Gutenberg | +0.401 |
Neg logit contributions | |
ensed | -0.444 |
icably | -0.432 |
scam | -0.428 |
ous | -0.392 |
ighting | -0.391 |
Token | a |
Token ID | 257 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
ensed | +0.032 |
icably | +0.031 |
scam | +0.031 |
ous | +0.028 |
ighting | +0.028 |
Neg logit contributions | |
Marshal | -0.034 |
lator | -0.034 |
iler | -0.030 |
layer | -0.030 |
Gutenberg | -0.029 |
Token | workout |
Token ID | 17578 |
Feature activation | +4.53e-02 |
Pos logit contributions | |
Marshal | +0.011 |
lator | +0.011 |
iler | +0.010 |
layer | +0.010 |
Gutenberg | +0.009 |
Neg logit contributions | |
ensed | -0.009 |
icably | -0.009 |
scam | -0.009 |
ous | -0.008 |
recomm | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | -3.54e-03 |
Pos logit contributions | |
Marshal | +0.034 |
lator | +0.034 |
iler | +0.030 |
layer | +0.029 |
Gutenberg | +0.029 |
Neg logit contributions | |
ensed | -0.034 |
icably | -0.033 |
scam | -0.033 |
ous | -0.031 |
ighting | -0.030 |
Token | according |
Token ID | 1864 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
ensed | +0.002 |
icably | +0.002 |
scam | +0.002 |
ous | +0.002 |
ighting | +0.002 |
Neg logit contributions | |
Marshal | -0.003 |
lator | -0.003 |
iler | -0.003 |
layer | -0.003 |
Gutenberg | -0.003 |
Token | showed |
Token ID | 3751 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
Marshal | +0.072 |
lator | +0.071 |
iler | +0.063 |
layer | +0.062 |
Gutenberg | +0.062 |
Neg logit contributions | |
ensed | -0.054 |
icably | -0.052 |
scam | -0.052 |
ighting | -0.047 |
ous | -0.047 |
Token | an |
Token ID | 281 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
ensed | +0.126 |
icably | +0.123 |
scam | +0.122 |
ous | +0.113 |
ighting | +0.113 |
Neg logit contributions | |
Marshal | -0.108 |
lator | -0.105 |
iler | -0.091 |
layer | -0.091 |
Gutenberg | -0.090 |
Token | anx |
Token ID | 7296 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
Marshal | +0.086 |
lator | +0.083 |
iler | +0.071 |
layer | +0.071 |
Gutenberg | +0.070 |
Neg logit contributions | |
ensed | -0.123 |
icably | -0.120 |
scam | -0.119 |
ighting | -0.111 |
ous | -0.111 |
Token | io |
Token ID | 952 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ensed | +0.098 |
icably | +0.096 |
scam | +0.095 |
ous | +0.087 |
ighting | +0.087 |
Neg logit contributions | |
Marshal | -0.108 |
lator | -0.105 |
iler | -0.093 |
layer | -0.093 |
Gutenberg | -0.092 |
Token | ly |
Token ID | 306 |
Feature activation | +1.90e-01 |
Pos logit contributions | |
Marshal | +0.081 |
lator | +0.079 |
iler | +0.068 |
layer | +0.068 |
Gutenberg | +0.067 |
Neg logit contributions | |
ensed | -0.095 |
icably | -0.092 |
scam | -0.091 |
ous | -0.085 |
ighting | -0.084 |
Token | tic |
Token ID | 13370 |
Feature activation | +6.04e-01 |
Pos logit contributions | |
Marshal | +0.053 |
lator | +0.050 |
iler | +0.033 |
layer | +0.032 |
Gutenberg | +0.031 |
Neg logit contributions | |
ensed | -0.235 |
icably | -0.231 |
scam | -0.230 |
ous | -0.220 |
ighting | -0.218 |
Token | effect |
Token ID | 1245 |
Feature activation | -8.95e-02 |
Pos logit contributions | |
Marshal | +0.488 |
lator | +0.479 |
iler | +0.424 |
layer | +0.422 |
Gutenberg | +0.417 |
Neg logit contributions | |
ensed | -0.428 |
icably | -0.415 |
scam | -0.412 |
ighting | -0.376 |
ous | -0.376 |
Token | in |
Token ID | 287 |
Feature activation | +7.99e-02 |
Pos logit contributions | |
ensed | +0.065 |
icably | +0.063 |
scam | +0.063 |
ous | +0.058 |
ighting | +0.057 |
Neg logit contributions | |
Marshal | -0.070 |
lator | -0.069 |
iler | -0.061 |
layer | -0.061 |
Gutenberg | -0.060 |
Token | the |
Token ID | 262 |
Feature activation | +6.00e-02 |
Pos logit contributions | |
Marshal | +0.068 |
lator | +0.066 |
iler | +0.059 |
layer | +0.059 |
Gutenberg | +0.058 |
Neg logit contributions | |
ensed | -0.053 |
icably | -0.052 |
scam | -0.051 |
ighting | -0.047 |
ous | -0.047 |
Token | defensive |
Token ID | 6110 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
Marshal | +0.051 |
lator | +0.050 |
iler | +0.044 |
layer | +0.044 |
Gutenberg | +0.044 |
Neg logit contributions | |
ensed | -0.040 |
icably | -0.039 |
scam | -0.039 |
ous | -0.035 |
ighting | -0.035 |
Token | burying |
Token ID | 48360 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
Marshal | +0.193 |
lator | +0.188 |
iler | +0.170 |
layer | +0.169 |
Gutenberg | +0.167 |
Neg logit contributions | |
ensed | -0.138 |
icably | -0.133 |
scam | -0.130 |
ous | -0.118 |
ighting | -0.118 |
Token | ] |
Token ID | 60 |
Feature activation | +2.64e-01 |
Pos logit contributions | |
Marshal | +0.092 |
lator | +0.090 |
iler | +0.076 |
layer | +0.075 |
Gutenberg | +0.074 |
Neg logit contributions | |
ensed | -0.147 |
icably | -0.144 |
scam | -0.143 |
ous | -0.134 |
ighting | -0.133 |
Token |
|
Token ID | 198 |
Feature activation | +7.44e-02 |
Pos logit contributions | |
Marshal | +0.209 |
lator | +0.205 |
iler | +0.181 |
layer | +0.180 |
Gutenberg | +0.178 |
Neg logit contributions | |
ensed | -0.192 |
icably | -0.187 |
scam | -0.185 |
ous | -0.170 |
ighting | -0.169 |
Token |
|
Token ID | 198 |
Feature activation | +4.52e-02 |
Pos logit contributions | |
Marshal | +0.058 |
lator | +0.057 |
iler | +0.050 |
layer | +0.050 |
Gutenberg | +0.049 |
Neg logit contributions | |
ensed | -0.055 |
icably | -0.053 |
scam | -0.053 |
ighting | -0.048 |
recomm | -0.048 |
Token | According |
Token ID | 4821 |
Feature activation | +7.03e-02 |
Pos logit contributions | |
Marshal | +0.038 |
lator | +0.037 |
iler | +0.033 |
layer | +0.033 |
Gutenberg | +0.033 |
Neg logit contributions | |
ensed | -0.031 |
icably | -0.030 |
scam | -0.029 |
ous | -0.027 |
ighting | -0.027 |
Token | to |
Token ID | 284 |
Feature activation | +2.57e-03 |
Pos logit contributions | |
Marshal | +0.057 |
lator | +0.056 |
iler | +0.049 |
layer | +0.049 |
Gutenberg | +0.048 |
Neg logit contributions | |
ensed | -0.050 |
icably | -0.049 |
scam | -0.048 |
ous | -0.044 |
ighting | -0.044 |
Token | Marshal |
Token ID | 37899 |
Feature activation | +5.99e-01 |
Pos logit contributions | |
Marshal | +0.002 |
lator | +0.002 |
iler | +0.002 |
layer | +0.002 |
Gutenberg | +0.002 |
Neg logit contributions | |
ensed | -0.002 |
icably | -0.002 |
scam | -0.002 |
ous | -0.002 |
ighting | -0.002 |
Token | Ale |
Token ID | 9300 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
Marshal | +0.421 |
lator | +0.412 |
iler | +0.357 |
layer | +0.355 |
Gutenberg | +0.351 |
Neg logit contributions | |
ensed | -0.487 |
icably | -0.475 |
scam | -0.472 |
ous | -0.437 |
ighting | -0.435 |
Token | ks |
Token ID | 591 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
Marshal | +0.074 |
lator | +0.072 |
iler | +0.061 |
layer | +0.061 |
Gutenberg | +0.061 |
Neg logit contributions | |
ensed | -0.110 |
icably | -0.107 |
scam | -0.107 |
ous | -0.100 |
ella | -0.099 |
Token | andr |
Token ID | 46273 |
Feature activation | -7.82e-02 |
Pos logit contributions | |
Marshal | +0.245 |
lator | +0.242 |
iler | +0.215 |
layer | +0.214 |
Gutenberg | +0.212 |
Neg logit contributions | |
ensed | -0.180 |
icably | -0.174 |
scam | -0.173 |
ous | -0.158 |
ighting | -0.156 |
Token | Vas |
Token ID | 23663 |
Feature activation | +6.46e-02 |
Pos logit contributions | |
ensed | +0.062 |
icably | +0.060 |
scam | +0.060 |
ous | +0.056 |
ella | +0.055 |
Neg logit contributions | |
Marshal | -0.056 |
lator | -0.055 |
iler | -0.048 |
layer | -0.048 |
Gutenberg | -0.047 |
Token | ile |
Token ID | 576 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
Marshal | +0.047 |
lator | +0.046 |
iler | +0.040 |
layer | +0.040 |
Gutenberg | +0.040 |
Neg logit contributions | |
ensed | -0.050 |
icably | -0.049 |
scam | -0.049 |
ous | -0.045 |
ella | -0.045 |
Token | only |
Token ID | 691 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
Marshal | +0.095 |
lator | +0.093 |
iler | +0.083 |
layer | +0.082 |
Gutenberg | +0.081 |
Neg logit contributions | |
ensed | -0.086 |
icably | -0.083 |
scam | -0.082 |
ous | -0.076 |
ighting | -0.075 |
Token | Ravens |
Token ID | 20091 |
Feature activation | +8.53e-02 |
Pos logit contributions | |
Marshal | +0.013 |
lator | +0.013 |
iler | +0.011 |
layer | +0.011 |
Gutenberg | +0.011 |
Neg logit contributions | |
ensed | -0.013 |
icably | -0.013 |
scam | -0.013 |
ous | -0.012 |
ighting | -0.012 |
Token | All |
Token ID | 1439 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
Marshal | +0.063 |
lator | +0.062 |
iler | +0.054 |
layer | +0.054 |
Gutenberg | +0.054 |
Neg logit contributions | |
ensed | -0.066 |
icably | -0.064 |
scam | -0.064 |
ous | -0.059 |
ighting | -0.058 |
Token | - |
Token ID | 12 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
Marshal | +0.030 |
lator | +0.029 |
iler | +0.026 |
layer | +0.025 |
Gutenberg | +0.025 |
Neg logit contributions | |
ensed | -0.033 |
icably | -0.033 |
scam | -0.032 |
ighting | -0.030 |
ella | -0.030 |
Token | Pro |
Token ID | 2964 |
Feature activation | -7.95e-02 |
Pos logit contributions | |
Marshal | +0.082 |
lator | +0.081 |
iler | +0.072 |
layer | +0.071 |
Gutenberg | +0.070 |
Neg logit contributions | |
ensed | -0.071 |
icably | -0.069 |
scam | -0.068 |
ighting | -0.062 |
ous | -0.062 |
Token | Marshal |
Token ID | 37899 |
Feature activation | +5.98e-01 |
Pos logit contributions | |
ensed | +0.060 |
icably | +0.058 |
scam | +0.058 |
ous | +0.053 |
ighting | +0.053 |
Neg logit contributions | |
Marshal | -0.061 |
lator | -0.060 |
iler | -0.052 |
layer | -0.052 |
Gutenberg | -0.051 |
Token | Y |
Token ID | 575 |
Feature activation | -6.96e-02 |
Pos logit contributions | |
Marshal | +0.540 |
lator | +0.534 |
iler | +0.478 |
layer | +0.477 |
Gutenberg | +0.472 |
Neg logit contributions | |
ensed | -0.366 |
icably | -0.352 |
scam | -0.350 |
ous | -0.316 |
ella | -0.312 |
Token | anda |
Token ID | 5282 |
Feature activation | -4.83e-02 |
Pos logit contributions | |
ensed | +0.042 |
icably | +0.041 |
scam | +0.040 |
ighting | +0.036 |
recomm | +0.036 |
Neg logit contributions | |
Marshal | -0.063 |
lator | -0.062 |
iler | -0.056 |
layer | -0.056 |
Gutenberg | -0.055 |
Token | — |
Token ID | 851 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
ensed | +0.034 |
icably | +0.033 |
scam | +0.033 |
ous | +0.030 |
ighting | +0.030 |
Neg logit contributions | |
Marshal | -0.039 |
lator | -0.038 |
iler | -0.034 |
layer | -0.033 |
Gutenberg | -0.033 |
Token | per |
Token ID | 583 |
Feature activation | +2.28e-03 |
Pos logit contributions | |
ensed | +0.041 |
icably | +0.040 |
scam | +0.040 |
ous | +0.036 |
ighting | +0.036 |
Neg logit contributions | |
Marshal | -0.048 |
lator | -0.047 |
iler | -0.042 |
layer | -0.042 |
Gutenberg | -0.041 |
Token | Pro |
Token ID | 1041 |
Feature activation | +8.72e-02 |
Pos logit contributions | |
Marshal | +0.002 |
lator | +0.002 |
iler | +0.001 |
layer | +0.001 |
Gutenberg | +0.001 |
Neg logit contributions | |
ensed | -0.002 |
icably | -0.002 |
scam | -0.002 |
ous | -0.002 |
ighting | -0.002 |
Token | iazep |
Token ID | 48826 |
Feature activation | +9.02e-03 |
Pos logit contributions | |
ensed | +0.019 |
icably | +0.018 |
scam | +0.018 |
ous | +0.017 |
ighting | +0.017 |
Neg logit contributions | |
Marshal | -0.023 |
lator | -0.023 |
iler | -0.020 |
layer | -0.020 |
Gutenberg | -0.020 |
Token | ine |
Token ID | 500 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
Marshal | +0.009 |
lator | +0.009 |
iler | +0.009 |
layer | +0.009 |
Gutenberg | +0.008 |
Neg logit contributions | |
ensed | -0.004 |
icably | -0.004 |
scam | -0.004 |
ighting | -0.003 |
ous | -0.003 |
Token | anx |
Token ID | 7296 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
ensed | +0.163 |
icably | +0.159 |
scam | +0.157 |
ighting | +0.144 |
ous | +0.144 |
Neg logit contributions | |
Marshal | -0.170 |
lator | -0.167 |
iler | -0.147 |
layer | -0.146 |
Gutenberg | -0.144 |
Token | io |
Token ID | 952 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
ensed | +0.083 |
icably | +0.081 |
scam | +0.080 |
ous | +0.074 |
ighting | +0.073 |
Neg logit contributions | |
Marshal | -0.090 |
lator | -0.088 |
iler | -0.078 |
layer | -0.077 |
Gutenberg | -0.077 |
Token | ly |
Token ID | 306 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
Marshal | +0.077 |
lator | +0.075 |
iler | +0.066 |
layer | +0.065 |
Gutenberg | +0.064 |
Neg logit contributions | |
ensed | -0.087 |
icably | -0.084 |
scam | -0.083 |
ous | -0.078 |
ella | -0.077 |
Token | tic |
Token ID | 13370 |
Feature activation | +5.89e-01 |
Pos logit contributions | |
Marshal | +0.045 |
lator | +0.042 |
iler | +0.030 |
layer | +0.028 |
Gutenberg | +0.028 |
Neg logit contributions | |
ensed | -0.185 |
icably | -0.181 |
scam | -0.181 |
ous | -0.173 |
ella | -0.172 |
Token | agent |
Token ID | 5797 |
Feature activation | +3.68e-01 |
Pos logit contributions | |
Marshal | +0.447 |
lator | +0.439 |
iler | +0.385 |
layer | +0.382 |
Gutenberg | +0.377 |
Neg logit contributions | |
ensed | -0.444 |
icably | -0.433 |
scam | -0.428 |
ighting | -0.396 |
ous | -0.392 |
Token | , |
Token ID | 11 |
Feature activation | +5.42e-02 |
Pos logit contributions | |
Marshal | +0.285 |
lator | +0.280 |
iler | +0.246 |
layer | +0.244 |
Gutenberg | +0.241 |
Neg logit contributions | |
ensed | -0.273 |
icably | -0.266 |
scam | -0.263 |
ighting | -0.242 |
ous | -0.242 |
Token | also |
Token ID | 635 |
Feature activation | +8.32e-02 |
Pos logit contributions | |
Marshal | +0.046 |
lator | +0.045 |
iler | +0.040 |
layer | +0.040 |
Gutenberg | +0.040 |
Neg logit contributions | |
ensed | -0.036 |
icably | -0.035 |
scam | -0.035 |
ighting | -0.032 |
ous | -0.031 |
Token | showed |
Token ID | 3751 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
Marshal | +0.072 |
lator | +0.071 |
iler | +0.063 |
layer | +0.062 |
Gutenberg | +0.062 |
Neg logit contributions | |
ensed | -0.054 |
icably | -0.052 |
scam | -0.052 |
ighting | -0.047 |
ous | -0.047 |
Token | an |
Token ID | 281 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
ensed | +0.126 |
icably | +0.123 |
scam | +0.122 |
ous | +0.113 |
ighting | +0.113 |
Neg logit contributions | |
Marshal | -0.108 |
lator | -0.105 |
iler | -0.091 |
layer | -0.091 |
Gutenberg | -0.090 |
Token | by |
Token ID | 416 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
ensed | +0.078 |
icably | +0.076 |
scam | +0.076 |
ous | +0.070 |
ighting | +0.070 |
Neg logit contributions | |
Marshal | -0.062 |
lator | -0.061 |
iler | -0.053 |
layer | -0.052 |
Gutenberg | -0.051 |
Token | the |
Token ID | 262 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
Marshal | +0.110 |
lator | +0.108 |
iler | +0.095 |
layer | +0.095 |
Gutenberg | +0.094 |
Neg logit contributions | |
ensed | -0.099 |
icably | -0.097 |
scam | -0.096 |
ous | -0.088 |
ighting | -0.088 |
Token | talented |
Token ID | 12356 |
Feature activation | -3.08e-02 |
Pos logit contributions | |
ensed | +0.011 |
icably | +0.010 |
scam | +0.010 |
ighting | +0.009 |
ous | +0.009 |
Neg logit contributions | |
Marshal | -0.014 |
lator | -0.013 |
iler | -0.012 |
layer | -0.012 |
Gutenberg | -0.012 |
Token | Will |
Token ID | 2561 |
Feature activation | +3.76e-02 |
Pos logit contributions | |
ensed | +0.022 |
icably | +0.021 |
scam | +0.021 |
ous | +0.019 |
ighting | +0.019 |
Neg logit contributions | |
Marshal | -0.025 |
lator | -0.025 |
iler | -0.022 |
layer | -0.022 |
Gutenberg | -0.022 |
Token | Lar |
Token ID | 25577 |
Feature activation | +1.80e-01 |
Pos logit contributions | |
Marshal | +0.025 |
lator | +0.025 |
iler | +0.021 |
layer | +0.021 |
Gutenberg | +0.021 |
Neg logit contributions | |
ensed | -0.031 |
icably | -0.031 |
scam | -0.031 |
ous | -0.028 |
ella | -0.028 |
Token | che |
Token ID | 2395 |
Feature activation | +5.83e-01 |
Pos logit contributions | |
Marshal | +0.059 |
lator | +0.056 |
iler | +0.040 |
layer | +0.039 |
Gutenberg | +0.038 |
Neg logit contributions | |
ensed | -0.214 |
icably | -0.211 |
scam | -0.210 |
ous | -0.199 |
ighting | -0.199 |
Token | . |
Token ID | 13 |
Feature activation | +7.13e-02 |
Pos logit contributions | |
Marshal | +0.447 |
lator | +0.438 |
iler | +0.386 |
layer | +0.383 |
Gutenberg | +0.378 |
Neg logit contributions | |
ensed | -0.437 |
icably | -0.426 |
scam | -0.422 |
ous | -0.387 |
ighting | -0.387 |
Token |
|
Token ID | 198 |
Feature activation | +7.05e-02 |
Pos logit contributions | |
Marshal | +0.057 |
lator | +0.056 |
iler | +0.050 |
layer | +0.049 |
Gutenberg | +0.049 |
Neg logit contributions | |
ensed | -0.051 |
icably | -0.050 |
scam | -0.049 |
ous | -0.045 |
ighting | -0.045 |
Token |
|
Token ID | 198 |
Feature activation | +5.97e-02 |
Pos logit contributions | |
Marshal | +0.055 |
lator | +0.054 |
iler | +0.048 |
layer | +0.048 |
Gutenberg | +0.047 |
Neg logit contributions | |
ensed | -0.052 |
icably | -0.050 |
scam | -0.050 |
ighting | -0.046 |
ous | -0.045 |
Token | Thanks |
Token ID | 9690 |
Feature activation | -6.60e-02 |
Pos logit contributions | |
Marshal | +0.048 |
lator | +0.048 |
iler | +0.042 |
layer | +0.042 |
Gutenberg | +0.041 |
Neg logit contributions | |
ensed | -0.042 |
icably | -0.041 |
scam | -0.041 |
ous | -0.037 |
ighting | -0.037 |
Token | again |
Token ID | 757 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
ensed | +0.045 |
icably | +0.044 |
scam | +0.044 |
ous | +0.040 |
ella | +0.040 |
Neg logit contributions | |
Marshal | -0.054 |
lator | -0.054 |
iler | -0.048 |
layer | -0.047 |
Gutenberg | -0.047 |
Token |
|
Token ID | 198 |
Feature activation | -1.87e-04 |
Pos logit contributions | |
Marshal | +0.015 |
lator | +0.015 |
layer | +0.013 |
iler | +0.013 |
Gutenberg | +0.013 |
Neg logit contributions | |
ensed | -0.015 |
icably | -0.014 |
scam | -0.014 |
ighting | -0.013 |
recomm | -0.013 |
Token | Over |
Token ID | 5886 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
ensed | +0.000 |
icably | +0.000 |
scam | +0.000 |
ous | +0.000 |
ighting | +0.000 |
Neg logit contributions | |
Marshal | -0.000 |
lator | -0.000 |
iler | -0.000 |
layer | -0.000 |
Gutenberg | -0.000 |
Token | on |
Token ID | 319 |
Feature activation | -2.19e-02 |
Pos logit contributions | |
ensed | +0.082 |
icably | +0.080 |
scam | +0.079 |
ous | +0.073 |
ighting | +0.072 |
Neg logit contributions | |
Marshal | -0.094 |
lator | -0.092 |
iler | -0.082 |
layer | -0.081 |
Gutenberg | -0.080 |
Token | Reddit |
Token ID | 10750 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
ensed | +0.017 |
icably | +0.016 |
scam | +0.016 |
ous | +0.015 |
ighting | +0.015 |
Neg logit contributions | |
Marshal | -0.016 |
lator | -0.016 |
iler | -0.014 |
layer | -0.014 |
Gutenberg | -0.014 |
Token | Oculus |
Token ID | 22334 |
Feature activation | +2.32e-01 |
Pos logit contributions | |
ensed | +0.079 |
icably | +0.077 |
scam | +0.077 |
ous | +0.070 |
ighting | +0.070 |
Neg logit contributions | |
Marshal | -0.083 |
lator | -0.081 |
iler | -0.072 |
layer | -0.071 |
Gutenberg | -0.070 |
Token | Rift |
Token ID | 21222 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
Marshal | +0.190 |
lator | +0.187 |
iler | +0.166 |
layer | +0.165 |
Gutenberg | +0.163 |
Neg logit contributions | |
ensed | -0.162 |
icably | -0.157 |
scam | -0.156 |
ous | -0.142 |
ighting | -0.142 |
Token | creator |
Token ID | 13172 |
Feature activation | +3.21e-01 |
Pos logit contributions | |
Marshal | +0.459 |
lator | +0.451 |
iler | +0.398 |
layer | +0.396 |
Gutenberg | +0.391 |
Neg logit contributions | |
ensed | -0.420 |
icably | -0.408 |
scam | -0.404 |
ous | -0.370 |
ighting | -0.369 |
Token | Palmer |
Token ID | 18918 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
Marshal | +0.252 |
lator | +0.248 |
iler | +0.218 |
layer | +0.217 |
Gutenberg | +0.215 |
Neg logit contributions | |
ensed | -0.234 |
icably | -0.227 |
scam | -0.225 |
ous | -0.207 |
ighting | -0.206 |
Token | Luc |
Token ID | 7598 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
Marshal | +0.098 |
lator | +0.097 |
iler | +0.087 |
layer | +0.086 |
Gutenberg | +0.085 |
Neg logit contributions | |
ensed | -0.066 |
icably | -0.063 |
scam | -0.063 |
ous | -0.057 |
ighting | -0.056 |
Token | key |
Token ID | 2539 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
ensed | +0.096 |
icably | +0.093 |
scam | +0.093 |
ous | +0.087 |
ella | +0.086 |
Neg logit contributions | |
Marshal | -0.082 |
lator | -0.080 |
iler | -0.069 |
layer | -0.068 |
Gutenberg | -0.068 |
Token | has |
Token ID | 468 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
Marshal | +0.110 |
lator | +0.108 |
iler | +0.096 |
layer | +0.095 |
Gutenberg | +0.094 |
Neg logit contributions | |
ensed | -0.093 |
icably | -0.091 |
scam | -0.090 |
ous | -0.082 |
ighting | -0.082 |
Token | 4 |
Token ID | 604 |
Feature activation | -6.25e-03 |
Pos logit contributions | |
ensed | +0.035 |
icably | +0.034 |
scam | +0.033 |
ous | +0.031 |
ighting | +0.031 |
Neg logit contributions | |
Marshal | -0.034 |
lator | -0.034 |
iler | -0.030 |
layer | -0.029 |
Gutenberg | -0.029 |
Token | th |
Token ID | 400 |
Feature activation | +3.33e-01 |
Pos logit contributions | |
ensed | +0.007 |
icably | +0.007 |
scam | +0.007 |
ous | +0.007 |
ella | +0.007 |
Neg logit contributions | |
Marshal | -0.002 |
lator | -0.002 |
iler | -0.002 |
layer | -0.002 |
Gutenberg | -0.002 |
Token | Italian |
Token ID | 8200 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
Marshal | +0.246 |
lator | +0.241 |
iler | +0.211 |
layer | +0.209 |
Gutenberg | +0.207 |
Neg logit contributions | |
ensed | -0.259 |
icably | -0.252 |
scam | -0.250 |
ous | -0.231 |
ighting | -0.230 |
Token | " |
Token ID | 366 |
Feature activation | +6.11e-02 |
Pos logit contributions | |
Marshal | +0.100 |
lator | +0.098 |
iler | +0.086 |
layer | +0.086 |
Gutenberg | +0.085 |
Neg logit contributions | |
ensed | -0.102 |
icably | -0.099 |
scam | -0.099 |
ous | -0.091 |
ighting | -0.090 |
Token | Mon |
Token ID | 9069 |
Feature activation | +6.93e-02 |
Pos logit contributions | |
Marshal | +0.046 |
lator | +0.045 |
iler | +0.040 |
layer | +0.040 |
Gutenberg | +0.039 |
Neg logit contributions | |
ensed | -0.046 |
icably | -0.045 |
scam | -0.045 |
ous | -0.041 |
ighting | -0.041 |
Token | ter |
Token ID | 353 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
Marshal | +0.021 |
lator | +0.020 |
iler | +0.014 |
layer | +0.014 |
Gutenberg | +0.013 |
Neg logit contributions | |
ensed | -0.084 |
icably | -0.082 |
scam | -0.082 |
ous | -0.078 |
ighting | -0.077 |
Token | osa |
Token ID | 8546 |
Feature activation | -9.77e-02 |
Pos logit contributions | |
Marshal | +0.546 |
lator | +0.539 |
iler | +0.487 |
layer | +0.485 |
Gutenberg | +0.478 |
Neg logit contributions | |
ensed | -0.330 |
icably | -0.318 |
scam | -0.317 |
ighting | -0.281 |
recomm | -0.280 |
Token | Division |
Token ID | 7458 |
Feature activation | -7.27e-02 |
Pos logit contributions | |
ensed | +0.070 |
icably | +0.067 |
scam | +0.067 |
ous | +0.061 |
ella | +0.061 |
Neg logit contributions | |
Marshal | -0.078 |
lator | -0.077 |
iler | -0.068 |
layer | -0.068 |
Gutenberg | -0.067 |
Token | " |
Token ID | 1 |
Feature activation | -3.21e-02 |
Pos logit contributions | |
ensed | +0.049 |
icably | +0.048 |
scam | +0.048 |
ous | +0.043 |
ighting | +0.043 |
Neg logit contributions | |
Marshal | -0.061 |
lator | -0.060 |
iler | -0.053 |
layer | -0.053 |
Gutenberg | -0.052 |
Token | Alpine |
Token ID | 46994 |
Feature activation | +3.55e-02 |
Pos logit contributions | |
ensed | +0.022 |
icably | +0.022 |
scam | +0.022 |
ous | +0.020 |
ighting | +0.020 |
Neg logit contributions | |
Marshal | -0.026 |
lator | -0.026 |
iler | -0.023 |
layer | -0.023 |
Gutenberg | -0.022 |
Token | Division |
Token ID | 7458 |
Feature activation | -4.10e-02 |
Pos logit contributions | |
Marshal | +0.027 |
lator | +0.026 |
iler | +0.023 |
layer | +0.023 |
Gutenberg | +0.023 |
Neg logit contributions | |
ensed | -0.027 |
icably | -0.026 |
scam | -0.026 |
ous | -0.024 |
ighting | -0.024 |
Token | ] |
Token ID | 60 |
Feature activation | +1.82e-01 |
Pos logit contributions | |
Marshal | +0.127 |
lator | +0.124 |
iler | +0.103 |
layer | +0.102 |
Gutenberg | +0.100 |
Neg logit contributions | |
ensed | -0.215 |
icably | -0.211 |
scam | -0.209 |
ous | -0.196 |
ighting | -0.196 |
Token |
|
Token ID | 198 |
Feature activation | +8.79e-04 |
Pos logit contributions | |
Marshal | +0.147 |
lator | +0.145 |
iler | +0.128 |
layer | +0.127 |
Gutenberg | +0.125 |
Neg logit contributions | |
ensed | -0.128 |
icably | -0.124 |
scam | -0.124 |
ous | -0.113 |
ighting | -0.112 |
Token |
|
Token ID | 198 |
Feature activation | -1.84e-02 |
Pos logit contributions | |
Marshal | +0.001 |
lator | +0.001 |
iler | +0.001 |
layer | +0.001 |
Gutenberg | +0.001 |
Neg logit contributions | |
ensed | -0.001 |
icably | -0.001 |
scam | -0.001 |
ighting | -0.001 |
ous | -0.001 |
Token | The |
Token ID | 464 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
ensed | +0.014 |
icably | +0.013 |
scam | +0.013 |
ous | +0.012 |
ighting | +0.012 |
Neg logit contributions | |
Marshal | -0.014 |
lator | -0.014 |
iler | -0.012 |
layer | -0.012 |
Gutenberg | -0.012 |
Token | Android |
Token ID | 5565 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
ensed | +0.144 |
icably | +0.140 |
scam | +0.139 |
ous | +0.129 |
ighting | +0.128 |
Neg logit contributions | |
Marshal | -0.131 |
lator | -0.129 |
iler | -0.112 |
layer | -0.111 |
Gutenberg | -0.110 |
Token | Market |
Token ID | 5991 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
Marshal | +0.159 |
lator | +0.157 |
iler | +0.137 |
layer | +0.136 |
Gutenberg | +0.134 |
Neg logit contributions | |
ensed | -0.179 |
icably | -0.175 |
scam | -0.174 |
ous | -0.161 |
ighting | -0.160 |
Token | 's |
Token ID | 338 |
Feature activation | -4.71e-02 |
Pos logit contributions | |
Marshal | +0.454 |
lator | +0.445 |
iler | +0.392 |
layer | +0.390 |
Gutenberg | +0.385 |
Neg logit contributions | |
ensed | -0.426 |
icably | -0.413 |
scam | -0.410 |
ous | -0.376 |
ighting | -0.375 |
Token | a |
Token ID | 257 |
Feature activation | +3.25e-02 |
Pos logit contributions | |
ensed | +0.036 |
icably | +0.035 |
scam | +0.035 |
ous | +0.032 |
ighting | +0.032 |
Neg logit contributions | |
Marshal | -0.035 |
lator | -0.035 |
iler | -0.030 |
layer | -0.030 |
Gutenberg | -0.030 |
Token | big |
Token ID | 1263 |
Feature activation | -6.74e-02 |
Pos logit contributions | |
Marshal | +0.025 |
lator | +0.024 |
iler | +0.021 |
layer | +0.021 |
Gutenberg | +0.021 |
Neg logit contributions | |
ensed | -0.025 |
icably | -0.024 |
scam | -0.024 |
ous | -0.022 |
ighting | -0.022 |
Token | place |
Token ID | 1295 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
ensed | +0.044 |
icably | +0.042 |
scam | +0.041 |
ous | +0.038 |
ighting | +0.038 |
Neg logit contributions | |
Marshal | -0.059 |
lator | -0.058 |
iler | -0.052 |
layer | -0.051 |
Gutenberg | -0.051 |
Token | , |
Token ID | 11 |
Feature activation | -5.70e-03 |
Pos logit contributions | |
ensed | +0.160 |
icably | +0.155 |
scam | +0.154 |
ous | +0.142 |
ighting | +0.141 |
Neg logit contributions | |
Marshal | -0.176 |
lator | -0.173 |
iler | -0.152 |
layer | -0.152 |
Gutenberg | -0.150 |
Token | caric |
Token ID | 33674 |
Feature activation | +3.63e-01 |
Pos logit contributions | |
ensed | +0.208 |
icably | +0.203 |
scam | +0.201 |
ous | +0.184 |
ighting | +0.183 |
Neg logit contributions | |
Marshal | -0.228 |
lator | -0.224 |
iler | -0.198 |
layer | -0.197 |
Gutenberg | -0.194 |
Token | atures |
Token ID | 6691 |
Feature activation | +3.35e-01 |
Pos logit contributions | |
Marshal | +0.223 |
lator | +0.218 |
iler | +0.185 |
layer | +0.183 |
Gutenberg | +0.181 |
Neg logit contributions | |
ensed | -0.328 |
icably | -0.320 |
scam | -0.318 |
ous | -0.298 |
ighting | -0.297 |
Token | of |
Token ID | 286 |
Feature activation | +4.72e-02 |
Pos logit contributions | |
Marshal | +0.290 |
lator | +0.284 |
iler | +0.254 |
layer | +0.253 |
Gutenberg | +0.250 |
Neg logit contributions | |
ensed | -0.218 |
icably | -0.212 |
scam | -0.209 |
ighting | -0.190 |
ous | -0.189 |
Token | Asians |
Token ID | 30852 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
Marshal | +0.036 |
lator | +0.036 |
iler | +0.031 |
layer | +0.031 |
Gutenberg | +0.031 |
Neg logit contributions | |
ensed | -0.035 |
icably | -0.034 |
scam | -0.034 |
ous | -0.031 |
ighting | -0.031 |
Token | mas |
Token ID | 12422 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
Marshal | +0.092 |
lator | +0.090 |
iler | +0.079 |
layer | +0.079 |
Gutenberg | +0.078 |
Neg logit contributions | |
ensed | -0.087 |
icably | -0.085 |
scam | -0.084 |
ous | -0.077 |
ighting | -0.077 |
Token | quer |
Token ID | 10819 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
ensed | +0.197 |
icably | +0.194 |
scam | +0.193 |
ous | +0.184 |
ighting | +0.183 |
Neg logit contributions | |
Marshal | -0.045 |
lator | -0.043 |
iler | -0.028 |
layer | -0.028 |
Gutenberg | -0.026 |
Token | ading |
Token ID | 4980 |
Feature activation | +6.11e-02 |
Pos logit contributions | |
Marshal | +0.483 |
lator | +0.475 |
iler | +0.422 |
layer | +0.420 |
Gutenberg | +0.415 |
Neg logit contributions | |
ensed | -0.394 |
icably | -0.382 |
scam | -0.379 |
ous | -0.346 |
ighting | -0.344 |
Token | as |
Token ID | 355 |
Feature activation | +9.73e-02 |
Pos logit contributions | |
Marshal | +0.043 |
lator | +0.042 |
iler | +0.036 |
layer | +0.036 |
Gutenberg | +0.036 |
Neg logit contributions | |
ensed | -0.050 |
icably | -0.049 |
scam | -0.049 |
ous | -0.045 |
ash | -0.045 |
Token | humor |
Token ID | 14733 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
Marshal | +0.078 |
lator | +0.076 |
iler | +0.067 |
layer | +0.067 |
Gutenberg | +0.066 |
Neg logit contributions | |
ensed | -0.070 |
icably | -0.068 |
scam | -0.067 |
ighting | -0.062 |
ous | -0.062 |
Token | . |
Token ID | 13 |
Feature activation | +4.68e-02 |
Pos logit contributions | |
ensed | +0.014 |
icably | +0.013 |
scam | +0.013 |
ighting | +0.012 |
ella | +0.011 |
Neg logit contributions | |
Marshal | -0.021 |
lator | -0.021 |
iler | -0.019 |
layer | -0.019 |
Gutenberg | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
Marshal | +0.037 |
lator | +0.036 |
iler | +0.032 |
layer | +0.032 |
Gutenberg | +0.031 |
Neg logit contributions | |
ensed | -0.034 |
icably | -0.033 |
scam | -0.033 |
ous | -0.030 |
ighting | -0.030 |
Token | though |
Token ID | 996 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
ensed | +0.009 |
icably | +0.008 |
scam | +0.008 |
ighting | +0.008 |
ella | +0.007 |
Neg logit contributions | |
Marshal | -0.014 |
lator | -0.014 |
iler | -0.013 |
layer | -0.013 |
Gutenberg | -0.012 |
Token | : |
Token ID | 25 |
Feature activation | -7.72e-02 |
Pos logit contributions | |
ensed | +0.189 |
scam | +0.184 |
icably | +0.183 |
ous | +0.169 |
recomm | +0.167 |
Neg logit contributions | |
Marshal | -0.198 |
lator | -0.195 |
iler | -0.172 |
layer | -0.171 |
Gutenberg | -0.170 |
Token | Would |
Token ID | 10928 |
Feature activation | -1.44e-01 |
Pos logit contributions | |
ensed | +0.062 |
icably | +0.060 |
scam | +0.060 |
ous | +0.056 |
ighting | +0.055 |
Neg logit contributions | |
Marshal | -0.055 |
lator | -0.054 |
iler | -0.047 |
layer | -0.047 |
Gutenberg | -0.046 |
Token | Os |
Token ID | 8834 |
Feature activation | +8.18e-02 |
Pos logit contributions | |
ensed | +0.101 |
icably | +0.098 |
scam | +0.097 |
ighting | +0.089 |
ella | +0.088 |
Neg logit contributions | |
Marshal | -0.117 |
lator | -0.114 |
iler | -0.102 |
layer | -0.101 |
Gutenberg | -0.100 |
Token | we |
Token ID | 732 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
Marshal | +0.043 |
lator | +0.041 |
iler | +0.034 |
layer | +0.034 |
Gutenberg | +0.033 |
Neg logit contributions | |
ensed | -0.081 |
icably | -0.080 |
scam | -0.079 |
ous | -0.075 |
ighting | -0.074 |
Token | iler |
Token ID | 5329 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
Marshal | +0.027 |
lator | +0.024 |
iler | +0.000 |
layer | -0.001 |
Gutenberg | -0.004 |
Neg logit contributions | |
ensed | -0.376 |
icably | -0.371 |
scam | -0.370 |
ous | -0.354 |
ighting | -0.353 |
Token | , |
Token ID | 11 |
Feature activation | +2.76e-02 |
Pos logit contributions | |
Marshal | +0.460 |
lator | +0.452 |
iler | +0.400 |
layer | +0.397 |
Gutenberg | +0.392 |
Neg logit contributions | |
ensed | -0.416 |
icably | -0.404 |
scam | -0.400 |
ous | -0.367 |
ighting | -0.366 |
Token | as |
Token ID | 355 |
Feature activation | +7.68e-02 |
Pos logit contributions | |
Marshal | +0.020 |
lator | +0.020 |
iler | +0.017 |
layer | +0.017 |
Gutenberg | +0.017 |
Neg logit contributions | |
ensed | -0.021 |
icably | -0.021 |
scam | -0.021 |
ighting | -0.019 |
ous | -0.019 |
Token | unprepared |
Token ID | 45102 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
Marshal | +0.060 |
lator | +0.059 |
iler | +0.052 |
layer | +0.052 |
Gutenberg | +0.051 |
Neg logit contributions | |
ensed | -0.056 |
icably | -0.055 |
scam | -0.054 |
ighting | -0.050 |
ous | -0.050 |
Token | as |
Token ID | 355 |
Feature activation | +6.28e-02 |
Pos logit contributions | |
Marshal | +0.089 |
lator | +0.088 |
iler | +0.077 |
layer | +0.076 |
Gutenberg | +0.075 |
Neg logit contributions | |
ensed | -0.094 |
icably | -0.091 |
scam | -0.091 |
ous | -0.084 |
recomm | -0.083 |
Token | he |
Token ID | 339 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
Marshal | +0.050 |
lator | +0.049 |
iler | +0.043 |
layer | +0.043 |
Gutenberg | +0.042 |
Neg logit contributions | |
ensed | -0.046 |
icably | -0.044 |
scam | -0.044 |
ighting | -0.040 |
ous | -0.040 |
Token | would |
Token ID | 561 |
Feature activation | -3.44e-02 |
Pos logit contributions | |
Marshal | +0.099 |
lator | +0.097 |
iler | +0.087 |
layer | +0.086 |
Gutenberg | +0.085 |
Neg logit contributions | |
ensed | -0.074 |
icably | -0.071 |
scam | -0.070 |
ighting | -0.064 |
ella | -0.063 |
Token | be |
Token ID | 307 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
ensed | +0.026 |
icably | +0.026 |
scam | +0.025 |
ighting | +0.023 |
ous | +0.023 |
Neg logit contributions | |
Marshal | -0.026 |
lator | -0.025 |
iler | -0.022 |
layer | -0.022 |
Gutenberg | -0.022 |
Token | problematic |
Token ID | 15833 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
Marshal | +0.123 |
lator | +0.121 |
iler | +0.107 |
layer | +0.106 |
Gutenberg | +0.105 |
Neg logit contributions | |
ensed | -0.108 |
icably | -0.104 |
scam | -0.103 |
ighting | -0.095 |
ous | -0.094 |
Token | if |
Token ID | 611 |
Feature activation | +7.74e-02 |
Pos logit contributions | |
ensed | +0.127 |
icably | +0.123 |
scam | +0.122 |
ous | +0.111 |
ighting | +0.111 |
Neg logit contributions | |
Marshal | -0.148 |
lator | -0.145 |
iler | -0.129 |
layer | -0.128 |
Gutenberg | -0.127 |
Token | the |
Token ID | 262 |
Feature activation | +8.10e-02 |
Pos logit contributions | |
Marshal | +0.061 |
lator | +0.060 |
iler | +0.053 |
layer | +0.052 |
Gutenberg | +0.052 |
Neg logit contributions | |
ensed | -0.056 |
icably | -0.055 |
scam | -0.054 |
ighting | -0.050 |
ous | -0.050 |
Token | Panthers |
Token ID | 17782 |
Feature activation | +5.78e-01 |
Pos logit contributions | |
Marshal | +0.040 |
lator | +0.039 |
iler | +0.031 |
layer | +0.031 |
Gutenberg | +0.030 |
Neg logit contributions | |
ensed | -0.083 |
icably | -0.081 |
scam | -0.081 |
ous | -0.076 |
ighting | -0.076 |
Token | are |
Token ID | 389 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
Marshal | +0.503 |
lator | +0.491 |
iler | +0.442 |
layer | +0.440 |
Gutenberg | +0.431 |
Neg logit contributions | |
ensed | -0.374 |
icably | -0.362 |
scam | -0.355 |
ighting | -0.326 |
ous | -0.325 |
Token | asking |
Token ID | 4737 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
Marshal | +0.202 |
lator | +0.196 |
iler | +0.180 |
layer | +0.178 |
Gutenberg | +0.177 |
Neg logit contributions | |
ensed | -0.118 |
icably | -0.112 |
scam | -0.110 |
ighting | -0.101 |
ous | -0.100 |
Token | him |
Token ID | 683 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
Marshal | +0.129 |
lator | +0.125 |
iler | +0.111 |
layer | +0.110 |
Gutenberg | +0.109 |
Neg logit contributions | |
ensed | -0.113 |
icably | -0.109 |
scam | -0.108 |
ighting | -0.099 |
ella | -0.099 |
Token | to |
Token ID | 284 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
Marshal | +0.092 |
lator | +0.091 |
iler | +0.080 |
layer | +0.080 |
Gutenberg | +0.079 |
Neg logit contributions | |
ensed | -0.078 |
icably | -0.076 |
scam | -0.076 |
ous | -0.069 |
ighting | -0.069 |
Token | push |
Token ID | 4574 |
Feature activation | +9.99e-02 |
Pos logit contributions | |
Marshal | +0.113 |
lator | +0.110 |
iler | +0.098 |
layer | +0.097 |
Gutenberg | +0.096 |
Neg logit contributions | |
ensed | -0.099 |
icably | -0.096 |
scam | -0.094 |
ighting | -0.087 |
ous | -0.087 |
Token | against |
Token ID | 1028 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
Marshal | +0.141 |
lator | +0.139 |
iler | +0.123 |
layer | +0.122 |
Gutenberg | +0.120 |
Neg logit contributions | |
ensed | -0.132 |
icably | -0.128 |
scam | -0.127 |
ous | -0.116 |
ighting | -0.116 |
Token | Carolina |
Token ID | 5913 |
Feature activation | +1.71e-01 |
Pos logit contributions | |
Marshal | +0.114 |
lator | +0.112 |
iler | +0.099 |
layer | +0.098 |
Gutenberg | +0.097 |
Neg logit contributions | |
ensed | -0.103 |
icably | -0.100 |
scam | -0.099 |
ighting | -0.091 |
ella | -0.091 |
Token | , |
Token ID | 11 |
Feature activation | +1.41e-01 |
Pos logit contributions | |
Marshal | +0.137 |
lator | +0.135 |
iler | +0.119 |
layer | +0.119 |
Gutenberg | +0.117 |
Neg logit contributions | |
ensed | -0.122 |
icably | -0.118 |
scam | -0.117 |
ous | -0.107 |
ighting | -0.107 |
Token | and |
Token ID | 290 |
Feature activation | +1.00e-01 |
Pos logit contributions | |
Marshal | +0.123 |
lator | +0.120 |
iler | +0.107 |
layer | +0.106 |
Gutenberg | +0.105 |
Neg logit contributions | |
ensed | -0.092 |
icably | -0.088 |
scam | -0.087 |
ighting | -0.079 |
ous | -0.079 |
Token | the |
Token ID | 262 |
Feature activation | +9.10e-02 |
Pos logit contributions | |
Marshal | +0.085 |
lator | +0.083 |
iler | +0.074 |
layer | +0.073 |
Gutenberg | +0.073 |
Neg logit contributions | |
ensed | -0.068 |
icably | -0.066 |
scam | -0.065 |
ighting | -0.059 |
ous | -0.059 |
Token | Panthers |
Token ID | 17782 |
Feature activation | +5.75e-01 |
Pos logit contributions | |
Marshal | +0.055 |
lator | +0.053 |
iler | +0.045 |
layer | +0.045 |
Gutenberg | +0.044 |
Neg logit contributions | |
ensed | -0.083 |
icably | -0.081 |
scam | -0.081 |
ous | -0.075 |
ighting | -0.075 |
Token | have |
Token ID | 423 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
Marshal | +0.450 |
lator | +0.441 |
iler | +0.390 |
layer | +0.387 |
Gutenberg | +0.381 |
Neg logit contributions | |
ensed | -0.422 |
icably | -0.410 |
scam | -0.405 |
ous | -0.372 |
ighting | -0.372 |
Token | allowed |
Token ID | 3142 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
Marshal | +0.150 |
lator | +0.148 |
iler | +0.134 |
layer | +0.134 |
Gutenberg | +0.133 |
Neg logit contributions | |
ensed | -0.073 |
icably | -0.070 |
scam | -0.069 |
ous | -0.060 |
ighting | -0.060 |
Token | 16 |
Token ID | 1467 |
Feature activation | +4.89e-02 |
Pos logit contributions | |
ensed | +0.077 |
icably | +0.074 |
scam | +0.074 |
ous | +0.068 |
ighting | +0.068 |
Neg logit contributions | |
Marshal | -0.080 |
lator | -0.078 |
iler | -0.069 |
layer | -0.068 |
Gutenberg | -0.068 |
Token | touchdowns |
Token ID | 17692 |
Feature activation | -4.67e-02 |
Pos logit contributions | |
Marshal | +0.037 |
lator | +0.036 |
iler | +0.031 |
layer | +0.031 |
Gutenberg | +0.031 |
Neg logit contributions | |
ensed | -0.038 |
icably | -0.037 |
scam | -0.036 |
ous | -0.033 |
ighting | -0.033 |
Token | compared |
Token ID | 3688 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
ensed | +0.033 |
icably | +0.032 |
scam | +0.032 |
ighting | +0.029 |
ous | +0.029 |
Neg logit contributions | |
Marshal | -0.037 |
lator | -0.037 |
iler | -0.032 |
layer | -0.032 |
Gutenberg | -0.032 |
Token | these |
Token ID | 777 |
Feature activation | -5.93e-02 |
Pos logit contributions | |
ensed | +0.019 |
icably | +0.018 |
scam | +0.018 |
ous | +0.016 |
ighting | +0.016 |
Neg logit contributions | |
Marshal | -0.024 |
lator | -0.024 |
iler | -0.021 |
layer | -0.021 |
Gutenberg | -0.021 |
Token | first |
Token ID | 717 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
ensed | +0.041 |
icably | +0.040 |
scam | +0.039 |
ous | +0.036 |
ighting | +0.036 |
Neg logit contributions | |
Marshal | -0.049 |
lator | -0.048 |
iler | -0.043 |
layer | -0.043 |
Gutenberg | -0.042 |
Token | psych |
Token ID | 3795 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
Marshal | +0.099 |
lator | +0.097 |
iler | +0.086 |
Gutenberg | +0.086 |
layer | +0.086 |
Neg logit contributions | |
ensed | -0.081 |
icably | -0.078 |
scam | -0.077 |
ighting | -0.070 |
ous | -0.070 |
Token | oan |
Token ID | 24611 |
Feature activation | +2.96e-01 |
Pos logit contributions | |
Marshal | +0.066 |
lator | +0.065 |
iler | +0.054 |
layer | +0.054 |
Gutenberg | +0.053 |
Neg logit contributions | |
ensed | -0.110 |
icably | -0.108 |
scam | -0.107 |
ous | -0.100 |
ighting | -0.100 |
Token | aly |
Token ID | 3400 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
Marshal | +0.237 |
lator | +0.233 |
iler | +0.206 |
layer | +0.205 |
Gutenberg | +0.202 |
Neg logit contributions | |
ensed | -0.212 |
icably | -0.206 |
scam | -0.205 |
ous | -0.187 |
ighting | -0.186 |
Token | tic |
Token ID | 13370 |
Feature activation | +5.70e-01 |
Pos logit contributions | |
Marshal | +0.067 |
lator | +0.064 |
iler | +0.047 |
layer | +0.047 |
Gutenberg | +0.045 |
Neg logit contributions | |
ensed | -0.210 |
icably | -0.207 |
scam | -0.206 |
ous | -0.196 |
ella | -0.194 |
Token | approaches |
Token ID | 10581 |
Feature activation | +6.86e-03 |
Pos logit contributions | |
Marshal | +0.492 |
lator | +0.482 |
iler | +0.429 |
layer | +0.428 |
Gutenberg | +0.426 |
Neg logit contributions | |
ensed | -0.373 |
icably | -0.360 |
scam | -0.355 |
ighting | -0.322 |
ous | -0.322 |
Token | to |
Token ID | 284 |
Feature activation | -5.23e-02 |
Pos logit contributions | |
Marshal | +0.005 |
lator | +0.005 |
iler | +0.005 |
layer | +0.005 |
Gutenberg | +0.004 |
Neg logit contributions | |
ensed | -0.005 |
icably | -0.005 |
scam | -0.005 |
ous | -0.005 |
ighting | -0.005 |
Token | myth |
Token ID | 7918 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
ensed | +0.038 |
icably | +0.037 |
scam | +0.037 |
ous | +0.034 |
ighting | +0.034 |
Neg logit contributions | |
Marshal | -0.041 |
lator | -0.040 |
iler | -0.036 |
layer | -0.035 |
Gutenberg | -0.035 |
Token | , |
Token ID | 11 |
Feature activation | +3.15e-02 |
Pos logit contributions | |
ensed | +0.083 |
icably | +0.080 |
scam | +0.080 |
ighting | +0.073 |
recomm | +0.073 |
Neg logit contributions | |
Marshal | -0.082 |
lator | -0.080 |
iler | -0.071 |
layer | -0.070 |
Gutenberg | -0.070 |
Token | it |
Token ID | 340 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
Marshal | +0.025 |
lator | +0.025 |
iler | +0.022 |
layer | +0.022 |
Gutenberg | +0.021 |
Neg logit contributions | |
ensed | -0.023 |
icably | -0.022 |
scam | -0.022 |
ous | -0.020 |
ighting | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +8.19e-02 |
Pos logit contributions | |
ensed | +0.196 |
icably | +0.191 |
scam | +0.190 |
ous | +0.174 |
ighting | +0.174 |
Neg logit contributions | |
Marshal | -0.192 |
lator | -0.188 |
iler | -0.165 |
layer | -0.164 |
Gutenberg | -0.162 |
Token | Dr |
Token ID | 1583 |
Feature activation | +7.04e-02 |
Pos logit contributions | |
Marshal | +0.065 |
lator | +0.063 |
iler | +0.056 |
layer | +0.056 |
Gutenberg | +0.056 |
Neg logit contributions | |
ensed | -0.060 |
icably | -0.058 |
scam | -0.057 |
ighting | -0.052 |
recomm | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | +5.42e-02 |
Pos logit contributions | |
Marshal | +0.053 |
lator | +0.052 |
iler | +0.046 |
layer | +0.045 |
Gutenberg | +0.045 |
Neg logit contributions | |
ensed | -0.054 |
icably | -0.052 |
scam | -0.052 |
ous | -0.048 |
ighting | -0.048 |
Token | Thomas |
Token ID | 5658 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
Marshal | +0.041 |
lator | +0.040 |
iler | +0.036 |
layer | +0.035 |
Gutenberg | +0.035 |
Neg logit contributions | |
ensed | -0.041 |
icably | -0.040 |
scam | -0.039 |
ous | -0.036 |
ighting | -0.036 |
Token | Se |
Token ID | 1001 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
ensed | +0.019 |
icably | +0.018 |
scam | +0.018 |
ous | +0.017 |
ighting | +0.017 |
Neg logit contributions | |
Marshal | -0.018 |
lator | -0.018 |
iler | -0.016 |
layer | -0.016 |
Gutenberg | -0.016 |
Token | iler |
Token ID | 5329 |
Feature activation | +5.69e-01 |
Pos logit contributions | |
ensed | +0.146 |
icably | +0.142 |
scam | +0.142 |
ous | +0.131 |
ighting | +0.130 |
Neg logit contributions | |
Marshal | -0.136 |
lator | -0.133 |
iler | -0.116 |
layer | -0.116 |
Gutenberg | -0.114 |
Token | , |
Token ID | 11 |
Feature activation | +6.90e-02 |
Pos logit contributions | |
Marshal | +0.440 |
lator | +0.431 |
iler | +0.379 |
layer | +0.377 |
Gutenberg | +0.373 |
Neg logit contributions | |
ensed | -0.423 |
icably | -0.412 |
scam | -0.408 |
ighting | -0.374 |
ous | -0.374 |
Token | a |
Token ID | 257 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
Marshal | +0.053 |
lator | +0.052 |
iler | +0.046 |
layer | +0.045 |
Gutenberg | +0.045 |
Neg logit contributions | |
ensed | -0.052 |
icably | -0.050 |
scam | -0.050 |
ous | -0.046 |
ighting | -0.046 |
Token | physicist |
Token ID | 33013 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
Marshal | +0.027 |
lator | +0.026 |
iler | +0.024 |
layer | +0.024 |
Gutenberg | +0.023 |
Neg logit contributions | |
ensed | -0.018 |
icably | -0.017 |
scam | -0.017 |
ous | -0.015 |
ighting | -0.015 |
Token | from |
Token ID | 422 |
Feature activation | -3.71e-02 |
Pos logit contributions | |
ensed | +0.108 |
icably | +0.105 |
scam | +0.105 |
ous | +0.097 |
recomm | +0.096 |
Neg logit contributions | |
Marshal | -0.107 |
lator | -0.106 |
iler | -0.093 |
layer | -0.092 |
Gutenberg | -0.091 |
Token | Germany |
Token ID | 4486 |
Feature activation | +9.46e-02 |
Pos logit contributions | |
ensed | +0.026 |
icably | +0.025 |
scam | +0.025 |
ous | +0.023 |
ighting | +0.023 |
Neg logit contributions | |
Marshal | -0.031 |
lator | -0.030 |
iler | -0.027 |
layer | -0.026 |
Gutenberg | -0.026 |
Token | offered |
Token ID | 4438 |
Feature activation | -6.89e-02 |
Pos logit contributions | |
ensed | +0.062 |
icably | +0.060 |
scam | +0.059 |
ighting | +0.054 |
ous | +0.054 |
Neg logit contributions | |
Marshal | -0.078 |
lator | -0.076 |
iler | -0.068 |
layer | -0.068 |
Gutenberg | -0.067 |
Token | a |
Token ID | 257 |
Feature activation | -4.57e-02 |
Pos logit contributions | |
ensed | +0.051 |
icably | +0.049 |
scam | +0.049 |
ous | +0.045 |
ighting | +0.045 |
Neg logit contributions | |
Marshal | -0.053 |
lator | -0.052 |
iler | -0.046 |
layer | -0.046 |
Gutenberg | -0.045 |
Token | tweet |
Token ID | 6126 |
Feature activation | -5.51e-02 |
Pos logit contributions | |
ensed | +0.031 |
scam | +0.030 |
icably | +0.030 |
ous | +0.027 |
recomm | +0.027 |
Neg logit contributions | |
Marshal | -0.038 |
lator | -0.037 |
iler | -0.033 |
layer | -0.033 |
Gutenberg | -0.033 |
Token | of |
Token ID | 286 |
Feature activation | -9.02e-02 |
Pos logit contributions | |
ensed | +0.037 |
icably | +0.036 |
scam | +0.035 |
ous | +0.032 |
ighting | +0.032 |
Neg logit contributions | |
Marshal | -0.047 |
lator | -0.046 |
iler | -0.041 |
layer | -0.041 |
Gutenberg | -0.040 |
Token | condol |
Token ID | 35059 |
Feature activation | -3.84e-02 |
Pos logit contributions | |
ensed | +0.072 |
icably | +0.070 |
scam | +0.070 |
ous | +0.065 |
recomm | +0.064 |
Neg logit contributions | |
Marshal | -0.064 |
lator | -0.063 |
iler | -0.055 |
layer | -0.055 |
Gutenberg | -0.054 |
Token | ence |
Token ID | 594 |
Feature activation | -7.91e-01 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.010 |
scam | +0.010 |
recomm | +0.007 |
ash | +0.007 |
Neg logit contributions | |
Marshal | -0.047 |
lator | -0.047 |
iler | -0.044 |
layer | -0.043 |
Gutenberg | -0.043 |
Token | to |
Token ID | 284 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
ensed | +0.567 |
icably | +0.550 |
scam | +0.546 |
ous | +0.500 |
ighting | +0.498 |
Neg logit contributions | |
Marshal | -0.632 |
lator | -0.621 |
iler | -0.549 |
layer | -0.546 |
Gutenberg | -0.540 |
Token | those |
Token ID | 883 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
ensed | +0.080 |
icably | +0.077 |
scam | +0.077 |
ous | +0.070 |
recomm | +0.069 |
Neg logit contributions | |
Marshal | -0.100 |
lator | -0.099 |
iler | -0.088 |
layer | -0.087 |
Gutenberg | -0.087 |
Token | affected |
Token ID | 5676 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
ensed | +0.064 |
icably | +0.061 |
scam | +0.061 |
ous | +0.055 |
recomm | +0.054 |
Neg logit contributions | |
Marshal | -0.105 |
lator | -0.104 |
iler | -0.093 |
Gutenberg | -0.093 |
layer | -0.093 |
Token | by |
Token ID | 416 |
Feature activation | +4.51e-02 |
Pos logit contributions | |
ensed | +0.126 |
scam | +0.122 |
icably | +0.121 |
ous | +0.113 |
ash | +0.111 |
Neg logit contributions | |
Marshal | -0.113 |
lator | -0.111 |
iler | -0.096 |
layer | -0.096 |
Gutenberg | -0.095 |
Token | the |
Token ID | 262 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
Marshal | +0.039 |
lator | +0.038 |
iler | +0.034 |
layer | +0.034 |
Gutenberg | +0.034 |
Neg logit contributions | |
ensed | -0.029 |
icably | -0.029 |
scam | -0.028 |
ous | -0.026 |
ighting | -0.026 |
Token | notion |
Token ID | 9495 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
ensed | +0.016 |
icably | +0.016 |
scam | +0.016 |
ous | +0.014 |
recomm | +0.014 |
Neg logit contributions | |
Marshal | -0.015 |
lator | -0.015 |
iler | -0.013 |
layer | -0.013 |
Gutenberg | -0.013 |
Token | is |
Token ID | 318 |
Feature activation | -2.00e-03 |
Pos logit contributions | |
Marshal | +0.106 |
lator | +0.104 |
iler | +0.093 |
layer | +0.093 |
Gutenberg | +0.092 |
Neg logit contributions | |
ensed | -0.079 |
icably | -0.076 |
scam | -0.076 |
ous | -0.069 |
ella | -0.068 |
Token | � |
Token ID | 564 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
ensed | +0.001 |
icably | +0.001 |
scam | +0.001 |
ous | +0.001 |
ighting | +0.001 |
Neg logit contributions | |
Marshal | -0.002 |
lator | -0.002 |
iler | -0.002 |
layer | -0.002 |
Gutenberg | -0.002 |
Token | � |
Token ID | 246 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
ensed | +0.066 |
icably | +0.064 |
scam | +0.063 |
ous | +0.057 |
ighting | +0.056 |
Neg logit contributions | |
Marshal | -0.102 |
lator | -0.100 |
iler | -0.090 |
layer | -0.090 |
Gutenberg | -0.089 |
Token | nob |
Token ID | 34952 |
Feature activation | -2.10e-01 |
Pos logit contributions | |
ensed | +0.141 |
icably | +0.137 |
scam | +0.136 |
ous | +0.126 |
ighting | +0.125 |
Neg logit contributions | |
Marshal | -0.143 |
lator | -0.141 |
iler | -0.124 |
layer | -0.123 |
Gutenberg | -0.122 |
Token | ody |
Token ID | 1118 |
Feature activation | -7.87e-01 |
Pos logit contributions | |
ensed | +0.045 |
icably | +0.040 |
scam | +0.039 |
ighting | +0.027 |
ous | +0.026 |
Neg logit contributions | |
Marshal | -0.272 |
lator | -0.271 |
iler | -0.252 |
layer | -0.251 |
Gutenberg | -0.248 |
Token | gets |
Token ID | 3011 |
Feature activation | -6.15e-02 |
Pos logit contributions | |
ensed | +0.539 |
icably | +0.522 |
scam | +0.518 |
ous | +0.473 |
ighting | +0.470 |
Neg logit contributions | |
Marshal | -0.653 |
lator | -0.642 |
iler | -0.570 |
layer | -0.567 |
Gutenberg | -0.561 |
Token | to |
Token ID | 284 |
Feature activation | +9.97e-03 |
Pos logit contributions | |
ensed | +0.043 |
icably | +0.042 |
scam | +0.042 |
ous | +0.038 |
ighting | +0.038 |
Neg logit contributions | |
Marshal | -0.050 |
lator | -0.049 |
iler | -0.044 |
layer | -0.043 |
Gutenberg | -0.043 |
Token | tell |
Token ID | 1560 |
Feature activation | +9.28e-02 |
Pos logit contributions | |
Marshal | +0.008 |
lator | +0.008 |
iler | +0.007 |
layer | +0.007 |
Gutenberg | +0.007 |
Neg logit contributions | |
ensed | -0.007 |
icably | -0.007 |
scam | -0.007 |
ous | -0.006 |
ighting | -0.006 |
Token | us |
Token ID | 514 |
Feature activation | +2.55e-02 |
Pos logit contributions | |
Marshal | +0.074 |
lator | +0.073 |
iler | +0.064 |
layer | +0.064 |
Gutenberg | +0.063 |
Neg logit contributions | |
ensed | -0.067 |
icably | -0.065 |
scam | -0.064 |
ous | -0.059 |
ighting | -0.059 |
Token | what |
Token ID | 644 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
Marshal | +0.017 |
lator | +0.017 |
iler | +0.015 |
layer | +0.015 |
Gutenberg | +0.015 |
Neg logit contributions | |
ensed | -0.021 |
icably | -0.020 |
scam | -0.020 |
ous | -0.019 |
recomm | -0.019 |
Token | age |
Token ID | 496 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
ensed | +0.034 |
icably | +0.033 |
scam | +0.033 |
ous | +0.029 |
ella | +0.029 |
Neg logit contributions | |
Marshal | -0.050 |
lator | -0.049 |
iler | -0.044 |
layer | -0.044 |
Gutenberg | -0.044 |
Token | like |
Token ID | 588 |
Feature activation | +3.40e-02 |
Pos logit contributions | |
ensed | +0.212 |
icably | +0.206 |
scam | +0.204 |
ous | +0.188 |
ighting | +0.187 |
Neg logit contributions | |
Marshal | -0.227 |
lator | -0.223 |
iler | -0.197 |
layer | -0.196 |
Gutenberg | -0.193 |
Token | the |
Token ID | 262 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
Marshal | +0.028 |
lator | +0.028 |
iler | +0.025 |
layer | +0.025 |
Gutenberg | +0.024 |
Neg logit contributions | |
ensed | -0.023 |
icably | -0.022 |
scam | -0.022 |
ous | -0.020 |
ighting | -0.020 |
Token | old |
Token ID | 1468 |
Feature activation | -9.44e-02 |
Pos logit contributions | |
ensed | +0.015 |
icably | +0.015 |
scam | +0.014 |
ous | +0.013 |
ighting | +0.013 |
Neg logit contributions | |
Marshal | -0.017 |
lator | -0.017 |
iler | -0.015 |
layer | -0.015 |
Gutenberg | -0.014 |
Token | cattle |
Token ID | 17025 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
ensed | +0.067 |
icably | +0.065 |
scam | +0.065 |
ous | +0.059 |
ighting | +0.059 |
Neg logit contributions | |
Marshal | -0.076 |
lator | -0.075 |
iler | -0.066 |
layer | -0.066 |
Gutenberg | -0.065 |
Token | ranc |
Token ID | 32205 |
Feature activation | -7.86e-01 |
Pos logit contributions | |
ensed | +0.173 |
icably | +0.168 |
scam | +0.165 |
ous | +0.150 |
ighting | +0.149 |
Neg logit contributions | |
Marshal | -0.244 |
lator | -0.240 |
iler | -0.215 |
layer | -0.214 |
Gutenberg | -0.211 |
Token | hers |
Token ID | 7084 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
ensed | +0.881 |
icably | +0.864 |
scam | +0.860 |
ous | +0.815 |
ighting | +0.812 |
Neg logit contributions | |
Marshal | -0.310 |
lator | -0.298 |
iler | -0.226 |
layer | -0.224 |
Gutenberg | -0.218 |
Token | of |
Token ID | 286 |
Feature activation | -9.13e-02 |
Pos logit contributions | |
Marshal | +0.025 |
lator | +0.024 |
iler | +0.022 |
layer | +0.022 |
Gutenberg | +0.021 |
Neg logit contributions | |
ensed | -0.020 |
icably | -0.019 |
scam | -0.019 |
ighting | -0.017 |
ous | -0.017 |
Token | the |
Token ID | 262 |
Feature activation | -5.49e-02 |
Pos logit contributions | |
ensed | +0.067 |
icably | +0.065 |
scam | +0.064 |
ous | +0.059 |
ighting | +0.059 |
Neg logit contributions | |
Marshal | -0.072 |
lator | -0.071 |
iler | -0.062 |
layer | -0.062 |
Gutenberg | -0.061 |
Token | West |
Token ID | 2688 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
ensed | +0.043 |
icably | +0.042 |
scam | +0.041 |
ous | +0.038 |
ighting | +0.038 |
Neg logit contributions | |
Marshal | -0.040 |
lator | -0.039 |
iler | -0.034 |
layer | -0.034 |
Gutenberg | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | +2.33e-03 |
Pos logit contributions | |
ensed | +0.012 |
icably | +0.012 |
scam | +0.012 |
ous | +0.011 |
ighting | +0.011 |
Neg logit contributions | |
Marshal | -0.012 |
lator | -0.012 |
iler | -0.010 |
layer | -0.010 |
Gutenberg | -0.010 |
Token | official |
Token ID | 1743 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
ensed | +0.149 |
scam | +0.145 |
icably | +0.145 |
ous | +0.136 |
ash | +0.135 |
Neg logit contributions | |
Marshal | -0.095 |
lator | -0.094 |
iler | -0.080 |
layer | -0.079 |
Gutenberg | -0.078 |
Token | , |
Token ID | 11 |
Feature activation | -1.70e-02 |
Pos logit contributions | |
Marshal | +0.189 |
lator | +0.186 |
iler | +0.163 |
layer | +0.162 |
Gutenberg | +0.161 |
Neg logit contributions | |
ensed | -0.186 |
scam | -0.181 |
icably | -0.180 |
ous | -0.167 |
recomm | -0.165 |
Token | according |
Token ID | 1864 |
Feature activation | +5.62e-02 |
Pos logit contributions | |
ensed | +0.013 |
icably | +0.012 |
scam | +0.012 |
ous | +0.011 |
ighting | +0.011 |
Neg logit contributions | |
Marshal | -0.013 |
lator | -0.013 |
iler | -0.011 |
layer | -0.011 |
Gutenberg | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | -5.13e-02 |
Pos logit contributions | |
Marshal | +0.045 |
lator | +0.044 |
iler | +0.039 |
layer | +0.039 |
Gutenberg | +0.038 |
Neg logit contributions | |
ensed | -0.040 |
icably | -0.039 |
scam | -0.039 |
ighting | -0.035 |
ous | -0.035 |
Token | Ag |
Token ID | 2449 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
ensed | +0.037 |
icably | +0.036 |
scam | +0.036 |
ous | +0.033 |
ighting | +0.033 |
Neg logit contributions | |
Marshal | -0.040 |
lator | -0.039 |
iler | -0.035 |
layer | -0.035 |
Gutenberg | -0.034 |
Token | ence |
Token ID | 594 |
Feature activation | -7.75e-01 |
Pos logit contributions | |
ensed | +0.064 |
icably | +0.062 |
scam | +0.061 |
recomm | +0.045 |
ighting | +0.045 |
Neg logit contributions | |
Marshal | -0.282 |
lator | -0.279 |
iler | -0.259 |
layer | -0.258 |
Gutenberg | -0.255 |
Token | - |
Token ID | 12 |
Feature activation | -2.34e-02 |
Pos logit contributions | |
ensed | +0.635 |
icably | +0.623 |
scam | +0.615 |
ighting | +0.571 |
ous | +0.568 |
Neg logit contributions | |
Marshal | -0.540 |
lator | -0.525 |
iler | -0.453 |
layer | -0.453 |
Gutenberg | -0.450 |
Token | France |
Token ID | 28572 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
ensed | +0.018 |
icably | +0.018 |
scam | +0.018 |
ous | +0.016 |
ighting | +0.016 |
Neg logit contributions | |
Marshal | -0.017 |
lator | -0.017 |
iler | -0.015 |
layer | -0.015 |
Gutenberg | -0.015 |
Token | Pres |
Token ID | 1763 |
Feature activation | -9.15e-02 |
Pos logit contributions | |
ensed | +0.081 |
icably | +0.079 |
scam | +0.079 |
ous | +0.073 |
ighting | +0.072 |
Neg logit contributions | |
Marshal | -0.074 |
lator | -0.072 |
iler | -0.063 |
layer | -0.063 |
Gutenberg | -0.062 |
Token | se |
Token ID | 325 |
Feature activation | -2.97e-01 |
Pos logit contributions | |
icably | +0.061 |
ensed | +0.061 |
scam | +0.060 |
ighting | +0.055 |
recomm | +0.055 |
Neg logit contributions | |
Marshal | -0.076 |
lator | -0.076 |
iler | -0.066 |
layer | -0.066 |
Gutenberg | -0.065 |
Token | news |
Token ID | 1705 |
Feature activation | -8.99e-02 |
Pos logit contributions | |
ensed | +0.213 |
scam | +0.205 |
icably | +0.203 |
ous | +0.190 |
ella | +0.187 |
Neg logit contributions | |
Marshal | -0.237 |
lator | -0.234 |
layer | -0.206 |
iler | -0.204 |
Gutenberg | -0.203 |
Token | the |
Token ID | 262 |
Feature activation | -8.40e-02 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.009 |
scam | +0.009 |
ella | +0.009 |
ighting | +0.008 |
Neg logit contributions | |
Marshal | -0.012 |
lator | -0.012 |
iler | -0.011 |
layer | -0.011 |
Gutenberg | -0.010 |
Token | company |
Token ID | 1664 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
ensed | +0.051 |
icably | +0.049 |
scam | +0.049 |
ighting | +0.044 |
ous | +0.044 |
Neg logit contributions | |
Marshal | -0.076 |
lator | -0.075 |
iler | -0.067 |
layer | -0.067 |
Gutenberg | -0.066 |
Token | � |
Token ID | 447 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
ensed | +0.155 |
icably | +0.150 |
scam | +0.149 |
ighting | +0.136 |
ous | +0.136 |
Neg logit contributions | |
Marshal | -0.182 |
lator | -0.178 |
iler | -0.158 |
layer | -0.157 |
Gutenberg | -0.156 |
Token | � |
Token ID | 247 |
Feature activation | -4.89e-02 |
Pos logit contributions | |
Marshal | +0.016 |
lator | +0.015 |
iler | +0.014 |
layer | +0.013 |
Gutenberg | +0.013 |
Neg logit contributions | |
ensed | -0.015 |
icably | -0.015 |
scam | -0.015 |
ous | -0.014 |
ighting | -0.014 |
Token | s |
Token ID | 82 |
Feature activation | +5.65e-02 |
Pos logit contributions | |
ensed | +0.047 |
icably | +0.046 |
scam | +0.045 |
ous | +0.042 |
ighting | +0.042 |
Neg logit contributions | |
Marshal | -0.027 |
lator | -0.027 |
iler | -0.022 |
layer | -0.022 |
Gutenberg | -0.022 |
Token | ash |
Token ID | 12530 |
Feature activation | -7.65e-01 |
Pos logit contributions | |
Marshal | +0.048 |
lator | +0.047 |
iler | +0.042 |
layer | +0.042 |
Gutenberg | +0.041 |
Neg logit contributions | |
ensed | -0.038 |
icably | -0.037 |
scam | -0.036 |
ighting | -0.033 |
ous | -0.033 |
Token | bas |
Token ID | 1615 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
ensed | +0.487 |
icably | +0.471 |
scam | +0.468 |
ous | +0.424 |
ighting | +0.420 |
Neg logit contributions | |
Marshal | -0.671 |
lator | -0.661 |
iler | -0.591 |
layer | -0.588 |
Gutenberg | -0.583 |
Token | ins |
Token ID | 1040 |
Feature activation | -3.93e-02 |
Pos logit contributions | |
ensed | +0.089 |
icably | +0.086 |
scam | +0.086 |
ous | +0.078 |
ighting | +0.078 |
Neg logit contributions | |
Marshal | -0.096 |
lator | -0.094 |
iler | -0.083 |
layer | -0.083 |
Gutenberg | -0.082 |
Token | to |
Token ID | 284 |
Feature activation | -8.11e-03 |
Pos logit contributions | |
ensed | +0.028 |
icably | +0.027 |
scam | +0.027 |
ous | +0.025 |
ighting | +0.025 |
Neg logit contributions | |
Marshal | -0.032 |
lator | -0.031 |
iler | -0.027 |
layer | -0.027 |
Gutenberg | -0.027 |
Token | confirm |
Token ID | 6216 |
Feature activation | +3.64e-04 |
Pos logit contributions | |
ensed | +0.006 |
icably | +0.006 |
scam | +0.006 |
ous | +0.005 |
ighting | +0.005 |
Neg logit contributions | |
Marshal | -0.006 |
lator | -0.006 |
iler | -0.005 |
layer | -0.005 |
Gutenberg | -0.005 |
Token | structural |
Token ID | 13204 |
Feature activation | +2.66e-01 |
Pos logit contributions | |
Marshal | +0.000 |
lator | +0.000 |
iler | +0.000 |
layer | +0.000 |
Gutenberg | +0.000 |
Neg logit contributions | |
ensed | -0.000 |
icably | -0.000 |
scam | -0.000 |
ella | -0.000 |
ighting | -0.000 |
Token | formed |
Token ID | 7042 |
Feature activation | -2.82e-02 |
Pos logit contributions | |
Marshal | +0.053 |
lator | +0.052 |
iler | +0.046 |
layer | +0.046 |
Gutenberg | +0.045 |
Neg logit contributions | |
ensed | -0.041 |
icably | -0.039 |
scam | -0.039 |
ous | -0.035 |
ighting | -0.035 |
Token | an |
Token ID | 281 |
Feature activation | +3.18e-03 |
Pos logit contributions | |
ensed | +0.021 |
icably | +0.020 |
scam | +0.020 |
ous | +0.019 |
ighting | +0.018 |
Neg logit contributions | |
Marshal | -0.022 |
lator | -0.022 |
iler | -0.019 |
layer | -0.019 |
Gutenberg | -0.019 |
Token | alliance |
Token ID | 12801 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
Marshal | +0.003 |
lator | +0.003 |
iler | +0.002 |
layer | +0.002 |
Gutenberg | +0.002 |
Neg logit contributions | |
ensed | -0.002 |
icably | -0.002 |
scam | -0.002 |
ous | -0.002 |
ighting | -0.002 |
Token | with |
Token ID | 351 |
Feature activation | +2.98e-02 |
Pos logit contributions | |
ensed | +0.144 |
icably | +0.140 |
scam | +0.139 |
ous | +0.129 |
ighting | +0.128 |
Neg logit contributions | |
Marshal | -0.132 |
lator | -0.130 |
iler | -0.113 |
layer | -0.113 |
Gutenberg | -0.111 |
Token | Ag |
Token ID | 2449 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
Marshal | +0.023 |
lator | +0.022 |
iler | +0.020 |
layer | +0.020 |
Gutenberg | +0.019 |
Neg logit contributions | |
ensed | -0.022 |
icably | -0.022 |
scam | -0.021 |
ous | -0.020 |
ighting | -0.020 |
Token | ence |
Token ID | 594 |
Feature activation | -7.21e-01 |
Pos logit contributions | |
ensed | +0.222 |
icably | +0.217 |
scam | +0.216 |
recomm | +0.195 |
ighting | +0.195 |
Neg logit contributions | |
Marshal | -0.264 |
lator | -0.259 |
iler | -0.232 |
layer | -0.230 |
Gutenberg | -0.226 |
Token | Franç |
Token ID | 40178 |
Feature activation | -2.01e-01 |
Pos logit contributions | |
ensed | +0.579 |
icably | +0.564 |
scam | +0.560 |
ous | +0.518 |
ighting | +0.516 |
Neg logit contributions | |
Marshal | -0.513 |
lator | -0.502 |
iler | -0.437 |
layer | -0.434 |
Gutenberg | -0.429 |
Token | a |
Token ID | 64 |
Feature activation | -3.98e-01 |
Pos logit contributions | |
ensed | +0.123 |
icably | +0.119 |
scam | +0.118 |
ous | +0.106 |
ella | +0.105 |
Neg logit contributions | |
Marshal | -0.182 |
lator | -0.179 |
iler | -0.161 |
layer | -0.160 |
Gutenberg | -0.159 |
Token | ise |
Token ID | 786 |
Feature activation | -2.90e-01 |
Pos logit contributions | |
ensed | +0.227 |
icably | +0.219 |
scam | +0.218 |
ous | +0.194 |
ighting | +0.193 |
Neg logit contributions | |
Marshal | -0.376 |
lator | -0.370 |
iler | -0.334 |
layer | -0.332 |
Gutenberg | -0.329 |
Token | In |
Token ID | 554 |
Feature activation | -7.54e-02 |
Pos logit contributions | |
ensed | +0.211 |
icably | +0.205 |
scam | +0.203 |
ous | +0.187 |
ighting | +0.185 |
Neg logit contributions | |
Marshal | -0.229 |
lator | -0.225 |
iler | -0.198 |
layer | -0.198 |
Gutenberg | -0.195 |
Token | format |
Token ID | 18982 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
ensed | +0.051 |
icably | +0.049 |
scam | +0.049 |
ous | +0.044 |
ighting | +0.044 |
Neg logit contributions | |
Marshal | -0.064 |
lator | -0.062 |
iler | -0.056 |
layer | -0.055 |
Gutenberg | -0.055 |
Token | � |
Token ID | 447 |
Feature activation | +9.83e-02 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.010 |
scam | +0.010 |
ous | +0.009 |
ighting | +0.009 |
Neg logit contributions | |
Marshal | -0.012 |
lator | -0.012 |
iler | -0.010 |
layer | -0.010 |
Gutenberg | -0.010 |
Token | � |
Token ID | 247 |
Feature activation | +3.34e-02 |
Pos logit contributions | |
Marshal | +0.073 |
lator | +0.072 |
iler | +0.063 |
layer | +0.062 |
Gutenberg | +0.061 |
Neg logit contributions | |
ensed | -0.076 |
icably | -0.074 |
scam | -0.073 |
ous | -0.068 |
ighting | -0.067 |
Token | s |
Token ID | 82 |
Feature activation | +5.58e-02 |
Pos logit contributions | |
Marshal | +0.019 |
lator | +0.018 |
iler | +0.015 |
layer | +0.015 |
Gutenberg | +0.015 |
Neg logit contributions | |
ensed | -0.032 |
icably | -0.031 |
scam | -0.031 |
ous | -0.029 |
ighting | -0.029 |
Token | final |
Token ID | 2457 |
Feature activation | -7.79e-03 |
Pos logit contributions | |
Marshal | +0.042 |
lator | +0.041 |
iler | +0.036 |
layer | +0.036 |
Gutenberg | +0.036 |
Neg logit contributions | |
ensed | -0.042 |
icably | -0.041 |
scam | -0.041 |
ous | -0.037 |
ighting | -0.037 |
Token | coal |
Token ID | 5655 |
Feature activation | -3.90e-02 |
Pos logit contributions | |
ensed | +0.006 |
icably | +0.006 |
scam | +0.006 |
ous | +0.005 |
ighting | +0.005 |
Neg logit contributions | |
Marshal | -0.006 |
lator | -0.006 |
iler | -0.005 |
layer | -0.005 |
Gutenberg | -0.005 |
Token | ash |
Token ID | 12530 |
Feature activation | -7.17e-01 |
Pos logit contributions | |
ensed | +0.028 |
icably | +0.027 |
scam | +0.026 |
ous | +0.024 |
ighting | +0.024 |
Neg logit contributions | |
Marshal | -0.031 |
lator | -0.031 |
iler | -0.027 |
layer | -0.027 |
Gutenberg | -0.027 |
Token | rule |
Token ID | 3896 |
Feature activation | +9.08e-02 |
Pos logit contributions | |
ensed | +0.527 |
icably | +0.512 |
scam | +0.509 |
ous | +0.467 |
ighting | +0.464 |
Neg logit contributions | |
Marshal | -0.560 |
lator | -0.550 |
iler | -0.485 |
layer | -0.482 |
Gutenberg | -0.476 |
Token | — |
Token ID | 960 |
Feature activation | +4.96e-02 |
Pos logit contributions | |
Marshal | +0.071 |
lator | +0.070 |
iler | +0.061 |
layer | +0.061 |
Gutenberg | +0.060 |
Neg logit contributions | |
ensed | -0.067 |
icably | -0.065 |
scam | -0.065 |
ighting | -0.059 |
ous | -0.059 |
Token | expected |
Token ID | 40319 |
Feature activation | +9.52e-02 |
Pos logit contributions | |
Marshal | +0.042 |
lator | +0.042 |
iler | +0.037 |
layer | +0.037 |
Gutenberg | +0.037 |
Neg logit contributions | |
ensed | -0.033 |
icably | -0.032 |
scam | -0.032 |
ous | -0.029 |
ighting | -0.029 |
Token | to |
Token ID | 284 |
Feature activation | -3.73e-02 |
Pos logit contributions | |
Marshal | +0.076 |
lator | +0.075 |
iler | +0.066 |
layer | +0.066 |
Gutenberg | +0.065 |
Neg logit contributions | |
ensed | -0.068 |
icably | -0.066 |
scam | -0.065 |
ous | -0.060 |
ighting | -0.060 |
Token | be |
Token ID | 307 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
ensed | +0.030 |
icably | +0.029 |
scam | +0.029 |
ous | +0.027 |
ighting | +0.027 |
Neg logit contributions | |
Marshal | -0.027 |
lator | -0.026 |
iler | -0.023 |
layer | -0.022 |
Gutenberg | -0.022 |
Token | , |
Token ID | 11 |
Feature activation | -5.29e-02 |
Pos logit contributions | |
ensed | +0.215 |
icably | +0.210 |
scam | +0.209 |
ous | +0.195 |
ighting | +0.192 |
Neg logit contributions | |
Marshal | -0.187 |
lator | -0.184 |
iler | -0.159 |
layer | -0.158 |
Gutenberg | -0.157 |
Token |
|
Token ID | 198 |
Feature activation | -5.39e-02 |
Pos logit contributions | |
ensed | +0.037 |
icably | +0.036 |
scam | +0.036 |
ous | +0.033 |
ighting | +0.033 |
Neg logit contributions | |
Marshal | -0.043 |
lator | -0.042 |
iler | -0.037 |
layer | -0.037 |
Gutenberg | -0.037 |
Token |
|
Token ID | 198 |
Feature activation | -5.81e-02 |
Pos logit contributions | |
ensed | +0.040 |
icably | +0.039 |
scam | +0.038 |
ighting | +0.035 |
recomm | +0.035 |
Neg logit contributions | |
Marshal | -0.042 |
lator | -0.041 |
iler | -0.037 |
layer | -0.036 |
Gutenberg | -0.036 |
Token | The |
Token ID | 464 |
Feature activation | -2.14e-01 |
Pos logit contributions | |
ensed | +0.036 |
icably | +0.035 |
scam | +0.035 |
ous | +0.031 |
ighting | +0.031 |
Neg logit contributions | |
Marshal | -0.052 |
lator | -0.051 |
iler | -0.046 |
layer | -0.045 |
Gutenberg | -0.045 |
Token | insol |
Token ID | 35831 |
Feature activation | -3.01e-02 |
Pos logit contributions | |
ensed | +0.144 |
icably | +0.140 |
scam | +0.139 |
ous | +0.126 |
ighting | +0.126 |
Neg logit contributions | |
Marshal | -0.180 |
lator | -0.176 |
iler | -0.157 |
layer | -0.156 |
Gutenberg | -0.155 |
Token | ence |
Token ID | 594 |
Feature activation | -7.07e-01 |
Pos logit contributions | |
ensed | +0.014 |
icably | +0.013 |
scam | +0.013 |
ighting | +0.011 |
recomm | +0.011 |
Neg logit contributions | |
Marshal | -0.031 |
lator | -0.031 |
iler | -0.028 |
layer | -0.028 |
Gutenberg | -0.028 |
Token | of |
Token ID | 286 |
Feature activation | -9.38e-02 |
Pos logit contributions | |
ensed | +0.450 |
icably | +0.435 |
scam | +0.434 |
ous | +0.394 |
ighting | +0.389 |
Neg logit contributions | |
Marshal | -0.619 |
lator | -0.611 |
iler | -0.545 |
layer | -0.542 |
Gutenberg | -0.538 |
Token | office |
Token ID | 2607 |
Feature activation | -9.57e-02 |
Pos logit contributions | |
ensed | +0.069 |
icably | +0.067 |
scam | +0.067 |
ous | +0.061 |
ighting | +0.061 |
Neg logit contributions | |
Marshal | -0.073 |
lator | -0.072 |
iler | -0.063 |
layer | -0.063 |
Gutenberg | -0.062 |
Token | , |
Token ID | 11 |
Feature activation | -7.26e-02 |
Pos logit contributions | |
ensed | +0.074 |
icably | +0.072 |
scam | +0.072 |
ous | +0.066 |
ighting | +0.066 |
Neg logit contributions | |
Marshal | -0.071 |
lator | -0.070 |
iler | -0.061 |
layer | -0.060 |
Gutenberg | -0.060 |
Token | and |
Token ID | 290 |
Feature activation | -6.39e-02 |
Pos logit contributions | |
ensed | +0.049 |
icably | +0.047 |
scam | +0.047 |
ous | +0.043 |
ighting | +0.043 |
Neg logit contributions | |
Marshal | -0.061 |
lator | -0.060 |
iler | -0.053 |
layer | -0.053 |
Gutenberg | -0.053 |
Token | the |
Token ID | 262 |
Feature activation | -9.09e-02 |
Pos logit contributions | |
ensed | +0.044 |
icably | +0.042 |
scam | +0.042 |
ous | +0.038 |
ighting | +0.038 |
Neg logit contributions | |
Marshal | -0.053 |
lator | -0.052 |
iler | -0.046 |
layer | -0.046 |
Gutenberg | -0.046 |
Token | landfill |
Token ID | 47712 |
Feature activation | +9.59e-02 |
Pos logit contributions | |
ensed | +0.012 |
icably | +0.011 |
scam | +0.011 |
ous | +0.010 |
ash | +0.010 |
Neg logit contributions | |
Marshal | -0.010 |
lator | -0.010 |
iler | -0.009 |
layer | -0.009 |
Gutenberg | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e-03 |
Pos logit contributions | |
Marshal | +0.072 |
lator | +0.070 |
iler | +0.062 |
layer | +0.061 |
Gutenberg | +0.060 |
Neg logit contributions | |
ensed | -0.074 |
icably | -0.072 |
scam | -0.071 |
ighting | -0.066 |
ous | -0.065 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
ensed | +0.001 |
icably | +0.001 |
scam | +0.001 |
ous | +0.001 |
ighting | +0.001 |
Neg logit contributions | |
Marshal | -0.001 |
lator | -0.001 |
iler | -0.001 |
layer | -0.001 |
Gutenberg | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -3.01e-02 |
Pos logit contributions | |
ensed | +0.012 |
icably | +0.012 |
scam | +0.012 |
ighting | +0.011 |
ous | +0.011 |
Neg logit contributions | |
Marshal | -0.013 |
lator | -0.013 |
iler | -0.011 |
layer | -0.011 |
Gutenberg | -0.011 |
Token | Moving |
Token ID | 33622 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
ensed | +0.020 |
icably | +0.020 |
scam | +0.020 |
ighting | +0.018 |
ella | +0.018 |
Neg logit contributions | |
Marshal | -0.025 |
lator | -0.025 |
iler | -0.022 |
layer | -0.022 |
Gutenberg | -0.022 |
Token | ash |
Token ID | 12530 |
Feature activation | -6.90e-01 |
Pos logit contributions | |
ensed | +0.035 |
icably | +0.030 |
scam | +0.029 |
ous | +0.017 |
ighting | +0.017 |
Neg logit contributions | |
Marshal | -0.275 |
lator | -0.272 |
iler | -0.254 |
layer | -0.253 |
Gutenberg | -0.251 |
Token | from |
Token ID | 422 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
ensed | +0.479 |
icably | +0.465 |
scam | +0.461 |
ous | +0.421 |
ighting | +0.419 |
Neg logit contributions | |
Marshal | -0.566 |
lator | -0.556 |
iler | -0.494 |
layer | -0.492 |
Gutenberg | -0.485 |
Token | the |
Token ID | 262 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
ensed | +0.081 |
icably | +0.078 |
scam | +0.077 |
ous | +0.071 |
ighting | +0.070 |
Neg logit contributions | |
Marshal | -0.096 |
lator | -0.094 |
iler | -0.083 |
layer | -0.083 |
Gutenberg | -0.082 |
Token | Asheville |
Token ID | 49362 |
Feature activation | -8.81e-02 |
Pos logit contributions | |
ensed | +0.090 |
icably | +0.088 |
scam | +0.087 |
ous | +0.080 |
ighting | +0.080 |
Neg logit contributions | |
Marshal | -0.086 |
lator | -0.085 |
iler | -0.074 |
layer | -0.074 |
Gutenberg | -0.073 |
Token | plant |
Token ID | 4618 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
ensed | +0.050 |
icably | +0.048 |
scam | +0.048 |
ous | +0.043 |
ighting | +0.043 |
Neg logit contributions | |
Marshal | -0.083 |
lator | -0.082 |
iler | -0.074 |
layer | -0.074 |
Gutenberg | -0.073 |
Token | to |
Token ID | 284 |
Feature activation | -6.65e-02 |
Pos logit contributions | |
ensed | +0.127 |
icably | +0.123 |
scam | +0.121 |
ighting | +0.110 |
ous | +0.110 |
Neg logit contributions | |
Marshal | -0.152 |
lator | -0.150 |
iler | -0.133 |
layer | -0.133 |
Gutenberg | -0.131 |
Token | serves |
Token ID | 9179 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
ensed | +0.017 |
icably | +0.016 |
scam | +0.016 |
ighting | +0.015 |
ous | +0.015 |
Neg logit contributions | |
Marshal | -0.019 |
lator | -0.019 |
iler | -0.017 |
layer | -0.017 |
Gutenberg | -0.016 |
Token | powerful |
Token ID | 3665 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
Marshal | +0.083 |
lator | +0.082 |
iler | +0.072 |
layer | +0.072 |
Gutenberg | +0.071 |
Neg logit contributions | |
ensed | -0.073 |
icably | -0.071 |
scam | -0.070 |
ous | -0.064 |
ighting | -0.064 |
Token | corporate |
Token ID | 6355 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
ensed | +0.087 |
icably | +0.084 |
scam | +0.083 |
ous | +0.076 |
ighting | +0.076 |
Neg logit contributions | |
Marshal | -0.096 |
lator | -0.094 |
iler | -0.083 |
layer | -0.083 |
Gutenberg | -0.082 |
Token | interests |
Token ID | 5353 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
Marshal | +0.016 |
lator | +0.016 |
iler | +0.014 |
layer | +0.014 |
Gutenberg | +0.014 |
Neg logit contributions | |
ensed | -0.014 |
icably | -0.014 |
scam | -0.014 |
ous | -0.013 |
ighting | -0.013 |
Token | unab |
Token ID | 40986 |
Feature activation | -9.81e-02 |
Pos logit contributions | |
ensed | +0.093 |
icably | +0.090 |
scam | +0.090 |
ous | +0.082 |
ighting | +0.081 |
Neg logit contributions | |
Marshal | -0.103 |
lator | -0.101 |
iler | -0.089 |
layer | -0.089 |
Gutenberg | -0.088 |
Token | ashed |
Token ID | 5263 |
Feature activation | -6.88e-01 |
Pos logit contributions | |
ensed | +0.014 |
icably | +0.012 |
scam | +0.012 |
ous | +0.006 |
ighting | +0.006 |
Neg logit contributions | |
Marshal | -0.134 |
lator | -0.133 |
iler | -0.124 |
layer | -0.124 |
Gutenberg | -0.123 |
Token | ly |
Token ID | 306 |
Feature activation | +5.60e-02 |
Pos logit contributions | |
ensed | +0.542 |
scam | +0.531 |
icably | +0.526 |
ous | +0.492 |
recomm | +0.484 |
Neg logit contributions | |
Marshal | -0.499 |
lator | -0.489 |
layer | -0.422 |
iler | -0.422 |
Gutenberg | -0.418 |
Token | , |
Token ID | 11 |
Feature activation | -7.98e-02 |
Pos logit contributions | |
Marshal | +0.044 |
lator | +0.043 |
iler | +0.038 |
layer | +0.038 |
Gutenberg | +0.038 |
Neg logit contributions | |
ensed | -0.041 |
icably | -0.039 |
scam | -0.039 |
ous | -0.036 |
ighting | -0.036 |
Token | and |
Token ID | 290 |
Feature activation | -6.81e-02 |
Pos logit contributions | |
ensed | +0.055 |
icably | +0.053 |
scam | +0.052 |
ous | +0.048 |
ighting | +0.048 |
Neg logit contributions | |
Marshal | -0.066 |
lator | -0.065 |
iler | -0.058 |
layer | -0.058 |
Gutenberg | -0.057 |
Token | another |
Token ID | 1194 |
Feature activation | +9.85e-02 |
Pos logit contributions | |
ensed | +0.047 |
icably | +0.046 |
scam | +0.045 |
ous | +0.041 |
ighting | +0.041 |
Neg logit contributions | |
Marshal | -0.056 |
lator | -0.055 |
iler | -0.049 |
layer | -0.049 |
Gutenberg | -0.048 |
Token | party |
Token ID | 2151 |
Feature activation | +3.48e-02 |
Pos logit contributions | |
Marshal | +0.084 |
lator | +0.083 |
iler | +0.074 |
layer | +0.073 |
Gutenberg | +0.073 |
Neg logit contributions | |
ensed | -0.065 |
icably | -0.063 |
scam | -0.062 |
ous | -0.056 |
ighting | -0.056 |
Token | River |
Token ID | 5866 |
Feature activation | -2.01e-03 |
Pos logit contributions | |
Marshal | +0.007 |
lator | +0.007 |
iler | +0.006 |
layer | +0.006 |
Gutenberg | +0.006 |
Neg logit contributions | |
ensed | -0.008 |
icably | -0.007 |
scam | -0.007 |
ous | -0.007 |
ella | -0.007 |
Token | ash |
Token ID | 12530 |
Feature activation | -6.12e-01 |
Pos logit contributions | |
ensed | +0.002 |
icably | +0.001 |
scam | +0.001 |
ous | +0.001 |
ighting | +0.001 |
Neg logit contributions | |
Marshal | -0.002 |
lator | -0.002 |
iler | -0.001 |
layer | -0.001 |
Gutenberg | -0.001 |
Token | ponds |
Token ID | 47339 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
ensed | +0.416 |
icably | +0.402 |
scam | +0.402 |
ous | +0.365 |
ash | +0.363 |
Neg logit contributions | |
Marshal | -0.511 |
lator | -0.502 |
iler | -0.446 |
layer | -0.442 |
Gutenberg | -0.440 |
Token | and |
Token ID | 290 |
Feature activation | +1.68e-03 |
Pos logit contributions | |
ensed | +0.152 |
icably | +0.147 |
scam | +0.146 |
ous | +0.134 |
ighting | +0.134 |
Neg logit contributions | |
Marshal | -0.162 |
lator | -0.159 |
iler | -0.141 |
layer | -0.140 |
Gutenberg | -0.138 |
Token | moving |
Token ID | 3867 |
Feature activation | -2.34e-01 |
Pos logit contributions | |
Marshal | +0.001 |
lator | +0.001 |
iler | +0.001 |
layer | +0.001 |
Gutenberg | +0.001 |
Neg logit contributions | |
ensed | -0.001 |
icably | -0.001 |
scam | -0.001 |
ighting | -0.001 |
ous | -0.001 |
Token | ash |
Token ID | 12530 |
Feature activation | -6.87e-01 |
Pos logit contributions | |
ensed | +0.165 |
icably | +0.160 |
scam | +0.159 |
ous | +0.145 |
ighting | +0.144 |
Neg logit contributions | |
Marshal | -0.189 |
lator | -0.186 |
iler | -0.165 |
layer | -0.164 |
Gutenberg | -0.162 |
Token | to |
Token ID | 284 |
Feature activation | -5.05e-02 |
Pos logit contributions | |
ensed | +0.457 |
icably | +0.443 |
scam | +0.439 |
ous | +0.398 |
ighting | +0.397 |
Neg logit contributions | |
Marshal | -0.584 |
lator | -0.574 |
iler | -0.512 |
layer | -0.510 |
Gutenberg | -0.503 |
Token | a |
Token ID | 257 |
Feature activation | -5.01e-03 |
Pos logit contributions | |
ensed | +0.037 |
icably | +0.036 |
scam | +0.036 |
ous | +0.033 |
ighting | +0.032 |
Neg logit contributions | |
Marshal | -0.040 |
lator | -0.039 |
iler | -0.034 |
layer | -0.034 |
Gutenberg | -0.034 |
Token | lined |
Token ID | 16566 |
Feature activation | -3.45e-02 |
Pos logit contributions | |
ensed | +0.004 |
icably | +0.004 |
scam | +0.004 |
ous | +0.003 |
ighting | +0.003 |
Neg logit contributions | |
Marshal | -0.004 |
lator | -0.004 |
iler | -0.003 |
layer | -0.003 |
Gutenberg | -0.003 |
Token | structural |
Token ID | 13204 |
Feature activation | +2.56e-01 |
Pos logit contributions | |
ensed | +0.024 |
icably | +0.023 |
scam | +0.023 |
ous | +0.021 |
ighting | +0.021 |
Neg logit contributions | |
Marshal | -0.028 |
lator | -0.028 |
iler | -0.025 |
layer | -0.025 |
Gutenberg | -0.024 |
Token | fill |
Token ID | 6070 |
Feature activation | +5.16e-02 |
Pos logit contributions | |
Marshal | +0.218 |
lator | +0.214 |
iler | +0.191 |
layer | +0.191 |
Gutenberg | +0.187 |
Neg logit contributions | |
ensed | -0.171 |
icably | -0.166 |
scam | -0.163 |
ighting | -0.149 |
ous | -0.148 |
Token | be |
Token ID | 307 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
Marshal | +0.042 |
lator | +0.042 |
iler | +0.037 |
layer | +0.037 |
Gutenberg | +0.036 |
Neg logit contributions | |
ensed | -0.038 |
icably | -0.037 |
scam | -0.037 |
ous | -0.034 |
ighting | -0.034 |
Token | elected |
Token ID | 7018 |
Feature activation | -9.64e-02 |
Pos logit contributions | |
Marshal | +0.097 |
lator | +0.096 |
iler | +0.085 |
layer | +0.084 |
Gutenberg | +0.084 |
Neg logit contributions | |
ensed | -0.085 |
icably | -0.082 |
scam | -0.081 |
ous | -0.075 |
ighting | -0.074 |
Token | and |
Token ID | 290 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
ensed | +0.070 |
icably | +0.068 |
scam | +0.068 |
ous | +0.062 |
ella | +0.062 |
Neg logit contributions | |
Marshal | -0.075 |
lator | -0.075 |
iler | -0.066 |
layer | -0.066 |
Gutenberg | -0.065 |
Token | Arab |
Token ID | 4498 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
Marshal | +0.012 |
lator | +0.012 |
iler | +0.010 |
layer | +0.010 |
Gutenberg | +0.010 |
Neg logit contributions | |
ensed | -0.011 |
icably | -0.011 |
scam | -0.011 |
ous | -0.010 |
recomm | -0.010 |
Token | parliament |
Token ID | 8540 |
Feature activation | -7.56e-02 |
Pos logit contributions | |
Marshal | +0.083 |
lator | +0.081 |
iler | +0.071 |
layer | +0.070 |
Gutenberg | +0.069 |
Neg logit contributions | |
ensed | -0.094 |
icably | -0.091 |
scam | -0.091 |
ous | -0.084 |
ighting | -0.084 |
Token | arians |
Token ID | 13517 |
Feature activation | -6.79e-01 |
Pos logit contributions | |
ensed | +0.034 |
icably | +0.033 |
scam | +0.032 |
ous | +0.028 |
ighting | +0.028 |
Neg logit contributions | |
Marshal | -0.080 |
lator | -0.079 |
iler | -0.072 |
layer | -0.072 |
Gutenberg | -0.071 |
Token | are |
Token ID | 389 |
Feature activation | +4.51e-02 |
Pos logit contributions | |
ensed | +0.445 |
icably | +0.430 |
scam | +0.427 |
ous | +0.388 |
ighting | +0.385 |
Neg logit contributions | |
Marshal | -0.584 |
lator | -0.574 |
iler | -0.513 |
layer | -0.510 |
Gutenberg | -0.505 |
Token | free |
Token ID | 1479 |
Feature activation | -4.95e-02 |
Pos logit contributions | |
Marshal | +0.038 |
lator | +0.038 |
iler | +0.034 |
layer | +0.033 |
Gutenberg | +0.033 |
Neg logit contributions | |
ensed | -0.030 |
icably | -0.029 |
scam | -0.029 |
ous | -0.026 |
ighting | -0.026 |
Token | to |
Token ID | 284 |
Feature activation | -3.43e-02 |
Pos logit contributions | |
ensed | +0.035 |
icably | +0.034 |
scam | +0.034 |
ous | +0.031 |
ighting | +0.031 |
Neg logit contributions | |
Marshal | -0.040 |
lator | -0.039 |
iler | -0.035 |
layer | -0.034 |
Gutenberg | -0.034 |
Token | say |
Token ID | 910 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
ensed | +0.026 |
icably | +0.025 |
scam | +0.025 |
ous | +0.023 |
ighting | +0.023 |
Neg logit contributions | |
Marshal | -0.026 |
lator | -0.026 |
iler | -0.023 |
layer | -0.022 |
Gutenberg | -0.022 |
Token | mean |
Token ID | 1612 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
Marshal | +0.079 |
lator | +0.078 |
iler | +0.067 |
layer | +0.067 |
Gutenberg | +0.066 |
Neg logit contributions | |
ensed | -0.092 |
icably | -0.090 |
scam | -0.089 |
ous | -0.083 |
ighting | -0.082 |
Token | celer |
Token ID | 7015 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
ensed | +0.180 |
icably | +0.176 |
scam | +0.175 |
ous | +0.163 |
ighting | +0.162 |
Neg logit contributions | |
Marshal | -0.140 |
lator | -0.137 |
iler | -0.117 |
layer | -0.117 |
Gutenberg | -0.115 |
Token | ating |
Token ID | 803 |
Feature activation | +5.87e-02 |
Pos logit contributions | |
Marshal | +0.155 |
lator | +0.152 |
iler | +0.136 |
layer | +0.135 |
Gutenberg | +0.133 |
Neg logit contributions | |
ensed | -0.118 |
scam | -0.114 |
icably | -0.114 |
ighting | -0.102 |
ella | -0.102 |
Token | water |
Token ID | 1660 |
Feature activation | +4.29e-02 |
Pos logit contributions | |
Marshal | +0.048 |
lator | +0.047 |
iler | +0.041 |
layer | +0.041 |
Gutenberg | +0.041 |
Neg logit contributions | |
ensed | -0.041 |
icably | -0.040 |
scam | -0.040 |
ous | -0.036 |
ighting | -0.036 |
Token | removal |
Token ID | 9934 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
Marshal | +0.036 |
lator | +0.036 |
iler | +0.032 |
layer | +0.032 |
Gutenberg | +0.031 |
Neg logit contributions | |
ensed | -0.029 |
icably | -0.028 |
scam | -0.028 |
ous | -0.025 |
ella | -0.025 |
Token | from |
Token ID | 422 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
ensed | +0.139 |
icably | +0.135 |
scam | +0.133 |
ighting | +0.121 |
ella | +0.121 |
Neg logit contributions | |
Marshal | -0.165 |
lator | -0.161 |
iler | -0.143 |
layer | -0.142 |
Gutenberg | -0.141 |
Token | ash |
Token ID | 12530 |
Feature activation | -6.73e-01 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.010 |
scam | +0.010 |
ous | +0.009 |
ighting | +0.009 |
Neg logit contributions | |
Marshal | -0.012 |
lator | -0.012 |
iler | -0.011 |
layer | -0.011 |
Gutenberg | -0.011 |
Token | ponds |
Token ID | 47339 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
ensed | +0.434 |
icably | +0.419 |
scam | +0.416 |
ous | +0.377 |
ighting | +0.375 |
Neg logit contributions | |
Marshal | -0.586 |
lator | -0.576 |
iler | -0.515 |
layer | -0.513 |
Gutenberg | -0.507 |
Token | at |
Token ID | 379 |
Feature activation | -3.75e-02 |
Pos logit contributions | |
ensed | +0.155 |
icably | +0.150 |
scam | +0.149 |
ous | +0.136 |
ighting | +0.136 |
Neg logit contributions | |
Marshal | -0.166 |
lator | -0.162 |
iler | -0.143 |
layer | -0.142 |
Gutenberg | -0.141 |
Token | all |
Token ID | 477 |
Feature activation | -4.35e-02 |
Pos logit contributions | |
ensed | +0.027 |
icably | +0.026 |
scam | +0.026 |
ous | +0.023 |
ighting | +0.023 |
Neg logit contributions | |
Marshal | -0.030 |
lator | -0.030 |
iler | -0.026 |
layer | -0.026 |
Gutenberg | -0.026 |
Token | retired |
Token ID | 9880 |
Feature activation | -4.01e-01 |
Pos logit contributions | |
ensed | +0.029 |
icably | +0.028 |
scam | +0.028 |
ella | +0.025 |
ighting | +0.025 |
Neg logit contributions | |
Marshal | -0.037 |
lator | -0.037 |
iler | -0.033 |
layer | -0.033 |
Gutenberg | -0.032 |
Token | coal |
Token ID | 5655 |
Feature activation | -9.83e-02 |
Pos logit contributions | |
ensed | +0.200 |
icably | +0.190 |
scam | +0.188 |
ighting | +0.164 |
ous | +0.164 |
Neg logit contributions | |
Marshal | -0.409 |
lator | -0.402 |
iler | -0.366 |
layer | -0.364 |
Gutenberg | -0.362 |
Token | for |
Token ID | 329 |
Feature activation | -5.22e-02 |
Pos logit contributions | |
Marshal | +0.014 |
lator | +0.014 |
iler | +0.012 |
layer | +0.012 |
Gutenberg | +0.012 |
Neg logit contributions | |
ensed | -0.011 |
icably | -0.011 |
scam | -0.011 |
ous | -0.010 |
ighting | -0.010 |
Token | reuse |
Token ID | 32349 |
Feature activation | -1.17e-01 |
Pos logit contributions | |
ensed | +0.036 |
icably | +0.035 |
scam | +0.034 |
ous | +0.031 |
ighting | +0.031 |
Neg logit contributions | |
Marshal | -0.043 |
lator | -0.042 |
iler | -0.038 |
layer | -0.038 |
Gutenberg | -0.037 |
Token | opportunities |
Token ID | 6443 |
Feature activation | -3.79e-02 |
Pos logit contributions | |
ensed | +0.078 |
icably | +0.076 |
scam | +0.075 |
ighting | +0.068 |
ella | +0.068 |
Neg logit contributions | |
Marshal | -0.099 |
lator | -0.097 |
iler | -0.086 |
layer | -0.086 |
Gutenberg | -0.085 |
Token | for |
Token ID | 329 |
Feature activation | -3.97e-02 |
Pos logit contributions | |
ensed | +0.028 |
icably | +0.028 |
scam | +0.027 |
ous | +0.025 |
ighting | +0.025 |
Neg logit contributions | |
Marshal | -0.029 |
lator | -0.028 |
iler | -0.025 |
layer | -0.025 |
Gutenberg | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | -3.17e-02 |
Pos logit contributions | |
ensed | +0.025 |
icably | +0.024 |
scam | +0.023 |
ous | +0.021 |
ighting | +0.021 |
Neg logit contributions | |
Marshal | -0.036 |
lator | -0.035 |
iler | -0.031 |
layer | -0.031 |
Gutenberg | -0.031 |
Token | ash |
Token ID | 12530 |
Feature activation | -6.70e-01 |
Pos logit contributions | |
ensed | +0.021 |
icably | +0.020 |
scam | +0.020 |
ous | +0.018 |
ighting | +0.018 |
Neg logit contributions | |
Marshal | -0.027 |
lator | -0.027 |
iler | -0.024 |
layer | -0.024 |
Gutenberg | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
ensed | +0.429 |
icably | +0.414 |
scam | +0.413 |
ous | +0.374 |
ash | +0.371 |
Neg logit contributions | |
Marshal | -0.585 |
lator | -0.577 |
iler | -0.516 |
layer | -0.512 |
Gutenberg | -0.509 |
Token |
|
Token ID | 198 |
Feature activation | -5.55e-03 |
Pos logit contributions | |
ensed | +0.008 |
icably | +0.007 |
scam | +0.007 |
ous | +0.007 |
ighting | +0.007 |
Neg logit contributions | |
Marshal | -0.008 |
lator | -0.008 |
iler | -0.007 |
layer | -0.007 |
Gutenberg | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | -3.01e-02 |
Pos logit contributions | |
ensed | +0.004 |
icably | +0.004 |
scam | +0.004 |
ighting | +0.004 |
recomm | +0.004 |
Neg logit contributions | |
Marshal | -0.004 |
lator | -0.004 |
iler | -0.004 |
layer | -0.004 |
Gutenberg | -0.004 |
Token | Ac |
Token ID | 12832 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
ensed | +0.020 |
icably | +0.019 |
scam | +0.019 |
ighting | +0.017 |
ous | +0.017 |
Neg logit contributions | |
Marshal | -0.025 |
lator | -0.025 |
iler | -0.022 |
layer | -0.022 |
Gutenberg | -0.022 |
Token | celer |
Token ID | 7015 |
Feature activation | +1.81e-01 |
Pos logit contributions | |
ensed | +0.180 |
icably | +0.176 |
scam | +0.175 |
ous | +0.163 |
ighting | +0.162 |
Neg logit contributions | |
Marshal | -0.140 |
lator | -0.137 |
iler | -0.117 |
layer | -0.117 |
Gutenberg | -0.115 |
Token | evaluated |
Token ID | 16726 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
Marshal | +0.054 |
lator | +0.053 |
iler | +0.048 |
layer | +0.047 |
Gutenberg | +0.047 |
Neg logit contributions | |
ensed | -0.040 |
icably | -0.038 |
scam | -0.038 |
ighting | -0.035 |
ous | -0.035 |
Token | . |
Token ID | 13 |
Feature activation | +4.90e-02 |
Pos logit contributions | |
Marshal | +0.087 |
lator | +0.086 |
iler | +0.075 |
layer | +0.075 |
Gutenberg | +0.074 |
Neg logit contributions | |
ensed | -0.087 |
icably | -0.084 |
scam | -0.084 |
ous | -0.077 |
ighting | -0.077 |
Token |
|
Token ID | 198 |
Feature activation | +3.00e-02 |
Pos logit contributions | |
Marshal | +0.039 |
lator | +0.038 |
iler | +0.034 |
layer | +0.034 |
Gutenberg | +0.033 |
Neg logit contributions | |
ensed | -0.035 |
icably | -0.034 |
scam | -0.034 |
ous | -0.031 |
ighting | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | +3.99e-03 |
Pos logit contributions | |
Marshal | +0.024 |
lator | +0.023 |
iler | +0.020 |
layer | +0.020 |
Gutenberg | +0.020 |
Neg logit contributions | |
ensed | -0.022 |
icably | -0.021 |
scam | -0.021 |
ighting | -0.019 |
recomm | -0.019 |
Token | Moving |
Token ID | 33622 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
Marshal | +0.003 |
lator | +0.003 |
iler | +0.003 |
layer | +0.003 |
Gutenberg | +0.003 |
Neg logit contributions | |
ensed | -0.003 |
scam | -0.003 |
icably | -0.003 |
ighting | -0.002 |
ous | -0.002 |
Token | ash |
Token ID | 12530 |
Feature activation | -6.67e-01 |
Pos logit contributions | |
ensed | +0.072 |
icably | +0.067 |
scam | +0.066 |
ous | +0.055 |
ighting | +0.055 |
Neg logit contributions | |
Marshal | -0.220 |
lator | -0.217 |
iler | -0.200 |
layer | -0.199 |
Gutenberg | -0.198 |
Token | from |
Token ID | 422 |
Feature activation | -7.91e-02 |
Pos logit contributions | |
ensed | +0.467 |
icably | +0.453 |
scam | +0.449 |
ous | +0.410 |
ighting | +0.409 |
Neg logit contributions | |
Marshal | -0.544 |
lator | -0.534 |
iler | -0.474 |
layer | -0.472 |
Gutenberg | -0.466 |
Token | the |
Token ID | 262 |
Feature activation | -8.20e-02 |
Pos logit contributions | |
ensed | +0.056 |
icably | +0.054 |
scam | +0.053 |
ighting | +0.048 |
ous | +0.048 |
Neg logit contributions | |
Marshal | -0.065 |
lator | -0.063 |
iler | -0.056 |
layer | -0.056 |
Gutenberg | -0.056 |
Token | River |
Token ID | 5866 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
ensed | +0.060 |
icably | +0.058 |
scam | +0.058 |
ous | +0.053 |
ighting | +0.053 |
Neg logit contributions | |
Marshal | -0.064 |
lator | -0.063 |
iler | -0.056 |
layer | -0.055 |
Gutenberg | -0.055 |
Token | b |
Token ID | 65 |
Feature activation | -4.27e-02 |
Pos logit contributions | |
ensed | +0.073 |
icably | +0.071 |
scam | +0.070 |
ous | +0.063 |
ighting | +0.063 |
Neg logit contributions | |
Marshal | -0.098 |
lator | -0.096 |
iler | -0.086 |
layer | -0.086 |
Gutenberg | -0.085 |
Token | end |
Token ID | 437 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
ensed | +0.041 |
icably | +0.040 |
scam | +0.040 |
ighting | +0.037 |
ous | +0.037 |
Neg logit contributions | |
Marshal | -0.024 |
lator | -0.023 |
iler | -0.019 |
layer | -0.019 |
Gutenberg | -0.018 |
Token | year |
Token ID | 614 |
Feature activation | -8.24e-02 |
Pos logit contributions | |
Marshal | +0.230 |
lator | +0.226 |
iler | +0.204 |
layer | +0.203 |
Gutenberg | +0.201 |
Neg logit contributions | |
ensed | -0.143 |
icably | -0.138 |
scam | -0.136 |
ighting | -0.122 |
ous | -0.122 |
Token | , |
Token ID | 11 |
Feature activation | +2.14e-02 |
Pos logit contributions | |
ensed | +0.062 |
icably | +0.061 |
scam | +0.061 |
ous | +0.056 |
ighting | +0.055 |
Neg logit contributions | |
Marshal | -0.062 |
lator | -0.061 |
iler | -0.054 |
layer | -0.054 |
Gutenberg | -0.053 |
Token | its |
Token ID | 663 |
Feature activation | -5.08e-02 |
Pos logit contributions | |
Marshal | +0.016 |
lator | +0.016 |
iler | +0.014 |
layer | +0.014 |
Gutenberg | +0.014 |
Neg logit contributions | |
ensed | -0.016 |
icably | -0.016 |
scam | -0.015 |
ous | -0.014 |
ighting | -0.014 |
Token | website |
Token ID | 3052 |
Feature activation | -2.63e-02 |
Pos logit contributions | |
ensed | +0.039 |
icably | +0.038 |
scam | +0.038 |
ous | +0.035 |
ighting | +0.034 |
Neg logit contributions | |
Marshal | -0.038 |
lator | -0.037 |
iler | -0.033 |
layer | -0.033 |
Gutenberg | -0.032 |
Token | disp |
Token ID | 4596 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
ensed | +0.017 |
icably | +0.017 |
scam | +0.016 |
ous | +0.015 |
ighting | +0.015 |
Neg logit contributions | |
Marshal | -0.023 |
lator | -0.022 |
iler | -0.020 |
layer | -0.020 |
Gutenberg | -0.020 |
Token | ensed |
Token ID | 15385 |
Feature activation | -6.63e-01 |
Pos logit contributions | |
ensed | +0.005 |
scam | +0.004 |
icably | +0.004 |
recomm | -0.004 |
ous | -0.004 |
Neg logit contributions | |
Marshal | -0.176 |
lator | -0.175 |
iler | -0.165 |
layer | -0.164 |
Gutenberg | -0.162 |
Token | with |
Token ID | 351 |
Feature activation | +6.36e-02 |
Pos logit contributions | |
ensed | +0.503 |
scam | +0.490 |
icably | +0.488 |
ous | +0.449 |
ash | +0.446 |
Neg logit contributions | |
Marshal | -0.499 |
lator | -0.493 |
iler | -0.431 |
layer | -0.429 |
Gutenberg | -0.421 |
Token | nudity |
Token ID | 42156 |
Feature activation | -1.65e-01 |
Pos logit contributions | |
Marshal | +0.054 |
lator | +0.053 |
iler | +0.047 |
layer | +0.047 |
Gutenberg | +0.046 |
Neg logit contributions | |
ensed | -0.043 |
icably | -0.041 |
scam | -0.041 |
ous | -0.037 |
ighting | -0.037 |
Token | . |
Token ID | 13 |
Feature activation | +3.19e-02 |
Pos logit contributions | |
ensed | +0.122 |
icably | +0.119 |
scam | +0.117 |
ighting | +0.107 |
ella | +0.107 |
Neg logit contributions | |
Marshal | -0.128 |
lator | -0.126 |
iler | -0.111 |
layer | -0.111 |
Gutenberg | -0.110 |
Token | As |
Token ID | 1081 |
Feature activation | +1.24e-01 |
Pos logit contributions | |
Marshal | +0.025 |
lator | +0.025 |
iler | +0.022 |
layer | +0.022 |
Gutenberg | +0.021 |
Neg logit contributions | |
ensed | -0.023 |
icably | -0.023 |
scam | -0.022 |
ous | -0.021 |
ighting | -0.020 |
Token | a |
Token ID | 257 |
Feature activation | +9.67e-02 |
Pos logit contributions | |
Marshal | +0.099 |
lator | +0.097 |
iler | +0.086 |
layer | +0.086 |
Gutenberg | +0.085 |
Neg logit contributions | |
ensed | -0.088 |
icably | -0.086 |
scam | -0.085 |
ous | -0.078 |
ighting | -0.077 |
Token | ate |
Token ID | 15063 |
Feature activation | -3.81e-02 |
Pos logit contributions | |
ensed | +0.083 |
icably | +0.081 |
scam | +0.080 |
ous | +0.073 |
ighting | +0.073 |
Neg logit contributions | |
Marshal | -0.093 |
lator | -0.092 |
iler | -0.081 |
layer | -0.081 |
Gutenberg | -0.080 |
Token | lunch |
Token ID | 9965 |
Feature activation | +2.41e-01 |
Pos logit contributions | |
ensed | +0.028 |
icably | +0.027 |
scam | +0.027 |
ous | +0.025 |
ash | +0.025 |
Neg logit contributions | |
Marshal | -0.030 |
lator | -0.029 |
iler | -0.026 |
layer | -0.026 |
Gutenberg | -0.025 |
Token | with |
Token ID | 351 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
Marshal | +0.177 |
lator | +0.173 |
iler | +0.151 |
layer | +0.151 |
Gutenberg | +0.149 |
Neg logit contributions | |
ensed | -0.189 |
icably | -0.184 |
scam | -0.182 |
ous | -0.168 |
ighting | -0.168 |
Token | fellow |
Token ID | 5891 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
Marshal | +0.008 |
lator | +0.008 |
iler | +0.007 |
layer | +0.007 |
Gutenberg | +0.007 |
Neg logit contributions | |
ensed | -0.008 |
icably | -0.008 |
scam | -0.008 |
ous | -0.007 |
ighting | -0.007 |
Token | parliament |
Token ID | 8540 |
Feature activation | -1.47e-01 |
Pos logit contributions | |
ensed | +0.154 |
icably | +0.149 |
scam | +0.147 |
ous | +0.136 |
ighting | +0.136 |
Neg logit contributions | |
Marshal | -0.164 |
lator | -0.160 |
iler | -0.141 |
layer | -0.140 |
Gutenberg | -0.139 |
Token | arians |
Token ID | 13517 |
Feature activation | -6.61e-01 |
Pos logit contributions | |
ensed | +0.041 |
icably | +0.038 |
scam | +0.037 |
ous | +0.029 |
ighting | +0.028 |
Neg logit contributions | |
Marshal | -0.182 |
lator | -0.180 |
iler | -0.167 |
layer | -0.166 |
Gutenberg | -0.164 |
Token | . |
Token ID | 13 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
ensed | +0.500 |
icably | +0.486 |
scam | +0.482 |
ous | +0.444 |
ighting | +0.442 |
Neg logit contributions | |
Marshal | -0.502 |
lator | -0.491 |
iler | -0.431 |
layer | -0.429 |
Gutenberg | -0.424 |
Token |
|
Token ID | 198 |
Feature activation | -1.63e-01 |
Pos logit contributions | |
ensed | +0.100 |
icably | +0.097 |
scam | +0.096 |
recomm | +0.088 |
ous | +0.088 |
Neg logit contributions | |
Marshal | -0.106 |
lator | -0.102 |
iler | -0.090 |
layer | -0.090 |
Gutenberg | -0.089 |
Token |
|
Token ID | 198 |
Feature activation | -1.87e-01 |
Pos logit contributions | |
ensed | +0.119 |
icably | +0.116 |
scam | +0.114 |
ighting | +0.105 |
ous | +0.104 |
Neg logit contributions | |
Marshal | -0.129 |
lator | -0.126 |
iler | -0.111 |
layer | -0.111 |
Gutenberg | -0.109 |
Token | With |
Token ID | 3152 |
Feature activation | -9.02e-02 |
Pos logit contributions | |
ensed | +0.122 |
icably | +0.118 |
scam | +0.117 |
recomm | +0.105 |
ighting | +0.105 |
Neg logit contributions | |
Marshal | -0.161 |
lator | -0.158 |
layer | -0.141 |
iler | -0.141 |
Gutenberg | -0.139 |
Token | the |
Token ID | 262 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
ensed | +0.066 |
icably | +0.064 |
scam | +0.064 |
ous | +0.058 |
ella | +0.058 |
Neg logit contributions | |
Marshal | -0.071 |
lator | -0.069 |
iler | -0.061 |
layer | -0.061 |
Gutenberg | -0.060 |
Token |
|
Token ID | 198 |
Feature activation | -4.72e-02 |
Pos logit contributions | |
ensed | +0.020 |
icably | +0.019 |
scam | +0.019 |
ighting | +0.018 |
recomm | +0.017 |
Neg logit contributions | |
Marshal | -0.021 |
lator | -0.021 |
iler | -0.019 |
layer | -0.019 |
Gutenberg | -0.018 |
Token | Cl |
Token ID | 2601 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
ensed | +0.035 |
icably | +0.034 |
scam | +0.034 |
ighting | +0.031 |
ous | +0.031 |
Neg logit contributions | |
Marshal | -0.037 |
lator | -0.036 |
iler | -0.032 |
layer | -0.032 |
Gutenberg | -0.031 |
Token | osing |
Token ID | 2752 |
Feature activation | +9.37e-03 |
Pos logit contributions | |
ensed | +0.206 |
icably | +0.199 |
scam | +0.198 |
recomm | +0.177 |
ous | +0.176 |
Neg logit contributions | |
Marshal | -0.327 |
lator | -0.323 |
iler | -0.292 |
layer | -0.290 |
Gutenberg | -0.286 |
Token | the |
Token ID | 262 |
Feature activation | -3.91e-02 |
Pos logit contributions | |
Marshal | +0.008 |
lator | +0.008 |
iler | +0.007 |
layer | +0.007 |
Gutenberg | +0.007 |
Neg logit contributions | |
ensed | -0.007 |
icably | -0.006 |
scam | -0.006 |
ous | -0.006 |
ighting | -0.006 |
Token | Sutton |
Token ID | 39964 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
ensed | +0.029 |
icably | +0.028 |
scam | +0.028 |
ous | +0.026 |
ighting | +0.026 |
Neg logit contributions | |
Marshal | -0.030 |
lator | -0.030 |
iler | -0.026 |
layer | -0.026 |
Gutenberg | -0.026 |
Token | ash |
Token ID | 12530 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
Marshal | +0.154 |
lator | +0.151 |
iler | +0.133 |
layer | +0.132 |
Gutenberg | +0.130 |
Neg logit contributions | |
ensed | -0.155 |
icably | -0.151 |
scam | -0.150 |
ous | -0.138 |
ighting | -0.137 |
Token | ponds |
Token ID | 47339 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
ensed | +0.413 |
icably | +0.399 |
scam | +0.398 |
ous | +0.360 |
ighting | +0.356 |
Neg logit contributions | |
Marshal | -0.576 |
lator | -0.567 |
iler | -0.508 |
layer | -0.504 |
Gutenberg | -0.500 |
Token | once |
Token ID | 1752 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
ensed | +0.165 |
icably | +0.160 |
scam | +0.159 |
ous | +0.145 |
ighting | +0.145 |
Neg logit contributions | |
Marshal | -0.196 |
lator | -0.193 |
iler | -0.171 |
layer | -0.170 |
Gutenberg | -0.168 |
Token | lined |
Token ID | 16566 |
Feature activation | -5.89e-02 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.010 |
scam | +0.010 |
ighting | +0.009 |
ous | +0.009 |
Neg logit contributions | |
Marshal | -0.012 |
lator | -0.012 |
iler | -0.011 |
layer | -0.011 |
Gutenberg | -0.010 |
Token | structural |
Token ID | 13204 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ensed | +0.043 |
icably | +0.042 |
scam | +0.042 |
ous | +0.038 |
ighting | +0.038 |
Neg logit contributions | |
Marshal | -0.046 |
lator | -0.045 |
iler | -0.040 |
layer | -0.040 |
Gutenberg | -0.039 |
Token | fill |
Token ID | 6070 |
Feature activation | +4.88e-02 |
Pos logit contributions | |
Marshal | +0.185 |
lator | +0.182 |
iler | +0.161 |
layer | +0.160 |
Gutenberg | +0.158 |
Neg logit contributions | |
ensed | -0.169 |
icably | -0.164 |
scam | -0.163 |
ous | -0.149 |
ighting | -0.149 |
Token | Brennan |
Token ID | 26577 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
ensed | +0.134 |
icably | +0.130 |
scam | +0.129 |
ous | +0.120 |
ighting | +0.120 |
Neg logit contributions | |
Marshal | -0.115 |
lator | -0.112 |
iler | -0.097 |
layer | -0.097 |
Gutenberg | -0.096 |
Token | Center |
Token ID | 3337 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
ensed | +0.112 |
icably | +0.108 |
scam | +0.108 |
ous | +0.099 |
ighting | +0.099 |
Neg logit contributions | |
Marshal | -0.112 |
lator | -0.110 |
iler | -0.097 |
layer | -0.096 |
Gutenberg | -0.095 |
Token | filed |
Token ID | 5717 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
Marshal | +0.018 |
lator | +0.018 |
iler | +0.016 |
layer | +0.016 |
Gutenberg | +0.015 |
Neg logit contributions | |
ensed | -0.015 |
icably | -0.014 |
scam | -0.014 |
ighting | -0.013 |
ous | -0.013 |
Token | an |
Token ID | 281 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
ensed | +0.194 |
icably | +0.189 |
scam | +0.187 |
ous | +0.172 |
ighting | +0.171 |
Neg logit contributions | |
Marshal | -0.201 |
lator | -0.197 |
iler | -0.173 |
layer | -0.172 |
Gutenberg | -0.170 |
Token | am |
Token ID | 716 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.010 |
scam | +0.009 |
ighting | +0.009 |
ous | +0.009 |
Neg logit contributions | |
Marshal | -0.010 |
lator | -0.010 |
iler | -0.009 |
layer | -0.009 |
Gutenberg | -0.009 |
Token | icus |
Token ID | 24552 |
Feature activation | -6.53e-01 |
Pos logit contributions | |
ensed | +0.052 |
scam | +0.047 |
icably | +0.046 |
ighting | +0.035 |
recomm | +0.035 |
Neg logit contributions | |
Marshal | -0.250 |
lator | -0.247 |
iler | -0.230 |
layer | -0.229 |
Gutenberg | -0.226 |
Token | brief |
Token ID | 4506 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
ensed | +0.370 |
icably | +0.359 |
scam | +0.354 |
ighting | +0.319 |
ella | +0.311 |
Neg logit contributions | |
Marshal | -0.618 |
lator | -0.604 |
iler | -0.551 |
layer | -0.546 |
Gutenberg | -0.538 |
Token | calling |
Token ID | 4585 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
ensed | +0.175 |
icably | +0.171 |
scam | +0.169 |
ighting | +0.154 |
ous | +0.154 |
Neg logit contributions | |
Marshal | -0.198 |
lator | -0.194 |
iler | -0.172 |
layer | -0.171 |
Gutenberg | -0.169 |
Token | for |
Token ID | 329 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
Marshal | +0.133 |
lator | +0.130 |
iler | +0.117 |
layer | +0.115 |
Gutenberg | +0.115 |
Neg logit contributions | |
ensed | -0.108 |
icably | -0.104 |
scam | -0.103 |
ighting | -0.094 |
ella | -0.093 |
Token | the |
Token ID | 262 |
Feature activation | -6.66e-02 |
Pos logit contributions | |
ensed | +0.087 |
icably | +0.084 |
scam | +0.083 |
ous | +0.076 |
ighting | +0.076 |
Neg logit contributions | |
Marshal | -0.094 |
lator | -0.092 |
iler | -0.081 |
layer | -0.081 |
Gutenberg | -0.080 |
Token | Court |
Token ID | 3078 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
ensed | +0.053 |
icably | +0.052 |
scam | +0.051 |
ous | +0.047 |
ighting | +0.047 |
Neg logit contributions | |
Marshal | -0.048 |
lator | -0.047 |
iler | -0.041 |
layer | -0.041 |
Gutenberg | -0.040 |
Token | that |
Token ID | 326 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
Marshal | +0.025 |
lator | +0.024 |
iler | +0.022 |
layer | +0.022 |
Gutenberg | +0.021 |
Neg logit contributions | |
ensed | -0.019 |
icably | -0.018 |
scam | -0.018 |
ighting | -0.017 |
ous | -0.017 |
Token | two |
Token ID | 734 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
ensed | +0.076 |
icably | +0.074 |
scam | +0.073 |
ous | +0.067 |
ighting | +0.067 |
Neg logit contributions | |
Marshal | -0.081 |
lator | -0.079 |
iler | -0.070 |
layer | -0.070 |
Gutenberg | -0.069 |
Token | separate |
Token ID | 4553 |
Feature activation | +1.00e-01 |
Pos logit contributions | |
ensed | +0.022 |
icably | +0.021 |
scam | +0.021 |
ous | +0.019 |
ighting | +0.019 |
Neg logit contributions | |
Marshal | -0.025 |
lator | -0.025 |
iler | -0.022 |
layer | -0.022 |
Gutenberg | -0.021 |
Token | Russian |
Token ID | 3394 |
Feature activation | +6.53e-02 |
Pos logit contributions | |
Marshal | +0.081 |
lator | +0.080 |
iler | +0.071 |
layer | +0.070 |
Gutenberg | +0.070 |
Neg logit contributions | |
ensed | -0.071 |
icably | -0.069 |
scam | -0.068 |
ous | -0.062 |
ighting | -0.062 |
Token | intelligence |
Token ID | 4430 |
Feature activation | +5.43e-03 |
Pos logit contributions | |
Marshal | +0.052 |
lator | +0.052 |
iler | +0.046 |
layer | +0.045 |
Gutenberg | +0.045 |
Neg logit contributions | |
ensed | -0.047 |
icably | -0.045 |
scam | -0.045 |
ous | -0.041 |
ighting | -0.041 |
Token | groups |
Token ID | 2628 |
Feature activation | -6.43e-01 |
Pos logit contributions | |
Marshal | +0.005 |
lator | +0.005 |
iler | +0.005 |
layer | +0.005 |
Gutenberg | +0.005 |
Neg logit contributions | |
ensed | -0.003 |
icably | -0.003 |
scam | -0.003 |
ous | -0.003 |
ighting | -0.003 |
Token | had |
Token ID | 550 |
Feature activation | -7.07e-02 |
Pos logit contributions | |
ensed | +0.446 |
icably | +0.434 |
scam | +0.426 |
ighting | +0.391 |
ous | +0.391 |
Neg logit contributions | |
Marshal | -0.528 |
lator | -0.517 |
iler | -0.460 |
layer | -0.458 |
Gutenberg | -0.453 |
Token | gained |
Token ID | 8618 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
ensed | +0.048 |
icably | +0.047 |
scam | +0.046 |
ighting | +0.043 |
ous | +0.042 |
Neg logit contributions | |
Marshal | -0.059 |
lator | -0.057 |
iler | -0.051 |
layer | -0.051 |
Gutenberg | -0.050 |
Token | access |
Token ID | 1895 |
Feature activation | -4.50e-02 |
Pos logit contributions | |
ensed | +0.087 |
icably | +0.084 |
scam | +0.083 |
ous | +0.076 |
recomm | +0.075 |
Neg logit contributions | |
Marshal | -0.114 |
lator | -0.112 |
iler | -0.100 |
layer | -0.099 |
Gutenberg | -0.098 |
Token | to |
Token ID | 284 |
Feature activation | -6.28e-02 |
Pos logit contributions | |
ensed | +0.031 |
icably | +0.030 |
scam | +0.030 |
ous | +0.028 |
ighting | +0.027 |
Neg logit contributions | |
Marshal | -0.037 |
lator | -0.036 |
iler | -0.032 |
layer | -0.032 |
Gutenberg | -0.032 |
Token | the |
Token ID | 262 |
Feature activation | -7.04e-02 |
Pos logit contributions | |
ensed | +0.045 |
icably | +0.044 |
scam | +0.043 |
ous | +0.040 |
ighting | +0.040 |
Neg logit contributions | |
Marshal | -0.050 |
lator | -0.049 |
iler | -0.044 |
layer | -0.043 |
Gutenberg | -0.043 |
Token | aylor |
Token ID | 7167 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
ensed | +0.008 |
icably | +0.007 |
scam | +0.007 |
recomm | +0.006 |
ighting | +0.006 |
Neg logit contributions | |
Marshal | -0.018 |
lator | -0.018 |
iler | -0.016 |
layer | -0.016 |
Gutenberg | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -3.73e-02 |
Pos logit contributions | |
ensed | +0.174 |
scam | +0.168 |
icably | +0.168 |
ous | +0.156 |
ella | +0.155 |
Neg logit contributions | |
Marshal | -0.178 |
lator | -0.175 |
iler | -0.153 |
layer | -0.153 |
Gutenberg | -0.152 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -2.84e-02 |
Pos logit contributions | |
ensed | +0.027 |
icably | +0.026 |
scam | +0.026 |
ous | +0.024 |
ella | +0.024 |
Neg logit contributions | |
Marshal | -0.030 |
lator | -0.029 |
iler | -0.026 |
layer | -0.026 |
Gutenberg | -0.025 |
Token | Chief |
Token ID | 23675 |
Feature activation | +2.17e-01 |
Pos logit contributions | |
ensed | +0.020 |
icably | +0.019 |
scam | +0.019 |
ous | +0.018 |
ighting | +0.017 |
Neg logit contributions | |
Marshal | -0.023 |
lator | -0.023 |
iler | -0.020 |
layer | -0.020 |
Gutenberg | -0.020 |
Token | Special |
Token ID | 6093 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
Marshal | +0.145 |
lator | +0.142 |
iler | +0.122 |
layer | +0.121 |
Gutenberg | +0.120 |
Neg logit contributions | |
ensed | -0.184 |
icably | -0.180 |
scam | -0.179 |
ous | -0.166 |
ighting | -0.165 |
Token | Prosecutor |
Token ID | 37478 |
Feature activation | +3.16e-01 |
Pos logit contributions | |
Marshal | +0.107 |
lator | +0.105 |
iler | +0.091 |
layer | +0.090 |
Gutenberg | +0.089 |
Neg logit contributions | |
ensed | -0.129 |
icably | -0.126 |
scam | -0.125 |
ous | -0.116 |
ighting | -0.116 |
Token | , |
Token ID | 11 |
Feature activation | -6.75e-02 |
Pos logit contributions | |
Marshal | +0.245 |
lator | +0.241 |
iler | +0.212 |
layer | +0.211 |
Gutenberg | +0.208 |
Neg logit contributions | |
ensed | -0.234 |
icably | -0.227 |
scam | -0.226 |
ous | -0.208 |
ighting | -0.206 |
Token | K |
Token ID | 509 |
Feature activation | +5.85e-02 |
Pos logit contributions | |
ensed | +0.052 |
icably | +0.051 |
scam | +0.050 |
ous | +0.046 |
ighting | +0.046 |
Neg logit contributions | |
Marshal | -0.050 |
lator | -0.049 |
iler | -0.043 |
layer | -0.043 |
Gutenberg | -0.042 |
Token | atic |
Token ID | 1512 |
Feature activation | -7.65e-02 |
Pos logit contributions | |
Marshal | +0.046 |
lator | +0.045 |
iler | +0.040 |
layer | +0.040 |
Gutenberg | +0.039 |
Neg logit contributions | |
ensed | -0.042 |
icably | -0.041 |
scam | -0.041 |
ous | -0.038 |
ighting | -0.037 |
Token | a |
Token ID | 64 |
Feature activation | -2.21e-01 |
Pos logit contributions | |
ensed | +0.057 |
icably | +0.055 |
scam | +0.055 |
ous | +0.051 |
ella | +0.050 |
Neg logit contributions | |
Marshal | -0.059 |
lator | -0.058 |
iler | -0.051 |
layer | -0.051 |
Gutenberg | -0.050 |
Token | Jane |
Token ID | 12091 |
Feature activation | +6.83e-02 |
Pos logit contributions | |
ensed | +0.169 |
icably | +0.164 |
scam | +0.164 |
ous | +0.151 |
ella | +0.150 |
Neg logit contributions | |
Marshal | -0.166 |
lator | -0.163 |
iler | -0.143 |
layer | -0.142 |
Gutenberg | -0.140 |
Token | Human |
Token ID | 20490 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
Marshal | +0.035 |
lator | +0.034 |
iler | +0.030 |
layer | +0.030 |
Gutenberg | +0.029 |
Neg logit contributions | |
ensed | -0.036 |
icably | -0.035 |
scam | -0.035 |
ous | -0.032 |
ighting | -0.032 |
Token | Resource |
Token ID | 20857 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
Marshal | +0.136 |
lator | +0.133 |
iler | +0.117 |
layer | +0.117 |
Gutenberg | +0.115 |
Neg logit contributions | |
ensed | -0.128 |
icably | -0.125 |
scam | -0.124 |
ous | -0.114 |
ighting | -0.113 |
Token | Management |
Token ID | 8549 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
ensed | +0.135 |
icably | +0.131 |
scam | +0.130 |
ous | +0.121 |
ighting | +0.120 |
Neg logit contributions | |
Marshal | -0.114 |
lator | -0.112 |
iler | -0.097 |
layer | -0.096 |
Gutenberg | -0.095 |
Token | from |
Token ID | 422 |
Feature activation | -7.12e-02 |
Pos logit contributions | |
Marshal | +0.097 |
lator | +0.095 |
iler | +0.084 |
layer | +0.083 |
Gutenberg | +0.082 |
Neg logit contributions | |
ensed | -0.094 |
icably | -0.092 |
scam | -0.091 |
ous | -0.083 |
ighting | -0.083 |
Token | Louisiana |
Token ID | 13340 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
ensed | +0.047 |
icably | +0.046 |
scam | +0.046 |
ighting | +0.041 |
ous | +0.041 |
Neg logit contributions | |
Marshal | -0.061 |
lator | -0.059 |
iler | -0.053 |
layer | -0.053 |
Gutenberg | -0.052 |
Token | State |
Token ID | 1812 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
ensed | +0.139 |
icably | +0.136 |
scam | +0.135 |
ous | +0.127 |
ighting | +0.126 |
Neg logit contributions | |
Marshal | -0.078 |
lator | -0.076 |
iler | -0.063 |
layer | -0.063 |
Gutenberg | -0.061 |
Token | University |
Token ID | 2059 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
Marshal | +0.243 |
lator | +0.239 |
iler | +0.210 |
layer | +0.209 |
Gutenberg | +0.207 |
Neg logit contributions | |
ensed | -0.234 |
icably | -0.227 |
scam | -0.226 |
ous | -0.208 |
recomm | -0.206 |
Token | . |
Token ID | 13 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
ensed | +0.085 |
icably | +0.082 |
scam | +0.082 |
ous | +0.076 |
ighting | +0.075 |
Neg logit contributions | |
Marshal | -0.077 |
lator | -0.075 |
iler | -0.065 |
layer | -0.065 |
Gutenberg | -0.064 |
Token | How |
Token ID | 1374 |
Feature activation | +1.17e-01 |
Pos logit contributions | |
Marshal | +0.016 |
lator | +0.016 |
iler | +0.014 |
layer | +0.014 |
Gutenberg | +0.013 |
Neg logit contributions | |
ensed | -0.021 |
icably | -0.021 |
scam | -0.021 |
ous | -0.019 |
ighting | -0.019 |
Token | common |
Token ID | 2219 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
Marshal | +0.097 |
lator | +0.095 |
iler | +0.085 |
layer | +0.084 |
Gutenberg | +0.084 |
Neg logit contributions | |
ensed | -0.080 |
icably | -0.077 |
scam | -0.076 |
ighting | -0.070 |
ous | -0.069 |
Token | is |
Token ID | 318 |
Feature activation | +7.31e-02 |
Pos logit contributions | |
Marshal | +0.112 |
lator | +0.110 |
iler | +0.096 |
layer | +0.096 |
Gutenberg | +0.094 |
Neg logit contributions | |
ensed | -0.122 |
icably | -0.118 |
scam | -0.117 |
ighting | -0.108 |
ous | -0.108 |
Token | B |
Token ID | 347 |
Feature activation | +6.59e-02 |
Pos logit contributions | |
Marshal | +0.134 |
lator | +0.131 |
iler | +0.115 |
layer | +0.114 |
Gutenberg | +0.113 |
Neg logit contributions | |
ensed | -0.138 |
icably | -0.134 |
scam | -0.133 |
ous | -0.123 |
ighting | -0.122 |
Token | erc |
Token ID | 2798 |
Feature activation | -3.03e-02 |
Pos logit contributions | |
Marshal | +0.053 |
lator | +0.052 |
iler | +0.046 |
layer | +0.046 |
Gutenberg | +0.046 |
Neg logit contributions | |
ensed | -0.046 |
icably | -0.045 |
scam | -0.045 |
ous | -0.041 |
ighting | -0.041 |
Token | owitz |
Token ID | 20951 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
ensed | +0.023 |
icably | +0.022 |
scam | +0.022 |
ighting | +0.020 |
recomm | +0.020 |
Neg logit contributions | |
Marshal | -0.023 |
lator | -0.022 |
iler | -0.020 |
layer | -0.020 |
Gutenberg | -0.019 |
Token | noted |
Token ID | 4367 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
Marshal | +0.159 |
lator | +0.155 |
iler | +0.138 |
layer | +0.137 |
Gutenberg | +0.135 |
Neg logit contributions | |
ensed | -0.139 |
icably | -0.135 |
scam | -0.134 |
ous | -0.122 |
ighting | -0.122 |
Token | four |
Token ID | 1440 |
Feature activation | -4.40e-03 |
Pos logit contributions | |
Marshal | +0.022 |
lator | +0.022 |
iler | +0.019 |
layer | +0.019 |
Gutenberg | +0.019 |
Neg logit contributions | |
ensed | -0.017 |
icably | -0.017 |
scam | -0.017 |
ous | -0.015 |
ighting | -0.015 |
Token | primary |
Token ID | 4165 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
ensed | +0.003 |
icably | +0.003 |
scam | +0.003 |
ous | +0.003 |
ighting | +0.003 |
Neg logit contributions | |
Marshal | -0.004 |
lator | -0.003 |
iler | -0.003 |
layer | -0.003 |
Gutenberg | -0.003 |
Token | factions |
Token ID | 18783 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
Marshal | +0.269 |
lator | +0.264 |
iler | +0.235 |
layer | +0.234 |
Gutenberg | +0.232 |
Neg logit contributions | |
ensed | -0.219 |
icably | -0.211 |
scam | -0.209 |
ous | -0.191 |
ighting | -0.190 |
Token | at |
Token ID | 379 |
Feature activation | +6.69e-02 |
Pos logit contributions | |
ensed | +0.113 |
icably | +0.110 |
scam | +0.108 |
ella | +0.099 |
ous | +0.099 |
Neg logit contributions | |
Marshal | -0.132 |
lator | -0.128 |
iler | -0.115 |
layer | -0.114 |
Gutenberg | -0.112 |
Token | this |
Token ID | 428 |
Feature activation | +5.72e-02 |
Pos logit contributions | |
Marshal | +0.057 |
lator | +0.056 |
iler | +0.050 |
layer | +0.049 |
Gutenberg | +0.049 |
Neg logit contributions | |
ensed | -0.045 |
icably | -0.043 |
scam | -0.043 |
ous | -0.039 |
ighting | -0.039 |
Token | gathering |
Token ID | 11228 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
Marshal | +0.048 |
lator | +0.047 |
iler | +0.042 |
layer | +0.042 |
Gutenberg | +0.041 |
Neg logit contributions | |
ensed | -0.039 |
icably | -0.038 |
scam | -0.037 |
ous | -0.034 |
ighting | -0.034 |
Token | , |
Token ID | 11 |
Feature activation | +7.48e-02 |
Pos logit contributions | |
ensed | +0.146 |
icably | +0.142 |
scam | +0.140 |
ighting | +0.129 |
ous | +0.129 |
Neg logit contributions | |
Marshal | -0.141 |
lator | -0.137 |
iler | -0.120 |
layer | -0.120 |
Gutenberg | -0.118 |
Token | have |
Token ID | 423 |
Feature activation | +7.09e-02 |
Pos logit contributions | |
ensed | +0.043 |
icably | +0.042 |
scam | +0.041 |
ous | +0.038 |
ighting | +0.038 |
Neg logit contributions | |
Marshal | -0.045 |
lator | -0.044 |
iler | -0.039 |
layer | -0.038 |
Gutenberg | -0.038 |
Token | a |
Token ID | 257 |
Feature activation | +7.77e-02 |
Pos logit contributions | |
Marshal | +0.058 |
lator | +0.057 |
iler | +0.050 |
layer | +0.050 |
Gutenberg | +0.049 |
Neg logit contributions | |
ensed | -0.050 |
icably | -0.048 |
scam | -0.048 |
ous | -0.044 |
ighting | -0.043 |
Token | hot |
Token ID | 3024 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
Marshal | +0.065 |
lator | +0.064 |
iler | +0.057 |
layer | +0.056 |
Gutenberg | +0.056 |
Neg logit contributions | |
ensed | -0.053 |
icably | -0.051 |
scam | -0.051 |
ous | -0.047 |
ighting | -0.046 |
Token | bod |
Token ID | 16429 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
Marshal | +0.109 |
lator | +0.107 |
iler | +0.096 |
layer | +0.095 |
Gutenberg | +0.094 |
Neg logit contributions | |
ensed | -0.093 |
icably | -0.091 |
scam | -0.090 |
ous | -0.082 |
ighting | -0.082 |
Token | . |
Token ID | 13 |
Feature activation | +3.67e-02 |
Pos logit contributions | |
Marshal | +0.191 |
lator | +0.187 |
iler | +0.166 |
layer | +0.165 |
Gutenberg | +0.163 |
Neg logit contributions | |
ensed | -0.166 |
icably | -0.161 |
scam | -0.160 |
ous | -0.146 |
ighting | -0.145 |
Token | Let |
Token ID | 3914 |
Feature activation | +3.26e-01 |
Pos logit contributions | |
Marshal | +0.029 |
lator | +0.028 |
iler | +0.025 |
layer | +0.025 |
Gutenberg | +0.024 |
Neg logit contributions | |
ensed | -0.027 |
icably | -0.026 |
scam | -0.026 |
ous | -0.024 |
ighting | -0.024 |
Token | 's |
Token ID | 338 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
Marshal | +0.265 |
lator | +0.260 |
iler | +0.231 |
layer | +0.229 |
Gutenberg | +0.227 |
Neg logit contributions | |
ensed | -0.228 |
icably | -0.221 |
scam | -0.219 |
ous | -0.200 |
ighting | -0.200 |
Token | not |
Token ID | 407 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
Marshal | +0.020 |
lator | +0.020 |
iler | +0.018 |
layer | +0.018 |
Gutenberg | +0.017 |
Neg logit contributions | |
ensed | -0.017 |
icably | -0.017 |
scam | -0.017 |
ous | -0.015 |
ighting | -0.015 |
Token | pretend |
Token ID | 16614 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
Marshal | +0.118 |
lator | +0.115 |
iler | +0.103 |
layer | +0.102 |
Gutenberg | +0.101 |
Neg logit contributions | |
ensed | -0.099 |
icably | -0.095 |
scam | -0.094 |
ous | -0.086 |
ighting | -0.086 |
Token | we |
Token ID | 356 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
Marshal | +0.144 |
lator | +0.142 |
iler | +0.127 |
layer | +0.127 |
Gutenberg | +0.125 |
Neg logit contributions | |
ensed | -0.101 |
icably | -0.097 |
scam | -0.096 |
ous | -0.087 |
ighting | -0.087 |
Token | 're |
Token ID | 821 |
Feature activation | +8.79e-02 |
Pos logit contributions | |
Marshal | +0.082 |
lator | +0.080 |
iler | +0.071 |
layer | +0.070 |
Gutenberg | +0.069 |
Neg logit contributions | |
ensed | -0.080 |
icably | -0.077 |
scam | -0.076 |
ous | -0.070 |
ighting | -0.070 |
Token | ground |
Token ID | 2323 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
Marshal | +0.108 |
lator | +0.105 |
iler | +0.094 |
layer | +0.093 |
Gutenberg | +0.092 |
Neg logit contributions | |
ensed | -0.089 |
icably | -0.086 |
scam | -0.085 |
ous | -0.078 |
ella | -0.078 |
Token | testing |
Token ID | 4856 |
Feature activation | -1.63e-01 |
Pos logit contributions | |
Marshal | +0.105 |
lator | +0.103 |
iler | +0.091 |
layer | +0.091 |
Gutenberg | +0.089 |
Neg logit contributions | |
ensed | -0.093 |
icably | -0.091 |
scam | -0.089 |
ous | -0.081 |
ella | -0.081 |
Token | and |
Token ID | 290 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
ensed | +0.114 |
icably | +0.110 |
scam | +0.109 |
ous | +0.099 |
ighting | +0.099 |
Neg logit contributions | |
Marshal | -0.134 |
lator | -0.132 |
iler | -0.117 |
layer | -0.116 |
Gutenberg | -0.115 |
Token | in |
Token ID | 287 |
Feature activation | +6.04e-02 |
Pos logit contributions | |
Marshal | +0.031 |
lator | +0.031 |
iler | +0.027 |
layer | +0.027 |
Gutenberg | +0.027 |
Neg logit contributions | |
ensed | -0.028 |
icably | -0.027 |
scam | -0.027 |
ous | -0.024 |
ighting | -0.024 |
Token | - |
Token ID | 12 |
Feature activation | +8.80e-02 |
Pos logit contributions | |
Marshal | +0.048 |
lator | +0.047 |
iler | +0.042 |
layer | +0.041 |
Gutenberg | +0.041 |
Neg logit contributions | |
ensed | -0.044 |
icably | -0.043 |
scam | -0.042 |
ous | -0.039 |
ighting | -0.038 |
Token | flight |
Token ID | 22560 |
Feature activation | +3.83e-01 |
Pos logit contributions | |
Marshal | +0.045 |
lator | +0.044 |
layer | +0.036 |
iler | +0.036 |
Gutenberg | +0.034 |
Neg logit contributions | |
ensed | -0.088 |
icably | -0.086 |
scam | -0.086 |
ous | -0.081 |
recomm | -0.080 |
Token | operation |
Token ID | 4905 |
Feature activation | -8.88e-02 |
Pos logit contributions | |
Marshal | +0.319 |
lator | +0.312 |
iler | +0.278 |
layer | +0.276 |
Gutenberg | +0.273 |
Neg logit contributions | |
ensed | -0.263 |
icably | -0.256 |
scam | -0.251 |
ous | -0.229 |
ella | -0.229 |
Token | , |
Token ID | 11 |
Feature activation | +2.66e-02 |
Pos logit contributions | |
ensed | +0.065 |
icably | +0.063 |
scam | +0.063 |
ous | +0.058 |
ighting | +0.057 |
Neg logit contributions | |
Marshal | -0.069 |
lator | -0.068 |
iler | -0.060 |
layer | -0.060 |
Gutenberg | -0.059 |
Token | tele |
Token ID | 5735 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
Marshal | +0.023 |
lator | +0.022 |
iler | +0.020 |
layer | +0.020 |
Gutenberg | +0.020 |
Neg logit contributions | |
ensed | -0.017 |
icably | -0.017 |
scam | -0.017 |
ous | -0.015 |
ighting | -0.015 |
Token | metry |
Token ID | 41935 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
ensed | +0.151 |
icably | +0.147 |
scam | +0.146 |
ous | +0.135 |
ighting | +0.135 |
Neg logit contributions | |
Marshal | -0.126 |
lator | -0.123 |
iler | -0.107 |
layer | -0.106 |
Gutenberg | -0.105 |
Token | system |
Token ID | 1080 |
Feature activation | -6.94e-02 |
Pos logit contributions | |
ensed | +0.011 |
icably | +0.011 |
scam | +0.011 |
ighting | +0.010 |
ella | +0.010 |
Neg logit contributions | |
Marshal | -0.015 |
lator | -0.015 |
iler | -0.013 |
layer | -0.013 |
Gutenberg | -0.013 |
Token | media |
Token ID | 2056 |
Feature activation | +6.31e-02 |
Pos logit contributions | |
Marshal | +0.173 |
lator | +0.170 |
iler | +0.152 |
layer | +0.151 |
Gutenberg | +0.149 |
Neg logit contributions | |
ensed | -0.133 |
icably | -0.128 |
scam | -0.127 |
ous | -0.116 |
ighting | -0.115 |
Token | pages |
Token ID | 5468 |
Feature activation | +2.51e-02 |
Pos logit contributions | |
Marshal | +0.052 |
lator | +0.050 |
iler | +0.045 |
layer | +0.044 |
Gutenberg | +0.044 |
Neg logit contributions | |
ensed | -0.044 |
icably | -0.043 |
scam | -0.042 |
ighting | -0.038 |
ous | -0.038 |
Token | , |
Token ID | 11 |
Feature activation | +8.60e-02 |
Pos logit contributions | |
Marshal | +0.020 |
lator | +0.020 |
iler | +0.017 |
layer | +0.017 |
Gutenberg | +0.017 |
Neg logit contributions | |
ensed | -0.018 |
icably | -0.017 |
scam | -0.017 |
ous | -0.016 |
ighting | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | +6.09e-02 |
Pos logit contributions | |
Marshal | +0.072 |
lator | +0.071 |
iler | +0.063 |
layer | +0.063 |
Gutenberg | +0.062 |
Neg logit contributions | |
ensed | -0.059 |
icably | -0.056 |
scam | -0.056 |
ous | -0.051 |
ighting | -0.051 |
Token | you |
Token ID | 345 |
Feature activation | -5.66e-02 |
Pos logit contributions | |
Marshal | +0.049 |
lator | +0.048 |
iler | +0.043 |
layer | +0.043 |
Gutenberg | +0.042 |
Neg logit contributions | |
ensed | -0.043 |
icably | -0.042 |
scam | -0.041 |
ous | -0.038 |
ighting | -0.038 |
Token | can |
Token ID | 460 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
ensed | +0.037 |
icably | +0.036 |
scam | +0.036 |
ous | +0.033 |
ighting | +0.032 |
Neg logit contributions | |
Marshal | -0.048 |
lator | -0.048 |
iler | -0.042 |
layer | -0.042 |
Gutenberg | -0.042 |
Token | get |
Token ID | 651 |
Feature activation | +1.51e-02 |
Pos logit contributions | |
ensed | +0.018 |
icably | +0.017 |
scam | +0.017 |
ous | +0.016 |
ighting | +0.016 |
Neg logit contributions | |
Marshal | -0.022 |
lator | -0.021 |
iler | -0.019 |
layer | -0.019 |
Gutenberg | -0.019 |
Token | a |
Token ID | 257 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
Marshal | +0.012 |
lator | +0.012 |
iler | +0.010 |
layer | +0.010 |
Gutenberg | +0.010 |
Neg logit contributions | |
ensed | -0.011 |
icably | -0.010 |
scam | -0.010 |
ous | -0.010 |
ighting | -0.009 |
Token | hint |
Token ID | 9254 |
Feature activation | +1.01e-03 |
Pos logit contributions | |
Marshal | +0.102 |
lator | +0.100 |
iler | +0.089 |
layer | +0.088 |
Gutenberg | +0.087 |
Neg logit contributions | |
ensed | -0.088 |
icably | -0.086 |
scam | -0.085 |
ous | -0.078 |
recomm | -0.077 |
Token | of |
Token ID | 286 |
Feature activation | +2.93e-02 |
Pos logit contributions | |
Marshal | +0.001 |
lator | +0.001 |
iler | +0.001 |
layer | +0.001 |
Gutenberg | +0.001 |
Neg logit contributions | |
ensed | -0.001 |
icably | -0.001 |
scam | -0.001 |
ous | -0.001 |
ighting | -0.001 |
Token | what |
Token ID | 644 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
Marshal | +0.019 |
lator | +0.019 |
iler | +0.016 |
layer | +0.016 |
Gutenberg | +0.016 |
Neg logit contributions | |
ensed | -0.025 |
icably | -0.025 |
scam | -0.025 |
ous | -0.023 |
ighting | -0.023 |
Token | which |
Token ID | 543 |
Feature activation | -4.15e-02 |
Pos logit contributions | |
Marshal | +0.071 |
lator | +0.070 |
iler | +0.063 |
layer | +0.062 |
Gutenberg | +0.062 |
Neg logit contributions | |
ensed | -0.054 |
icably | -0.053 |
scam | -0.052 |
ighting | -0.047 |
ella | -0.047 |
Token | make |
Token ID | 787 |
Feature activation | +1.25e-01 |
Pos logit contributions | |
ensed | +0.029 |
icably | +0.028 |
scam | +0.028 |
ighting | +0.026 |
ous | +0.026 |
Neg logit contributions | |
Marshal | -0.034 |
lator | -0.033 |
iler | -0.029 |
layer | -0.029 |
Gutenberg | -0.029 |
Token | them |
Token ID | 606 |
Feature activation | +8.83e-02 |
Pos logit contributions | |
Marshal | +0.101 |
lator | +0.098 |
iler | +0.088 |
layer | +0.087 |
Gutenberg | +0.087 |
Neg logit contributions | |
ensed | -0.089 |
icably | -0.086 |
scam | -0.085 |
ella | -0.078 |
ighting | -0.077 |
Token | more |
Token ID | 517 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
Marshal | +0.074 |
lator | +0.073 |
iler | +0.065 |
layer | +0.065 |
Gutenberg | +0.064 |
Neg logit contributions | |
ensed | -0.060 |
icably | -0.057 |
scam | -0.057 |
ighting | -0.052 |
ous | -0.052 |
Token | suitable |
Token ID | 11080 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
Marshal | +0.146 |
lator | +0.143 |
iler | +0.128 |
layer | +0.127 |
Gutenberg | +0.126 |
Neg logit contributions | |
ensed | -0.115 |
icably | -0.110 |
scam | -0.109 |
ighting | -0.100 |
ella | -0.099 |
Token | overall |
Token ID | 4045 |
Feature activation | +2.98e-01 |
Pos logit contributions | |
ensed | +0.088 |
icably | +0.085 |
scam | +0.085 |
ous | +0.077 |
ighting | +0.077 |
Neg logit contributions | |
Marshal | -0.109 |
lator | -0.107 |
iler | -0.096 |
layer | -0.095 |
Gutenberg | -0.094 |
Token | for |
Token ID | 329 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
Marshal | +0.242 |
lator | +0.238 |
iler | +0.211 |
layer | +0.210 |
Gutenberg | +0.207 |
Neg logit contributions | |
ensed | -0.210 |
icably | -0.204 |
scam | -0.202 |
ous | -0.184 |
ighting | -0.184 |
Token | gaming |
Token ID | 7776 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
ensed | +0.017 |
icably | +0.017 |
scam | +0.016 |
ighting | +0.015 |
ella | +0.015 |
Neg logit contributions | |
Marshal | -0.021 |
lator | -0.020 |
iler | -0.018 |
layer | -0.018 |
Gutenberg | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +5.76e-02 |
Pos logit contributions | |
Marshal | +0.010 |
lator | +0.010 |
iler | +0.009 |
layer | +0.009 |
Gutenberg | +0.009 |
Neg logit contributions | |
ensed | -0.009 |
icably | -0.009 |
scam | -0.009 |
ighting | -0.008 |
ella | -0.008 |
Token | Firstly |
Token ID | 41039 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
Marshal | +0.046 |
lator | +0.045 |
iler | +0.040 |
layer | +0.040 |
Gutenberg | +0.039 |
Neg logit contributions | |
ensed | -0.042 |
icably | -0.040 |
scam | -0.040 |
recomm | -0.036 |
ighting | -0.036 |
Token | there |
Token ID | 612 |
Feature activation | +4.10e-03 |
Pos logit contributions | |
Marshal | +0.008 |
lator | +0.008 |
iler | +0.007 |
layer | +0.007 |
Gutenberg | +0.007 |
Neg logit contributions | |
ensed | -0.008 |
icably | -0.008 |
scam | -0.007 |
ous | -0.007 |
ighting | -0.007 |
Token | 7 |
Token ID | 22 |
Feature activation | +1.00e-01 |
Pos logit contributions | |
Marshal | +0.031 |
lator | +0.031 |
iler | +0.027 |
layer | +0.027 |
Gutenberg | +0.027 |
Neg logit contributions | |
ensed | -0.029 |
icably | -0.028 |
scam | -0.028 |
ous | -0.026 |
ighting | -0.026 |
Token | and |
Token ID | 290 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
Marshal | +0.088 |
lator | +0.087 |
iler | +0.077 |
layer | +0.077 |
Gutenberg | +0.076 |
Neg logit contributions | |
ensed | -0.064 |
icably | -0.061 |
scam | -0.061 |
ous | -0.056 |
ighting | -0.055 |
Token | 2 |
Token ID | 362 |
Feature activation | -4.98e-03 |
Pos logit contributions | |
Marshal | +0.014 |
lator | +0.014 |
iler | +0.013 |
layer | +0.012 |
Gutenberg | +0.012 |
Neg logit contributions | |
ensed | -0.013 |
icably | -0.012 |
scam | -0.012 |
ous | -0.011 |
ighting | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +5.92e-02 |
Pos logit contributions | |
ensed | +0.004 |
icably | +0.004 |
scam | +0.004 |
ous | +0.003 |
ella | +0.003 |
Neg logit contributions | |
Marshal | -0.004 |
lator | -0.004 |
iler | -0.003 |
layer | -0.003 |
Gutenberg | -0.003 |
Token | 1 |
Token ID | 16 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
Marshal | +0.046 |
lator | +0.045 |
iler | +0.040 |
layer | +0.040 |
Gutenberg | +0.039 |
Neg logit contributions | |
ensed | -0.044 |
icably | -0.042 |
scam | -0.042 |
ous | -0.038 |
ighting | -0.038 |
Token | . |
Token ID | 13 |
Feature activation | +4.50e-02 |
Pos logit contributions | |
ensed | +0.072 |
icably | +0.070 |
scam | +0.070 |
ous | +0.063 |
recomm | +0.062 |
Neg logit contributions | |
Marshal | -0.103 |
lator | -0.101 |
iler | -0.090 |
layer | -0.090 |
Gutenberg | -0.089 |
Token |
|
Token ID | 198 |
Feature activation | +5.33e-02 |
Pos logit contributions | |
Marshal | +0.036 |
lator | +0.035 |
iler | +0.031 |
layer | +0.031 |
Gutenberg | +0.030 |
Neg logit contributions | |
ensed | -0.033 |
icably | -0.032 |
scam | -0.031 |
ous | -0.029 |
ighting | -0.029 |
Token |
|
Token ID | 198 |
Feature activation | +2.55e-02 |
Pos logit contributions | |
Marshal | +0.042 |
lator | +0.041 |
iler | +0.036 |
layer | +0.036 |
Gutenberg | +0.036 |
Neg logit contributions | |
ensed | -0.039 |
icably | -0.038 |
scam | -0.038 |
ighting | -0.034 |
ous | -0.034 |
Token | Some |
Token ID | 4366 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
Marshal | +0.022 |
lator | +0.021 |
iler | +0.019 |
layer | +0.019 |
Gutenberg | +0.019 |
Neg logit contributions | |
ensed | -0.017 |
icably | -0.016 |
scam | -0.016 |
ighting | -0.015 |
ous | -0.015 |
Token | bureaucrats |
Token ID | 34025 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
ensed | +0.068 |
icably | +0.066 |
scam | +0.065 |
ous | +0.059 |
ighting | +0.059 |
Neg logit contributions | |
Marshal | -0.083 |
lator | -0.082 |
iler | -0.073 |
layer | -0.073 |
Gutenberg | -0.071 |
Token | say |
Token ID | 910 |
Feature activation | +6.93e-02 |
Pos logit contributions | |
Marshal | +0.021 |
lator | +0.020 |
iler | +0.018 |
layer | +0.018 |
Gutenberg | +0.017 |
Neg logit contributions | |
ensed | -0.019 |
icably | -0.019 |
scam | -0.019 |
ous | -0.017 |
ighting | -0.017 |
Token | " |
Token ID | 1 |
Feature activation | +2.21e-02 |
Pos logit contributions | |
ensed | +0.040 |
icably | +0.039 |
scam | +0.038 |
ous | +0.035 |
ighting | +0.035 |
Neg logit contributions | |
Marshal | -0.044 |
lator | -0.044 |
iler | -0.038 |
layer | -0.038 |
Gutenberg | -0.038 |
Token | & |
Token ID | 1222 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
Marshal | +0.017 |
lator | +0.017 |
iler | +0.015 |
layer | +0.015 |
Gutenberg | +0.015 |
Neg logit contributions | |
ensed | -0.016 |
icably | -0.016 |
scam | -0.015 |
ous | -0.014 |
ighting | -0.014 |
Token | ] |
Token ID | 60 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
ensed | +0.009 |
scam | +0.009 |
icably | +0.009 |
ous | +0.008 |
recomm | +0.008 |
Neg logit contributions | |
Marshal | -0.006 |
lator | -0.006 |
iler | -0.005 |
Gutenberg | -0.005 |
layer | -0.005 |
Token | @ |
Token ID | 31 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
Marshal | +0.191 |
lator | +0.189 |
iler | +0.167 |
Gutenberg | +0.166 |
layer | +0.165 |
Neg logit contributions | |
ensed | -0.179 |
icably | -0.174 |
scam | -0.174 |
ous | -0.161 |
ighting | -0.159 |
Token | Key |
Token ID | 7383 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
ensed | +0.028 |
icably | +0.028 |
scam | +0.027 |
ous | +0.026 |
ella | +0.026 |
Neg logit contributions | |
Marshal | -0.022 |
lator | -0.021 |
iler | -0.018 |
Gutenberg | -0.018 |
layer | -0.018 |
Token | Take |
Token ID | 12322 |
Feature activation | +7.66e-02 |
Pos logit contributions | |
Marshal | +0.145 |
lator | +0.143 |
iler | +0.128 |
layer | +0.127 |
Gutenberg | +0.126 |
Neg logit contributions | |
ensed | -0.105 |
icably | -0.102 |
scam | -0.101 |
ous | -0.092 |
ighting | -0.091 |
Token | [ |
Token ID | 58 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
Marshal | +0.052 |
lator | +0.051 |
iler | +0.044 |
layer | +0.044 |
Gutenberg | +0.044 |
Neg logit contributions | |
ensed | -0.064 |
icably | -0.062 |
scam | -0.061 |
ous | -0.058 |
ighting | -0.057 |
Token | index |
Token ID | 9630 |
Feature activation | +6.61e-02 |
Pos logit contributions | |
Marshal | +0.110 |
lator | +0.109 |
iler | +0.095 |
Gutenberg | +0.094 |
layer | +0.093 |
Neg logit contributions | |
ensed | -0.119 |
icably | -0.116 |
scam | -0.116 |
ous | -0.108 |
ighting | -0.106 |
Token | State |
Token ID | 9012 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
Marshal | +0.034 |
lator | +0.034 |
iler | +0.027 |
Gutenberg | +0.027 |
layer | +0.027 |
Neg logit contributions | |
ensed | -0.065 |
icably | -0.064 |
scam | -0.064 |
ous | -0.060 |
ighting | -0.060 |
Token | , |
Token ID | 11 |
Feature activation | +2.98e-02 |
Pos logit contributions | |
Marshal | +0.214 |
lator | +0.212 |
iler | +0.184 |
layer | +0.182 |
Gutenberg | +0.182 |
Neg logit contributions | |
ensed | -0.239 |
icably | -0.232 |
scam | -0.232 |
ous | -0.216 |
ighting | -0.214 |
Token | Fl |
Token ID | 1610 |
Feature activation | -3.81e-02 |
Pos logit contributions | |
Marshal | +0.023 |
lator | +0.023 |
iler | +0.020 |
layer | +0.020 |
Gutenberg | +0.020 |
Neg logit contributions | |
ensed | -0.022 |
scam | -0.022 |
icably | -0.022 |
ous | -0.020 |
recomm | -0.020 |
Token | had |
Token ID | 18108 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
ensed | +0.020 |
icably | +0.020 |
scam | +0.019 |
ous | +0.018 |
ighting | +0.018 |
Neg logit contributions | |
Marshal | -0.019 |
lator | -0.019 |
iler | -0.017 |
layer | -0.017 |
Gutenberg | -0.016 |
Token | style |
Token ID | 3918 |
Feature activation | -2.40e-02 |
Pos logit contributions | |
ensed | +0.087 |
icably | +0.084 |
scam | +0.083 |
ous | +0.076 |
ighting | +0.076 |
Neg logit contributions | |
Marshal | -0.099 |
lator | -0.097 |
iler | -0.086 |
layer | -0.086 |
Gutenberg | -0.085 |
Token | and |
Token ID | 290 |
Feature activation | +2.23e-02 |
Pos logit contributions | |
ensed | +0.015 |
icably | +0.015 |
scam | +0.014 |
ighting | +0.013 |
ous | +0.013 |
Neg logit contributions | |
Marshal | -0.021 |
lator | -0.021 |
iler | -0.019 |
layer | -0.019 |
Gutenberg | -0.019 |
Token | sw |
Token ID | 1509 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
Marshal | +0.018 |
lator | +0.018 |
iler | +0.016 |
layer | +0.016 |
Gutenberg | +0.016 |
Neg logit contributions | |
ensed | -0.016 |
icably | -0.015 |
scam | -0.015 |
ous | -0.014 |
ighting | -0.014 |
Token | agger |
Token ID | 7928 |
Feature activation | +3.99e-02 |
Pos logit contributions | |
Marshal | +0.164 |
lator | +0.162 |
iler | +0.146 |
layer | +0.145 |
Gutenberg | +0.143 |
Neg logit contributions | |
ensed | -0.114 |
icably | -0.111 |
scam | -0.110 |
recomm | -0.099 |
ous | -0.098 |
Token | , |
Token ID | 11 |
Feature activation | +6.07e-02 |
Pos logit contributions | |
Marshal | +0.032 |
lator | +0.032 |
iler | +0.028 |
layer | +0.028 |
Gutenberg | +0.027 |
Neg logit contributions | |
ensed | -0.028 |
icably | -0.028 |
scam | -0.027 |
ighting | -0.025 |
ous | -0.025 |
Token | and |
Token ID | 290 |
Feature activation | +3.60e-02 |
Pos logit contributions | |
Marshal | +0.051 |
lator | +0.050 |
iler | +0.044 |
layer | +0.044 |
Gutenberg | +0.044 |
Neg logit contributions | |
ensed | -0.041 |
icably | -0.040 |
scam | -0.039 |
ous | -0.036 |
ighting | -0.036 |
Token | they |
Token ID | 484 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
Marshal | +0.029 |
lator | +0.028 |
iler | +0.025 |
layer | +0.025 |
Gutenberg | +0.025 |
Neg logit contributions | |
ensed | -0.025 |
icably | -0.025 |
scam | -0.025 |
ous | -0.022 |
ighting | -0.022 |
Token | seemed |
Token ID | 3947 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
ensed | +0.093 |
icably | +0.090 |
scam | +0.089 |
ous | +0.081 |
ighting | +0.081 |
Neg logit contributions | |
Marshal | -0.119 |
lator | -0.117 |
iler | -0.104 |
layer | -0.103 |
Gutenberg | -0.102 |
Token | afraid |
Token ID | 7787 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
ensed | +0.093 |
icably | +0.090 |
scam | +0.089 |
ous | +0.081 |
ighting | +0.081 |
Neg logit contributions | |
Marshal | -0.111 |
lator | -0.109 |
iler | -0.097 |
layer | -0.096 |
Gutenberg | -0.095 |
Token | of |
Token ID | 286 |
Feature activation | -6.56e-02 |
Pos logit contributions | |
ensed | +0.105 |
icably | +0.102 |
scam | +0.101 |
ous | +0.091 |
ighting | +0.091 |
Neg logit contributions | |
Marshal | -0.138 |
lator | -0.135 |
iler | -0.121 |
layer | -0.120 |
Gutenberg | -0.119 |
Token | acts |
Token ID | 6529 |
Feature activation | -3.95e-02 |
Pos logit contributions | |
Marshal | +0.017 |
lator | +0.017 |
iler | +0.015 |
layer | +0.015 |
Gutenberg | +0.015 |
Neg logit contributions | |
ensed | -0.015 |
icably | -0.015 |
scam | -0.014 |
ous | -0.013 |
ighting | -0.013 |
Token | , |
Token ID | 11 |
Feature activation | +7.44e-02 |
Pos logit contributions | |
ensed | +0.030 |
icably | +0.029 |
scam | +0.029 |
ous | +0.026 |
ighting | +0.026 |
Neg logit contributions | |
Marshal | -0.030 |
lator | -0.030 |
iler | -0.026 |
layer | -0.026 |
Gutenberg | -0.026 |
Token | he |
Token ID | 339 |
Feature activation | +6.89e-02 |
Pos logit contributions | |
Marshal | +0.062 |
lator | +0.060 |
iler | +0.054 |
layer | +0.053 |
Gutenberg | +0.053 |
Neg logit contributions | |
ensed | -0.051 |
icably | -0.050 |
scam | -0.049 |
ous | -0.045 |
ighting | -0.045 |
Token | wrote |
Token ID | 2630 |
Feature activation | +9.81e-02 |
Pos logit contributions | |
Marshal | +0.054 |
lator | +0.053 |
iler | +0.047 |
layer | +0.047 |
Gutenberg | +0.046 |
Neg logit contributions | |
ensed | -0.050 |
icably | -0.049 |
scam | -0.048 |
ous | -0.044 |
ighting | -0.044 |
Token | :" |
Token ID | 11097 |
Feature activation | +7.46e-02 |
Pos logit contributions | |
Marshal | +0.078 |
lator | +0.077 |
iler | +0.068 |
layer | +0.067 |
Gutenberg | +0.067 |
Neg logit contributions | |
ensed | -0.071 |
icably | -0.069 |
scam | -0.068 |
ous | -0.062 |
ighting | -0.062 |
Token | To |
Token ID | 2514 |
Feature activation | -8.99e-02 |
Pos logit contributions | |
Marshal | +0.067 |
lator | +0.065 |
iler | +0.059 |
layer | +0.058 |
Gutenberg | +0.058 |
Neg logit contributions | |
ensed | -0.047 |
icably | -0.045 |
scam | -0.045 |
ous | -0.040 |
ighting | -0.040 |
Token | date |
Token ID | 3128 |
Feature activation | +1.68e-02 |
Pos logit contributions | |
ensed | +0.065 |
icably | +0.063 |
scam | +0.063 |
ous | +0.058 |
recomm | +0.057 |
Neg logit contributions | |
Marshal | -0.071 |
lator | -0.070 |
iler | -0.062 |
layer | -0.062 |
Gutenberg | -0.061 |
Token | [ |
Token ID | 685 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
Marshal | +0.013 |
lator | +0.013 |
iler | +0.012 |
layer | +0.012 |
Gutenberg | +0.011 |
Neg logit contributions | |
ensed | -0.012 |
icably | -0.012 |
scam | -0.012 |
ous | -0.011 |
ighting | -0.011 |
Token | May |
Token ID | 6747 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
Marshal | +0.102 |
lator | +0.100 |
iler | +0.089 |
layer | +0.088 |
Gutenberg | +0.087 |
Neg logit contributions | |
ensed | -0.095 |
icably | -0.092 |
scam | -0.092 |
ous | -0.084 |
ighting | -0.084 |
Token | 1928 |
Token ID | 35768 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
ensed | +0.107 |
icably | +0.104 |
scam | +0.103 |
ighting | +0.095 |
ous | +0.094 |
Neg logit contributions | |
Marshal | -0.107 |
lator | -0.105 |
iler | -0.092 |
layer | -0.091 |
Gutenberg | -0.090 |
Token | ], |
Token ID | 4357 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
ensed | +0.023 |
icably | +0.022 |
scam | +0.022 |
ous | +0.021 |
ighting | +0.021 |
Neg logit contributions | |
Marshal | -0.015 |
lator | -0.015 |
iler | -0.012 |
layer | -0.012 |
Gutenberg | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -6.42e-02 |
Pos logit contributions | |
ensed | +0.080 |
icably | +0.078 |
scam | +0.077 |
ous | +0.071 |
ighting | +0.071 |
Neg logit contributions | |
Marshal | -0.086 |
lator | -0.085 |
iler | -0.075 |
layer | -0.074 |
Gutenberg | -0.073 |
Token |
|
Token ID | 198 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
ensed | +0.047 |
icably | +0.046 |
scam | +0.045 |
recomm | +0.042 |
ighting | +0.041 |
Neg logit contributions | |
Marshal | -0.051 |
lator | -0.049 |
iler | -0.043 |
layer | -0.043 |
Gutenberg | -0.043 |
Token |
|
Token ID | 198 |
Feature activation | -4.85e-02 |
Pos logit contributions | |
ensed | +0.018 |
icably | +0.018 |
scam | +0.018 |
ighting | +0.016 |
ous | +0.016 |
Neg logit contributions | |
Marshal | -0.020 |
lator | -0.019 |
iler | -0.017 |
layer | -0.017 |
Gutenberg | -0.017 |
Token | " |
Token ID | 1 |
Feature activation | -4.53e-02 |
Pos logit contributions | |
ensed | +0.034 |
icably | +0.033 |
scam | +0.033 |
recomm | +0.030 |
ighting | +0.030 |
Neg logit contributions | |
Marshal | -0.039 |
lator | -0.039 |
layer | -0.035 |
iler | -0.034 |
Gutenberg | -0.034 |
Token | These |
Token ID | 4711 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
ensed | +0.030 |
icably | +0.029 |
scam | +0.029 |
ighting | +0.026 |
recomm | +0.026 |
Neg logit contributions | |
Marshal | -0.039 |
lator | -0.038 |
layer | -0.034 |
iler | -0.034 |
Gutenberg | -0.033 |
Token | programs |
Token ID | 4056 |
Feature activation | -4.02e-01 |
Pos logit contributions | |
ensed | +0.110 |
icably | +0.107 |
scam | +0.106 |
ous | +0.097 |
ighting | +0.097 |
Neg logit contributions | |
Marshal | -0.123 |
lator | -0.121 |
iler | -0.107 |
layer | -0.106 |
Gutenberg | -0.105 |
Token | can |
Token ID | 460 |
Feature activation | -9.11e-02 |
Pos logit contributions | |
ensed | +0.290 |
icably | +0.281 |
scam | +0.279 |
ous | +0.256 |
ighting | +0.255 |
Neg logit contributions | |
Marshal | -0.319 |
lator | -0.313 |
iler | -0.276 |
layer | -0.275 |
Gutenberg | -0.272 |
Token | protect |
Token ID | 1805 |
Feature activation | +3.18e-01 |
Pos logit contributions | |
ensed | +0.067 |
icably | +0.065 |
scam | +0.065 |
ous | +0.059 |
ighting | +0.059 |
Neg logit contributions | |
Marshal | -0.071 |
lator | -0.069 |
iler | -0.061 |
layer | -0.061 |
Gutenberg | -0.060 |
Token | consumers |
Token ID | 7008 |
Feature activation | +2.07e-01 |
Pos logit contributions | |
Marshal | +0.244 |
lator | +0.240 |
iler | +0.211 |
layer | +0.210 |
Gutenberg | +0.207 |
Neg logit contributions | |
ensed | -0.238 |
icably | -0.231 |
scam | -0.229 |
ous | -0.211 |
ighting | -0.210 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
Marshal | +0.167 |
lator | +0.164 |
iler | +0.145 |
layer | +0.144 |
Gutenberg | +0.143 |
Neg logit contributions | |
ensed | -0.147 |
icably | -0.142 |
scam | -0.142 |
ous | -0.130 |
ella | -0.129 |
Token | reduce |
Token ID | 4646 |
Feature activation | +3.37e-02 |
Pos logit contributions | |
ensed | +0.007 |
icably | +0.007 |
scam | +0.007 |
ous | +0.007 |
ighting | +0.007 |
Neg logit contributions | |
Marshal | -0.008 |
lator | -0.008 |
iler | -0.007 |
layer | -0.007 |
Gutenberg | -0.007 |
Token | enezuel |
Token ID | 12596 |
Feature activation | +6.74e-02 |
Pos logit contributions | |
ensed | +0.015 |
icably | +0.014 |
scam | +0.014 |
ighting | +0.013 |
recomm | +0.013 |
Neg logit contributions | |
Marshal | -0.015 |
lator | -0.015 |
iler | -0.013 |
layer | -0.013 |
Gutenberg | -0.013 |
Token | a |
Token ID | 64 |
Feature activation | -2.13e-01 |
Pos logit contributions | |
Marshal | +0.059 |
lator | +0.058 |
iler | +0.052 |
layer | +0.052 |
Gutenberg | +0.051 |
Neg logit contributions | |
ensed | -0.043 |
icably | -0.041 |
scam | -0.040 |
ighting | -0.037 |
recomm | -0.037 |
Token | relationship |
Token ID | 2776 |
Feature activation | -9.46e-02 |
Pos logit contributions | |
ensed | +0.147 |
icably | +0.142 |
scam | +0.141 |
ous | +0.129 |
ighting | +0.128 |
Neg logit contributions | |
Marshal | -0.176 |
lator | -0.173 |
iler | -0.153 |
layer | -0.153 |
Gutenberg | -0.151 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
ensed | +0.071 |
icably | +0.069 |
scam | +0.068 |
ous | +0.063 |
ighting | +0.062 |
Neg logit contributions | |
Marshal | -0.073 |
lator | -0.071 |
iler | -0.063 |
layer | -0.062 |
Gutenberg | -0.062 |
Token | The |
Token ID | 383 |
Feature activation | -6.35e-02 |
Pos logit contributions | |
Marshal | +0.015 |
lator | +0.014 |
iler | +0.013 |
layer | +0.013 |
Gutenberg | +0.012 |
Neg logit contributions | |
ensed | -0.014 |
icably | -0.013 |
scam | -0.013 |
ous | -0.012 |
ighting | -0.012 |
Token | U |
Token ID | 471 |
Feature activation | -8.38e-02 |
Pos logit contributions | |
ensed | +0.048 |
icably | +0.047 |
scam | +0.047 |
ous | +0.043 |
ighting | +0.043 |
Neg logit contributions | |
Marshal | -0.048 |
lator | -0.047 |
iler | -0.041 |
layer | -0.041 |
Gutenberg | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | -4.74e-02 |
Pos logit contributions | |
ensed | +0.065 |
icably | +0.064 |
scam | +0.063 |
ous | +0.058 |
ighting | +0.058 |
Neg logit contributions | |
Marshal | -0.062 |
lator | -0.060 |
iler | -0.053 |
layer | -0.052 |
Gutenberg | -0.052 |
Token | S |
Token ID | 50 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
ensed | +0.035 |
icably | +0.033 |
scam | +0.033 |
ous | +0.030 |
ighting | +0.030 |
Neg logit contributions | |
Marshal | -0.038 |
lator | -0.037 |
iler | -0.032 |
layer | -0.032 |
Gutenberg | -0.032 |
Token | . |
Token ID | 13 |
Feature activation | -3.55e-02 |
Pos logit contributions | |
ensed | +0.112 |
icably | +0.108 |
scam | +0.108 |
ous | +0.099 |
recomm | +0.098 |
Neg logit contributions | |
Marshal | -0.115 |
lator | -0.113 |
iler | -0.100 |
layer | -0.099 |
Gutenberg | -0.098 |
Token | is |
Token ID | 318 |
Feature activation | +7.02e-02 |
Pos logit contributions | |
ensed | +0.027 |
icably | +0.026 |
scam | +0.026 |
ous | +0.024 |
ighting | +0.024 |
Neg logit contributions | |
Marshal | -0.027 |
lator | -0.026 |
iler | -0.023 |
layer | -0.023 |
Gutenberg | -0.023 |
Token | inevitably |
Token ID | 16857 |
Feature activation | +3.49e-02 |
Pos logit contributions | |
Marshal | +0.060 |
lator | +0.059 |
iler | +0.053 |
layer | +0.052 |
Gutenberg | +0.052 |
Neg logit contributions | |
ensed | -0.046 |
icably | -0.044 |
scam | -0.044 |
ighting | -0.040 |
ous | -0.040 |
Token | binding |
Token ID | 30786 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
Marshal | +0.057 |
lator | +0.056 |
iler | +0.049 |
layer | +0.048 |
Gutenberg | +0.047 |
Neg logit contributions | |
ensed | -0.068 |
icably | -0.067 |
scam | -0.066 |
ous | -0.061 |
ighting | -0.061 |
Token | feature |
Token ID | 3895 |
Feature activation | -4.34e-02 |
Pos logit contributions | |
Marshal | +0.196 |
lator | +0.192 |
iler | +0.170 |
layer | +0.169 |
Gutenberg | +0.167 |
Neg logit contributions | |
ensed | -0.177 |
icably | -0.171 |
scam | -0.170 |
ous | -0.156 |
ighting | -0.155 |
Token | is |
Token ID | 318 |
Feature activation | +6.29e-02 |
Pos logit contributions | |
ensed | +0.030 |
icably | +0.029 |
scam | +0.028 |
ighting | +0.026 |
ous | +0.026 |
Neg logit contributions | |
Marshal | -0.036 |
lator | -0.035 |
iler | -0.031 |
layer | -0.031 |
Gutenberg | -0.031 |
Token | awesome |
Token ID | 7427 |
Feature activation | +4.95e-02 |
Pos logit contributions | |
Marshal | +0.052 |
lator | +0.051 |
iler | +0.045 |
layer | +0.045 |
Gutenberg | +0.044 |
Neg logit contributions | |
ensed | -0.044 |
icably | -0.042 |
scam | -0.042 |
ighting | -0.038 |
ous | -0.038 |
Token | . |
Token ID | 13 |
Feature activation | -8.36e-03 |
Pos logit contributions | |
Marshal | +0.037 |
lator | +0.037 |
iler | +0.032 |
layer | +0.032 |
Gutenberg | +0.031 |
Neg logit contributions | |
ensed | -0.038 |
icably | -0.037 |
scam | -0.036 |
ighting | -0.033 |
ous | -0.033 |
Token | However |
Token ID | 2102 |
Feature activation | -8.44e-02 |
Pos logit contributions | |
ensed | +0.006 |
icably | +0.006 |
scam | +0.006 |
ous | +0.005 |
ighting | +0.005 |
Neg logit contributions | |
Marshal | -0.007 |
lator | -0.007 |
iler | -0.006 |
layer | -0.006 |
Gutenberg | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +3.98e-02 |
Pos logit contributions | |
ensed | +0.063 |
icably | +0.061 |
scam | +0.061 |
ous | +0.056 |
ighting | +0.055 |
Neg logit contributions | |
Marshal | -0.065 |
lator | -0.064 |
iler | -0.056 |
layer | -0.056 |
Gutenberg | -0.055 |
Token | it |
Token ID | 340 |
Feature activation | +1.88e-02 |
Pos logit contributions | |
Marshal | +0.033 |
lator | +0.032 |
iler | +0.029 |
layer | +0.029 |
Gutenberg | +0.028 |
Neg logit contributions | |
ensed | -0.027 |
icably | -0.027 |
scam | -0.026 |
ous | -0.024 |
ighting | -0.024 |
Token | does |
Token ID | 857 |
Feature activation | +2.76e-02 |
Pos logit contributions | |
Marshal | +0.016 |
lator | +0.016 |
iler | +0.014 |
layer | +0.014 |
Gutenberg | +0.014 |
Neg logit contributions | |
ensed | -0.013 |
icably | -0.012 |
scam | -0.012 |
ighting | -0.011 |
ous | -0.011 |
Token | have |
Token ID | 423 |
Feature activation | +6.17e-02 |
Pos logit contributions | |
Marshal | +0.022 |
lator | +0.021 |
iler | +0.019 |
layer | +0.019 |
Gutenberg | +0.018 |
Neg logit contributions | |
ensed | -0.020 |
icably | -0.020 |
scam | -0.019 |
ous | -0.018 |
ighting | -0.018 |
Token | a |
Token ID | 257 |
Feature activation | +7.22e-02 |
Pos logit contributions | |
Marshal | +0.048 |
lator | +0.046 |
iler | +0.041 |
layer | +0.041 |
Gutenberg | +0.040 |
Neg logit contributions | |
ensed | -0.046 |
icably | -0.045 |
scam | -0.044 |
ous | -0.041 |
ighting | -0.041 |
Token | your |
Token ID | 534 |
Feature activation | +1.57e-01 |
Pos logit contributions | |
Marshal | +0.063 |
lator | +0.062 |
iler | +0.054 |
layer | +0.054 |
Gutenberg | +0.053 |
Neg logit contributions | |
ensed | -0.062 |
icably | -0.060 |
scam | -0.060 |
ous | -0.055 |
recomm | -0.055 |
Token | own |
Token ID | 898 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
Marshal | +0.112 |
lator | +0.110 |
iler | +0.095 |
layer | +0.095 |
Gutenberg | +0.093 |
Neg logit contributions | |
ensed | -0.126 |
icably | -0.122 |
scam | -0.122 |
ous | -0.113 |
ighting | -0.112 |
Token | due |
Token ID | 2233 |
Feature activation | -7.59e-03 |
Pos logit contributions | |
Marshal | +0.174 |
lator | +0.171 |
iler | +0.153 |
layer | +0.153 |
Gutenberg | +0.151 |
Neg logit contributions | |
ensed | -0.121 |
icably | -0.116 |
scam | -0.116 |
ous | -0.104 |
ighting | -0.104 |
Token | diligence |
Token ID | 34136 |
Feature activation | +8.72e-02 |
Pos logit contributions | |
ensed | +0.006 |
icably | +0.006 |
scam | +0.006 |
ous | +0.005 |
recomm | +0.005 |
Neg logit contributions | |
Marshal | -0.006 |
lator | -0.006 |
iler | -0.005 |
Gutenberg | -0.005 |
layer | -0.005 |
Token | when |
Token ID | 618 |
Feature activation | +9.96e-03 |
Pos logit contributions | |
Marshal | +0.068 |
lator | +0.067 |
iler | +0.059 |
layer | +0.058 |
Gutenberg | +0.058 |
Neg logit contributions | |
ensed | -0.064 |
icably | -0.063 |
scam | -0.062 |
ous | -0.057 |
ighting | -0.057 |
Token | considering |
Token ID | 6402 |
Feature activation | -2.24e-01 |
Pos logit contributions | |
Marshal | +0.009 |
lator | +0.009 |
iler | +0.008 |
Gutenberg | +0.008 |
layer | +0.008 |
Neg logit contributions | |
ensed | -0.006 |
icably | -0.006 |
scam | -0.006 |
ighting | -0.005 |
ella | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | -2.52e-02 |
Pos logit contributions | |
ensed | +0.167 |
icably | +0.162 |
scam | +0.159 |
ighting | +0.148 |
ous | +0.147 |
Neg logit contributions | |
Marshal | -0.174 |
lator | -0.169 |
iler | -0.149 |
layer | -0.148 |
Gutenberg | -0.147 |
Token | offerings |
Token ID | 18369 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
ensed | +0.017 |
icably | +0.016 |
scam | +0.016 |
ighting | +0.015 |
ous | +0.015 |
Neg logit contributions | |
Marshal | -0.021 |
lator | -0.021 |
iler | -0.019 |
layer | -0.019 |
Gutenberg | -0.018 |
Token | of |
Token ID | 286 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
Marshal | +0.117 |
lator | +0.114 |
iler | +0.102 |
layer | +0.102 |
Gutenberg | +0.101 |
Neg logit contributions | |
ensed | -0.086 |
icably | -0.084 |
scam | -0.083 |
ighting | -0.075 |
ous | -0.075 |
Token | third |
Token ID | 2368 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.009 |
scam | +0.009 |
ighting | +0.009 |
ous | +0.009 |
Neg logit contributions | |
Marshal | -0.011 |
lator | -0.011 |
iler | -0.009 |
layer | -0.009 |
Gutenberg | -0.009 |
Token | party |
Token ID | 2151 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
Marshal | +0.185 |
lator | +0.182 |
iler | +0.160 |
layer | +0.159 |
Gutenberg | +0.157 |
Neg logit contributions | |
ensed | -0.178 |
icably | -0.173 |
scam | -0.172 |
ous | -0.158 |
ighting | -0.157 |
Token | many |
Token ID | 867 |
Feature activation | -7.66e-02 |
Pos logit contributions | |
ensed | +0.045 |
icably | +0.044 |
scam | +0.044 |
ighting | +0.040 |
ous | +0.040 |
Neg logit contributions | |
Marshal | -0.055 |
lator | -0.054 |
iler | -0.049 |
layer | -0.048 |
Gutenberg | -0.048 |
Token | ; |
Token ID | 26 |
Feature activation | +7.82e-02 |
Pos logit contributions | |
ensed | +0.055 |
icably | +0.053 |
scam | +0.053 |
ighting | +0.048 |
ous | +0.048 |
Neg logit contributions | |
Marshal | -0.061 |
lator | -0.060 |
iler | -0.053 |
layer | -0.053 |
Gutenberg | -0.052 |
Token | when |
Token ID | 618 |
Feature activation | -6.31e-02 |
Pos logit contributions | |
Marshal | +0.066 |
lator | +0.065 |
iler | +0.058 |
layer | +0.058 |
Gutenberg | +0.057 |
Neg logit contributions | |
ensed | -0.052 |
icably | -0.051 |
scam | -0.050 |
ous | -0.046 |
ighting | -0.046 |
Token | many |
Token ID | 867 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
ensed | +0.041 |
icably | +0.039 |
scam | +0.039 |
ous | +0.036 |
ighting | +0.035 |
Neg logit contributions | |
Marshal | -0.055 |
lator | -0.054 |
iler | -0.048 |
layer | -0.048 |
Gutenberg | -0.047 |
Token | politicians |
Token ID | 7602 |
Feature activation | -9.11e-02 |
Pos logit contributions | |
ensed | +0.010 |
icably | +0.010 |
scam | +0.010 |
ous | +0.009 |
ighting | +0.009 |
Neg logit contributions | |
Marshal | -0.011 |
lator | -0.011 |
iler | -0.010 |
layer | -0.010 |
Gutenberg | -0.010 |
Token | shy |
Token ID | 15800 |
Feature activation | -4.52e-01 |
Pos logit contributions | |
ensed | +0.066 |
icably | +0.064 |
scam | +0.062 |
ighting | +0.058 |
ella | +0.058 |
Neg logit contributions | |
Marshal | -0.072 |
lator | -0.071 |
iler | -0.063 |
layer | -0.063 |
Gutenberg | -0.061 |
Token | away |
Token ID | 1497 |
Feature activation | -5.31e-02 |
Pos logit contributions | |
ensed | +0.319 |
icably | +0.310 |
scam | +0.308 |
ous | +0.282 |
ighting | +0.280 |
Neg logit contributions | |
Marshal | -0.365 |
lator | -0.359 |
iler | -0.318 |
layer | -0.316 |
Gutenberg | -0.313 |
Token | from |
Token ID | 422 |
Feature activation | -3.73e-02 |
Pos logit contributions | |
ensed | +0.036 |
icably | +0.035 |
scam | +0.035 |
ous | +0.032 |
ighting | +0.032 |
Neg logit contributions | |
Marshal | -0.044 |
lator | -0.043 |
iler | -0.038 |
layer | -0.038 |
Gutenberg | -0.038 |
Token | the |
Token ID | 262 |
Feature activation | -2.61e-04 |
Pos logit contributions | |
ensed | +0.025 |
icably | +0.024 |
scam | +0.023 |
ighting | +0.021 |
ous | +0.021 |
Neg logit contributions | |
Marshal | -0.032 |
lator | -0.031 |
iler | -0.028 |
layer | -0.028 |
Gutenberg | -0.028 |
Token | long |
Token ID | 890 |
Feature activation | +2.70e-02 |
Pos logit contributions | |
ensed | +0.000 |
icably | +0.000 |
scam | +0.000 |
ous | +0.000 |
ighting | +0.000 |
Neg logit contributions | |
Marshal | -0.000 |
lator | -0.000 |
iler | -0.000 |
layer | -0.000 |
Gutenberg | -0.000 |
Token | suffering |
Token ID | 7195 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
Marshal | +0.020 |
lator | +0.019 |
iler | +0.017 |
layer | +0.017 |
Gutenberg | +0.017 |
Neg logit contributions | |
ensed | -0.021 |
icably | -0.021 |
scam | -0.020 |
ous | -0.019 |
ighting | -0.019 |
Token | Like |
Token ID | 4525 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
ensed | +0.001 |
icably | +0.001 |
scam | +0.001 |
ighting | +0.001 |
ous | +0.001 |
Neg logit contributions | |
Marshal | -0.001 |
lator | -0.001 |
iler | -0.001 |
layer | -0.001 |
Gutenberg | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -1.28e-02 |
Pos logit contributions | |
Marshal | +0.115 |
lator | +0.113 |
iler | +0.102 |
layer | +0.101 |
Gutenberg | +0.101 |
Neg logit contributions | |
ensed | -0.067 |
icably | -0.064 |
scam | -0.063 |
ighting | -0.057 |
ella | -0.056 |
Token | infected |
Token ID | 14112 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
ensed | +0.011 |
icably | +0.011 |
scam | +0.011 |
ous | +0.010 |
ighting | +0.010 |
Neg logit contributions | |
Marshal | -0.008 |
lator | -0.008 |
iler | -0.007 |
layer | -0.007 |
Gutenberg | -0.007 |
Token | populations |
Token ID | 9684 |
Feature activation | +6.79e-02 |
Pos logit contributions | |
Marshal | +0.153 |
lator | +0.150 |
iler | +0.131 |
layer | +0.131 |
Gutenberg | +0.129 |
Neg logit contributions | |
ensed | -0.156 |
icably | -0.151 |
scam | -0.151 |
ous | -0.139 |
ighting | -0.138 |
Token | in |
Token ID | 287 |
Feature activation | +4.99e-02 |
Pos logit contributions | |
Marshal | +0.055 |
lator | +0.055 |
iler | +0.048 |
layer | +0.048 |
Gutenberg | +0.048 |
Neg logit contributions | |
ensed | -0.047 |
icably | -0.046 |
scam | -0.046 |
ous | -0.042 |
ighting | -0.042 |
Token | Saskatchewan |
Token ID | 31346 |
Feature activation | -4.42e-01 |
Pos logit contributions | |
Marshal | +0.043 |
lator | +0.042 |
iler | +0.037 |
layer | +0.037 |
Gutenberg | +0.037 |
Neg logit contributions | |
ensed | -0.033 |
icably | -0.032 |
scam | -0.031 |
ighting | -0.029 |
ella | -0.029 |
Token | , |
Token ID | 11 |
Feature activation | -2.76e-03 |
Pos logit contributions | |
ensed | +0.332 |
icably | +0.322 |
scam | +0.321 |
ous | +0.296 |
ella | +0.293 |
Neg logit contributions | |
Marshal | -0.337 |
lator | -0.331 |
iler | -0.291 |
layer | -0.290 |
Gutenberg | -0.286 |
Token | many |
Token ID | 867 |
Feature activation | -8.23e-02 |
Pos logit contributions | |
ensed | +0.002 |
icably | +0.002 |
scam | +0.002 |
ighting | +0.002 |
ous | +0.002 |
Neg logit contributions | |
Marshal | -0.002 |
lator | -0.002 |
iler | -0.002 |
layer | -0.002 |
Gutenberg | -0.002 |
Token | live |
Token ID | 2107 |
Feature activation | -6.46e-02 |
Pos logit contributions | |
ensed | +0.059 |
icably | +0.058 |
scam | +0.057 |
ighting | +0.052 |
ous | +0.052 |
Neg logit contributions | |
Marshal | -0.065 |
lator | -0.064 |
iler | -0.057 |
layer | -0.056 |
Gutenberg | -0.056 |
Token | in |
Token ID | 287 |
Feature activation | -4.97e-02 |
Pos logit contributions | |
ensed | +0.048 |
icably | +0.046 |
scam | +0.046 |
ighting | +0.042 |
ous | +0.042 |
Neg logit contributions | |
Marshal | -0.050 |
lator | -0.049 |
iler | -0.043 |
layer | -0.043 |
Gutenberg | -0.043 |
Token | areas |
Token ID | 3006 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
ensed | +0.036 |
icably | +0.035 |
scam | +0.035 |
ighting | +0.032 |
ous | +0.032 |
Neg logit contributions | |
Marshal | -0.039 |
lator | -0.038 |
iler | -0.034 |
layer | -0.034 |
Gutenberg | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | +2.21e-02 |
Pos logit contributions | |
Marshal | +0.080 |
lator | +0.078 |
iler | +0.069 |
layer | +0.068 |
Gutenberg | +0.067 |
Neg logit contributions | |
ensed | -0.080 |
icably | -0.078 |
scam | -0.077 |
ous | -0.071 |
ighting | -0.071 |
Token |
|
Token ID | 198 |
Feature activation | +5.15e-02 |
Pos logit contributions | |
Marshal | +0.018 |
lator | +0.017 |
iler | +0.015 |
layer | +0.015 |
Gutenberg | +0.015 |
Neg logit contributions | |
ensed | -0.016 |
icably | -0.016 |
scam | -0.015 |
ous | -0.014 |
ighting | -0.014 |
Token |
|
Token ID | 198 |
Feature activation | +3.68e-02 |
Pos logit contributions | |
Marshal | +0.041 |
lator | +0.040 |
iler | +0.035 |
layer | +0.035 |
Gutenberg | +0.034 |
Neg logit contributions | |
ensed | -0.038 |
icably | -0.037 |
scam | -0.036 |
ighting | -0.033 |
ous | -0.033 |
Token | Watch |
Token ID | 10723 |
Feature activation | +1.55e-01 |
Pos logit contributions | |
Marshal | +0.032 |
lator | +0.031 |
iler | +0.028 |
layer | +0.028 |
Gutenberg | +0.027 |
Neg logit contributions | |
ensed | -0.024 |
icably | -0.023 |
scam | -0.023 |
ighting | -0.021 |
ous | -0.021 |
Token | dog |
Token ID | 9703 |
Feature activation | -1.90e-01 |
Pos logit contributions | |
Marshal | +0.145 |
lator | +0.143 |
iler | +0.129 |
layer | +0.129 |
Gutenberg | +0.127 |
Neg logit contributions | |
ensed | -0.090 |
icably | -0.086 |
scam | -0.086 |
ous | -0.077 |
ighting | -0.076 |
Token | groups |
Token ID | 2628 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
ensed | +0.127 |
icably | +0.124 |
scam | +0.122 |
ous | +0.111 |
ighting | +0.111 |
Neg logit contributions | |
Marshal | -0.161 |
lator | -0.156 |
iler | -0.139 |
layer | -0.139 |
Gutenberg | -0.138 |
Token | filed |
Token ID | 5717 |
Feature activation | -2.23e-01 |
Pos logit contributions | |
ensed | +0.340 |
icably | +0.330 |
scam | +0.326 |
ous | +0.299 |
ighting | +0.298 |
Neg logit contributions | |
Marshal | -0.393 |
lator | -0.384 |
iler | -0.341 |
layer | -0.340 |
Gutenberg | -0.336 |
Token | Federal |
Token ID | 5618 |
Feature activation | +3.70e-01 |
Pos logit contributions | |
ensed | +0.162 |
icably | +0.157 |
scam | +0.156 |
ous | +0.143 |
ighting | +0.142 |
Neg logit contributions | |
Marshal | -0.175 |
lator | -0.172 |
iler | -0.152 |
layer | -0.151 |
Gutenberg | -0.149 |
Token | Election |
Token ID | 14219 |
Feature activation | +9.30e-02 |
Pos logit contributions | |
Marshal | +0.221 |
lator | +0.212 |
iler | +0.181 |
layer | +0.177 |
Gutenberg | +0.176 |
Neg logit contributions | |
ensed | -0.341 |
icably | -0.334 |
scam | -0.330 |
ous | -0.310 |
ighting | -0.309 |
Token | Commission |
Token ID | 4513 |
Feature activation | +2.71e-01 |
Pos logit contributions | |
Marshal | +0.051 |
lator | +0.048 |
iler | +0.039 |
layer | +0.039 |
Gutenberg | +0.038 |
Neg logit contributions | |
ensed | -0.092 |
icably | -0.090 |
scam | -0.089 |
ous | -0.084 |
recomm | -0.083 |
Token | complaints |
Token ID | 9687 |
Feature activation | -1.45e-01 |
Pos logit contributions | |
Marshal | +0.256 |
lator | +0.252 |
iler | +0.227 |
layer | +0.226 |
Gutenberg | +0.224 |
Neg logit contributions | |
ensed | -0.155 |
icably | -0.150 |
scam | -0.148 |
ous | -0.132 |
ighting | -0.131 |
Token | 0 |
Token ID | 657 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
Marshal | +0.008 |
lator | +0.008 |
iler | +0.007 |
layer | +0.007 |
Gutenberg | +0.007 |
Neg logit contributions | |
ensed | -0.008 |
icably | -0.008 |
scam | -0.008 |
ous | -0.007 |
ighting | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | -7.02e-02 |
Pos logit contributions | |
Marshal | +0.008 |
lator | +0.008 |
iler | +0.007 |
layer | +0.007 |
Gutenberg | +0.007 |
Neg logit contributions | |
ensed | -0.008 |
icably | -0.008 |
scam | -0.008 |
ous | -0.007 |
ighting | -0.007 |
Token | 0 |
Token ID | 15 |
Feature activation | -2.00e-02 |
Pos logit contributions | |
ensed | +0.054 |
icably | +0.053 |
scam | +0.052 |
ous | +0.048 |
ighting | +0.048 |
Neg logit contributions | |
Marshal | -0.053 |
lator | -0.051 |
iler | -0.045 |
layer | -0.045 |
Gutenberg | -0.044 |
Token | f |
Token ID | 69 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
ensed | +0.022 |
icably | +0.021 |
scam | +0.021 |
ous | +0.020 |
ighting | +0.020 |
Neg logit contributions | |
Marshal | -0.009 |
lator | -0.008 |
iler | -0.007 |
layer | -0.007 |
Gutenberg | -0.006 |
Token | ); |
Token ID | 1776 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
Marshal | +0.191 |
lator | +0.187 |
iler | +0.165 |
layer | +0.163 |
Gutenberg | +0.161 |
Neg logit contributions | |
ensed | -0.187 |
icably | -0.181 |
scam | -0.180 |
ighting | -0.165 |
recomm | -0.164 |
Token | RAW |
Token ID | 33782 |
Feature activation | -5.25e-01 |
Pos logit contributions | |
ensed | +0.056 |
icably | +0.053 |
scam | +0.053 |
ous | +0.046 |
ighting | +0.045 |
Neg logit contributions | |
Marshal | -0.133 |
lator | -0.132 |
iler | -0.120 |
layer | -0.120 |
Gutenberg | -0.119 |
Token | _ |
Token ID | 62 |
Feature activation | +3.81e-02 |
Pos logit contributions | |
ensed | +0.455 |
icably | +0.444 |
scam | +0.442 |
ous | +0.411 |
ighting | +0.410 |
Neg logit contributions | |
Marshal | -0.340 |
lator | -0.333 |
iler | -0.285 |
layer | -0.283 |
Gutenberg | -0.279 |
Token | ASS |
Token ID | 10705 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
Marshal | +0.035 |
lator | +0.034 |
iler | +0.031 |
layer | +0.030 |
Gutenberg | +0.030 |
Neg logit contributions | |
ensed | -0.023 |
icably | -0.022 |
scam | -0.022 |
ous | -0.020 |
ighting | -0.020 |
Token | ERT |
Token ID | 17395 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
ensed | +0.125 |
icably | +0.121 |
scam | +0.120 |
ous | +0.108 |
ighting | +0.108 |
Neg logit contributions | |
Marshal | -0.170 |
lator | -0.166 |
iler | -0.149 |
layer | -0.148 |
Gutenberg | -0.147 |
Token | ( |
Token ID | 7 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
ensed | +0.070 |
icably | +0.067 |
scam | +0.067 |
ous | +0.060 |
ighting | +0.060 |
Neg logit contributions | |
Marshal | -0.093 |
lator | -0.091 |
iler | -0.081 |
layer | -0.081 |
Gutenberg | -0.080 |
Token | it |
Token ID | 270 |
Feature activation | +5.35e-02 |
Pos logit contributions | |
ensed | +0.089 |
icably | +0.087 |
scam | +0.086 |
ous | +0.079 |
ighting | +0.079 |
Neg logit contributions | |
Marshal | -0.087 |
lator | -0.085 |
iler | -0.075 |
layer | -0.075 |
Gutenberg | -0.073 |
Token | also |
Token ID | 635 |
Feature activation | +3.87e-03 |
Pos logit contributions | |
Marshal | +0.023 |
lator | +0.023 |
iler | +0.020 |
layer | +0.020 |
Gutenberg | +0.020 |
Neg logit contributions | |
ensed | -0.020 |
icably | -0.019 |
scam | -0.019 |
ous | -0.017 |
ighting | -0.017 |
Token | the |
Token ID | 262 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
Marshal | +0.003 |
lator | +0.003 |
iler | +0.003 |
layer | +0.003 |
Gutenberg | +0.003 |
Neg logit contributions | |
ensed | -0.003 |
icably | -0.003 |
scam | -0.003 |
ous | -0.002 |
ighting | -0.002 |
Token | style |
Token ID | 3918 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
ensed | +0.013 |
icably | +0.013 |
scam | +0.013 |
ous | +0.012 |
ighting | +0.012 |
Neg logit contributions | |
Marshal | -0.015 |
lator | -0.015 |
iler | -0.013 |
layer | -0.013 |
Gutenberg | -0.013 |
Token | of |
Token ID | 286 |
Feature activation | +4.41e-02 |
Pos logit contributions | |
Marshal | +0.014 |
lator | +0.014 |
iler | +0.012 |
layer | +0.012 |
Gutenberg | +0.012 |
Neg logit contributions | |
ensed | -0.011 |
icably | -0.010 |
scam | -0.010 |
ighting | -0.009 |
ous | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | -8.70e-03 |
Pos logit contributions | |
Marshal | +0.037 |
lator | +0.036 |
iler | +0.032 |
layer | +0.032 |
Gutenberg | +0.032 |
Neg logit contributions | |
ensed | -0.030 |
icably | -0.029 |
scam | -0.029 |
ighting | -0.026 |
ous | -0.026 |
Token | show |
Token ID | 905 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
ensed | +0.004 |
icably | +0.004 |
scam | +0.004 |
ighting | +0.003 |
ous | +0.003 |
Neg logit contributions | |
Marshal | -0.009 |
lator | -0.009 |
iler | -0.008 |
layer | -0.008 |
Gutenberg | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
ensed | +0.320 |
icably | +0.311 |
scam | +0.310 |
ous | +0.285 |
recomm | +0.283 |
Neg logit contributions | |
Marshal | -0.330 |
lator | -0.324 |
iler | -0.285 |
layer | -0.284 |
Gutenberg | -0.280 |
Token | The |
Token ID | 383 |
Feature activation | -7.07e-02 |
Pos logit contributions | |
Marshal | +0.024 |
lator | +0.024 |
iler | +0.021 |
layer | +0.021 |
Gutenberg | +0.021 |
Neg logit contributions | |
ensed | -0.024 |
icably | -0.023 |
scam | -0.023 |
ighting | -0.021 |
ous | -0.021 |
Token | story |
Token ID | 1621 |
Feature activation | +5.97e-02 |
Pos logit contributions | |
ensed | +0.051 |
icably | +0.050 |
scam | +0.049 |
ous | +0.045 |
ighting | +0.045 |
Neg logit contributions | |
Marshal | -0.056 |
lator | -0.055 |
iler | -0.048 |
layer | -0.048 |
Gutenberg | -0.048 |
Token | where |
Token ID | 810 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
Marshal | +0.051 |
lator | +0.050 |
iler | +0.044 |
layer | +0.044 |
Gutenberg | +0.044 |
Neg logit contributions | |
ensed | -0.040 |
icably | -0.038 |
scam | -0.038 |
ighting | -0.035 |
ella | -0.034 |
Token | Cyborg |
Token ID | 46114 |
Feature activation | -5.91e-02 |
Pos logit contributions | |
Marshal | +0.031 |
lator | +0.030 |
iler | +0.026 |
layer | +0.026 |
Gutenberg | +0.026 |
Neg logit contributions | |
ensed | -0.029 |
icably | -0.028 |
scam | -0.027 |
ighting | -0.025 |
ous | -0.025 |