Token | Sports |
Token ID | 7092 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
fitt | +0.291 |
slic | +0.275 |
hof | +0.266 |
leakage | +0.265 |
stamped | +0.264 |
Neg logit contributions | |
ˈ | -0.257 |
Redd | -0.208 |
Wan | -0.202 |
claw | -0.200 |
Neph | -0.190 |
Token | ,[ |
Token ID | 17414 |
Feature activation | -2.34e-02 |
Pos logit contributions | |
ˈ | +0.246 |
Redd | +0.198 |
Wan | +0.192 |
claw | +0.191 |
Neph | +0.181 |
Neg logit contributions | |
fitt | -0.291 |
slic | -0.275 |
hof | -0.266 |
leakage | -0.265 |
stamped | -0.264 |
Token | 97 |
Token ID | 5607 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
ˈ | +0.070 |
Redd | +0.059 |
Wan | +0.057 |
claw | +0.057 |
Neph | +0.054 |
Neg logit contributions | |
fitt | -0.054 |
slic | -0.050 |
hof | -0.048 |
leakage | -0.048 |
stamped | -0.048 |
Token | ] |
Token ID | 60 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
fitt | +0.370 |
slic | +0.351 |
hof | +0.345 |
stamped | +0.342 |
leakage | +0.341 |
Neg logit contributions | |
ˈ | -0.270 |
Redd | -0.216 |
Wan | -0.209 |
claw | -0.205 |
Neph | -0.191 |
Token | Ble |
Token ID | 17175 |
Feature activation | -5.70e-02 |
Pos logit contributions | |
ˈ | +0.510 |
Redd | +0.424 |
Wan | +0.414 |
claw | +0.412 |
Neph | +0.396 |
Neg logit contributions | |
fitt | -0.425 |
slic | -0.398 |
hof | -0.381 |
leakage | -0.380 |
stamped | -0.378 |
Token | acher |
Token ID | 3493 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
ˈ | +0.212 |
Redd | +0.185 |
Wan | +0.182 |
claw | +0.181 |
Neph | +0.175 |
Neg logit contributions | |
fitt | -0.089 |
slic | -0.079 |
hof | -0.075 |
leakage | -0.074 |
stamped | -0.074 |
Token | Report |
Token ID | 6358 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
fitt | +1.179 |
slic | +1.091 |
hof | +1.048 |
leakage | +1.045 |
stamped | +1.043 |
Neg logit contributions | |
ˈ | -1.658 |
Redd | -1.396 |
Wan | -1.366 |
claw | -1.358 |
Neph | -1.302 |
Token | ,[ |
Token ID | 17414 |
Feature activation | -2.71e-02 |
Pos logit contributions | |
fitt | +0.606 |
slic | +0.573 |
hof | +0.557 |
leakage | +0.555 |
stamped | +0.555 |
Neg logit contributions | |
ˈ | -0.437 |
Redd | -0.343 |
Wan | -0.332 |
claw | -0.327 |
Neph | -0.308 |
Token | 98 |
Token ID | 4089 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
ˈ | +0.089 |
Redd | +0.076 |
Wan | +0.074 |
claw | +0.074 |
Neph | +0.071 |
Neg logit contributions | |
fitt | -0.055 |
slic | -0.050 |
hof | -0.048 |
leakage | -0.048 |
stamped | -0.047 |
Token | ] |
Token ID | 60 |
Feature activation | -1.91e-01 |
Pos logit contributions | |
fitt | +0.405 |
slic | +0.383 |
hof | +0.377 |
stamped | +0.375 |
leakage | +0.373 |
Neg logit contributions | |
ˈ | -0.302 |
Redd | -0.242 |
Wan | -0.234 |
claw | -0.230 |
Neph | -0.212 |
Token | Sporting |
Token ID | 31790 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
ˈ | +0.529 |
Redd | +0.437 |
Wan | +0.426 |
claw | +0.424 |
Neph | +0.408 |
Neg logit contributions | |
fitt | -0.478 |
slic | -0.448 |
hof | -0.430 |
leakage | -0.428 |
stamped | -0.426 |
Token | UCLA |
Token ID | 21750 |
Feature activation | -4.98e-02 |
Pos logit contributions | |
ˈ | +0.065 |
Redd | +0.052 |
Wan | +0.051 |
claw | +0.050 |
Neph | +0.048 |
Neg logit contributions | |
fitt | -0.075 |
slic | -0.071 |
hof | -0.068 |
leakage | -0.068 |
stamped | -0.068 |
Token | on |
Token ID | 319 |
Feature activation | +2.01e-02 |
Pos logit contributions | |
ˈ | +0.142 |
Redd | +0.118 |
Wan | +0.116 |
claw | +0.115 |
Neph | +0.110 |
Neg logit contributions | |
fitt | -0.120 |
slic | -0.113 |
hof | -0.108 |
leakage | -0.108 |
stamped | -0.107 |
Token | Friday |
Token ID | 3217 |
Feature activation | -4.77e-02 |
Pos logit contributions | |
fitt | +0.052 |
slic | +0.049 |
hof | +0.048 |
leakage | +0.047 |
stamped | +0.047 |
Neg logit contributions | |
ˈ | -0.054 |
Redd | -0.044 |
Wan | -0.043 |
claw | -0.042 |
Neph | -0.041 |
Token | via |
Token ID | 2884 |
Feature activation | -6.49e-02 |
Pos logit contributions | |
ˈ | +0.135 |
Redd | +0.112 |
Wan | +0.109 |
claw | +0.109 |
Neph | +0.104 |
Neg logit contributions | |
fitt | -0.117 |
slic | -0.110 |
hof | -0.105 |
leakage | -0.105 |
stamped | -0.104 |
Token | Ble |
Token ID | 17175 |
Feature activation | -9.09e-02 |
Pos logit contributions | |
ˈ | +0.192 |
Redd | +0.161 |
Wan | +0.157 |
claw | +0.156 |
Neph | +0.149 |
Neg logit contributions | |
fitt | -0.151 |
slic | -0.141 |
hof | -0.135 |
leakage | -0.134 |
stamped | -0.134 |
Token | acher |
Token ID | 3493 |
Feature activation | +5.33e-01 |
Pos logit contributions | |
ˈ | +0.340 |
Redd | +0.297 |
Wan | +0.291 |
claw | +0.289 |
Neph | +0.281 |
Neg logit contributions | |
fitt | -0.139 |
slic | -0.125 |
hof | -0.117 |
leakage | -0.117 |
stamped | -0.116 |
Token | Report |
Token ID | 6358 |
Feature activation | +2.23e-01 |
Pos logit contributions | |
fitt | +1.170 |
slic | +1.079 |
hof | +1.038 |
leakage | +1.035 |
stamped | +1.034 |
Neg logit contributions | |
ˈ | -1.639 |
Redd | -1.380 |
Wan | -1.350 |
claw | -1.342 |
Neph | -1.288 |
Token | video |
Token ID | 2008 |
Feature activation | -3.84e-02 |
Pos logit contributions | |
fitt | +0.541 |
slic | +0.505 |
hof | +0.487 |
leakage | +0.485 |
stamped | +0.484 |
Neg logit contributions | |
ˈ | -0.637 |
Redd | -0.529 |
Wan | -0.517 |
claw | -0.512 |
Neph | -0.490 |
Token | . |
Token ID | 13 |
Feature activation | -3.86e-02 |
Pos logit contributions | |
ˈ | +0.112 |
Redd | +0.094 |
Wan | +0.092 |
claw | +0.091 |
Neph | +0.087 |
Neg logit contributions | |
fitt | -0.090 |
slic | -0.084 |
hof | -0.081 |
leakage | -0.080 |
stamped | -0.080 |
Token |
|
Token ID | 198 |
Feature activation | -5.87e-02 |
Pos logit contributions | |
ˈ | +0.108 |
Redd | +0.090 |
Wan | +0.088 |
claw | +0.087 |
Neph | +0.083 |
Neg logit contributions | |
fitt | -0.095 |
slic | -0.089 |
hof | -0.086 |
leakage | -0.086 |
stamped | -0.085 |
Token |
|
Token ID | 198 |
Feature activation | -6.50e-02 |
Pos logit contributions | |
ˈ | +0.171 |
Redd | +0.143 |
Wan | +0.139 |
claw | +0.138 |
Neph | +0.133 |
Neg logit contributions | |
fitt | -0.140 |
slic | -0.131 |
leakage | -0.125 |
hof | -0.125 |
stamped | -0.124 |
Token | the |
Token ID | 262 |
Feature activation | +2.72e-02 |
Pos logit contributions | |
fitt | +0.141 |
slic | +0.132 |
hof | +0.129 |
leakage | +0.125 |
stamped | +0.124 |
Neg logit contributions | |
ˈ | -0.198 |
Redd | -0.166 |
Wan | -0.163 |
claw | -0.162 |
Neph | -0.157 |
Token | reference |
Token ID | 4941 |
Feature activation | -5.00e-02 |
Pos logit contributions | |
fitt | +0.056 |
slic | +0.052 |
hof | +0.051 |
leakage | +0.049 |
stamped | +0.048 |
Neg logit contributions | |
ˈ | -0.086 |
Redd | -0.072 |
Wan | -0.071 |
claw | -0.071 |
Neph | -0.069 |
Token | design |
Token ID | 1486 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
ˈ | +0.189 |
Redd | +0.165 |
Wan | +0.163 |
claw | +0.162 |
Neph | +0.159 |
Neg logit contributions | |
fitt | -0.071 |
slic | -0.064 |
hof | -0.062 |
leakage | -0.058 |
stamped | -0.057 |
Token | . |
Token ID | 13 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
fitt | +0.243 |
slic | +0.227 |
hof | +0.220 |
leakage | +0.215 |
stamped | +0.215 |
Neg logit contributions | |
ˈ | -0.317 |
Redd | -0.266 |
Wan | -0.261 |
claw | -0.259 |
Neph | -0.250 |
Token | Equ |
Token ID | 7889 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
fitt | +0.066 |
slic | +0.062 |
hof | +0.059 |
leakage | +0.059 |
stamped | +0.058 |
Neg logit contributions | |
ˈ | -0.074 |
Redd | -0.061 |
Wan | -0.060 |
claw | -0.059 |
Neph | -0.057 |
Token | ipped |
Token ID | 3949 |
Feature activation | +5.05e-01 |
Pos logit contributions | |
fitt | +0.257 |
slic | +0.234 |
hof | +0.221 |
leakage | +0.221 |
stamped | +0.220 |
Neg logit contributions | |
ˈ | -0.493 |
Redd | -0.425 |
Wan | -0.417 |
claw | -0.414 |
Neph | -0.401 |
Token | with |
Token ID | 351 |
Feature activation | +7.06e-02 |
Pos logit contributions | |
fitt | +1.172 |
slic | +1.086 |
stamped | +1.040 |
hof | +1.039 |
leakage | +1.039 |
Neg logit contributions | |
ˈ | -1.506 |
Redd | -1.262 |
Wan | -1.229 |
claw | -1.218 |
Neph | -1.167 |
Token | Un |
Token ID | 791 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
fitt | +0.160 |
slic | +0.149 |
hof | +0.146 |
leakage | +0.142 |
stamped | +0.141 |
Neg logit contributions | |
ˈ | -0.210 |
Redd | -0.176 |
Wan | -0.172 |
claw | -0.171 |
Neph | -0.165 |
Token | locked |
Token ID | 24162 |
Feature activation | +3.78e-02 |
Pos logit contributions | |
ˈ | +0.293 |
Redd | +0.244 |
claw | +0.239 |
Wan | +0.237 |
Neph | +0.220 |
Neg logit contributions | |
fitt | -0.267 |
slic | -0.250 |
leakage | -0.237 |
hof | -0.236 |
stamped | -0.235 |
Token | Digital |
Token ID | 10231 |
Feature activation | +1.57e-02 |
Pos logit contributions | |
fitt | +0.098 |
slic | +0.092 |
hof | +0.089 |
leakage | +0.088 |
stamped | +0.088 |
Neg logit contributions | |
ˈ | -0.102 |
Redd | -0.084 |
Wan | -0.081 |
claw | -0.081 |
Neph | -0.077 |
Token | Power |
Token ID | 13434 |
Feature activation | +3.90e-02 |
Pos logit contributions | |
fitt | +0.046 |
slic | +0.044 |
hof | +0.042 |
leakage | +0.042 |
stamped | +0.042 |
Neg logit contributions | |
ˈ | -0.037 |
Redd | -0.029 |
Wan | -0.028 |
claw | -0.028 |
Neph | -0.026 |
Token | the |
Token ID | 262 |
Feature activation | +2.53e-02 |
Pos logit contributions | |
ˈ | +0.128 |
Redd | +0.107 |
Wan | +0.105 |
claw | +0.104 |
Neph | +0.100 |
Neg logit contributions | |
fitt | -0.097 |
slic | -0.090 |
hof | -0.086 |
leakage | -0.086 |
stamped | -0.085 |
Token | 64 |
Token ID | 5598 |
Feature activation | -8.56e-02 |
Pos logit contributions | |
fitt | +0.058 |
slic | +0.054 |
hof | +0.052 |
leakage | +0.052 |
stamped | +0.052 |
Neg logit contributions | |
ˈ | -0.075 |
Redd | -0.063 |
Wan | -0.062 |
claw | -0.061 |
Neph | -0.059 |
Token | - |
Token ID | 12 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
ˈ | +0.246 |
Redd | +0.205 |
Wan | +0.202 |
claw | +0.200 |
Neph | +0.191 |
Neg logit contributions | |
fitt | -0.205 |
slic | -0.191 |
hof | -0.184 |
leakage | -0.184 |
stamped | -0.181 |
Token | bit |
Token ID | 2545 |
Feature activation | +5.53e-02 |
Pos logit contributions | |
fitt | +0.073 |
slic | +0.067 |
leakage | +0.064 |
hof | +0.064 |
stamped | +0.064 |
Neg logit contributions | |
ˈ | -0.109 |
Redd | -0.093 |
Wan | -0.091 |
claw | -0.090 |
Neph | -0.087 |
Token | Hy |
Token ID | 6707 |
Feature activation | +1.21e-01 |
Pos logit contributions | |
fitt | +0.129 |
slic | +0.120 |
hof | +0.116 |
leakage | +0.115 |
stamped | +0.114 |
Neg logit contributions | |
ˈ | -0.163 |
Redd | -0.136 |
Wan | -0.133 |
claw | -0.132 |
Neph | -0.128 |
Token | rule |
Token ID | 25135 |
Feature activation | +5.03e-01 |
Pos logit contributions | |
fitt | +0.250 |
slic | +0.232 |
hof | +0.220 |
leakage | +0.220 |
stamped | +0.218 |
Neg logit contributions | |
ˈ | -0.391 |
Redd | -0.331 |
Wan | -0.327 |
claw | -0.324 |
Neph | -0.312 |
Token | Fi |
Token ID | 23238 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
fitt | +1.180 |
slic | +1.099 |
hof | +1.056 |
stamped | +1.051 |
leakage | +1.049 |
Neg logit contributions | |
ˈ | -1.477 |
Redd | -1.237 |
Wan | -1.206 |
claw | -1.196 |
Neph | -1.147 |
Token | end |
Token ID | 437 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
ˈ | +0.412 |
Redd | +0.343 |
Wan | +0.335 |
claw | +0.334 |
Neph | +0.317 |
Neg logit contributions | |
fitt | -0.333 |
slic | -0.311 |
leakage | -0.298 |
hof | -0.297 |
stamped | -0.295 |
Token | , |
Token ID | 11 |
Feature activation | +2.63e-02 |
Pos logit contributions | |
fitt | +0.350 |
slic | +0.327 |
leakage | +0.314 |
hof | +0.313 |
stamped | +0.311 |
Neg logit contributions | |
ˈ | -0.414 |
Redd | -0.344 |
Wan | -0.338 |
claw | -0.336 |
Neph | -0.321 |
Token | O |
Token ID | 440 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
fitt | +0.058 |
slic | +0.054 |
hof | +0.052 |
leakage | +0.051 |
stamped | +0.051 |
Neg logit contributions | |
ˈ | -0.081 |
Redd | -0.067 |
Wan | -0.067 |
claw | -0.066 |
Neph | -0.064 |
Token | car |
Token ID | 7718 |
Feature activation | -9.41e-02 |
Pos logit contributions | |
fitt | +0.042 |
slic | +0.040 |
leakage | +0.038 |
hof | +0.038 |
stamped | +0.038 |
Neg logit contributions | |
ˈ | -0.040 |
Redd | -0.032 |
Wan | -0.031 |
claw | -0.031 |
Neph | -0.030 |
Token | � |
Token ID | 247 |
Feature activation | +2.92e-02 |
Pos logit contributions | |
ˈ | +0.017 |
Redd | +0.014 |
Wan | +0.013 |
claw | +0.013 |
Neph | +0.012 |
Neg logit contributions | |
fitt | -0.024 |
slic | -0.023 |
hof | -0.022 |
leakage | -0.022 |
stamped | -0.022 |
Token | t |
Token ID | 83 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
fitt | +0.090 |
slic | +0.086 |
leakage | +0.083 |
hof | +0.083 |
stamped | +0.081 |
Neg logit contributions | |
ˈ | -0.066 |
Redd | -0.049 |
Wan | -0.048 |
claw | -0.048 |
Neph | -0.045 |
Token | stopped |
Token ID | 5025 |
Feature activation | +4.64e-02 |
Pos logit contributions | |
fitt | +0.031 |
slic | +0.029 |
hof | +0.027 |
leakage | +0.027 |
stamped | +0.026 |
Neg logit contributions | |
ˈ | -0.046 |
Redd | -0.038 |
claw | -0.038 |
Wan | -0.037 |
Neph | -0.036 |
Token | Sch |
Token ID | 3059 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
fitt | +0.099 |
slic | +0.091 |
hof | +0.086 |
leakage | +0.086 |
stamped | +0.085 |
Neg logit contributions | |
ˈ | -0.146 |
Redd | -0.124 |
Wan | -0.122 |
claw | -0.122 |
Neph | -0.117 |
Token | um |
Token ID | 388 |
Feature activation | -5.88e-02 |
Pos logit contributions | |
fitt | +0.469 |
slic | +0.440 |
hof | +0.424 |
leakage | +0.422 |
stamped | +0.421 |
Neg logit contributions | |
ˈ | -0.497 |
Redd | -0.410 |
Wan | -0.400 |
claw | -0.396 |
Neph | -0.378 |
Token | acher |
Token ID | 3493 |
Feature activation | +4.73e-01 |
Pos logit contributions | |
ˈ | +0.213 |
Redd | +0.183 |
claw | +0.181 |
Wan | +0.180 |
Neph | +0.172 |
Neg logit contributions | |
fitt | -0.100 |
slic | -0.090 |
leakage | -0.084 |
stamped | -0.082 |
hof | -0.082 |
Token | from |
Token ID | 422 |
Feature activation | +6.77e-04 |
Pos logit contributions | |
fitt | +1.364 |
slic | +1.289 |
hof | +1.247 |
leakage | +1.243 |
stamped | +1.242 |
Neg logit contributions | |
ˈ | -1.129 |
Redd | -0.906 |
Wan | -0.879 |
claw | -0.867 |
Neph | -0.824 |
Token | asking |
Token ID | 4737 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
fitt | +0.001 |
slic | +0.001 |
hof | +0.001 |
leakage | +0.001 |
stamped | +0.001 |
Neg logit contributions | |
ˈ | -0.002 |
Redd | -0.002 |
claw | -0.002 |
Wan | -0.002 |
Neph | -0.002 |
Token | .) |
Token ID | 2014 |
Feature activation | -6.87e-02 |
Pos logit contributions | |
fitt | +0.243 |
slic | +0.226 |
hof | +0.217 |
leakage | +0.215 |
stamped | +0.214 |
Neg logit contributions | |
ˈ | -0.334 |
Redd | -0.281 |
Wan | -0.276 |
claw | -0.274 |
Neph | -0.263 |
Token |
|
Token ID | 198 |
Feature activation | -4.87e-02 |
Pos logit contributions | |
ˈ | +0.191 |
Redd | +0.158 |
Wan | +0.155 |
claw | +0.155 |
Neph | +0.149 |
Neg logit contributions | |
fitt | -0.172 |
slic | -0.162 |
leakage | -0.155 |
hof | -0.154 |
stamped | -0.154 |
Token |
|
Token ID | 198 |
Feature activation | -5.12e-02 |
Pos logit contributions | |
ˈ | +0.139 |
Redd | +0.116 |
Wan | +0.113 |
claw | +0.112 |
Neph | +0.108 |
Neg logit contributions | |
fitt | -0.120 |
slic | -0.112 |
leakage | -0.107 |
hof | -0.106 |
stamped | -0.106 |
Token | haunted |
Token ID | 26688 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
ˈ | +0.069 |
Redd | +0.058 |
Wan | +0.057 |
claw | +0.057 |
Neph | +0.055 |
Neg logit contributions | |
fitt | -0.048 |
slic | -0.044 |
hof | -0.043 |
leakage | -0.042 |
stamped | -0.042 |
Token | by |
Token ID | 416 |
Feature activation | -7.55e-02 |
Pos logit contributions | |
ˈ | +0.049 |
Redd | +0.041 |
Wan | +0.041 |
claw | +0.040 |
Neph | +0.039 |
Neg logit contributions | |
fitt | -0.034 |
slic | -0.032 |
hof | -0.030 |
leakage | -0.030 |
stamped | -0.030 |
Token | Joel |
Token ID | 18623 |
Feature activation | +8.08e-02 |
Pos logit contributions | |
ˈ | +0.224 |
Redd | +0.189 |
Wan | +0.184 |
claw | +0.183 |
Neph | +0.176 |
Neg logit contributions | |
fitt | -0.174 |
slic | -0.162 |
hof | -0.156 |
leakage | -0.154 |
stamped | -0.154 |
Token | Sch |
Token ID | 3059 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
fitt | +0.197 |
slic | +0.185 |
hof | +0.177 |
leakage | +0.177 |
stamped | +0.176 |
Neg logit contributions | |
ˈ | -0.229 |
Redd | -0.190 |
Wan | -0.186 |
claw | -0.184 |
Neph | -0.176 |
Token | um |
Token ID | 388 |
Feature activation | -5.02e-02 |
Pos logit contributions | |
fitt | +0.397 |
hof | +0.367 |
slic | +0.366 |
stamped | +0.354 |
leakage | +0.354 |
Neg logit contributions | |
ˈ | -0.458 |
Redd | -0.383 |
Wan | -0.376 |
claw | -0.369 |
Neph | -0.355 |
Token | acher |
Token ID | 3493 |
Feature activation | +4.69e-01 |
Pos logit contributions | |
ˈ | +0.186 |
Redd | +0.162 |
Wan | +0.159 |
claw | +0.158 |
Neph | +0.153 |
Neg logit contributions | |
fitt | -0.079 |
slic | -0.071 |
hof | -0.066 |
leakage | -0.066 |
stamped | -0.066 |
Token | � |
Token ID | 447 |
Feature activation | +9.38e-03 |
Pos logit contributions | |
fitt | +1.265 |
slic | +1.189 |
hof | +1.152 |
stamped | +1.149 |
leakage | +1.146 |
Neg logit contributions | |
ˈ | -1.198 |
Redd | -0.985 |
Wan | -0.959 |
claw | -0.939 |
Neph | -0.901 |
Token | � |
Token ID | 247 |
Feature activation | +3.69e-02 |
Pos logit contributions | |
fitt | +0.028 |
slic | +0.027 |
hof | +0.026 |
leakage | +0.026 |
stamped | +0.026 |
Neg logit contributions | |
ˈ | -0.021 |
Redd | -0.017 |
Wan | -0.016 |
claw | -0.016 |
Neph | -0.015 |
Token | s |
Token ID | 82 |
Feature activation | -9.61e-03 |
Pos logit contributions | |
fitt | +0.093 |
slic | +0.088 |
hof | +0.084 |
leakage | +0.084 |
stamped | +0.084 |
Neg logit contributions | |
ˈ | -0.101 |
Redd | -0.084 |
Wan | -0.081 |
claw | -0.081 |
Neph | -0.077 |
Token | 1997 |
Token ID | 8309 |
Feature activation | +6.78e-02 |
Pos logit contributions | |
ˈ | +0.028 |
Redd | +0.023 |
Wan | +0.023 |
claw | +0.023 |
Neph | +0.022 |
Neg logit contributions | |
fitt | -0.023 |
slic | -0.021 |
hof | -0.021 |
leakage | -0.020 |
stamped | -0.020 |
Token | debacle |
Token ID | 40943 |
Feature activation | +6.61e-02 |
Pos logit contributions | |
fitt | +0.161 |
slic | +0.149 |
hof | +0.144 |
leakage | +0.142 |
stamped | +0.141 |
Neg logit contributions | |
ˈ | -0.198 |
Redd | -0.164 |
Wan | -0.161 |
claw | -0.160 |
Neph | -0.154 |
Token | . |
Token ID | 13 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
ˈ | +0.274 |
Redd | +0.224 |
Wan | +0.219 |
claw | +0.218 |
Neph | +0.208 |
Neg logit contributions | |
fitt | -0.256 |
slic | -0.239 |
hof | -0.231 |
leakage | -0.230 |
stamped | -0.227 |
Token |
|
Token ID | 198 |
Feature activation | +1.91e-02 |
Pos logit contributions | |
fitt | +0.011 |
slic | +0.011 |
leakage | +0.010 |
hof | +0.010 |
stamped | +0.010 |
Neg logit contributions | |
ˈ | -0.012 |
Redd | -0.010 |
Wan | -0.009 |
claw | -0.009 |
Neph | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -6.06e-03 |
Pos logit contributions | |
fitt | +0.046 |
slic | +0.043 |
leakage | +0.041 |
hof | +0.041 |
stamped | +0.040 |
Neg logit contributions | |
ˈ | -0.055 |
Redd | -0.046 |
Wan | -0.045 |
claw | -0.045 |
Neph | -0.043 |
Token | Que |
Token ID | 15681 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ˈ | +0.016 |
Redd | +0.013 |
Wan | +0.013 |
claw | +0.012 |
Neph | +0.012 |
Neg logit contributions | |
fitt | -0.017 |
slic | -0.016 |
leakage | -0.015 |
hof | -0.015 |
stamped | -0.015 |
Token | ens |
Token ID | 641 |
Feature activation | +8.89e-02 |
Pos logit contributions | |
fitt | +0.300 |
slic | +0.282 |
leakage | +0.271 |
hof | +0.270 |
stamped | +0.270 |
Neg logit contributions | |
ˈ | -0.309 |
Redd | -0.254 |
Wan | -0.247 |
claw | -0.246 |
Neph | -0.233 |
Token | land |
Token ID | 1044 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
fitt | +0.150 |
slic | +0.135 |
hof | +0.128 |
leakage | +0.127 |
stamped | +0.126 |
Neg logit contributions | |
ˈ | -0.319 |
Redd | -0.277 |
Wan | -0.272 |
claw | -0.271 |
Neph | -0.262 |
Token | � |
Token ID | 447 |
Feature activation | -5.18e-03 |
Pos logit contributions | |
fitt | +1.093 |
slic | +1.017 |
hof | +0.978 |
leakage | +0.972 |
stamped | +0.968 |
Neg logit contributions | |
ˈ | -1.369 |
Redd | -1.147 |
Wan | -1.120 |
claw | -1.112 |
Neph | -1.067 |
Token | � |
Token ID | 247 |
Feature activation | +3.73e-02 |
Pos logit contributions | |
ˈ | +0.012 |
Redd | +0.009 |
Wan | +0.009 |
claw | +0.009 |
Neph | +0.008 |
Neg logit contributions | |
fitt | -0.016 |
slic | -0.015 |
hof | -0.014 |
leakage | -0.014 |
stamped | -0.014 |
Token | s |
Token ID | 82 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
fitt | +0.088 |
slic | +0.082 |
hof | +0.079 |
leakage | +0.079 |
stamped | +0.078 |
Neg logit contributions | |
ˈ | -0.109 |
Redd | -0.091 |
Wan | -0.089 |
claw | -0.088 |
Neph | -0.084 |
Token | tropical |
Token ID | 19690 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
fitt | +0.035 |
slic | +0.033 |
hof | +0.032 |
leakage | +0.031 |
stamped | +0.031 |
Neg logit contributions | |
ˈ | -0.047 |
Redd | -0.039 |
Wan | -0.039 |
claw | -0.038 |
Neph | -0.037 |
Token | climate |
Token ID | 4258 |
Feature activation | -2.49e-02 |
Pos logit contributions | |
ˈ | +0.036 |
Redd | +0.030 |
Wan | +0.029 |
claw | +0.029 |
Neph | +0.028 |
Neg logit contributions | |
fitt | -0.026 |
slic | -0.024 |
hof | -0.024 |
leakage | -0.023 |
stamped | -0.023 |
Token | place |
Token ID | 1295 |
Feature activation | +9.82e-02 |
Pos logit contributions | |
ˈ | +0.019 |
Redd | +0.016 |
claw | +0.016 |
Wan | +0.016 |
Neph | +0.015 |
Neg logit contributions | |
fitt | -0.013 |
slic | -0.012 |
hof | -0.012 |
leakage | -0.012 |
stamped | -0.012 |
Token | your |
Token ID | 534 |
Feature activation | +4.01e-02 |
Pos logit contributions | |
fitt | +0.206 |
slic | +0.190 |
hof | +0.184 |
leakage | +0.182 |
stamped | +0.181 |
Neg logit contributions | |
ˈ | -0.311 |
Redd | -0.263 |
Wan | -0.259 |
claw | -0.257 |
Neph | -0.249 |
Token | seal |
Token ID | 13810 |
Feature activation | -6.44e-02 |
Pos logit contributions | |
fitt | +0.085 |
slic | +0.078 |
hof | +0.076 |
leakage | +0.074 |
stamped | +0.074 |
Neg logit contributions | |
ˈ | -0.127 |
Redd | -0.107 |
Wan | -0.105 |
claw | -0.105 |
Neph | -0.101 |
Token | here |
Token ID | 994 |
Feature activation | -3.18e-02 |
Pos logit contributions | |
ˈ | +0.181 |
Redd | +0.150 |
claw | +0.146 |
Wan | +0.146 |
Neph | +0.140 |
Neg logit contributions | |
fitt | -0.158 |
slic | -0.147 |
hof | -0.143 |
leakage | -0.142 |
stamped | -0.141 |
Token | ... |
Token ID | 986 |
Feature activation | +4.99e-02 |
Pos logit contributions | |
ˈ | +0.096 |
Redd | +0.080 |
Wan | +0.078 |
claw | +0.078 |
Neph | +0.075 |
Neg logit contributions | |
fitt | -0.072 |
slic | -0.067 |
hof | -0.064 |
leakage | -0.064 |
stamped | -0.063 |
Token | huh |
Token ID | 24926 |
Feature activation | +4.66e-01 |
Pos logit contributions | |
fitt | +0.137 |
slic | +0.129 |
hof | +0.124 |
leakage | +0.124 |
stamped | +0.123 |
Neg logit contributions | |
ˈ | -0.127 |
Redd | -0.103 |
Wan | -0.100 |
claw | -0.100 |
Neph | -0.094 |
Token | ? |
Token ID | 30 |
Feature activation | -2.89e-02 |
Pos logit contributions | |
fitt | +1.026 |
slic | +0.951 |
hof | +0.911 |
leakage | +0.907 |
stamped | +0.904 |
Neg logit contributions | |
ˈ | -1.432 |
Redd | -1.211 |
Wan | -1.184 |
claw | -1.175 |
Neph | -1.130 |
Token | � |
Token ID | 447 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
ˈ | +0.065 |
Redd | +0.051 |
Wan | +0.050 |
claw | +0.049 |
Neph | +0.047 |
Neg logit contributions | |
fitt | -0.087 |
slic | -0.083 |
hof | -0.080 |
leakage | -0.080 |
stamped | -0.080 |
Token | � |
Token ID | 251 |
Feature activation | +7.30e-02 |
Pos logit contributions | |
fitt | +0.435 |
slic | +0.411 |
hof | +0.398 |
leakage | +0.396 |
stamped | +0.395 |
Neg logit contributions | |
ˈ | -0.371 |
Redd | -0.298 |
Wan | -0.289 |
claw | -0.286 |
Neph | -0.271 |
Token | The |
Token ID | 383 |
Feature activation | -5.61e-02 |
Pos logit contributions | |
fitt | +0.194 |
slic | +0.183 |
leakage | +0.176 |
hof | +0.176 |
stamped | +0.174 |
Neg logit contributions | |
ˈ | -0.192 |
Redd | -0.157 |
Wan | -0.153 |
claw | -0.152 |
Neph | -0.145 |
Token | Lieutenant |
Token ID | 21586 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
ˈ | +0.175 |
Redd | +0.148 |
Wan | +0.145 |
claw | +0.144 |
Neph | +0.140 |
Neg logit contributions | |
fitt | -0.120 |
slic | -0.111 |
hof | -0.108 |
leakage | -0.106 |
stamped | -0.105 |
Token | not |
Token ID | 407 |
Feature activation | +3.52e-02 |
Pos logit contributions | |
ˈ | +0.000 |
Redd | +0.000 |
Wan | +0.000 |
claw | +0.000 |
Neph | +0.000 |
Neg logit contributions | |
fitt | -0.000 |
slic | -0.000 |
leakage | -0.000 |
hof | -0.000 |
stamped | -0.000 |
Token | clear |
Token ID | 1598 |
Feature activation | +8.78e-02 |
Pos logit contributions | |
fitt | +0.076 |
slic | +0.070 |
hof | +0.067 |
leakage | +0.067 |
stamped | +0.066 |
Neg logit contributions | |
ˈ | -0.109 |
Redd | -0.092 |
Wan | -0.091 |
claw | -0.090 |
Neph | -0.087 |
Token | yet |
Token ID | 1865 |
Feature activation | +9.05e-02 |
Pos logit contributions | |
fitt | +0.199 |
slic | +0.185 |
hof | +0.177 |
leakage | +0.176 |
stamped | +0.175 |
Neg logit contributions | |
ˈ | -0.264 |
Redd | -0.222 |
Wan | -0.217 |
claw | -0.216 |
Neph | -0.208 |
Token | how |
Token ID | 703 |
Feature activation | +2.19e-02 |
Pos logit contributions | |
fitt | +0.208 |
slic | +0.193 |
hof | +0.185 |
leakage | +0.184 |
stamped | +0.183 |
Neg logit contributions | |
ˈ | -0.271 |
Redd | -0.226 |
Wan | -0.221 |
claw | -0.220 |
Neph | -0.211 |
Token | Tel |
Token ID | 12088 |
Feature activation | -3.92e-03 |
Pos logit contributions | |
fitt | +0.045 |
slic | +0.041 |
hof | +0.039 |
stamped | +0.039 |
leakage | +0.039 |
Neg logit contributions | |
ˈ | -0.071 |
Redd | -0.059 |
Wan | -0.059 |
claw | -0.059 |
Neph | -0.056 |
Token | stra |
Token ID | 12044 |
Feature activation | +4.60e-01 |
Pos logit contributions | |
ˈ | +0.012 |
Redd | +0.010 |
claw | +0.010 |
Wan | +0.010 |
Neph | +0.010 |
Neg logit contributions | |
fitt | -0.008 |
slic | -0.008 |
leakage | -0.007 |
stamped | -0.007 |
hof | -0.007 |
Token | � |
Token ID | 447 |
Feature activation | -8.62e-04 |
Pos logit contributions | |
fitt | +1.014 |
slic | +0.940 |
hof | +0.901 |
leakage | +0.896 |
stamped | +0.893 |
Neg logit contributions | |
ˈ | -1.415 |
Redd | -1.195 |
Wan | -1.169 |
claw | -1.161 |
Neph | -1.116 |
Token | � |
Token ID | 247 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
ˈ | +0.002 |
Redd | +0.002 |
Wan | +0.002 |
claw | +0.001 |
Neph | +0.001 |
Neg logit contributions | |
fitt | -0.003 |
slic | -0.002 |
hof | -0.002 |
leakage | -0.002 |
stamped | -0.002 |
Token | s |
Token ID | 82 |
Feature activation | -6.45e-02 |
Pos logit contributions | |
ˈ | +0.090 |
Redd | +0.072 |
claw | +0.071 |
Wan | +0.071 |
Neph | +0.067 |
Neg logit contributions | |
fitt | -0.093 |
slic | -0.088 |
leakage | -0.084 |
hof | -0.084 |
stamped | -0.083 |
Token | proposal |
Token ID | 6961 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
ˈ | +0.211 |
Redd | +0.179 |
claw | +0.176 |
Wan | +0.176 |
Neph | +0.170 |
Neg logit contributions | |
fitt | -0.128 |
slic | -0.118 |
hof | -0.114 |
stamped | -0.111 |
leakage | -0.109 |
Token | to |
Token ID | 284 |
Feature activation | -2.13e-02 |
Pos logit contributions | |
fitt | +0.054 |
slic | +0.050 |
hof | +0.048 |
leakage | +0.047 |
stamped | +0.047 |
Neg logit contributions | |
ˈ | -0.077 |
Redd | -0.064 |
claw | -0.063 |
Wan | -0.063 |
Neph | -0.060 |
Token | weekend |
Token ID | 5041 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
fitt | +0.054 |
slic | +0.051 |
hof | +0.049 |
leakage | +0.049 |
stamped | +0.048 |
Neg logit contributions | |
ˈ | -0.066 |
Redd | -0.055 |
Wan | -0.054 |
claw | -0.053 |
Neph | -0.051 |
Token | . |
Token ID | 13 |
Feature activation | +6.18e-03 |
Pos logit contributions | |
ˈ | +0.044 |
Redd | +0.036 |
Wan | +0.035 |
claw | +0.035 |
Neph | +0.033 |
Neg logit contributions | |
fitt | -0.043 |
slic | -0.040 |
hof | -0.039 |
leakage | -0.039 |
stamped | -0.039 |
Token | Michael |
Token ID | 3899 |
Feature activation | +4.35e-02 |
Pos logit contributions | |
fitt | +0.015 |
slic | +0.014 |
leakage | +0.014 |
hof | +0.014 |
stamped | +0.014 |
Neg logit contributions | |
ˈ | -0.017 |
Redd | -0.015 |
Wan | -0.014 |
claw | -0.014 |
Neph | -0.014 |
Token | Sch |
Token ID | 3059 |
Feature activation | +2.33e-01 |
Pos logit contributions | |
fitt | +0.107 |
slic | +0.100 |
stamped | +0.096 |
hof | +0.096 |
leakage | +0.095 |
Neg logit contributions | |
ˈ | -0.121 |
Redd | -0.101 |
claw | -0.098 |
Wan | -0.098 |
Neph | -0.095 |
Token | um |
Token ID | 388 |
Feature activation | +9.61e-03 |
Pos logit contributions | |
fitt | +0.578 |
slic | +0.542 |
hof | +0.530 |
leakage | +0.522 |
stamped | +0.521 |
Neg logit contributions | |
ˈ | -0.644 |
Redd | -0.535 |
Wan | -0.522 |
claw | -0.513 |
Neph | -0.493 |
Token | acher |
Token ID | 3493 |
Feature activation | +4.57e-01 |
Pos logit contributions | |
fitt | +0.015 |
slic | +0.014 |
hof | +0.013 |
leakage | +0.013 |
stamped | +0.013 |
Neg logit contributions | |
ˈ | -0.036 |
Redd | -0.031 |
Wan | -0.030 |
claw | -0.030 |
Neph | -0.029 |
Token | 's |
Token ID | 338 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
fitt | +1.001 |
slic | +0.926 |
hof | +0.895 |
leakage | +0.890 |
stamped | +0.875 |
Neg logit contributions | |
ˈ | -1.409 |
Redd | -1.183 |
Wan | -1.159 |
claw | -1.159 |
Neph | -1.116 |
Token | Mercedes |
Token ID | 21279 |
Feature activation | +6.75e-02 |
Pos logit contributions | |
fitt | +0.035 |
slic | +0.032 |
hof | +0.032 |
leakage | +0.031 |
stamped | +0.031 |
Neg logit contributions | |
ˈ | -0.052 |
Redd | -0.044 |
Wan | -0.043 |
claw | -0.043 |
Neph | -0.042 |
Token | was |
Token ID | 373 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
fitt | +0.137 |
slic | +0.124 |
hof | +0.122 |
leakage | +0.119 |
stamped | +0.119 |
Neg logit contributions | |
ˈ | -0.216 |
Redd | -0.184 |
claw | -0.181 |
Wan | -0.181 |
Neph | -0.176 |
Token | third |
Token ID | 2368 |
Feature activation | +7.29e-03 |
Pos logit contributions | |
fitt | +0.052 |
slic | +0.048 |
hof | +0.047 |
leakage | +0.047 |
stamped | +0.046 |
Neg logit contributions | |
ˈ | -0.078 |
Redd | -0.067 |
Wan | -0.064 |
claw | -0.064 |
Neph | -0.062 |
Token | ahead |
Token ID | 4058 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
fitt | +0.018 |
slic | +0.017 |
hof | +0.016 |
leakage | +0.016 |
stamped | +0.016 |
Neg logit contributions | |
ˈ | -0.020 |
Redd | -0.016 |
claw | -0.016 |
Wan | -0.016 |
Neph | -0.016 |
Token | , |
Token ID | 11 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
ˈ | +0.179 |
Redd | +0.150 |
Wan | +0.147 |
claw | +0.146 |
Neph | +0.140 |
Neg logit contributions | |
fitt | -0.137 |
slic | -0.128 |
hof | -0.123 |
leakage | -0.122 |
stamped | -0.121 |
Token | and |
Token ID | 290 |
Feature activation | +2.95e-02 |
Pos logit contributions | |
fitt | +0.037 |
slic | +0.034 |
hof | +0.033 |
leakage | +0.033 |
stamped | +0.033 |
Neg logit contributions | |
ˈ | -0.053 |
Redd | -0.045 |
Wan | -0.044 |
claw | -0.044 |
Neph | -0.042 |
Token | that |
Token ID | 326 |
Feature activation | +6.23e-03 |
Pos logit contributions | |
fitt | +0.067 |
slic | +0.062 |
hof | +0.060 |
leakage | +0.059 |
stamped | +0.059 |
Neg logit contributions | |
ˈ | -0.088 |
Redd | -0.074 |
Wan | -0.073 |
claw | -0.072 |
Neph | -0.070 |
Token | the |
Token ID | 262 |
Feature activation | +3.49e-02 |
Pos logit contributions | |
fitt | +0.016 |
slic | +0.015 |
hof | +0.015 |
leakage | +0.014 |
stamped | +0.014 |
Neg logit contributions | |
ˈ | -0.017 |
Redd | -0.014 |
Wan | -0.013 |
claw | -0.013 |
Neph | -0.013 |
Token | Moon |
Token ID | 6869 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
fitt | +0.086 |
slic | +0.081 |
hof | +0.078 |
leakage | +0.078 |
stamped | +0.077 |
Neg logit contributions | |
ˈ | -0.097 |
Redd | -0.081 |
Wan | -0.079 |
claw | -0.078 |
Neph | -0.075 |
Token | landing |
Token ID | 9581 |
Feature activation | +4.50e-01 |
Pos logit contributions | |
fitt | +0.031 |
slic | +0.028 |
hof | +0.027 |
leakage | +0.027 |
stamped | +0.027 |
Neg logit contributions | |
ˈ | -0.049 |
Redd | -0.041 |
claw | -0.041 |
Wan | -0.041 |
Neph | -0.040 |
Token | was |
Token ID | 373 |
Feature activation | -8.08e-04 |
Pos logit contributions | |
fitt | +0.915 |
slic | +0.843 |
hof | +0.804 |
leakage | +0.799 |
stamped | +0.793 |
Neg logit contributions | |
ˈ | -1.458 |
Redd | -1.241 |
Wan | -1.217 |
claw | -1.210 |
Neph | -1.169 |
Token | fake |
Token ID | 8390 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
ˈ | +0.003 |
Redd | +0.002 |
Wan | +0.002 |
claw | +0.002 |
Neph | +0.002 |
Neg logit contributions | |
fitt | -0.002 |
slic | -0.001 |
hof | -0.001 |
leakage | -0.001 |
stamped | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -6.67e-04 |
Pos logit contributions | |
ˈ | +0.476 |
Redd | +0.400 |
Wan | +0.391 |
claw | +0.387 |
Neph | +0.373 |
Neg logit contributions | |
fitt | -0.379 |
slic | -0.353 |
hof | -0.339 |
leakage | -0.336 |
stamped | -0.334 |
Token | Flynn |
Token ID | 14654 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ˈ | +0.002 |
Redd | +0.002 |
Wan | +0.002 |
claw | +0.002 |
Neph | +0.001 |
Neg logit contributions | |
fitt | -0.002 |
slic | -0.002 |
leakage | -0.001 |
hof | -0.001 |
stamped | -0.001 |
Token | � |
Token ID | 447 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
fitt | +0.257 |
slic | +0.239 |
hof | +0.229 |
leakage | +0.228 |
stamped | +0.226 |
Neg logit contributions | |
ˈ | -0.351 |
Redd | -0.295 |
Wan | -0.290 |
claw | -0.288 |
Neph | -0.277 |
Token | ; |
Token ID | 2162 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
ˈ | +0.076 |
Redd | +0.064 |
Wan | +0.062 |
claw | +0.061 |
Neph | +0.059 |
Neg logit contributions | |
fitt | -0.066 |
slic | -0.062 |
hof | -0.059 |
leakage | -0.059 |
stamped | -0.059 |
Token | } |
Token ID | 1782 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
fitt | +0.281 |
slic | +0.258 |
leakage | +0.244 |
hof | +0.244 |
stamped | +0.243 |
Neg logit contributions | |
ˈ | -0.487 |
Redd | -0.419 |
Wan | -0.411 |
claw | -0.407 |
Neph | -0.393 |
Token |
|
Token ID | 198 |
Feature activation | -6.87e-02 |
Pos logit contributions | |
fitt | +0.541 |
slic | +0.499 |
hof | +0.480 |
leakage | +0.473 |
stamped | +0.473 |
Neg logit contributions | |
ˈ | -0.800 |
Redd | -0.672 |
Wan | -0.660 |
claw | -0.656 |
Neph | -0.633 |
Token |
|
Token ID | 198 |
Feature activation | -7.77e-02 |
Pos logit contributions | |
ˈ | +0.199 |
Redd | +0.166 |
Wan | +0.162 |
claw | +0.161 |
Neph | +0.154 |
Neg logit contributions | |
fitt | -0.165 |
slic | -0.154 |
leakage | -0.147 |
hof | -0.147 |
stamped | -0.146 |
Token | Ass |
Token ID | 8021 |
Feature activation | +6.25e-02 |
Pos logit contributions | |
ˈ | +0.197 |
Redd | +0.161 |
Wan | +0.156 |
claw | +0.153 |
Neph | +0.142 |
Neg logit contributions | |
fitt | -0.216 |
slic | -0.203 |
leakage | -0.196 |
stamped | -0.196 |
hof | -0.195 |
Token | igning |
Token ID | 38944 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
fitt | +0.175 |
slic | +0.165 |
hof | +0.159 |
leakage | +0.159 |
stamped | +0.159 |
Neg logit contributions | |
ˈ | -0.155 |
Redd | -0.125 |
Wan | -0.121 |
claw | -0.121 |
Neph | -0.114 |
Token | D |
Token ID | 360 |
Feature activation | +4.86e-02 |
Pos logit contributions | |
fitt | +1.060 |
slic | +0.987 |
hof | +0.953 |
leakage | +0.945 |
stamped | +0.944 |
Neg logit contributions | |
ˈ | -1.303 |
Redd | -1.088 |
Wan | -1.061 |
claw | -1.053 |
Neph | -1.012 |
Token | ensity |
Token ID | 6377 |
Feature activation | +2.38e-03 |
Pos logit contributions | |
fitt | +0.134 |
slic | +0.126 |
hof | +0.123 |
leakage | +0.122 |
stamped | +0.122 |
Neg logit contributions | |
ˈ | -0.122 |
Redd | -0.100 |
Wan | -0.096 |
claw | -0.095 |
Neph | -0.091 |
Token | to |
Token ID | 284 |
Feature activation | +4.34e-02 |
Pos logit contributions | |
fitt | +0.006 |
slic | +0.006 |
hof | +0.005 |
leakage | +0.005 |
stamped | +0.005 |
Neg logit contributions | |
ˈ | -0.007 |
Redd | -0.006 |
Wan | -0.005 |
claw | -0.005 |
Neph | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | +9.66e-03 |
Pos logit contributions | |
fitt | +0.107 |
slic | +0.100 |
hof | +0.097 |
leakage | +0.096 |
stamped | +0.096 |
Neg logit contributions | |
ˈ | -0.122 |
Redd | -0.101 |
Wan | -0.098 |
claw | -0.097 |
Neph | -0.094 |
Token | Grid |
Token ID | 24846 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
fitt | +0.024 |
slic | +0.023 |
hof | +0.022 |
leakage | +0.022 |
stamped | +0.022 |
Neg logit contributions | |
ˈ | -0.027 |
Redd | -0.022 |
Wan | -0.022 |
claw | -0.021 |
Neph | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | +8.54e-02 |
Pos logit contributions | |
fitt | +0.253 |
slic | +0.236 |
leakage | +0.226 |
hof | +0.225 |
stamped | +0.224 |
Neg logit contributions | |
ˈ | -0.311 |
Redd | -0.260 |
Wan | -0.253 |
claw | -0.252 |
Neph | -0.241 |
Token | re |
Token ID | 260 |
Feature activation | +6.09e-02 |
Pos logit contributions | |
fitt | +0.226 |
slic | +0.212 |
leakage | +0.204 |
hof | +0.204 |
stamped | +0.204 |
Neg logit contributions | |
ˈ | -0.226 |
Redd | -0.185 |
Wan | -0.180 |
claw | -0.178 |
Neph | -0.170 |
Token | i |
Token ID | 72 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
fitt | +0.151 |
slic | +0.141 |
leakage | +0.136 |
hof | +0.136 |
stamped | +0.135 |
Neg logit contributions | |
ˈ | -0.171 |
Redd | -0.142 |
Wan | -0.138 |
claw | -0.137 |
Neph | -0.131 |
Token | Profile |
Token ID | 13118 |
Feature activation | +1.57e-01 |
Pos logit contributions | |
fitt | +0.368 |
slic | +0.345 |
hof | +0.332 |
leakage | +0.332 |
stamped | +0.331 |
Neg logit contributions | |
ˈ | -0.382 |
Redd | -0.314 |
Wan | -0.307 |
claw | -0.304 |
Neph | -0.289 |
Token | Blog |
Token ID | 14001 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
fitt | +0.487 |
slic | +0.461 |
hof | +0.447 |
stamped | +0.446 |
leakage | +0.446 |
Neg logit contributions | |
ˈ | -0.340 |
Redd | -0.268 |
Wan | -0.258 |
claw | -0.255 |
Neph | -0.239 |
Token | Joined |
Token ID | 16709 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
fitt | +1.048 |
slic | +0.999 |
hof | +0.974 |
leakage | +0.971 |
stamped | +0.970 |
Neg logit contributions | |
ˈ | -0.539 |
Redd | -0.397 |
Wan | -0.379 |
claw | -0.373 |
Neph | -0.344 |
Token | October |
Token ID | 3267 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
fitt | +1.141 |
slic | +1.068 |
hof | +1.029 |
leakage | +1.025 |
stamped | +1.016 |
Neg logit contributions | |
ˈ | -1.219 |
Redd | -1.003 |
Wan | -0.983 |
claw | -0.972 |
Neph | -0.933 |
Token | 2002 |
Token ID | 6244 |
Feature activation | +8.76e-03 |
Pos logit contributions | |
fitt | +0.617 |
slic | +0.579 |
hof | +0.556 |
leakage | +0.555 |
stamped | +0.552 |
Neg logit contributions | |
ˈ | -0.655 |
Redd | -0.539 |
Wan | -0.527 |
claw | -0.523 |
Neph | -0.501 |
Token | United |
Token ID | 1578 |
Feature activation | +6.16e-02 |
Pos logit contributions | |
fitt | +0.023 |
slic | +0.022 |
hof | +0.021 |
leakage | +0.021 |
stamped | +0.021 |
Neg logit contributions | |
ˈ | -0.023 |
Redd | -0.019 |
Wan | -0.018 |
claw | -0.018 |
Neph | -0.018 |
Token | States |
Token ID | 1829 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
fitt | +0.159 |
slic | +0.149 |
hof | +0.145 |
leakage | +0.143 |
stamped | +0.143 |
Neg logit contributions | |
ˈ | -0.167 |
Redd | -0.137 |
Wan | -0.133 |
claw | -0.132 |
Neph | -0.125 |
Token | 3 |
Token ID | 513 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
fitt | +0.434 |
slic | +0.406 |
hof | +0.389 |
leakage | +0.388 |
stamped | +0.386 |
Neg logit contributions | |
ˈ | -0.491 |
Redd | -0.407 |
Wan | -0.397 |
claw | -0.395 |
Neph | -0.379 |
Token | button |
Token ID | 4936 |
Feature activation | +7.59e-02 |
Pos logit contributions | |
fitt | +0.212 |
slic | +0.201 |
hof | +0.194 |
leakage | +0.190 |
stamped | +0.190 |
Neg logit contributions | |
ˈ | -0.278 |
Redd | -0.234 |
Wan | -0.229 |
claw | -0.226 |
Neph | -0.218 |
Token | and |
Token ID | 290 |
Feature activation | +8.26e-02 |
Pos logit contributions | |
fitt | +0.174 |
slic | +0.163 |
hof | +0.156 |
leakage | +0.155 |
stamped | +0.154 |
Neg logit contributions | |
ˈ | -0.224 |
Redd | -0.189 |
Wan | -0.184 |
claw | -0.183 |
Neph | -0.175 |
Token | the |
Token ID | 262 |
Feature activation | +8.77e-02 |
Pos logit contributions | |
fitt | +0.173 |
slic | +0.160 |
hof | +0.155 |
leakage | +0.152 |
stamped | +0.152 |
Neg logit contributions | |
ˈ | -0.261 |
Redd | -0.221 |
Wan | -0.217 |
claw | -0.216 |
Neph | -0.207 |
Token | other |
Token ID | 584 |
Feature activation | +6.41e-02 |
Pos logit contributions | |
fitt | +0.174 |
slic | +0.161 |
hof | +0.155 |
leakage | +0.152 |
stamped | +0.152 |
Neg logit contributions | |
ˈ | -0.286 |
Redd | -0.244 |
Wan | -0.239 |
claw | -0.238 |
Neph | -0.229 |
Token | cigarette |
Token ID | 17779 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
fitt | +0.129 |
slic | +0.120 |
hof | +0.115 |
leakage | +0.113 |
stamped | +0.113 |
Neg logit contributions | |
ˈ | -0.208 |
Redd | -0.178 |
Wan | -0.174 |
claw | -0.173 |
Neph | -0.166 |
Token | lighter |
Token ID | 14871 |
Feature activation | +4.46e-01 |
Pos logit contributions | |
fitt | +0.178 |
slic | +0.161 |
hof | +0.152 |
leakage | +0.151 |
stamped | +0.150 |
Neg logit contributions | |
ˈ | -0.381 |
Redd | -0.330 |
Wan | -0.324 |
claw | -0.322 |
Neph | -0.312 |
Token | And |
Token ID | 1870 |
Feature activation | +9.70e-02 |
Pos logit contributions | |
fitt | +0.911 |
slic | +0.841 |
hof | +0.803 |
leakage | +0.797 |
stamped | +0.795 |
Neg logit contributions | |
ˈ | -1.440 |
Redd | -1.228 |
Wan | -1.203 |
claw | -1.196 |
Neph | -1.150 |
Token | here |
Token ID | 994 |
Feature activation | +4.15e-02 |
Pos logit contributions | |
fitt | +0.198 |
slic | +0.183 |
hof | +0.175 |
leakage | +0.174 |
stamped | +0.173 |
Neg logit contributions | |
ˈ | -0.310 |
Redd | -0.264 |
Wan | -0.260 |
claw | -0.260 |
Neph | -0.248 |
Token | is |
Token ID | 318 |
Feature activation | +2.13e-02 |
Pos logit contributions | |
fitt | +0.089 |
slic | +0.082 |
hof | +0.079 |
leakage | +0.078 |
stamped | +0.078 |
Neg logit contributions | |
ˈ | -0.130 |
Redd | -0.110 |
Wan | -0.108 |
claw | -0.107 |
Neph | -0.103 |
Token | the |
Token ID | 262 |
Feature activation | +9.83e-02 |
Pos logit contributions | |
fitt | +0.045 |
slic | +0.042 |
hof | +0.040 |
leakage | +0.040 |
stamped | +0.040 |
Neg logit contributions | |
ˈ | -0.067 |
Redd | -0.057 |
Wan | -0.056 |
claw | -0.055 |
Neph | -0.053 |
Token | fl |
Token ID | 781 |
Feature activation | +2.65e-01 |
Pos logit contributions | |
fitt | +0.189 |
slic | +0.176 |
hof | +0.170 |
leakage | +0.164 |
stamped | +0.164 |
Neg logit contributions | |
ˈ | -0.324 |
Redd | -0.278 |
Wan | -0.272 |
claw | -0.271 |
Neph | -0.262 |
Token | it |
Token ID | 340 |
Feature activation | -4.31e-02 |
Pos logit contributions | |
ˈ | +0.187 |
Redd | +0.153 |
Wan | +0.149 |
claw | +0.148 |
Neph | +0.141 |
Neg logit contributions | |
fitt | -0.187 |
slic | -0.176 |
hof | -0.170 |
leakage | -0.169 |
stamped | -0.169 |
Token | is |
Token ID | 318 |
Feature activation | -5.94e-02 |
Pos logit contributions | |
ˈ | +0.134 |
Redd | +0.113 |
Wan | +0.110 |
claw | +0.110 |
Neph | +0.105 |
Neg logit contributions | |
fitt | -0.094 |
slic | -0.087 |
hof | -0.083 |
leakage | -0.083 |
stamped | -0.083 |
Token | , |
Token ID | 11 |
Feature activation | -2.66e-02 |
Pos logit contributions | |
ˈ | +0.167 |
Redd | +0.138 |
Wan | +0.135 |
claw | +0.134 |
Neph | +0.128 |
Neg logit contributions | |
fitt | -0.146 |
slic | -0.137 |
hof | -0.131 |
leakage | -0.131 |
stamped | -0.130 |
Token | without |
Token ID | 1231 |
Feature activation | -6.05e-02 |
Pos logit contributions | |
ˈ | +0.080 |
Redd | +0.067 |
claw | +0.066 |
Wan | +0.066 |
Neph | +0.063 |
Neg logit contributions | |
fitt | -0.060 |
slic | -0.056 |
hof | -0.054 |
leakage | -0.053 |
stamped | -0.053 |
Token | further |
Token ID | 2252 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
ˈ | +0.189 |
Redd | +0.161 |
Wan | +0.158 |
claw | +0.157 |
Neph | +0.151 |
Neg logit contributions | |
fitt | -0.128 |
slic | -0.119 |
hof | -0.114 |
leakage | -0.113 |
stamped | -0.112 |
Token | ado |
Token ID | 50129 |
Feature activation | +4.42e-01 |
Pos logit contributions | |
ˈ | +0.382 |
Redd | +0.312 |
Wan | +0.303 |
claw | +0.301 |
Neph | +0.287 |
Neg logit contributions | |
fitt | -0.396 |
slic | -0.373 |
hof | -0.360 |
leakage | -0.357 |
stamped | -0.357 |
Token | : |
Token ID | 25 |
Feature activation | -6.28e-02 |
Pos logit contributions | |
fitt | +1.052 |
slic | +0.979 |
hof | +0.941 |
stamped | +0.937 |
leakage | +0.936 |
Neg logit contributions | |
ˈ | -1.280 |
Redd | -1.074 |
Wan | -1.052 |
claw | -1.035 |
Neph | -0.997 |
Token | one |
Token ID | 530 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
ˈ | +0.182 |
Redd | +0.152 |
Wan | +0.149 |
claw | +0.148 |
Neph | +0.142 |
Neg logit contributions | |
fitt | -0.149 |
slic | -0.139 |
hof | -0.133 |
leakage | -0.132 |
stamped | -0.132 |
Token | man |
Token ID | 582 |
Feature activation | -6.43e-02 |
Pos logit contributions | |
fitt | +0.038 |
slic | +0.035 |
hof | +0.034 |
leakage | +0.034 |
stamped | +0.034 |
Neg logit contributions | |
ˈ | -0.040 |
Redd | -0.033 |
Wan | -0.032 |
claw | -0.032 |
Neph | -0.030 |
Token | � |
Token ID | 447 |
Feature activation | +5.95e-02 |
Pos logit contributions | |
ˈ | +0.187 |
Redd | +0.156 |
Wan | +0.152 |
claw | +0.152 |
Neph | +0.144 |
Neg logit contributions | |
fitt | -0.152 |
slic | -0.141 |
hof | -0.137 |
leakage | -0.137 |
stamped | -0.134 |
Token | � |
Token ID | 247 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
fitt | +0.179 |
slic | +0.170 |
hof | +0.164 |
leakage | +0.163 |
stamped | +0.163 |
Neg logit contributions | |
ˈ | -0.136 |
Redd | -0.107 |
Wan | -0.103 |
claw | -0.103 |
Neph | -0.097 |
Token | TB |
Token ID | 22737 |
Feature activation | +5.02e-02 |
Pos logit contributions | |
fitt | +0.043 |
slic | +0.041 |
leakage | +0.039 |
hof | +0.039 |
stamped | +0.039 |
Neg logit contributions | |
ˈ | -0.043 |
Redd | -0.035 |
Wan | -0.034 |
claw | -0.034 |
Neph | -0.032 |
Token | one |
Token ID | 505 |
Feature activation | +7.19e-02 |
Pos logit contributions | |
fitt | +0.130 |
slic | +0.122 |
hof | +0.117 |
leakage | +0.117 |
stamped | +0.117 |
Neg logit contributions | |
ˈ | -0.135 |
Redd | -0.111 |
Wan | -0.109 |
claw | -0.108 |
Neph | -0.102 |
Token | - |
Token ID | 12 |
Feature activation | +5.95e-02 |
Pos logit contributions | |
fitt | +0.195 |
slic | +0.183 |
hof | +0.177 |
leakage | +0.177 |
stamped | +0.176 |
Neg logit contributions | |
ˈ | -0.185 |
Redd | -0.151 |
Wan | -0.147 |
claw | -0.146 |
Neph | -0.138 |
Token | Profile |
Token ID | 13118 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
fitt | +0.161 |
slic | +0.151 |
hof | +0.146 |
leakage | +0.146 |
stamped | +0.145 |
Neg logit contributions | |
ˈ | -0.153 |
Redd | -0.125 |
Wan | -0.122 |
claw | -0.121 |
Neph | -0.114 |
Token | Blog |
Token ID | 14001 |
Feature activation | +3.43e-01 |
Pos logit contributions | |
fitt | +0.394 |
slic | +0.372 |
hof | +0.361 |
stamped | +0.360 |
leakage | +0.360 |
Neg logit contributions | |
ˈ | -0.299 |
Redd | -0.240 |
Wan | -0.230 |
claw | -0.228 |
Neph | -0.214 |
Token | Joined |
Token ID | 16709 |
Feature activation | +4.42e-01 |
Pos logit contributions | |
fitt | +1.200 |
slic | +1.145 |
hof | +1.115 |
leakage | +1.112 |
stamped | +1.110 |
Neg logit contributions | |
ˈ | -0.611 |
Redd | -0.447 |
Wan | -0.428 |
claw | -0.421 |
Neph | -0.388 |
Token | November |
Token ID | 3389 |
Feature activation | +1.92e-01 |
Pos logit contributions | |
fitt | +1.121 |
slic | +1.049 |
hof | +1.010 |
leakage | +1.006 |
stamped | +1.001 |
Neg logit contributions | |
ˈ | -1.216 |
Redd | -1.003 |
Wan | -0.980 |
claw | -0.971 |
Neph | -0.930 |
Token | 2010 |
Token ID | 3050 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
fitt | +0.497 |
slic | +0.466 |
leakage | +0.447 |
hof | +0.446 |
stamped | +0.443 |
Neg logit contributions | |
ˈ | -0.519 |
Redd | -0.426 |
Wan | -0.417 |
claw | -0.415 |
Neph | -0.397 |
Token | United |
Token ID | 1578 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
fitt | +0.462 |
slic | +0.434 |
hof | +0.418 |
leakage | +0.417 |
stamped | +0.416 |
Neg logit contributions | |
ˈ | -0.460 |
Redd | -0.376 |
Wan | -0.367 |
claw | -0.363 |
Neph | -0.346 |
Token | States |
Token ID | 1829 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
fitt | +0.066 |
slic | +0.062 |
hof | +0.060 |
leakage | +0.059 |
stamped | +0.059 |
Neg logit contributions | |
ˈ | -0.068 |
Redd | -0.056 |
Wan | -0.054 |
claw | -0.054 |
Neph | -0.051 |
Token | 21 |
Token ID | 2310 |
Feature activation | -1.37e-02 |
Pos logit contributions | |
fitt | +0.459 |
slic | +0.429 |
hof | +0.412 |
leakage | +0.410 |
stamped | +0.408 |
Neg logit contributions | |
ˈ | -0.516 |
Redd | -0.428 |
Wan | -0.418 |
claw | -0.415 |
Neph | -0.399 |
Token | now |
Token ID | 783 |
Feature activation | +3.18e-02 |
Pos logit contributions | |
ˈ | +0.034 |
Redd | +0.028 |
Wan | +0.028 |
claw | +0.028 |
Neph | +0.027 |
Neg logit contributions | |
fitt | -0.021 |
slic | -0.019 |
hof | -0.019 |
leakage | -0.018 |
stamped | -0.018 |
Token | changed |
Token ID | 3421 |
Feature activation | +9.86e-02 |
Pos logit contributions | |
fitt | +0.066 |
slic | +0.061 |
hof | +0.059 |
leakage | +0.058 |
stamped | +0.057 |
Neg logit contributions | |
ˈ | -0.102 |
Redd | -0.086 |
Wan | -0.084 |
claw | -0.084 |
Neph | -0.081 |
Token | , |
Token ID | 11 |
Feature activation | +8.79e-02 |
Pos logit contributions | |
fitt | +0.250 |
slic | +0.234 |
hof | +0.225 |
leakage | +0.225 |
stamped | +0.223 |
Neg logit contributions | |
ˈ | -0.271 |
Redd | -0.223 |
Wan | -0.218 |
claw | -0.218 |
Neph | -0.206 |
Token | with |
Token ID | 351 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
fitt | +0.207 |
slic | +0.193 |
hof | +0.185 |
leakage | +0.184 |
stamped | +0.182 |
Neg logit contributions | |
ˈ | -0.258 |
Redd | -0.213 |
Wan | -0.210 |
claw | -0.209 |
Neph | -0.200 |
Token | Tel |
Token ID | 12088 |
Feature activation | +2.96e-02 |
Pos logit contributions | |
fitt | +0.080 |
slic | +0.074 |
hof | +0.071 |
leakage | +0.070 |
stamped | +0.070 |
Neg logit contributions | |
ˈ | -0.103 |
Redd | -0.086 |
Wan | -0.084 |
claw | -0.083 |
Neph | -0.081 |
Token | stra |
Token ID | 12044 |
Feature activation | +4.36e-01 |
Pos logit contributions | |
fitt | +0.063 |
slic | +0.058 |
stamped | +0.055 |
leakage | +0.055 |
hof | +0.054 |
Neg logit contributions | |
ˈ | -0.094 |
Redd | -0.079 |
claw | -0.078 |
Wan | -0.078 |
Neph | -0.074 |
Token | stating |
Token ID | 12316 |
Feature activation | -6.51e-02 |
Pos logit contributions | |
fitt | +0.955 |
slic | +0.885 |
hof | +0.847 |
leakage | +0.844 |
stamped | +0.841 |
Neg logit contributions | |
ˈ | -1.346 |
Redd | -1.139 |
Wan | -1.113 |
claw | -1.105 |
Neph | -1.063 |
Token | it |
Token ID | 340 |
Feature activation | +6.65e-02 |
Pos logit contributions | |
ˈ | +0.194 |
Redd | +0.163 |
Wan | +0.159 |
claw | +0.158 |
Neph | +0.152 |
Neg logit contributions | |
fitt | -0.150 |
slic | -0.139 |
hof | -0.134 |
leakage | -0.133 |
stamped | -0.132 |
Token | had |
Token ID | 550 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
fitt | +0.145 |
slic | +0.134 |
hof | +0.128 |
leakage | +0.128 |
stamped | +0.127 |
Neg logit contributions | |
ˈ | -0.207 |
Redd | -0.174 |
Wan | -0.171 |
claw | -0.170 |
Neph | -0.163 |
Token | sourced |
Token ID | 18229 |
Feature activation | +6.63e-02 |
Pos logit contributions | |
fitt | +0.066 |
slic | +0.061 |
hof | +0.059 |
leakage | +0.058 |
stamped | +0.057 |
Neg logit contributions | |
ˈ | -0.101 |
Redd | -0.085 |
Wan | -0.084 |
claw | -0.083 |
Neph | -0.080 |
Token | an |
Token ID | 281 |
Feature activation | +6.74e-02 |
Pos logit contributions | |
fitt | +0.143 |
slic | +0.133 |
hof | +0.130 |
stamped | +0.126 |
leakage | +0.126 |
Neg logit contributions | |
ˈ | -0.206 |
Redd | -0.173 |
Wan | -0.170 |
claw | -0.168 |
Neph | -0.164 |
Token | . |
Token ID | 13 |
Feature activation | +3.23e-02 |
Pos logit contributions | |
ˈ | +0.302 |
Redd | +0.250 |
Wan | +0.243 |
claw | +0.240 |
Neph | +0.230 |
Neg logit contributions | |
fitt | -0.286 |
slic | -0.270 |
stamped | -0.259 |
hof | -0.258 |
leakage | -0.258 |
Token | sn |
Token ID | 16184 |
Feature activation | -9.64e-02 |
Pos logit contributions | |
fitt | +0.079 |
slic | +0.074 |
leakage | +0.071 |
hof | +0.071 |
stamped | +0.070 |
Neg logit contributions | |
ˈ | -0.092 |
Redd | -0.077 |
claw | -0.075 |
Wan | -0.074 |
Neph | -0.070 |
Token | ipp |
Token ID | 3974 |
Feature activation | +2.28e-01 |
Pos logit contributions | |
ˈ | +0.325 |
Redd | +0.277 |
claw | +0.271 |
Wan | +0.271 |
Neph | +0.260 |
Neg logit contributions | |
fitt | -0.185 |
slic | -0.171 |
hof | -0.161 |
leakage | -0.160 |
stamped | -0.159 |
Token | et |
Token ID | 316 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
fitt | +0.610 |
slic | +0.573 |
leakage | +0.551 |
hof | +0.551 |
stamped | +0.550 |
Neg logit contributions | |
ˈ | -0.598 |
Redd | -0.487 |
Wan | -0.474 |
claw | -0.472 |
Neph | -0.448 |
Token | }} |
Token ID | 34949 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
fitt | +0.044 |
slic | +0.041 |
hof | +0.040 |
leakage | +0.040 |
stamped | +0.039 |
Neg logit contributions | |
ˈ | -0.041 |
Redd | -0.034 |
Wan | -0.033 |
claw | -0.032 |
Neph | -0.031 |
Token |
|
Token ID | 3556 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
fitt | +0.565 |
slic | +0.523 |
hof | +0.500 |
leakage | +0.497 |
stamped | +0.496 |
Neg logit contributions | |
ˈ | -0.797 |
Redd | -0.673 |
Wan | -0.659 |
claw | -0.655 |
Neph | -0.630 |
Token | p |
Token ID | 79 |
Feature activation | -6.44e-02 |
Pos logit contributions | |
fitt | +1.069 |
slic | +1.000 |
leakage | +0.956 |
hof | +0.955 |
stamped | +0.951 |
Neg logit contributions | |
ˈ | -1.218 |
Redd | -0.999 |
claw | -0.974 |
Wan | -0.972 |
Neph | -0.931 |
Token | > |
Token ID | 29 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
ˈ | +0.144 |
Redd | +0.116 |
Wan | +0.112 |
claw | +0.110 |
Neph | +0.102 |
Neg logit contributions | |
fitt | -0.194 |
slic | -0.185 |
stamped | -0.179 |
hof | -0.179 |
leakage | -0.179 |
Token | |
Token ID | 7359 |
Feature activation | +3.79e-01 |
Pos logit contributions | |
fitt | +0.257 |
slic | +0.239 |
hof | +0.230 |
leakage | +0.229 |
stamped | +0.228 |
Neg logit contributions | |
ˈ | -0.329 |
Redd | -0.276 |
Wan | -0.270 |
claw | -0.267 |
Neph | -0.256 |
Token | li |
Token ID | 4528 |
Feature activation | +1.04e-01 |
Pos logit contributions | |
fitt | +0.862 |
slic | +0.801 |
hof | +0.768 |
leakage | +0.764 |
stamped | +0.762 |
Neg logit contributions | |
ˈ | -1.140 |
Redd | -0.959 |
Wan | -0.937 |
claw | -0.930 |
Neph | -0.894 |
Token | > |
Token ID | 29 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
fitt | +0.332 |
slic | +0.315 |
hof | +0.306 |
leakage | +0.305 |
stamped | +0.305 |
Neg logit contributions | |
ˈ | -0.218 |
Redd | -0.169 |
Wan | -0.162 |
claw | -0.160 |
Neph | -0.150 |
Token | Inter |
Token ID | 4225 |
Feature activation | -9.69e-02 |
Pos logit contributions | |
ˈ | +0.037 |
Redd | +0.031 |
Wan | +0.030 |
claw | +0.030 |
Neph | +0.029 |
Neg logit contributions | |
fitt | -0.025 |
slic | -0.023 |
hof | -0.022 |
stamped | -0.022 |
leakage | -0.022 |
Token | pol |
Token ID | 16104 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
ˈ | +0.251 |
Redd | +0.205 |
Wan | +0.199 |
claw | +0.197 |
Neph | +0.187 |
Neg logit contributions | |
fitt | -0.262 |
slic | -0.247 |
hof | -0.237 |
leakage | -0.237 |
stamped | -0.237 |
Token | list |
Token ID | 1351 |
Feature activation | +6.18e-04 |
Pos logit contributions | |
ˈ | +0.588 |
Redd | +0.501 |
Wan | +0.491 |
claw | +0.491 |
Neph | +0.476 |
Neg logit contributions | |
fitt | -0.342 |
slic | -0.313 |
hof | -0.301 |
stamped | -0.293 |
leakage | -0.293 |
Token | which |
Token ID | 543 |
Feature activation | -9.32e-02 |
Pos logit contributions | |
fitt | +0.001 |
slic | +0.001 |
hof | +0.001 |
leakage | +0.001 |
stamped | +0.001 |
Neg logit contributions | |
ˈ | -0.002 |
Redd | -0.002 |
Wan | -0.002 |
claw | -0.002 |
Neph | -0.002 |
Token | Tel |
Token ID | 12088 |
Feature activation | +3.60e-02 |
Pos logit contributions | |
ˈ | +0.295 |
Redd | +0.247 |
Wan | +0.244 |
claw | +0.243 |
Neph | +0.235 |
Neg logit contributions | |
fitt | -0.197 |
slic | -0.182 |
hof | -0.174 |
leakage | -0.171 |
stamped | -0.170 |
Token | stra |
Token ID | 12044 |
Feature activation | +4.30e-01 |
Pos logit contributions | |
fitt | +0.075 |
slic | +0.069 |
leakage | +0.065 |
hof | +0.065 |
stamped | +0.065 |
Neg logit contributions | |
ˈ | -0.116 |
Redd | -0.098 |
claw | -0.096 |
Wan | -0.096 |
Neph | -0.092 |
Token | is |
Token ID | 318 |
Feature activation | -6.63e-03 |
Pos logit contributions | |
fitt | +0.936 |
slic | +0.866 |
hof | +0.834 |
leakage | +0.826 |
stamped | +0.818 |
Neg logit contributions | |
ˈ | -1.336 |
Redd | -1.121 |
Wan | -1.103 |
claw | -1.098 |
Neph | -1.056 |
Token | examining |
Token ID | 17247 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
ˈ | +0.020 |
Redd | +0.017 |
Wan | +0.016 |
claw | +0.016 |
Neph | +0.016 |
Neg logit contributions | |
fitt | -0.015 |
slic | -0.014 |
hof | -0.013 |
leakage | -0.013 |
stamped | -0.013 |
Token | is |
Token ID | 318 |
Feature activation | -3.96e-02 |
Pos logit contributions | |
fitt | +0.259 |
slic | +0.240 |
hof | +0.230 |
leakage | +0.229 |
stamped | +0.227 |
Neg logit contributions | |
ˈ | -0.367 |
Redd | -0.306 |
claw | -0.301 |
Wan | -0.300 |
Neph | -0.288 |
Token | believed |
Token ID | 4762 |
Feature activation | +8.39e-03 |
Pos logit contributions | |
ˈ | +0.121 |
Redd | +0.102 |
Wan | +0.100 |
claw | +0.099 |
Neph | +0.096 |
Neg logit contributions | |
fitt | -0.088 |
slic | -0.081 |
hof | -0.078 |
leakage | -0.077 |
stamped | -0.076 |
Token | to |
Token ID | 284 |
Feature activation | +3.76e-04 |
Pos logit contributions | |
fitt | +0.021 |
slic | +0.019 |
hof | +0.018 |
leakage | +0.018 |
stamped | +0.018 |
Neg logit contributions | |
ˈ | -0.024 |
Redd | -0.020 |
Wan | -0.019 |
claw | -0.019 |
Neph | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
fitt | +0.073 |
slic | +0.068 |
hof | +0.065 |
leakage | +0.065 |
stamped | +0.065 |
Neg logit contributions | |
ˈ | -0.080 |
Redd | -0.066 |
Wan | -0.065 |
claw | -0.064 |
Neph | -0.061 |
Token | However |
Token ID | 2102 |
Feature activation | -6.12e-02 |
Pos logit contributions | |
fitt | +0.037 |
slic | +0.035 |
leakage | +0.033 |
hof | +0.033 |
stamped | +0.033 |
Neg logit contributions | |
ˈ | -0.040 |
Redd | -0.033 |
Wan | -0.032 |
claw | -0.032 |
Neph | -0.031 |
Token | , |
Token ID | 11 |
Feature activation | +6.71e-02 |
Pos logit contributions | |
ˈ | +0.183 |
Redd | +0.154 |
Wan | +0.150 |
claw | +0.149 |
Neph | +0.143 |
Neg logit contributions | |
fitt | -0.140 |
slic | -0.130 |
hof | -0.125 |
leakage | -0.124 |
stamped | -0.124 |
Token | a |
Token ID | 257 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
fitt | +0.151 |
slic | +0.140 |
hof | +0.134 |
stamped | +0.133 |
leakage | +0.133 |
Neg logit contributions | |
ˈ | -0.203 |
Redd | -0.170 |
Wan | -0.167 |
claw | -0.166 |
Neph | -0.160 |
Token | Tel |
Token ID | 12088 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
ˈ | +0.066 |
Redd | +0.056 |
Wan | +0.055 |
claw | +0.055 |
Neph | +0.053 |
Neg logit contributions | |
fitt | -0.039 |
slic | -0.036 |
hof | -0.034 |
leakage | -0.034 |
stamped | -0.034 |
Token | stra |
Token ID | 12044 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
fitt | +0.095 |
slic | +0.089 |
hof | +0.085 |
leakage | +0.085 |
stamped | +0.085 |
Neg logit contributions | |
ˈ | -0.110 |
Redd | -0.092 |
Wan | -0.090 |
claw | -0.089 |
Neph | -0.085 |
Token | spokesperson |
Token ID | 11821 |
Feature activation | +6.47e-02 |
Pos logit contributions | |
fitt | +1.047 |
slic | +0.979 |
hof | +0.945 |
leakage | +0.934 |
stamped | +0.933 |
Neg logit contributions | |
ˈ | -1.194 |
Redd | -0.989 |
Wan | -0.968 |
claw | -0.962 |
Neph | -0.922 |
Token | today |
Token ID | 1909 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
fitt | +0.161 |
slic | +0.151 |
hof | +0.146 |
leakage | +0.145 |
stamped | +0.143 |
Neg logit contributions | |
ˈ | -0.180 |
Redd | -0.147 |
Wan | -0.144 |
claw | -0.144 |
Neph | -0.138 |
Token | said |
Token ID | 531 |
Feature activation | +8.38e-02 |
Pos logit contributions | |
ˈ | +0.040 |
Redd | +0.033 |
claw | +0.032 |
Wan | +0.032 |
Neph | +0.031 |
Neg logit contributions | |
fitt | -0.035 |
slic | -0.033 |
hof | -0.032 |
leakage | -0.031 |
stamped | -0.031 |
Token | the |
Token ID | 262 |
Feature activation | -3.78e-03 |
Pos logit contributions | |
fitt | +0.190 |
slic | +0.177 |
hof | +0.170 |
stamped | +0.168 |
leakage | +0.168 |
Neg logit contributions | |
ˈ | -0.251 |
Redd | -0.211 |
Wan | -0.207 |
claw | -0.205 |
Neph | -0.197 |
Token | tel |
Token ID | 13632 |
Feature activation | -6.51e-02 |
Pos logit contributions | |
ˈ | +0.013 |
Redd | +0.011 |
Wan | +0.011 |
claw | +0.011 |
Neph | +0.011 |
Neg logit contributions | |
fitt | -0.007 |
slic | -0.006 |
hof | -0.006 |
stamped | -0.006 |
leakage | -0.006 |
Token | from |
Token ID | 422 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
ˈ | +0.074 |
Redd | +0.061 |
Wan | +0.060 |
claw | +0.060 |
Neph | +0.057 |
Neg logit contributions | |
fitt | -0.063 |
slic | -0.059 |
leakage | -0.057 |
hof | -0.056 |
stamped | -0.056 |
Token | the |
Token ID | 262 |
Feature activation | -4.01e-02 |
Pos logit contributions | |
ˈ | +0.048 |
Redd | +0.040 |
Wan | +0.039 |
claw | +0.039 |
Neph | +0.037 |
Neg logit contributions | |
fitt | -0.038 |
slic | -0.035 |
hof | -0.034 |
leakage | -0.033 |
stamped | -0.033 |
Token | Harvard |
Token ID | 11131 |
Feature activation | -8.81e-02 |
Pos logit contributions | |
ˈ | +0.101 |
Redd | +0.082 |
Wan | +0.080 |
claw | +0.079 |
Neph | +0.075 |
Neg logit contributions | |
fitt | -0.110 |
slic | -0.104 |
hof | -0.100 |
leakage | -0.100 |
stamped | -0.100 |
Token | - |
Token ID | 12 |
Feature activation | +2.21e-03 |
Pos logit contributions | |
ˈ | +0.258 |
Redd | +0.215 |
Wan | +0.210 |
claw | +0.209 |
Neph | +0.201 |
Neg logit contributions | |
fitt | -0.208 |
slic | -0.194 |
hof | -0.186 |
leakage | -0.185 |
stamped | -0.185 |
Token | Smith |
Token ID | 17919 |
Feature activation | -8.20e-02 |
Pos logit contributions | |
fitt | +0.008 |
slic | +0.007 |
leakage | +0.007 |
hof | +0.007 |
stamped | +0.007 |
Neg logit contributions | |
ˈ | -0.004 |
Redd | -0.003 |
Wan | -0.003 |
claw | -0.003 |
Neph | -0.003 |
Token | sonian |
Token ID | 35202 |
Feature activation | -5.75e-01 |
Pos logit contributions | |
ˈ | +0.252 |
Redd | +0.213 |
Wan | +0.208 |
claw | +0.207 |
Neph | +0.199 |
Neg logit contributions | |
fitt | -0.182 |
slic | -0.169 |
leakage | -0.161 |
hof | -0.161 |
stamped | -0.160 |
Token | Center |
Token ID | 3337 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
ˈ | +1.618 |
Redd | +1.338 |
Wan | +1.309 |
claw | +1.304 |
Neph | +1.253 |
Neg logit contributions | |
fitt | -1.408 |
slic | -1.321 |
hof | -1.264 |
leakage | -1.264 |
stamped | -1.258 |
Token | for |
Token ID | 329 |
Feature activation | -3.93e-02 |
Pos logit contributions | |
ˈ | +0.090 |
Redd | +0.075 |
Wan | +0.073 |
claw | +0.072 |
Neph | +0.069 |
Neg logit contributions | |
fitt | -0.075 |
slic | -0.070 |
hof | -0.067 |
stamped | -0.067 |
leakage | -0.067 |
Token | Ast |
Token ID | 8304 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
ˈ | +0.144 |
Redd | +0.125 |
Wan | +0.123 |
claw | +0.122 |
Neph | +0.119 |
Neg logit contributions | |
fitt | -0.064 |
slic | -0.058 |
leakage | -0.054 |
hof | -0.054 |
stamped | -0.053 |
Token | roph |
Token ID | 10051 |
Feature activation | +2.88e-02 |
Pos logit contributions | |
ˈ | +0.042 |
Redd | +0.032 |
Wan | +0.031 |
claw | +0.031 |
Neph | +0.029 |
Neg logit contributions | |
fitt | -0.063 |
slic | -0.059 |
hof | -0.057 |
leakage | -0.057 |
stamped | -0.057 |
Token | ysics |
Token ID | 23154 |
Feature activation | +7.23e-02 |
Pos logit contributions | |
fitt | +0.069 |
slic | +0.064 |
hof | +0.061 |
leakage | +0.061 |
stamped | +0.061 |
Neg logit contributions | |
ˈ | -0.084 |
Redd | -0.070 |
Wan | -0.068 |
claw | -0.068 |
Neph | -0.065 |
Token | felt |
Token ID | 2936 |
Feature activation | +4.74e-02 |
Pos logit contributions | |
ˈ | +0.006 |
Redd | +0.005 |
Wan | +0.005 |
claw | +0.005 |
Neph | +0.005 |
Neg logit contributions | |
fitt | -0.004 |
slic | -0.004 |
hof | -0.003 |
leakage | -0.003 |
stamped | -0.003 |
Token | in |
Token ID | 287 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
fitt | +0.112 |
slic | +0.105 |
hof | +0.101 |
leakage | +0.100 |
stamped | +0.099 |
Neg logit contributions | |
ˈ | -0.137 |
Redd | -0.115 |
Wan | -0.112 |
claw | -0.111 |
Neph | -0.107 |
Token | Syria |
Token ID | 4392 |
Feature activation | +5.45e-02 |
Pos logit contributions | |
ˈ | +0.044 |
Redd | +0.037 |
Wan | +0.036 |
claw | +0.036 |
Neph | +0.035 |
Neg logit contributions | |
fitt | -0.032 |
slic | -0.030 |
hof | -0.029 |
leakage | -0.029 |
stamped | -0.028 |
Token | and |
Token ID | 290 |
Feature activation | -1.41e-03 |
Pos logit contributions | |
fitt | +0.127 |
slic | +0.119 |
hof | +0.114 |
leakage | +0.114 |
stamped | +0.112 |
Neg logit contributions | |
ˈ | -0.161 |
Redd | -0.134 |
Wan | -0.131 |
claw | -0.130 |
Neph | -0.125 |
Token | Mes |
Token ID | 14937 |
Feature activation | +5.29e-02 |
Pos logit contributions | |
ˈ | +0.004 |
Redd | +0.003 |
claw | +0.003 |
Wan | +0.003 |
Neph | +0.003 |
Neg logit contributions | |
fitt | -0.004 |
slic | -0.003 |
hof | -0.003 |
leakage | -0.003 |
stamped | -0.003 |
Token | opot |
Token ID | 43372 |
Feature activation | -5.38e-01 |
Pos logit contributions | |
fitt | +0.169 |
slic | +0.160 |
hof | +0.156 |
leakage | +0.155 |
stamped | +0.155 |
Neg logit contributions | |
ˈ | -0.110 |
Redd | -0.085 |
Wan | -0.082 |
claw | -0.081 |
Neph | -0.076 |
Token | amia |
Token ID | 49442 |
Feature activation | -7.53e-02 |
Pos logit contributions | |
ˈ | +1.299 |
Redd | +1.037 |
Wan | +1.008 |
claw | +0.998 |
Neph | +0.944 |
Neg logit contributions | |
fitt | -1.549 |
slic | -1.465 |
leakage | -1.410 |
hof | -1.409 |
stamped | -1.406 |
Token | . |
Token ID | 13 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
ˈ | +0.207 |
Redd | +0.171 |
Wan | +0.167 |
claw | +0.166 |
Neph | +0.158 |
Neg logit contributions | |
fitt | -0.190 |
slic | -0.178 |
hof | -0.172 |
leakage | -0.171 |
stamped | -0.170 |
Token | As |
Token ID | 1081 |
Feature activation | -1.97e-02 |
Pos logit contributions | |
ˈ | +0.047 |
Redd | +0.039 |
Wan | +0.038 |
claw | +0.037 |
Neph | +0.036 |
Neg logit contributions | |
fitt | -0.041 |
slic | -0.038 |
leakage | -0.037 |
hof | -0.037 |
stamped | -0.036 |
Token | with |
Token ID | 351 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
ˈ | +0.059 |
Redd | +0.049 |
Wan | +0.048 |
claw | +0.048 |
Neph | +0.046 |
Neg logit contributions | |
fitt | -0.045 |
slic | -0.042 |
hof | -0.040 |
leakage | -0.040 |
stamped | -0.040 |
Token | so |
Token ID | 523 |
Feature activation | +3.16e-03 |
Pos logit contributions | |
fitt | +0.023 |
slic | +0.022 |
hof | +0.021 |
leakage | +0.021 |
stamped | +0.020 |
Neg logit contributions | |
ˈ | -0.032 |
Redd | -0.027 |
Wan | -0.026 |
claw | -0.026 |
Neph | -0.025 |
Token | for |
Token ID | 329 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
ˈ | +0.254 |
Redd | +0.212 |
Wan | +0.208 |
claw | +0.208 |
Neph | +0.199 |
Neg logit contributions | |
fitt | -0.193 |
slic | -0.179 |
hof | -0.172 |
leakage | -0.170 |
stamped | -0.170 |
Token | a |
Token ID | 257 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
ˈ | +0.049 |
Redd | +0.041 |
Wan | +0.040 |
claw | +0.040 |
Neph | +0.039 |
Neg logit contributions | |
fitt | -0.036 |
slic | -0.033 |
hof | -0.032 |
leakage | -0.032 |
stamped | -0.031 |
Token | few |
Token ID | 1178 |
Feature activation | -7.31e-02 |
Pos logit contributions | |
ˈ | +0.039 |
Redd | +0.033 |
Wan | +0.032 |
claw | +0.032 |
Neph | +0.031 |
Neg logit contributions | |
fitt | -0.028 |
slic | -0.026 |
hof | -0.025 |
leakage | -0.025 |
stamped | -0.025 |
Token | other |
Token ID | 584 |
Feature activation | -4.61e-03 |
Pos logit contributions | |
ˈ | +0.226 |
Redd | +0.191 |
Wan | +0.187 |
claw | +0.186 |
Neph | +0.179 |
Neg logit contributions | |
fitt | -0.159 |
slic | -0.147 |
hof | -0.141 |
leakage | -0.140 |
stamped | -0.140 |
Token | fr |
Token ID | 1216 |
Feature activation | -5.33e-02 |
Pos logit contributions | |
ˈ | +0.014 |
Redd | +0.012 |
Wan | +0.012 |
claw | +0.012 |
Neph | +0.011 |
Neg logit contributions | |
fitt | -0.010 |
slic | -0.009 |
hof | -0.009 |
leakage | -0.009 |
stamped | -0.009 |
Token | atern |
Token ID | 9205 |
Feature activation | -5.28e-01 |
Pos logit contributions | |
ˈ | +0.133 |
Redd | +0.107 |
Wan | +0.104 |
claw | +0.103 |
Neph | +0.098 |
Neg logit contributions | |
fitt | -0.149 |
slic | -0.140 |
hof | -0.136 |
leakage | -0.135 |
stamped | -0.135 |
Token | ities |
Token ID | 871 |
Feature activation | +2.39e-02 |
Pos logit contributions | |
ˈ | +1.284 |
Redd | +1.035 |
claw | +0.996 |
Wan | +0.994 |
Neph | +0.946 |
Neg logit contributions | |
fitt | -1.492 |
slic | -1.428 |
hof | -1.368 |
leakage | -1.364 |
stamped | -1.357 |
Token | are |
Token ID | 389 |
Feature activation | +4.82e-02 |
Pos logit contributions | |
fitt | +0.052 |
slic | +0.049 |
hof | +0.047 |
leakage | +0.046 |
stamped | +0.046 |
Neg logit contributions | |
ˈ | -0.074 |
Redd | -0.062 |
Wan | -0.061 |
claw | -0.061 |
Neph | -0.058 |
Token | also |
Token ID | 635 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
fitt | +0.101 |
slic | +0.093 |
hof | +0.090 |
leakage | +0.088 |
stamped | +0.087 |
Neg logit contributions | |
ˈ | -0.154 |
Redd | -0.130 |
Wan | -0.128 |
claw | -0.127 |
Neph | -0.123 |
Token | in |
Token ID | 287 |
Feature activation | +4.07e-03 |
Pos logit contributions | |
fitt | +0.042 |
slic | +0.038 |
hof | +0.037 |
leakage | +0.036 |
stamped | +0.036 |
Neg logit contributions | |
ˈ | -0.067 |
Redd | -0.057 |
Wan | -0.056 |
claw | -0.055 |
Neph | -0.054 |
Token | a |
Token ID | 257 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
fitt | +0.009 |
slic | +0.008 |
hof | +0.008 |
leakage | +0.008 |
stamped | +0.008 |
Neg logit contributions | |
ˈ | -0.013 |
Redd | -0.011 |
Wan | -0.010 |
claw | -0.010 |
Neph | -0.010 |
Token | from |
Token ID | 422 |
Feature activation | -3.87e-02 |
Pos logit contributions | |
ˈ | +0.371 |
Redd | +0.309 |
Wan | +0.302 |
claw | +0.301 |
Neph | +0.288 |
Neg logit contributions | |
fitt | -0.310 |
slic | -0.289 |
leakage | -0.278 |
hof | -0.276 |
stamped | -0.275 |
Token | the |
Token ID | 262 |
Feature activation | -7.36e-02 |
Pos logit contributions | |
ˈ | +0.114 |
Redd | +0.095 |
Wan | +0.093 |
claw | +0.092 |
Neph | +0.089 |
Neg logit contributions | |
fitt | -0.091 |
slic | -0.084 |
hof | -0.081 |
leakage | -0.081 |
stamped | -0.080 |
Token | Harvard |
Token ID | 11131 |
Feature activation | -8.90e-02 |
Pos logit contributions | |
ˈ | +0.173 |
Redd | +0.137 |
Wan | +0.133 |
claw | +0.132 |
Neph | +0.126 |
Neg logit contributions | |
fitt | -0.216 |
slic | -0.204 |
hof | -0.197 |
leakage | -0.197 |
stamped | -0.196 |
Token | - |
Token ID | 12 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
ˈ | +0.254 |
Redd | +0.211 |
Wan | +0.206 |
claw | +0.204 |
Neph | +0.197 |
Neg logit contributions | |
fitt | -0.216 |
slic | -0.202 |
hof | -0.194 |
leakage | -0.193 |
stamped | -0.193 |
Token | Smith |
Token ID | 17919 |
Feature activation | -4.68e-02 |
Pos logit contributions | |
ˈ | +0.042 |
Redd | +0.031 |
Wan | +0.030 |
claw | +0.029 |
Neph | +0.027 |
Neg logit contributions | |
fitt | -0.081 |
slic | -0.077 |
leakage | -0.075 |
hof | -0.075 |
stamped | -0.075 |
Token | sonian |
Token ID | 35202 |
Feature activation | -5.17e-01 |
Pos logit contributions | |
ˈ | +0.141 |
Redd | +0.116 |
Wan | +0.114 |
claw | +0.113 |
Neph | +0.111 |
Neg logit contributions | |
fitt | -0.108 |
slic | -0.101 |
leakage | -0.096 |
hof | -0.096 |
stamped | -0.095 |
Token | Center |
Token ID | 3337 |
Feature activation | +6.65e-03 |
Pos logit contributions | |
ˈ | +1.446 |
Redd | +1.197 |
Wan | +1.169 |
claw | +1.167 |
Neph | +1.117 |
Neg logit contributions | |
fitt | -1.268 |
slic | -1.198 |
leakage | -1.140 |
stamped | -1.139 |
hof | -1.137 |
Token | for |
Token ID | 329 |
Feature activation | -2.60e-02 |
Pos logit contributions | |
fitt | +0.016 |
slic | +0.015 |
hof | +0.015 |
stamped | +0.015 |
leakage | +0.015 |
Neg logit contributions | |
ˈ | -0.019 |
Redd | -0.016 |
Wan | -0.015 |
claw | -0.015 |
Neph | -0.014 |
Token | Ast |
Token ID | 8304 |
Feature activation | -3.32e-02 |
Pos logit contributions | |
ˈ | +0.096 |
Redd | +0.084 |
Wan | +0.083 |
claw | +0.082 |
Neph | +0.080 |
Neg logit contributions | |
fitt | -0.041 |
slic | -0.037 |
hof | -0.034 |
leakage | -0.034 |
stamped | -0.034 |
Token | roph |
Token ID | 10051 |
Feature activation | +8.09e-02 |
Pos logit contributions | |
ˈ | +0.073 |
Redd | +0.057 |
Wan | +0.055 |
claw | +0.054 |
Neph | +0.051 |
Neg logit contributions | |
fitt | -0.103 |
slic | -0.097 |
hof | -0.095 |
leakage | -0.094 |
stamped | -0.094 |
Token | ysics |
Token ID | 23154 |
Feature activation | +5.86e-02 |
Pos logit contributions | |
fitt | +0.181 |
slic | +0.168 |
hof | +0.162 |
stamped | +0.161 |
leakage | +0.161 |
Neg logit contributions | |
ˈ | -0.245 |
Redd | -0.206 |
Wan | -0.201 |
claw | -0.199 |
Neph | -0.191 |
Token | planner |
Token ID | 42351 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
fitt | +0.037 |
slic | +0.034 |
hof | +0.033 |
leakage | +0.033 |
stamped | +0.032 |
Neg logit contributions | |
ˈ | -0.059 |
Redd | -0.050 |
Wan | -0.049 |
claw | -0.049 |
Neph | -0.047 |
Token | at |
Token ID | 379 |
Feature activation | -4.62e-02 |
Pos logit contributions | |
ˈ | +0.381 |
Redd | +0.316 |
Wan | +0.308 |
claw | +0.305 |
Neph | +0.291 |
Neg logit contributions | |
fitt | -0.342 |
slic | -0.320 |
hof | -0.308 |
leakage | -0.306 |
stamped | -0.306 |
Token | NASA |
Token ID | 8884 |
Feature activation | +8.10e-03 |
Pos logit contributions | |
ˈ | +0.127 |
Redd | +0.106 |
Wan | +0.103 |
claw | +0.102 |
Neph | +0.098 |
Neg logit contributions | |
fitt | -0.116 |
slic | -0.109 |
hof | -0.105 |
leakage | -0.104 |
stamped | -0.104 |
Token | 's |
Token ID | 338 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
fitt | +0.019 |
slic | +0.018 |
hof | +0.017 |
leakage | +0.017 |
stamped | +0.017 |
Neg logit contributions | |
ˈ | -0.023 |
Redd | -0.020 |
Wan | -0.019 |
claw | -0.019 |
Neph | -0.018 |
Token | Jet |
Token ID | 19013 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
ˈ | +0.043 |
Redd | +0.033 |
Wan | +0.032 |
claw | +0.032 |
Neph | +0.030 |
Neg logit contributions | |
fitt | -0.059 |
slic | -0.056 |
hof | -0.054 |
leakage | -0.054 |
stamped | -0.054 |
Token | Prop |
Token ID | 8772 |
Feature activation | -4.96e-01 |
Pos logit contributions | |
ˈ | +0.323 |
Redd | +0.262 |
Wan | +0.255 |
claw | +0.254 |
Neph | +0.240 |
Neg logit contributions | |
fitt | -0.367 |
slic | -0.346 |
hof | -0.333 |
leakage | -0.332 |
stamped | -0.331 |
Token | ulsion |
Token ID | 15204 |
Feature activation | -2.87e-01 |
Pos logit contributions | |
ˈ | +1.554 |
Redd | +1.318 |
Wan | +1.289 |
claw | +1.279 |
Neph | +1.230 |
Neg logit contributions | |
fitt | -1.067 |
slic | -0.987 |
hof | -0.944 |
leakage | -0.940 |
stamped | -0.938 |
Token | Laboratory |
Token ID | 18643 |
Feature activation | -9.51e-02 |
Pos logit contributions | |
ˈ | +0.808 |
Redd | +0.671 |
Wan | +0.654 |
claw | +0.649 |
Neph | +0.621 |
Neg logit contributions | |
fitt | -0.710 |
slic | -0.664 |
hof | -0.638 |
leakage | -0.636 |
stamped | -0.634 |
Token | in |
Token ID | 287 |
Feature activation | +5.05e-03 |
Pos logit contributions | |
ˈ | +0.270 |
Redd | +0.222 |
Wan | +0.218 |
claw | +0.215 |
Neph | +0.205 |
Neg logit contributions | |
fitt | -0.233 |
slic | -0.218 |
hof | -0.212 |
leakage | -0.210 |
stamped | -0.209 |
Token | Pasadena |
Token ID | 41010 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
fitt | +0.014 |
slic | +0.014 |
hof | +0.013 |
leakage | +0.013 |
stamped | +0.013 |
Neg logit contributions | |
ˈ | -0.012 |
Redd | -0.010 |
Wan | -0.010 |
claw | -0.009 |
Neph | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | -6.17e-02 |
Pos logit contributions | |
ˈ | +0.322 |
Redd | +0.272 |
Wan | +0.265 |
claw | +0.262 |
Neph | +0.251 |
Neg logit contributions | |
fitt | -0.242 |
slic | -0.226 |
hof | -0.217 |
leakage | -0.216 |
stamped | -0.216 |
Token | consider |
Token ID | 2074 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
fitt | +0.074 |
slic | +0.069 |
hof | +0.066 |
leakage | +0.066 |
stamped | +0.065 |
Neg logit contributions | |
ˈ | -0.095 |
Redd | -0.079 |
claw | -0.077 |
Wan | -0.076 |
Neph | -0.074 |
Token | . |
Token ID | 13 |
Feature activation | +2.00e-02 |
Pos logit contributions | |
fitt | +0.262 |
slic | +0.246 |
hof | +0.237 |
leakage | +0.236 |
stamped | +0.235 |
Neg logit contributions | |
ˈ | -0.278 |
Redd | -0.228 |
Wan | -0.222 |
claw | -0.221 |
Neph | -0.211 |
Token |
|
Token ID | 198 |
Feature activation | +3.62e-02 |
Pos logit contributions | |
fitt | +0.051 |
slic | +0.047 |
leakage | +0.046 |
stamped | +0.045 |
hof | +0.045 |
Neg logit contributions | |
ˈ | -0.055 |
Redd | -0.046 |
Wan | -0.045 |
claw | -0.044 |
Neph | -0.043 |
Token |
|
Token ID | 198 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
fitt | +0.085 |
slic | +0.079 |
hof | +0.076 |
leakage | +0.076 |
stamped | +0.075 |
Neg logit contributions | |
ˈ | -0.106 |
Redd | -0.089 |
Wan | -0.087 |
claw | -0.086 |
Neph | -0.083 |
Token | Pl |
Token ID | 3646 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
fitt | +0.033 |
slic | +0.031 |
leakage | +0.030 |
stamped | +0.030 |
hof | +0.030 |
Neg logit contributions | |
ˈ | -0.031 |
Redd | -0.025 |
Wan | -0.025 |
claw | -0.024 |
Neph | -0.023 |
Token | ant |
Token ID | 415 |
Feature activation | -4.80e-01 |
Pos logit contributions | |
ˈ | +0.040 |
Redd | +0.033 |
Wan | +0.032 |
claw | +0.032 |
Neph | +0.030 |
Neg logit contributions | |
fitt | -0.042 |
slic | -0.040 |
leakage | -0.038 |
hof | -0.038 |
stamped | -0.038 |
Token | ain |
Token ID | 391 |
Feature activation | -4.35e-01 |
Pos logit contributions | |
ˈ | +1.359 |
Redd | +1.135 |
Wan | +1.107 |
claw | +1.096 |
Neph | +1.057 |
Neg logit contributions | |
fitt | -1.159 |
slic | -1.079 |
hof | -1.048 |
leakage | -1.044 |
stamped | -1.040 |
Token | Fl |
Token ID | 1610 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
ˈ | +1.139 |
Redd | +0.927 |
Wan | +0.904 |
claw | +0.897 |
Neph | +0.861 |
Neg logit contributions | |
fitt | -1.146 |
slic | -1.078 |
hof | -1.046 |
leakage | -1.043 |
stamped | -1.038 |
Token | our |
Token ID | 454 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
ˈ | +0.361 |
Redd | +0.295 |
Wan | +0.287 |
claw | +0.285 |
Neph | +0.271 |
Neg logit contributions | |
fitt | -0.351 |
slic | -0.331 |
leakage | -0.318 |
hof | -0.317 |
stamped | -0.316 |
Token | — |
Token ID | 960 |
Feature activation | -4.31e-02 |
Pos logit contributions | |
ˈ | +0.053 |
Redd | +0.044 |
Wan | +0.043 |
claw | +0.043 |
Neph | +0.041 |
Neg logit contributions | |
fitt | -0.047 |
slic | -0.044 |
hof | -0.043 |
leakage | -0.043 |
stamped | -0.042 |
Token | Pl |
Token ID | 3646 |
Feature activation | +1.78e-04 |
Pos logit contributions | |
ˈ | +0.113 |
Redd | +0.093 |
Wan | +0.090 |
claw | +0.089 |
Neph | +0.085 |
Neg logit contributions | |
fitt | -0.115 |
slic | -0.108 |
hof | -0.104 |
leakage | -0.104 |
stamped | -0.104 |
Token | from |
Token ID | 422 |
Feature activation | -9.53e-03 |
Pos logit contributions | |
fitt | +0.274 |
slic | +0.255 |
hof | +0.245 |
leakage | +0.243 |
stamped | +0.240 |
Neg logit contributions | |
ˈ | -0.354 |
Redd | -0.294 |
Wan | -0.290 |
claw | -0.287 |
Neph | -0.277 |
Token | the |
Token ID | 262 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
ˈ | +0.028 |
Redd | +0.023 |
Wan | +0.023 |
claw | +0.023 |
Neph | +0.022 |
Neg logit contributions | |
fitt | -0.022 |
slic | -0.021 |
hof | -0.020 |
leakage | -0.020 |
stamped | -0.020 |
Token | region |
Token ID | 3814 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
ˈ | +0.070 |
Redd | +0.057 |
Wan | +0.056 |
claw | +0.056 |
Neph | +0.054 |
Neg logit contributions | |
fitt | -0.067 |
slic | -0.063 |
hof | -0.061 |
leakage | -0.060 |
stamped | -0.060 |
Token | – |
Token ID | 784 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
ˈ | +0.368 |
Redd | +0.304 |
Wan | +0.300 |
claw | +0.299 |
Neph | +0.289 |
Neg logit contributions | |
fitt | -0.273 |
slic | -0.253 |
hof | -0.243 |
leakage | -0.242 |
stamped | -0.237 |
Token | Mes |
Token ID | 14937 |
Feature activation | +5.17e-02 |
Pos logit contributions | |
ˈ | +0.331 |
Redd | +0.278 |
Wan | +0.272 |
claw | +0.270 |
Neph | +0.261 |
Neg logit contributions | |
fitt | -0.247 |
slic | -0.230 |
hof | -0.222 |
leakage | -0.220 |
stamped | -0.217 |
Token | opot |
Token ID | 43372 |
Feature activation | -4.79e-01 |
Pos logit contributions | |
fitt | +0.163 |
slic | +0.155 |
hof | +0.150 |
leakage | +0.150 |
stamped | +0.150 |
Neg logit contributions | |
ˈ | -0.110 |
Redd | -0.085 |
Wan | -0.082 |
claw | -0.081 |
Neph | -0.076 |
Token | am |
Token ID | 321 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
ˈ | +1.278 |
Redd | +1.048 |
Wan | +1.021 |
claw | +1.011 |
Neph | +0.965 |
Neg logit contributions | |
fitt | -1.253 |
slic | -1.177 |
hof | -1.133 |
leakage | -1.130 |
stamped | -1.127 |
Token | ian |
Token ID | 666 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
fitt | +0.279 |
slic | +0.260 |
hof | +0.250 |
leakage | +0.249 |
stamped | +0.248 |
Neg logit contributions | |
ˈ | -0.333 |
Redd | -0.279 |
Wan | -0.272 |
claw | -0.270 |
Neph | -0.258 |
Token | , |
Token ID | 11 |
Feature activation | -7.44e-02 |
Pos logit contributions | |
fitt | +0.027 |
slic | +0.025 |
hof | +0.024 |
leakage | +0.024 |
stamped | +0.024 |
Neg logit contributions | |
ˈ | -0.035 |
Redd | -0.030 |
Wan | -0.029 |
claw | -0.029 |
Neph | -0.028 |
Token | Israel |
Token ID | 2692 |
Feature activation | -3.29e-02 |
Pos logit contributions | |
ˈ | +0.203 |
Redd | +0.167 |
Wan | +0.163 |
claw | +0.161 |
Neph | +0.155 |
Neg logit contributions | |
fitt | -0.190 |
slic | -0.178 |
hof | -0.172 |
leakage | -0.171 |
stamped | -0.170 |
Token | ite |
Token ID | 578 |
Feature activation | +5.18e-02 |
Pos logit contributions | |
ˈ | +0.100 |
Redd | +0.084 |
Wan | +0.082 |
claw | +0.082 |
Neph | +0.078 |
Neg logit contributions | |
fitt | -0.074 |
slic | -0.068 |
hof | -0.066 |
leakage | -0.065 |
stamped | -0.065 |
Token | } |
Token ID | 1782 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
fitt | +0.276 |
slic | +0.256 |
hof | +0.246 |
leakage | +0.242 |
stamped | +0.242 |
Neg logit contributions | |
ˈ | -0.404 |
Redd | -0.342 |
Wan | -0.336 |
claw | -0.335 |
Neph | -0.323 |
Token | Catch |
Token ID | 25750 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
fitt | +0.255 |
slic | +0.236 |
hof | +0.228 |
leakage | +0.225 |
stamped | +0.224 |
Neg logit contributions | |
ˈ | -0.351 |
Redd | -0.295 |
Wan | -0.290 |
claw | -0.289 |
Neph | -0.278 |
Token | { |
Token ID | 1391 |
Feature activation | -6.55e-02 |
Pos logit contributions | |
ˈ | +0.290 |
Redd | +0.231 |
Wan | +0.227 |
claw | +0.226 |
Neph | +0.216 |
Neg logit contributions | |
fitt | -0.351 |
slic | -0.330 |
hof | -0.320 |
leakage | -0.318 |
stamped | -0.316 |
Token | Write |
Token ID | 19430 |
Feature activation | -6.79e-02 |
Pos logit contributions | |
ˈ | +0.170 |
Redd | +0.140 |
Wan | +0.135 |
claw | +0.133 |
Neph | +0.126 |
Neg logit contributions | |
fitt | -0.177 |
slic | -0.167 |
leakage | -0.161 |
stamped | -0.160 |
hof | -0.159 |
Token | - |
Token ID | 12 |
Feature activation | -5.18e-02 |
Pos logit contributions | |
ˈ | +0.207 |
Redd | +0.175 |
Wan | +0.171 |
claw | +0.171 |
Neph | +0.163 |
Neg logit contributions | |
fitt | -0.154 |
slic | -0.142 |
leakage | -0.136 |
hof | -0.135 |
stamped | -0.134 |
Token | Warning |
Token ID | 20361 |
Feature activation | -4.71e-01 |
Pos logit contributions | |
ˈ | +0.098 |
Redd | +0.075 |
Wan | +0.072 |
claw | +0.070 |
Neph | +0.064 |
Neg logit contributions | |
fitt | -0.177 |
slic | -0.168 |
leakage | -0.163 |
hof | -0.163 |
stamped | -0.163 |
Token | - |
Token ID | 532 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
ˈ | +1.379 |
Redd | +1.157 |
Wan | +1.136 |
claw | +1.133 |
Neph | +1.085 |
Neg logit contributions | |
fitt | -1.113 |
slic | -1.028 |
hof | -0.979 |
leakage | -0.977 |
stamped | -0.964 |
Token | Message |
Token ID | 12837 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
fitt | +0.050 |
slic | +0.047 |
leakage | +0.046 |
hof | +0.046 |
stamped | +0.045 |
Neg logit contributions | |
ˈ | -0.038 |
Redd | -0.030 |
Wan | -0.029 |
claw | -0.029 |
Neph | -0.027 |
Token | " |
Token ID | 366 |
Feature activation | -2.01e-02 |
Pos logit contributions | |
ˈ | +0.418 |
Redd | +0.345 |
Wan | +0.336 |
claw | +0.333 |
Neph | +0.318 |
Neg logit contributions | |
fitt | -0.394 |
slic | -0.369 |
hof | -0.356 |
leakage | -0.355 |
stamped | -0.354 |
Token | F |
Token ID | 37 |
Feature activation | +6.33e-02 |
Pos logit contributions | |
ˈ | +0.061 |
Redd | +0.052 |
Wan | +0.051 |
claw | +0.050 |
Neph | +0.048 |
Neg logit contributions | |
fitt | -0.045 |
slic | -0.042 |
hof | -0.040 |
leakage | -0.040 |
stamped | -0.040 |
Token | ailed |
Token ID | 6255 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
fitt | +0.112 |
slic | +0.100 |
leakage | +0.093 |
hof | +0.092 |
stamped | +0.091 |
Neg logit contributions | |
ˈ | -0.225 |
Redd | -0.195 |
Wan | -0.193 |
claw | -0.191 |
Neph | -0.183 |
Token | Active |
Token ID | 14199 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
ˈ | +0.303 |
Redd | +0.249 |
Wan | +0.245 |
claw | +0.242 |
Neph | +0.234 |
Neg logit contributions | |
fitt | -0.273 |
slic | -0.255 |
hof | -0.248 |
leakage | -0.247 |
stamped | -0.244 |
Token | Elect |
Token ID | 5903 |
Feature activation | +6.11e-03 |
Pos logit contributions | |
fitt | +0.070 |
slic | +0.066 |
hof | +0.064 |
leakage | +0.064 |
stamped | +0.063 |
Neg logit contributions | |
ˈ | -0.067 |
Redd | -0.055 |
Wan | -0.054 |
claw | -0.054 |
Neph | -0.051 |
Token | ron |
Token ID | 1313 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
fitt | +0.016 |
slic | +0.015 |
hof | +0.015 |
leakage | +0.014 |
stamped | +0.014 |
Neg logit contributions | |
ˈ | -0.016 |
Redd | -0.013 |
Wan | -0.013 |
claw | -0.013 |
Neph | -0.012 |
Token | ically |
Token ID | 1146 |
Feature activation | -6.56e-02 |
Pos logit contributions | |
fitt | +0.060 |
slic | +0.057 |
hof | +0.055 |
leakage | +0.055 |
stamped | +0.055 |
Neg logit contributions | |
ˈ | -0.056 |
Redd | -0.045 |
Wan | -0.044 |
claw | -0.044 |
Neph | -0.042 |
Token | Sc |
Token ID | 1446 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
ˈ | +0.174 |
Redd | +0.142 |
Wan | +0.139 |
claw | +0.138 |
Neph | +0.133 |
Neg logit contributions | |
fitt | -0.171 |
slic | -0.161 |
hof | -0.156 |
leakage | -0.155 |
stamped | -0.154 |
Token | anned |
Token ID | 3577 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
ˈ | +0.356 |
Redd | +0.298 |
Wan | +0.292 |
claw | +0.289 |
Neph | +0.280 |
Neg logit contributions | |
fitt | -0.272 |
slic | -0.254 |
leakage | -0.244 |
hof | -0.242 |
stamped | -0.238 |
Token | Array |
Token ID | 15690 |
Feature activation | -3.66e-03 |
Pos logit contributions | |
ˈ | +1.176 |
Redd | +0.946 |
Wan | +0.930 |
claw | +0.919 |
Neph | +0.889 |
Neg logit contributions | |
fitt | -1.289 |
slic | -1.211 |
hof | -1.176 |
leakage | -1.172 |
stamped | -1.165 |
Token | Rad |
Token ID | 5325 |
Feature activation | +4.90e-02 |
Pos logit contributions | |
ˈ | +0.010 |
Redd | +0.008 |
Wan | +0.008 |
claw | +0.008 |
Neph | +0.007 |
Neg logit contributions | |
fitt | -0.009 |
slic | -0.009 |
hof | -0.009 |
leakage | -0.009 |
stamped | -0.009 |
Token | ars |
Token ID | 945 |
Feature activation | -7.40e-02 |
Pos logit contributions | |
fitt | +0.123 |
slic | +0.115 |
hof | +0.110 |
leakage | +0.110 |
stamped | +0.110 |
Neg logit contributions | |
ˈ | -0.136 |
Redd | -0.113 |
Wan | -0.110 |
claw | -0.109 |
Neph | -0.104 |
Token | and |
Token ID | 290 |
Feature activation | -4.28e-02 |
Pos logit contributions | |
ˈ | +0.205 |
Redd | +0.170 |
Wan | +0.167 |
claw | +0.165 |
Neph | +0.158 |
Neg logit contributions | |
fitt | -0.184 |
slic | -0.172 |
hof | -0.166 |
leakage | -0.165 |
stamped | -0.164 |
Token | 38 |
Token ID | 4353 |
Feature activation | +7.85e-02 |
Pos logit contributions | |
ˈ | +0.123 |
Redd | +0.102 |
Wan | +0.100 |
claw | +0.099 |
Neph | +0.095 |
Neg logit contributions | |
fitt | -0.103 |
slic | -0.096 |
hof | -0.093 |
leakage | -0.092 |
stamped | -0.092 |
Token | to |
Token ID | 284 |
Feature activation | -3.29e-02 |
Pos logit contributions | |
fitt | +0.152 |
slic | +0.141 |
hof | +0.136 |
leakage | +0.135 |
stamped | +0.133 |
Neg logit contributions | |
ˈ | -0.202 |
Redd | -0.169 |
Wan | -0.166 |
claw | -0.165 |
Neph | -0.158 |
Token | Donetsk |
Token ID | 31819 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
ˈ | +0.101 |
Redd | +0.086 |
Wan | +0.084 |
claw | +0.083 |
Neph | +0.080 |
Neg logit contributions | |
fitt | -0.072 |
slic | -0.067 |
hof | -0.064 |
leakage | -0.064 |
stamped | -0.064 |
Token | and |
Token ID | 290 |
Feature activation | -3.94e-02 |
Pos logit contributions | |
ˈ | +0.510 |
Redd | +0.429 |
Wan | +0.419 |
claw | +0.419 |
Neph | +0.401 |
Neg logit contributions | |
fitt | -0.381 |
slic | -0.353 |
hof | -0.338 |
leakage | -0.337 |
stamped | -0.334 |
Token | Lu |
Token ID | 6026 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
ˈ | +0.112 |
Redd | +0.094 |
Wan | +0.091 |
claw | +0.091 |
Neph | +0.087 |
Neg logit contributions | |
fitt | -0.096 |
slic | -0.089 |
hof | -0.086 |
leakage | -0.086 |
stamped | -0.085 |
Token | h |
Token ID | 71 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
fitt | +0.295 |
slic | +0.280 |
hof | +0.274 |
stamped | +0.267 |
leakage | +0.265 |
Neg logit contributions | |
ˈ | -0.332 |
Redd | -0.280 |
Wan | -0.271 |
claw | -0.262 |
Neph | -0.261 |
Token | ansk |
Token ID | 34738 |
Feature activation | -4.66e-01 |
Pos logit contributions | |
fitt | +0.106 |
slic | +0.100 |
leakage | +0.097 |
hof | +0.097 |
stamped | +0.096 |
Neg logit contributions | |
ˈ | -0.077 |
Redd | -0.061 |
Wan | -0.059 |
claw | -0.058 |
Neph | -0.054 |
Token | , |
Token ID | 11 |
Feature activation | -7.74e-02 |
Pos logit contributions | |
ˈ | +1.387 |
Redd | +1.164 |
Wan | +1.137 |
claw | +1.136 |
Neph | +1.088 |
Neg logit contributions | |
fitt | -1.065 |
slic | -0.989 |
hof | -0.949 |
leakage | -0.949 |
stamped | -0.938 |
Token | however |
Token ID | 2158 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
ˈ | +0.236 |
Redd | +0.198 |
Wan | +0.194 |
claw | +0.194 |
Neph | +0.186 |
Neg logit contributions | |
fitt | -0.173 |
slic | -0.160 |
hof | -0.154 |
leakage | -0.153 |
stamped | -0.151 |
Token | , |
Token ID | 11 |
Feature activation | -4.51e-02 |
Pos logit contributions | |
ˈ | +0.414 |
Redd | +0.349 |
Wan | +0.341 |
claw | +0.339 |
Neph | +0.325 |
Neg logit contributions | |
fitt | -0.298 |
slic | -0.276 |
hof | -0.264 |
leakage | -0.263 |
stamped | -0.263 |
Token | and |
Token ID | 290 |
Feature activation | -7.16e-02 |
Pos logit contributions | |
ˈ | +0.142 |
Redd | +0.120 |
claw | +0.117 |
Wan | +0.117 |
Neph | +0.113 |
Neg logit contributions | |
fitt | -0.096 |
slic | -0.089 |
hof | -0.085 |
leakage | -0.084 |
stamped | -0.083 |
Token | the |
Token ID | 262 |
Feature activation | -6.57e-02 |
Pos logit contributions | |
ˈ | +0.219 |
Redd | +0.184 |
Wan | +0.181 |
claw | +0.180 |
Neph | +0.173 |
Neg logit contributions | |
fitt | -0.159 |
slic | -0.147 |
hof | -0.141 |
leakage | -0.140 |
stamped | -0.139 |
Token | ain |
Token ID | 391 |
Feature activation | -4.35e-01 |
Pos logit contributions | |
ˈ | +1.359 |
Redd | +1.135 |
Wan | +1.107 |
claw | +1.096 |
Neph | +1.057 |
Neg logit contributions | |
fitt | -1.159 |
slic | -1.079 |
hof | -1.048 |
leakage | -1.044 |
stamped | -1.040 |
Token | Fl |
Token ID | 1610 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
ˈ | +1.139 |
Redd | +0.927 |
Wan | +0.904 |
claw | +0.897 |
Neph | +0.861 |
Neg logit contributions | |
fitt | -1.146 |
slic | -1.078 |
hof | -1.046 |
leakage | -1.043 |
stamped | -1.038 |
Token | our |
Token ID | 454 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
ˈ | +0.361 |
Redd | +0.295 |
Wan | +0.287 |
claw | +0.285 |
Neph | +0.271 |
Neg logit contributions | |
fitt | -0.351 |
slic | -0.331 |
leakage | -0.318 |
hof | -0.317 |
stamped | -0.316 |
Token | — |
Token ID | 960 |
Feature activation | -4.31e-02 |
Pos logit contributions | |
ˈ | +0.053 |
Redd | +0.044 |
Wan | +0.043 |
claw | +0.043 |
Neph | +0.041 |
Neg logit contributions | |
fitt | -0.047 |
slic | -0.044 |
hof | -0.043 |
leakage | -0.043 |
stamped | -0.042 |
Token | Pl |
Token ID | 3646 |
Feature activation | +1.78e-04 |
Pos logit contributions | |
ˈ | +0.113 |
Redd | +0.093 |
Wan | +0.090 |
claw | +0.089 |
Neph | +0.085 |
Neg logit contributions | |
fitt | -0.115 |
slic | -0.108 |
hof | -0.104 |
leakage | -0.104 |
stamped | -0.104 |
Token | ant |
Token ID | 415 |
Feature activation | -4.57e-01 |
Pos logit contributions | |
fitt | +0.001 |
slic | +0.000 |
leakage | +0.000 |
hof | +0.000 |
stamped | +0.000 |
Neg logit contributions | |
ˈ | -0.000 |
Redd | -0.000 |
Wan | -0.000 |
claw | -0.000 |
Neph | -0.000 |
Token | ain |
Token ID | 391 |
Feature activation | -3.87e-01 |
Pos logit contributions | |
ˈ | +1.204 |
Redd | +0.984 |
Wan | +0.958 |
claw | +0.945 |
Neph | +0.908 |
Neg logit contributions | |
fitt | -1.206 |
slic | -1.129 |
leakage | -1.093 |
hof | -1.092 |
stamped | -1.084 |
Token | flour |
Token ID | 10601 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
ˈ | +1.170 |
Redd | +0.982 |
Wan | +0.959 |
claw | +0.953 |
Neph | +0.918 |
Neg logit contributions | |
fitt | -0.863 |
slic | -0.802 |
hof | -0.776 |
leakage | -0.769 |
stamped | -0.765 |
Token | is |
Token ID | 318 |
Feature activation | -6.51e-03 |
Pos logit contributions | |
fitt | +0.549 |
slic | +0.510 |
hof | +0.490 |
leakage | +0.487 |
stamped | +0.485 |
Neg logit contributions | |
ˈ | -0.747 |
Redd | -0.629 |
Wan | -0.615 |
claw | -0.610 |
Neph | -0.587 |
Token | quickly |
Token ID | 2952 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
ˈ | +0.020 |
Redd | +0.017 |
Wan | +0.017 |
claw | +0.016 |
Neph | +0.016 |
Neg logit contributions | |
fitt | -0.014 |
slic | -0.013 |
hof | -0.013 |
leakage | -0.013 |
stamped | -0.012 |
Token | becoming |
Token ID | 5033 |
Feature activation | -9.62e-03 |
Pos logit contributions | |
ˈ | +0.397 |
Redd | +0.335 |
claw | +0.329 |
Wan | +0.328 |
Neph | +0.316 |
Neg logit contributions | |
fitt | -0.238 |
slic | -0.217 |
hof | -0.212 |
leakage | -0.205 |
stamped | -0.199 |
Token | Penguins |
Token ID | 29755 |
Feature activation | -7.06e-02 |
Pos logit contributions | |
ˈ | +0.042 |
Redd | +0.035 |
Wan | +0.034 |
claw | +0.034 |
Neph | +0.032 |
Neg logit contributions | |
fitt | -0.040 |
slic | -0.037 |
hof | -0.036 |
leakage | -0.036 |
stamped | -0.036 |
Token | GM |
Token ID | 6951 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
ˈ | +0.210 |
Redd | +0.176 |
Wan | +0.172 |
claw | +0.172 |
Neph | +0.164 |
Neg logit contributions | |
fitt | -0.162 |
slic | -0.151 |
hof | -0.145 |
leakage | -0.144 |
stamped | -0.143 |
Token | Jim |
Token ID | 5395 |
Feature activation | +4.16e-02 |
Pos logit contributions | |
fitt | +0.294 |
slic | +0.280 |
hof | +0.271 |
leakage | +0.267 |
stamped | +0.267 |
Neg logit contributions | |
ˈ | -0.297 |
Redd | -0.244 |
Wan | -0.237 |
claw | -0.235 |
Neph | -0.224 |
Token | Rutherford |
Token ID | 49767 |
Feature activation | -2.20e-01 |
Pos logit contributions | |
fitt | +0.121 |
slic | +0.111 |
leakage | +0.110 |
hof | +0.109 |
stamped | +0.108 |
Neg logit contributions | |
ˈ | -0.100 |
Redd | -0.081 |
claw | -0.078 |
Wan | -0.078 |
Neph | -0.073 |
Token | approached |
Token ID | 10448 |
Feature activation | -1.70e-03 |
Pos logit contributions | |
ˈ | +0.669 |
Redd | +0.555 |
claw | +0.547 |
Wan | +0.544 |
Neph | +0.520 |
Neg logit contributions | |
fitt | -0.495 |
slic | -0.460 |
hof | -0.443 |
leakage | -0.441 |
stamped | -0.431 |
Token | Fle |
Token ID | 12005 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
ˈ | +0.005 |
Redd | +0.004 |
Wan | +0.004 |
claw | +0.004 |
Neph | +0.003 |
Neg logit contributions | |
fitt | -0.004 |
slic | -0.004 |
hof | -0.004 |
leakage | -0.004 |
stamped | -0.004 |
Token | ury |
Token ID | 1601 |
Feature activation | -2.33e-02 |
Pos logit contributions | |
ˈ | +1.361 |
Redd | +1.140 |
Wan | +1.119 |
claw | +1.111 |
Neph | +1.062 |
Neg logit contributions | |
fitt | -1.043 |
slic | -0.967 |
leakage | -0.925 |
stamped | -0.918 |
hof | -0.918 |
Token | leading |
Token ID | 3756 |
Feature activation | -4.68e-02 |
Pos logit contributions | |
ˈ | +0.067 |
Redd | +0.056 |
Wan | +0.055 |
claw | +0.054 |
Neph | +0.052 |
Neg logit contributions | |
fitt | -0.056 |
slic | -0.052 |
hof | -0.050 |
leakage | -0.050 |
stamped | -0.049 |
Token | into |
Token ID | 656 |
Feature activation | +4.38e-05 |
Pos logit contributions | |
ˈ | +0.139 |
Redd | +0.117 |
Wan | +0.114 |
claw | +0.113 |
Neph | +0.109 |
Neg logit contributions | |
fitt | -0.108 |
slic | -0.100 |
hof | -0.096 |
leakage | -0.096 |
stamped | -0.095 |
Token | the |
Token ID | 262 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
fitt | +0.000 |
slic | +0.000 |
hof | +0.000 |
leakage | +0.000 |
stamped | +0.000 |
Neg logit contributions | |
ˈ | -0.000 |
Redd | -0.000 |
Wan | -0.000 |
claw | -0.000 |
Neph | -0.000 |
Token | March |
Token ID | 2805 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
ˈ | +0.047 |
Redd | +0.039 |
Wan | +0.038 |
claw | +0.038 |
Neph | +0.037 |
Neg logit contributions | |
fitt | -0.032 |
slic | -0.030 |
hof | -0.028 |
leakage | -0.028 |
stamped | -0.028 |
Token | alf |
Token ID | 1604 |
Feature activation | -9.93e-02 |
Pos logit contributions | |
ˈ | +0.096 |
Redd | +0.083 |
claw | +0.081 |
Wan | +0.081 |
Neph | +0.078 |
Neg logit contributions | |
fitt | -0.056 |
slic | -0.052 |
leakage | -0.049 |
stamped | -0.048 |
hof | -0.048 |
Token | rides |
Token ID | 17445 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
ˈ | +0.297 |
Redd | +0.248 |
claw | +0.244 |
Wan | +0.244 |
Neph | +0.234 |
Neg logit contributions | |
fitt | -0.224 |
slic | -0.207 |
hof | -0.202 |
leakage | -0.200 |
stamped | -0.197 |
Token | for |
Token ID | 329 |
Feature activation | +1.90e-02 |
Pos logit contributions | |
ˈ | +0.349 |
Redd | +0.290 |
Wan | +0.282 |
claw | +0.281 |
Neph | +0.269 |
Neg logit contributions | |
fitt | -0.312 |
slic | -0.291 |
hof | -0.281 |
leakage | -0.280 |
stamped | -0.278 |
Token | Min |
Token ID | 1855 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
fitt | +0.045 |
slic | +0.042 |
hof | +0.040 |
leakage | +0.040 |
stamped | +0.040 |
Neg logit contributions | |
ˈ | -0.055 |
Redd | -0.046 |
Wan | -0.045 |
claw | -0.045 |
Neph | -0.043 |
Token | as |
Token ID | 292 |
Feature activation | -5.23e-02 |
Pos logit contributions | |
fitt | +0.317 |
slic | +0.298 |
hof | +0.290 |
leakage | +0.287 |
stamped | +0.287 |
Neg logit contributions | |
ˈ | -0.297 |
Redd | -0.242 |
Wan | -0.236 |
claw | -0.231 |
Neph | -0.221 |
Token | Tir |
Token ID | 39847 |
Feature activation | -4.49e-01 |
Pos logit contributions | |
ˈ | +0.133 |
Redd | +0.108 |
Wan | +0.106 |
claw | +0.104 |
Neph | +0.100 |
Neg logit contributions | |
fitt | -0.143 |
slic | -0.135 |
hof | -0.130 |
leakage | -0.129 |
stamped | -0.129 |
Token | ith |
Token ID | 342 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
ˈ | +1.032 |
Redd | +0.820 |
Wan | +0.781 |
claw | +0.776 |
Neph | +0.723 |
Neg logit contributions | |
fitt | -1.351 |
slic | -1.268 |
hof | -1.247 |
leakage | -1.235 |
stamped | -1.232 |
Token | , |
Token ID | 11 |
Feature activation | -7.81e-02 |
Pos logit contributions | |
ˈ | +0.514 |
Redd | +0.427 |
claw | +0.418 |
Wan | +0.417 |
Neph | +0.401 |
Neg logit contributions | |
fitt | -0.431 |
slic | -0.402 |
leakage | -0.387 |
hof | -0.385 |
stamped | -0.381 |
Token | chief |
Token ID | 4039 |
Feature activation | -9.47e-02 |
Pos logit contributions | |
ˈ | +0.247 |
Redd | +0.210 |
Wan | +0.206 |
claw | +0.205 |
Neph | +0.199 |
Neg logit contributions | |
fitt | -0.164 |
slic | -0.151 |
hof | -0.145 |
leakage | -0.144 |
stamped | -0.143 |
Token | city |
Token ID | 1748 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
ˈ | +0.256 |
Redd | +0.211 |
Wan | +0.205 |
claw | +0.203 |
Neph | +0.194 |
Neg logit contributions | |
fitt | -0.244 |
slic | -0.229 |
hof | -0.221 |
stamped | -0.220 |
leakage | -0.219 |
Token | of |
Token ID | 286 |
Feature activation | -6.04e-02 |
Pos logit contributions | |
ˈ | +0.053 |
Redd | +0.044 |
Wan | +0.043 |
claw | +0.042 |
Neph | +0.040 |
Neg logit contributions | |
fitt | -0.053 |
slic | -0.050 |
hof | -0.048 |
leakage | -0.048 |
stamped | -0.048 |
Token | Ferguson |
Token ID | 15031 |
Feature activation | -5.64e-02 |
Pos logit contributions | |
fitt | +0.238 |
slic | +0.226 |
hof | +0.220 |
stamped | +0.219 |
leakage | +0.219 |
Neg logit contributions | |
ˈ | -0.147 |
Redd | -0.112 |
Wan | -0.108 |
claw | -0.107 |
Neph | -0.099 |
Token | versus |
Token ID | 9051 |
Feature activation | -6.55e-02 |
Pos logit contributions | |
ˈ | +0.169 |
Redd | +0.142 |
Wan | +0.139 |
claw | +0.138 |
Neph | +0.132 |
Neg logit contributions | |
fitt | -0.129 |
slic | -0.120 |
hof | -0.115 |
leakage | -0.114 |
stamped | -0.114 |
Token | Kh |
Token ID | 5311 |
Feature activation | -9.39e-02 |
Pos logit contributions | |
ˈ | +0.171 |
Redd | +0.140 |
Wan | +0.136 |
claw | +0.135 |
Neph | +0.129 |
Neg logit contributions | |
fitt | -0.175 |
slic | -0.164 |
hof | -0.159 |
leakage | -0.158 |
stamped | -0.157 |
Token | ab |
Token ID | 397 |
Feature activation | -9.10e-02 |
Pos logit contributions | |
ˈ | +0.282 |
Redd | +0.238 |
Wan | +0.232 |
claw | +0.230 |
Neph | +0.221 |
Neg logit contributions | |
fitt | -0.214 |
slic | -0.199 |
leakage | -0.192 |
hof | -0.191 |
stamped | -0.190 |
Token | ib |
Token ID | 571 |
Feature activation | +8.57e-02 |
Pos logit contributions | |
ˈ | +0.232 |
Redd | +0.188 |
Wan | +0.184 |
claw | +0.183 |
Neph | +0.172 |
Neg logit contributions | |
fitt | -0.248 |
slic | -0.234 |
leakage | -0.225 |
hof | -0.225 |
stamped | -0.223 |
Token | Nur |
Token ID | 49281 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
fitt | +0.232 |
slic | +0.219 |
hof | +0.212 |
leakage | +0.211 |
stamped | +0.210 |
Neg logit contributions | |
ˈ | -0.219 |
Redd | -0.179 |
Wan | -0.174 |
claw | -0.172 |
Neph | -0.164 |
Token | mag |
Token ID | 19726 |
Feature activation | +5.88e-02 |
Pos logit contributions | |
ˈ | +1.189 |
Redd | +0.939 |
claw | +0.930 |
Wan | +0.922 |
Neph | +0.859 |
Neg logit contributions | |
fitt | -1.173 |
slic | -1.107 |
leakage | -1.065 |
hof | -1.057 |
stamped | -1.043 |
Token | omed |
Token ID | 12657 |
Feature activation | +2.52e-02 |
Pos logit contributions | |
fitt | +0.142 |
slic | +0.133 |
hof | +0.128 |
leakage | +0.127 |
stamped | +0.127 |
Neg logit contributions | |
ˈ | -0.168 |
Redd | -0.140 |
Wan | -0.137 |
claw | -0.136 |
Neph | -0.130 |
Token | ov |
Token ID | 709 |
Feature activation | -3.15e-02 |
Pos logit contributions | |
fitt | +0.059 |
slic | +0.056 |
leakage | +0.053 |
hof | +0.053 |
stamped | +0.052 |
Neg logit contributions | |
ˈ | -0.074 |
Redd | -0.061 |
Wan | -0.060 |
claw | -0.060 |
Neph | -0.057 |
Token | – |
Token ID | 784 |
Feature activation | -4.29e-02 |
Pos logit contributions | |
ˈ | +0.090 |
Redd | +0.075 |
Wan | +0.073 |
claw | +0.073 |
Neph | +0.070 |
Neg logit contributions | |
fitt | -0.076 |
slic | -0.071 |
hof | -0.068 |
leakage | -0.068 |
stamped | -0.068 |
Token | which |
Token ID | 543 |
Feature activation | -7.89e-02 |
Pos logit contributions | |
ˈ | +0.129 |
Redd | +0.108 |
Wan | +0.106 |
claw | +0.106 |
Neph | +0.101 |
Neg logit contributions | |
fitt | -0.097 |
slic | -0.091 |
hof | -0.087 |
leakage | -0.087 |
stamped | -0.086 |
Token |
|
Token ID | 198 |
Feature activation | -2.94e-02 |
Pos logit contributions | |
ˈ | +0.064 |
Redd | +0.054 |
Wan | +0.053 |
claw | +0.052 |
Neph | +0.050 |
Neg logit contributions | |
fitt | -0.054 |
slic | -0.050 |
leakage | -0.048 |
hof | -0.048 |
stamped | -0.047 |
Token | Google |
Token ID | 11708 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
ˈ | +0.075 |
Redd | +0.061 |
Wan | +0.059 |
claw | +0.059 |
Neph | +0.056 |
Neg logit contributions | |
fitt | -0.080 |
slic | -0.075 |
hof | -0.073 |
stamped | -0.072 |
leakage | -0.072 |
Token | Scholar |
Token ID | 11713 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
fitt | +0.052 |
slic | +0.050 |
hof | +0.049 |
leakage | +0.049 |
stamped | +0.049 |
Neg logit contributions | |
ˈ | -0.015 |
Redd | -0.009 |
Wan | -0.008 |
claw | -0.008 |
Neph | -0.006 |
Token | Crossref |
Token ID | 23613 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
ˈ | +0.353 |
Redd | +0.275 |
Wan | +0.264 |
claw | +0.261 |
Neph | +0.245 |
Neg logit contributions | |
fitt | -0.522 |
slic | -0.496 |
hof | -0.482 |
leakage | -0.480 |
stamped | -0.480 |
Token | | |
Token ID | 930 |
Feature activation | +5.51e-03 |
Pos logit contributions | |
ˈ | +0.933 |
Redd | +0.793 |
Wan | +0.771 |
claw | +0.764 |
Neph | +0.736 |
Neg logit contributions | |
fitt | -0.666 |
slic | -0.618 |
hof | -0.593 |
stamped | -0.592 |
leakage | -0.589 |
Token | ISI |
Token ID | 22048 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
fitt | +0.019 |
slic | +0.019 |
hof | +0.018 |
leakage | +0.018 |
stamped | +0.018 |
Neg logit contributions | |
ˈ | -0.010 |
Redd | -0.007 |
Wan | -0.007 |
claw | -0.007 |
Neph | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -8.08e-02 |
Pos logit contributions | |
ˈ | +1.304 |
Redd | +1.086 |
Wan | +1.064 |
claw | +1.055 |
Neph | +1.013 |
Neg logit contributions | |
fitt | -1.064 |
slic | -0.992 |
hof | -0.950 |
leakage | -0.949 |
stamped | -0.940 |
Token |
|
Token ID | 198 |
Feature activation | -7.66e-02 |
Pos logit contributions | |
ˈ | +0.233 |
Redd | +0.194 |
Wan | +0.190 |
claw | +0.189 |
Neph | +0.181 |
Neg logit contributions | |
fitt | -0.196 |
slic | -0.183 |
leakage | -0.175 |
hof | -0.174 |
stamped | -0.173 |
Token | M |
Token ID | 44 |
Feature activation | -4.29e-02 |
Pos logit contributions | |
ˈ | +0.189 |
Redd | +0.153 |
Wan | +0.149 |
claw | +0.147 |
Neph | +0.139 |
Neg logit contributions | |
fitt | -0.216 |
slic | -0.204 |
hof | -0.197 |
leakage | -0.196 |
stamped | -0.196 |
Token | ol |
Token ID | 349 |
Feature activation | -8.75e-02 |
Pos logit contributions | |
ˈ | +0.118 |
Redd | +0.097 |
Wan | +0.095 |
claw | +0.094 |
Neph | +0.090 |
Neg logit contributions | |
fitt | -0.109 |
slic | -0.102 |
hof | -0.098 |
leakage | -0.098 |
stamped | -0.098 |
Token | cho |
Token ID | 6679 |
Feature activation | -7.83e-02 |
Pos logit contributions | |
ˈ | +0.231 |
Redd | +0.187 |
Wan | +0.183 |
claw | +0.183 |
Neph | +0.173 |
Neg logit contributions | |
fitt | -0.232 |
slic | -0.219 |
leakage | -0.210 |
stamped | -0.209 |
hof | -0.208 |
Token |
|
Token ID | 198 |
Feature activation | -4.87e-02 |
Pos logit contributions | |
ˈ | +0.112 |
Redd | +0.094 |
Wan | +0.092 |
claw | +0.091 |
Neph | +0.087 |
Neg logit contributions | |
fitt | -0.093 |
slic | -0.087 |
leakage | -0.083 |
hof | -0.083 |
stamped | -0.082 |
Token | Google |
Token ID | 11708 |
Feature activation | -5.58e-03 |
Pos logit contributions | |
ˈ | +0.134 |
Redd | +0.112 |
Wan | +0.110 |
claw | +0.108 |
Neph | +0.102 |
Neg logit contributions | |
fitt | -0.125 |
slic | -0.116 |
leakage | -0.112 |
stamped | -0.111 |
hof | -0.111 |
Token | Scholar |
Token ID | 11713 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
ˈ | +0.006 |
Redd | +0.004 |
Wan | +0.003 |
claw | +0.003 |
Neph | +0.003 |
Neg logit contributions | |
fitt | -0.023 |
slic | -0.022 |
hof | -0.022 |
leakage | -0.022 |
stamped | -0.022 |
Token | Crossref |
Token ID | 23613 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
ˈ | +0.329 |
Redd | +0.255 |
Wan | +0.244 |
claw | +0.241 |
Neph | +0.224 |
Neg logit contributions | |
fitt | -0.514 |
slic | -0.490 |
hof | -0.475 |
stamped | -0.474 |
leakage | -0.473 |
Token | | |
Token ID | 930 |
Feature activation | -6.62e-03 |
Pos logit contributions | |
ˈ | +0.665 |
Redd | +0.558 |
Wan | +0.541 |
claw | +0.535 |
Neph | +0.512 |
Neg logit contributions | |
fitt | -0.586 |
slic | -0.548 |
hof | -0.528 |
stamped | -0.527 |
leakage | -0.525 |
Token | ISI |
Token ID | 22048 |
Feature activation | -4.46e-01 |
Pos logit contributions | |
ˈ | +0.012 |
Redd | +0.008 |
Wan | +0.008 |
claw | +0.008 |
Neph | +0.008 |
Neg logit contributions | |
fitt | -0.023 |
slic | -0.022 |
hof | -0.022 |
leakage | -0.022 |
stamped | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -6.85e-02 |
Pos logit contributions | |
ˈ | +1.285 |
Redd | +1.067 |
Wan | +1.047 |
claw | +1.039 |
Neph | +0.995 |
Neg logit contributions | |
fitt | -1.088 |
slic | -1.013 |
leakage | -0.970 |
hof | -0.961 |
stamped | -0.957 |
Token |
|
Token ID | 198 |
Feature activation | -7.44e-02 |
Pos logit contributions | |
ˈ | +0.198 |
Redd | +0.165 |
Wan | +0.161 |
claw | +0.161 |
Neph | +0.154 |
Neg logit contributions | |
fitt | -0.165 |
slic | -0.154 |
leakage | -0.148 |
hof | -0.147 |
stamped | -0.146 |
Token | Sal |
Token ID | 19221 |
Feature activation | +6.59e-02 |
Pos logit contributions | |
ˈ | +0.190 |
Redd | +0.155 |
Wan | +0.150 |
claw | +0.149 |
Neph | +0.141 |
Neg logit contributions | |
fitt | -0.203 |
slic | -0.191 |
hof | -0.185 |
leakage | -0.184 |
stamped | -0.184 |
Token | m |
Token ID | 76 |
Feature activation | -9.60e-02 |
Pos logit contributions | |
fitt | +0.169 |
slic | +0.158 |
leakage | +0.152 |
stamped | +0.152 |
hof | +0.151 |
Neg logit contributions | |
ˈ | -0.179 |
Redd | -0.147 |
Wan | -0.144 |
claw | -0.143 |
Neph | -0.136 |
Token | iv |
Token ID | 452 |
Feature activation | +9.47e-02 |
Pos logit contributions | |
ˈ | +0.273 |
Redd | +0.227 |
Wan | +0.221 |
claw | +0.220 |
Neph | +0.210 |
Neg logit contributions | |
fitt | -0.234 |
slic | -0.219 |
hof | -0.210 |
leakage | -0.210 |
stamped | -0.209 |
Token | Sh |
Token ID | 911 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
fitt | +0.030 |
slic | +0.028 |
hof | +0.027 |
leakage | +0.027 |
stamped | +0.027 |
Neg logit contributions | |
ˈ | -0.027 |
Redd | -0.022 |
Wan | -0.021 |
claw | -0.021 |
Neph | -0.020 |
Token | and |
Token ID | 392 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
ˈ | +0.338 |
Redd | +0.284 |
Wan | +0.277 |
claw | +0.275 |
Neph | +0.264 |
Neg logit contributions | |
fitt | -0.266 |
slic | -0.248 |
hof | -0.237 |
leakage | -0.237 |
stamped | -0.236 |
Token | ling |
Token ID | 1359 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
ˈ | +0.039 |
Redd | +0.033 |
Wan | +0.032 |
claw | +0.032 |
Neph | +0.030 |
Neg logit contributions | |
fitt | -0.030 |
slic | -0.028 |
hof | -0.027 |
leakage | -0.027 |
stamped | -0.027 |
Token | 1999 |
Token ID | 7358 |
Feature activation | -2.67e-02 |
Pos logit contributions | |
fitt | +0.425 |
slic | +0.394 |
hof | +0.381 |
stamped | +0.380 |
leakage | +0.379 |
Neg logit contributions | |
ˈ | -0.472 |
Redd | -0.393 |
Wan | -0.386 |
claw | -0.379 |
Neph | -0.358 |
Token | John |
Token ID | 1757 |
Feature activation | -3.83e-02 |
Pos logit contributions | |
ˈ | +0.055 |
Redd | +0.043 |
Wan | +0.041 |
claw | +0.040 |
Neph | +0.038 |
Neg logit contributions | |
fitt | -0.086 |
slic | -0.082 |
hof | -0.079 |
leakage | -0.079 |
stamped | -0.079 |
Token | Lith |
Token ID | 19730 |
Feature activation | -4.45e-01 |
Pos logit contributions | |
ˈ | +0.079 |
Redd | +0.061 |
Wan | +0.058 |
claw | +0.058 |
Neph | +0.054 |
Neg logit contributions | |
fitt | -0.124 |
slic | -0.118 |
hof | -0.114 |
leakage | -0.114 |
stamped | -0.113 |
Token | gow |
Token ID | 21175 |
Feature activation | +7.14e-02 |
Pos logit contributions | |
ˈ | +1.283 |
Redd | +1.064 |
claw | +1.045 |
Wan | +1.038 |
Neph | +0.987 |
Neg logit contributions | |
fitt | -1.072 |
slic | -1.011 |
leakage | -0.953 |
stamped | -0.949 |
hof | -0.940 |
Token |
|
Token ID | 198 |
Feature activation | +3.19e-02 |
Pos logit contributions | |
fitt | +0.167 |
slic | +0.156 |
hof | +0.149 |
leakage | +0.149 |
stamped | +0.148 |
Neg logit contributions | |
ˈ | -0.210 |
Redd | -0.176 |
Wan | -0.172 |
claw | -0.170 |
Neph | -0.163 |
Token |
|
Token ID | 198 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
fitt | +0.076 |
slic | +0.071 |
leakage | +0.068 |
hof | +0.068 |
stamped | +0.067 |
Neg logit contributions | |
ˈ | -0.093 |
Redd | -0.078 |
Wan | -0.076 |
claw | -0.076 |
Neph | -0.072 |
Token | 1999 |
Token ID | 18946 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
fitt | +0.064 |
slic | +0.060 |
hof | +0.058 |
stamped | +0.058 |
leakage | +0.057 |
Neg logit contributions | |
ˈ | -0.073 |
Redd | -0.060 |
Wan | -0.059 |
claw | -0.059 |
Neph | -0.056 |
Token | Michael |
Token ID | 3899 |
Feature activation | +4.16e-02 |
Pos logit contributions | |
ˈ | +0.028 |
Redd | +0.022 |
Wan | +0.021 |
claw | +0.021 |
Neph | +0.020 |
Neg logit contributions | |
fitt | -0.043 |
slic | -0.041 |
hof | -0.039 |
leakage | -0.039 |
stamped | -0.039 |
Token | the |
Token ID | 262 |
Feature activation | -4.48e-03 |
Pos logit contributions | |
ˈ | +0.138 |
Redd | +0.116 |
claw | +0.114 |
Wan | +0.113 |
Neph | +0.108 |
Neg logit contributions | |
fitt | -0.112 |
slic | -0.105 |
hof | -0.100 |
leakage | -0.100 |
stamped | -0.100 |
Token | reign |
Token ID | 13580 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
ˈ | +0.014 |
Redd | +0.011 |
Wan | +0.011 |
claw | +0.011 |
Neph | +0.011 |
Neg logit contributions | |
fitt | -0.010 |
slic | -0.009 |
hof | -0.009 |
leakage | -0.009 |
stamped | -0.009 |
Token | of |
Token ID | 286 |
Feature activation | +8.92e-03 |
Pos logit contributions | |
ˈ | +0.067 |
Redd | +0.054 |
Wan | +0.053 |
claw | +0.052 |
Neph | +0.050 |
Neg logit contributions | |
fitt | -0.070 |
slic | -0.066 |
hof | -0.064 |
leakage | -0.064 |
stamped | -0.063 |
Token | social |
Token ID | 1919 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
fitt | +0.023 |
slic | +0.022 |
hof | +0.021 |
leakage | +0.021 |
stamped | +0.021 |
Neg logit contributions | |
ˈ | -0.024 |
Redd | -0.020 |
Wan | -0.019 |
claw | -0.019 |
Neph | -0.018 |
Token | justice |
Token ID | 5316 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
fitt | +0.341 |
slic | +0.314 |
hof | +0.305 |
leakage | +0.298 |
stamped | +0.296 |
Neg logit contributions | |
ˈ | -0.567 |
Redd | -0.485 |
Wan | -0.475 |
claw | -0.471 |
Neph | -0.457 |
Token | indo |
Token ID | 23046 |
Feature activation | -4.45e-01 |
Pos logit contributions | |
ˈ | +0.395 |
Redd | +0.331 |
Wan | +0.322 |
claw | +0.321 |
Neph | +0.310 |
Neg logit contributions | |
fitt | -0.338 |
slic | -0.319 |
hof | -0.308 |
leakage | -0.305 |
stamped | -0.301 |
Token | ct |
Token ID | 310 |
Feature activation | -7.69e-02 |
Pos logit contributions | |
ˈ | +1.142 |
Redd | +0.925 |
Wan | +0.906 |
claw | +0.891 |
Neph | +0.847 |
Neg logit contributions | |
fitt | -1.196 |
slic | -1.139 |
leakage | -1.092 |
hof | -1.091 |
stamped | -1.077 |
Token | rin |
Token ID | 12769 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
ˈ | +0.174 |
Redd | +0.137 |
Wan | +0.132 |
claw | +0.132 |
Neph | +0.124 |
Neg logit contributions | |
fitt | -0.232 |
slic | -0.221 |
leakage | -0.213 |
stamped | -0.212 |
hof | -0.211 |
Token | ators |
Token ID | 2024 |
Feature activation | -6.82e-02 |
Pos logit contributions | |
ˈ | +0.469 |
Redd | +0.386 |
Wan | +0.378 |
claw | +0.377 |
Neph | +0.359 |
Neg logit contributions | |
fitt | -0.419 |
slic | -0.391 |
leakage | -0.377 |
hof | -0.375 |
stamped | -0.374 |
Token | , |
Token ID | 11 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
ˈ | +0.204 |
Redd | +0.172 |
Wan | +0.168 |
claw | +0.167 |
Neph | +0.161 |
Neg logit contributions | |
fitt | -0.156 |
slic | -0.145 |
hof | -0.139 |
leakage | -0.138 |
stamped | -0.137 |
Token | academics |
Token ID | 22321 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
ˈ | +0.105 |
Redd | +0.088 |
claw | +0.086 |
Wan | +0.086 |
Neph | +0.083 |
Neg logit contributions | |
fitt | -0.077 |
slic | -0.071 |
hof | -0.069 |
leakage | -0.067 |
stamped | -0.067 |
Token |
|
Token ID | 198 |
Feature activation | -8.13e-03 |
Pos logit contributions | |
fitt | +0.033 |
slic | +0.031 |
leakage | +0.029 |
hof | +0.029 |
stamped | +0.029 |
Neg logit contributions | |
ˈ | -0.040 |
Redd | -0.033 |
Wan | -0.033 |
claw | -0.032 |
Neph | -0.031 |
Token | As |
Token ID | 1722 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
ˈ | +0.019 |
Redd | +0.015 |
Wan | +0.015 |
claw | +0.015 |
Neph | +0.014 |
Neg logit contributions | |
fitt | -0.024 |
slic | -0.023 |
leakage | -0.022 |
hof | -0.022 |
stamped | -0.022 |
Token | a |
Token ID | 257 |
Feature activation | +5.57e-03 |
Pos logit contributions | |
ˈ | +0.034 |
Redd | +0.029 |
Wan | +0.028 |
claw | +0.028 |
Neph | +0.027 |
Neg logit contributions | |
fitt | -0.026 |
slic | -0.024 |
hof | -0.023 |
leakage | -0.023 |
stamped | -0.023 |
Token | neuro |
Token ID | 7669 |
Feature activation | +7.26e-02 |
Pos logit contributions | |
fitt | +0.011 |
slic | +0.010 |
hof | +0.009 |
leakage | +0.009 |
stamped | +0.009 |
Neg logit contributions | |
ˈ | -0.019 |
Redd | -0.016 |
Wan | -0.016 |
claw | -0.016 |
Neph | -0.015 |
Token | sur |
Token ID | 11793 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
fitt | +0.167 |
slic | +0.155 |
hof | +0.149 |
leakage | +0.148 |
stamped | +0.148 |
Neg logit contributions | |
ˈ | -0.217 |
Redd | -0.182 |
Wan | -0.178 |
claw | -0.177 |
Neph | -0.170 |
Token | geon |
Token ID | 6281 |
Feature activation | -4.43e-01 |
Pos logit contributions | |
ˈ | +0.346 |
Redd | +0.280 |
Wan | +0.272 |
claw | +0.268 |
Neph | +0.255 |
Neg logit contributions | |
fitt | -0.387 |
slic | -0.365 |
hof | -0.353 |
leakage | -0.352 |
stamped | -0.351 |
Token | specializing |
Token ID | 40847 |
Feature activation | -7.96e-02 |
Pos logit contributions | |
ˈ | +1.301 |
Redd | +1.082 |
claw | +1.062 |
Wan | +1.061 |
Neph | +1.015 |
Neg logit contributions | |
fitt | -1.033 |
slic | -0.963 |
leakage | -0.927 |
hof | -0.927 |
stamped | -0.915 |
Token | in |
Token ID | 287 |
Feature activation | -6.01e-03 |
Pos logit contributions | |
ˈ | +0.217 |
Redd | +0.180 |
Wan | +0.175 |
claw | +0.173 |
Neph | +0.166 |
Neg logit contributions | |
fitt | -0.203 |
slic | -0.190 |
hof | -0.182 |
stamped | -0.182 |
leakage | -0.181 |
Token | epilepsy |
Token ID | 35325 |
Feature activation | -1.43e-02 |
Pos logit contributions | |
ˈ | +0.018 |
Redd | +0.015 |
Wan | +0.015 |
claw | +0.015 |
Neph | +0.014 |
Neg logit contributions | |
fitt | -0.014 |
slic | -0.013 |
hof | -0.012 |
leakage | -0.012 |
stamped | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | +5.91e-02 |
Pos logit contributions | |
ˈ | +0.044 |
Redd | +0.037 |
Wan | +0.036 |
claw | +0.036 |
Neph | +0.034 |
Neg logit contributions | |
fitt | -0.032 |
slic | -0.030 |
hof | -0.028 |
leakage | -0.028 |
stamped | -0.028 |
Token | Chang |
Token ID | 22597 |
Feature activation | +7.96e-02 |
Pos logit contributions | |
fitt | +0.152 |
slic | +0.142 |
hof | +0.137 |
leakage | +0.137 |
stamped | +0.137 |
Neg logit contributions | |
ˈ | -0.160 |
Redd | -0.132 |
Wan | -0.129 |
claw | -0.128 |
Neph | -0.122 |
Token | Sh |
Token ID | 911 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
fitt | +0.094 |
slic | +0.089 |
hof | +0.085 |
leakage | +0.085 |
stamped | +0.085 |
Neg logit contributions | |
ˈ | -0.085 |
Redd | -0.069 |
Wan | -0.067 |
claw | -0.067 |
Neph | -0.063 |
Token | and |
Token ID | 392 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
ˈ | +0.376 |
Redd | +0.315 |
Wan | +0.307 |
claw | +0.306 |
Neph | +0.292 |
Neg logit contributions | |
fitt | -0.298 |
slic | -0.278 |
leakage | -0.265 |
hof | -0.265 |
stamped | -0.264 |
Token | ling |
Token ID | 1359 |
Feature activation | +1.54e-01 |
Pos logit contributions | |
fitt | +0.025 |
slic | +0.023 |
leakage | +0.022 |
hof | +0.022 |
stamped | +0.022 |
Neg logit contributions | |
ˈ | -0.031 |
Redd | -0.026 |
Wan | -0.026 |
claw | -0.026 |
Neph | -0.024 |
Token | 1996 |
Token ID | 8235 |
Feature activation | -4.32e-02 |
Pos logit contributions | |
fitt | +0.368 |
slic | +0.340 |
hof | +0.332 |
stamped | +0.331 |
leakage | +0.328 |
Neg logit contributions | |
ˈ | -0.446 |
Redd | -0.373 |
Wan | -0.370 |
claw | -0.359 |
Neph | -0.344 |
Token | John |
Token ID | 1757 |
Feature activation | -3.20e-02 |
Pos logit contributions | |
ˈ | +0.095 |
Redd | +0.075 |
Wan | +0.072 |
claw | +0.071 |
Neph | +0.068 |
Neg logit contributions | |
fitt | -0.133 |
slic | -0.126 |
hof | -0.122 |
leakage | -0.122 |
stamped | -0.121 |
Token | Lith |
Token ID | 19730 |
Feature activation | -4.40e-01 |
Pos logit contributions | |
ˈ | +0.087 |
Redd | +0.072 |
Wan | +0.070 |
claw | +0.069 |
Neph | +0.066 |
Neg logit contributions | |
fitt | -0.082 |
slic | -0.076 |
hof | -0.074 |
leakage | -0.073 |
stamped | -0.073 |
Token | gow |
Token ID | 21175 |
Feature activation | +1.26e-01 |
Pos logit contributions | |
ˈ | +1.266 |
Redd | +1.056 |
claw | +1.033 |
Wan | +1.032 |
Neph | +0.981 |
Neg logit contributions | |
fitt | -1.052 |
slic | -0.987 |
leakage | -0.941 |
stamped | -0.938 |
hof | -0.931 |
Token |
|
Token ID | 198 |
Feature activation | +5.15e-02 |
Pos logit contributions | |
fitt | +0.273 |
slic | +0.251 |
hof | +0.246 |
stamped | +0.244 |
leakage | +0.242 |
Neg logit contributions | |
ˈ | -0.389 |
Redd | -0.329 |
Wan | -0.327 |
claw | -0.319 |
Neph | -0.305 |
Token |
|
Token ID | 198 |
Feature activation | +4.42e-02 |
Pos logit contributions | |
fitt | +0.123 |
slic | +0.115 |
leakage | +0.109 |
hof | +0.109 |
stamped | +0.109 |
Neg logit contributions | |
ˈ | -0.150 |
Redd | -0.126 |
Wan | -0.123 |
claw | -0.122 |
Neph | -0.117 |
Token | 1996 |
Token ID | 22288 |
Feature activation | -3.23e-02 |
Pos logit contributions | |
fitt | +0.117 |
slic | +0.109 |
hof | +0.107 |
stamped | +0.106 |
leakage | +0.105 |
Neg logit contributions | |
ˈ | -0.115 |
Redd | -0.093 |
Wan | -0.092 |
claw | -0.091 |
Neph | -0.087 |
Token | Kel |
Token ID | 15150 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
ˈ | +0.084 |
Redd | +0.069 |
Wan | +0.067 |
claw | +0.066 |
Neph | +0.064 |
Neg logit contributions | |
fitt | -0.086 |
slic | -0.081 |
hof | -0.078 |
leakage | -0.078 |
stamped | -0.078 |
Token | love |
Token ID | 1842 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
fitt | +0.025 |
slic | +0.023 |
hof | +0.022 |
leakage | +0.022 |
stamped | +0.022 |
Neg logit contributions | |
ˈ | -0.038 |
Redd | -0.032 |
Wan | -0.032 |
claw | -0.031 |
Neph | -0.031 |
Token | letter |
Token ID | 3850 |
Feature activation | +8.80e-03 |
Pos logit contributions | |
fitt | +0.044 |
slic | +0.041 |
hof | +0.039 |
leakage | +0.039 |
stamped | +0.039 |
Neg logit contributions | |
ˈ | -0.071 |
Redd | -0.061 |
Wan | -0.060 |
claw | -0.059 |
Neph | -0.057 |
Token | to |
Token ID | 284 |
Feature activation | -2.26e-02 |
Pos logit contributions | |
fitt | +0.022 |
slic | +0.021 |
hof | +0.020 |
leakage | +0.020 |
stamped | +0.020 |
Neg logit contributions | |
ˈ | -0.024 |
Redd | -0.020 |
Wan | -0.020 |
claw | -0.019 |
Neph | -0.019 |
Token | New |
Token ID | 968 |
Feature activation | -4.20e-02 |
Pos logit contributions | |
ˈ | +0.068 |
Redd | +0.057 |
Wan | +0.055 |
claw | +0.055 |
Neph | +0.053 |
Neg logit contributions | |
fitt | -0.052 |
slic | -0.048 |
hof | -0.046 |
leakage | -0.046 |
stamped | -0.046 |
Token | York |
Token ID | 1971 |
Feature activation | +1.77e-01 |
Pos logit contributions | |
ˈ | +0.097 |
Redd | +0.078 |
Wan | +0.075 |
claw | +0.075 |
Neph | +0.071 |
Neg logit contributions | |
fitt | -0.124 |
slic | -0.118 |
hof | -0.113 |
leakage | -0.113 |
stamped | -0.112 |
Token | City |
Token ID | 2254 |
Feature activation | +3.45e-01 |
Pos logit contributions | |
fitt | +0.384 |
slic | +0.357 |
hof | +0.342 |
leakage | +0.340 |
stamped | +0.336 |
Neg logit contributions | |
ˈ | -0.548 |
Redd | -0.463 |
Wan | -0.453 |
claw | -0.451 |
Neph | -0.432 |
Token | may |
Token ID | 743 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
fitt | +0.742 |
slic | +0.688 |
hof | +0.660 |
leakage | +0.655 |
stamped | +0.648 |
Neg logit contributions | |
ˈ | -1.078 |
Redd | -0.911 |
Wan | -0.891 |
claw | -0.890 |
Neph | -0.853 |
Token | very |
Token ID | 845 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
ˈ | +0.044 |
Redd | +0.036 |
claw | +0.036 |
Wan | +0.036 |
Neph | +0.034 |
Neg logit contributions | |
fitt | -0.030 |
slic | -0.028 |
hof | -0.026 |
leakage | -0.026 |
stamped | -0.026 |
Token | well |
Token ID | 880 |
Feature activation | -4.97e-02 |
Pos logit contributions | |
fitt | +0.044 |
slic | +0.040 |
hof | +0.037 |
leakage | +0.037 |
stamped | +0.037 |
Neg logit contributions | |
ˈ | -0.104 |
Redd | -0.090 |
Wan | -0.088 |
claw | -0.088 |
Neph | -0.085 |
Token | be |
Token ID | 307 |
Feature activation | -4.40e-02 |
Pos logit contributions | |
ˈ | +0.155 |
Redd | +0.128 |
claw | +0.128 |
Wan | +0.127 |
Neph | +0.122 |
Neg logit contributions | |
fitt | -0.106 |
slic | -0.099 |
hof | -0.095 |
leakage | -0.094 |
stamped | -0.091 |
Token | his |
Token ID | 465 |
Feature activation | -1.95e-02 |
Pos logit contributions | |
ˈ | +0.133 |
Redd | +0.112 |
Wan | +0.110 |
claw | +0.109 |
Neph | +0.105 |
Neg logit contributions | |
fitt | -0.099 |
slic | -0.092 |
hof | -0.088 |
leakage | -0.088 |
stamped | -0.086 |
Token | remote |
Token ID | 6569 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
fitt | +0.214 |
slic | +0.199 |
hof | +0.194 |
leakage | +0.192 |
stamped | +0.190 |
Neg logit contributions | |
ˈ | -0.262 |
Redd | -0.220 |
Wan | -0.213 |
claw | -0.213 |
Neph | -0.204 |
Token | control |
Token ID | 1630 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
fitt | +0.220 |
slic | +0.203 |
hof | +0.196 |
leakage | +0.193 |
stamped | +0.191 |
Neg logit contributions | |
ˈ | -0.330 |
Redd | -0.282 |
Wan | -0.276 |
claw | -0.273 |
Neph | -0.263 |
Token | cars |
Token ID | 5006 |
Feature activation | +9.50e-02 |
Pos logit contributions | |
fitt | +0.279 |
slic | +0.259 |
hof | +0.251 |
leakage | +0.249 |
stamped | +0.247 |
Neg logit contributions | |
ˈ | -0.350 |
Redd | -0.293 |
Wan | -0.286 |
claw | -0.284 |
Neph | -0.273 |
Token | 1993 |
Token ID | 9656 |
Feature activation | +2.05e-02 |
Pos logit contributions | |
fitt | +0.242 |
slic | +0.227 |
hof | +0.219 |
leakage | +0.218 |
stamped | +0.217 |
Neg logit contributions | |
ˈ | -0.259 |
Redd | -0.213 |
Wan | -0.208 |
claw | -0.206 |
Neph | -0.197 |
Token | : |
Token ID | 25 |
Feature activation | +5.97e-02 |
Pos logit contributions | |
fitt | +0.047 |
slic | +0.044 |
hof | +0.042 |
leakage | +0.042 |
stamped | +0.042 |
Neg logit contributions | |
ˈ | -0.061 |
Redd | -0.051 |
Wan | -0.050 |
claw | -0.049 |
Neph | -0.047 |
Token | Father |
Token ID | 9190 |
Feature activation | +3.05e-01 |
Pos logit contributions | |
fitt | +0.156 |
slic | +0.146 |
hof | +0.142 |
leakage | +0.141 |
stamped | +0.140 |
Neg logit contributions | |
ˈ | -0.159 |
Redd | -0.131 |
Wan | -0.128 |
claw | -0.126 |
Neph | -0.121 |
Token | buys |
Token ID | 24779 |
Feature activation | +8.39e-02 |
Pos logit contributions | |
fitt | +0.754 |
slic | +0.703 |
hof | +0.685 |
leakage | +0.679 |
stamped | +0.674 |
Neg logit contributions | |
ˈ | -0.851 |
Redd | -0.707 |
Wan | -0.688 |
claw | -0.684 |
Neph | -0.657 |
Token | him |
Token ID | 683 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
fitt | +0.209 |
slic | +0.196 |
hof | +0.190 |
leakage | +0.189 |
stamped | +0.188 |
Neg logit contributions | |
ˈ | -0.232 |
Redd | -0.192 |
Wan | -0.188 |
claw | -0.186 |
Neph | -0.178 |
Token | a |
Token ID | 257 |
Feature activation | +6.11e-02 |
Pos logit contributions | |
fitt | +0.302 |
slic | +0.280 |
hof | +0.269 |
leakage | +0.268 |
stamped | +0.267 |
Neg logit contributions | |
ˈ | -0.412 |
Redd | -0.348 |
Wan | -0.340 |
claw | -0.338 |
Neph | -0.325 |
Token | £ |
Token ID | 4248 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
fitt | +0.131 |
slic | +0.121 |
hof | +0.116 |
leakage | +0.116 |
stamped | +0.115 |
Neg logit contributions | |
ˈ | -0.191 |
Redd | -0.162 |
Wan | -0.159 |
claw | -0.158 |
Neph | -0.152 |
Token | 1 |
Token ID | 16 |
Feature activation | +7.37e-02 |
Pos logit contributions | |
ˈ | +0.349 |
Redd | +0.289 |
claw | +0.284 |
Wan | +0.284 |
Neph | +0.267 |
Neg logit contributions | |
fitt | -0.320 |
slic | -0.299 |
leakage | -0.288 |
stamped | -0.285 |
hof | -0.283 |
Token | . |
Token ID | 13 |
Feature activation | +6.72e-02 |
Pos logit contributions | |
fitt | +0.196 |
slic | +0.183 |
hof | +0.179 |
leakage | +0.176 |
stamped | +0.176 |
Neg logit contributions | |
ˈ | -0.206 |
Redd | -0.169 |
Wan | -0.163 |
claw | -0.162 |
Neph | -0.154 |
Token | Sel |
Token ID | 15300 |
Feature activation | +4.91e-02 |
Pos logit contributions | |
fitt | +0.181 |
slic | +0.170 |
hof | +0.164 |
leakage | +0.163 |
stamped | +0.163 |
Neg logit contributions | |
ˈ | -0.174 |
Redd | -0.142 |
Wan | -0.138 |
claw | -0.137 |
Neph | -0.130 |
Token | z |
Token ID | 89 |
Feature activation | -7.70e-02 |
Pos logit contributions | |
fitt | +0.128 |
slic | +0.120 |
leakage | +0.115 |
stamped | +0.115 |
hof | +0.114 |
Neg logit contributions | |
ˈ | -0.132 |
Redd | -0.108 |
Wan | -0.106 |
claw | -0.105 |
Neph | -0.100 |
Token | nick |
Token ID | 17172 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
ˈ | +0.197 |
Redd | +0.159 |
Wan | +0.155 |
claw | +0.155 |
Neph | +0.146 |
Neg logit contributions | |
fitt | -0.211 |
slic | -0.198 |
hof | -0.191 |
leakage | -0.190 |
stamped | -0.190 |
Token | was |
Token ID | 373 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
ˈ | +0.446 |
Redd | +0.372 |
Wan | +0.365 |
claw | +0.364 |
Neph | +0.348 |
Neg logit contributions | |
fitt | -0.338 |
slic | -0.315 |
leakage | -0.302 |
hof | -0.300 |
stamped | -0.298 |
Token | inspired |
Token ID | 7867 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
ˈ | +0.039 |
Redd | +0.033 |
Wan | +0.032 |
claw | +0.032 |
Neph | +0.031 |
Neg logit contributions | |
fitt | -0.027 |
slic | -0.025 |
hof | -0.024 |
leakage | -0.024 |
stamped | -0.024 |
Token | , |
Token ID | 11 |
Feature activation | -2.73e-02 |
Pos logit contributions | |
fitt | +0.652 |
slic | +0.606 |
hof | +0.582 |
leakage | +0.579 |
stamped | +0.579 |
Neg logit contributions | |
ˈ | -0.841 |
Redd | -0.707 |
Wan | -0.691 |
claw | -0.685 |
Neph | -0.658 |
Token | in |
Token ID | 287 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
ˈ | +0.080 |
Redd | +0.066 |
Wan | +0.065 |
claw | +0.065 |
Neph | +0.062 |
Neg logit contributions | |
fitt | -0.064 |
slic | -0.060 |
hof | -0.058 |
leakage | -0.058 |
stamped | -0.057 |
Token | large |
Token ID | 1588 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
fitt | +0.029 |
slic | +0.027 |
hof | +0.026 |
leakage | +0.026 |
stamped | +0.025 |
Neg logit contributions | |
ˈ | -0.039 |
Redd | -0.033 |
Wan | -0.032 |
claw | -0.032 |
Neph | -0.031 |
Token | part |
Token ID | 636 |
Feature activation | -7.59e-02 |
Pos logit contributions | |
ˈ | +0.102 |
Redd | +0.086 |
Wan | +0.084 |
claw | +0.084 |
Neph | +0.081 |
Neg logit contributions | |
fitt | -0.072 |
slic | -0.067 |
hof | -0.064 |
leakage | -0.064 |
stamped | -0.063 |
Token | , |
Token ID | 11 |
Feature activation | +3.73e-04 |
Pos logit contributions | |
ˈ | +0.233 |
Redd | +0.198 |
Wan | +0.192 |
claw | +0.191 |
Neph | +0.184 |
Neg logit contributions | |
fitt | -0.168 |
slic | -0.155 |
stamped | -0.149 |
hof | -0.148 |
leakage | -0.148 |
Token | July |
Token ID | 2901 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
fitt | +0.267 |
slic | +0.251 |
hof | +0.244 |
leakage | +0.244 |
stamped | +0.243 |
Neg logit contributions | |
ˈ | -0.248 |
Redd | -0.204 |
Wan | -0.198 |
claw | -0.194 |
Neph | -0.186 |
Token | 2017 |
Token ID | 2177 |
Feature activation | +4.17e-02 |
Pos logit contributions | |
fitt | +0.218 |
slic | +0.203 |
hof | +0.194 |
leakage | +0.192 |
stamped | +0.191 |
Neg logit contributions | |
ˈ | -0.313 |
Redd | -0.264 |
Wan | -0.259 |
claw | -0.258 |
Neph | -0.248 |
Token | , |
Token ID | 11 |
Feature activation | +7.99e-02 |
Pos logit contributions | |
fitt | +0.096 |
slic | +0.090 |
hof | +0.086 |
stamped | +0.085 |
leakage | +0.085 |
Neg logit contributions | |
ˈ | -0.124 |
Redd | -0.103 |
claw | -0.101 |
Wan | -0.101 |
Neph | -0.096 |
Token | Christopher |
Token ID | 12803 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
fitt | +0.165 |
slic | +0.154 |
hof | +0.149 |
stamped | +0.144 |
leakage | +0.143 |
Neg logit contributions | |
ˈ | -0.253 |
Redd | -0.214 |
claw | -0.211 |
Wan | -0.210 |
Neph | -0.203 |
Token | reck |
Token ID | 12482 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
ˈ | +0.093 |
Redd | +0.077 |
Wan | +0.076 |
claw | +0.075 |
Neph | +0.072 |
Neg logit contributions | |
fitt | -0.081 |
slic | -0.076 |
hof | -0.073 |
leakage | -0.073 |
stamped | -0.072 |
Token | ons |
Token ID | 684 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
fitt | +0.347 |
slic | +0.329 |
leakage | +0.320 |
stamped | +0.317 |
hof | +0.317 |
Neg logit contributions | |
ˈ | -0.276 |
Redd | -0.219 |
Wan | -0.213 |
claw | -0.210 |
Neph | -0.199 |
Token | there |
Token ID | 612 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
fitt | +0.587 |
slic | +0.546 |
hof | +0.526 |
stamped | +0.518 |
leakage | +0.516 |
Neg logit contributions | |
ˈ | -0.821 |
Redd | -0.693 |
Wan | -0.679 |
claw | -0.674 |
Neph | -0.649 |
Token | will |
Token ID | 481 |
Feature activation | +5.98e-02 |
Pos logit contributions | |
fitt | +0.054 |
slic | +0.050 |
hof | +0.048 |
leakage | +0.048 |
stamped | +0.047 |
Neg logit contributions | |
ˈ | -0.084 |
Redd | -0.071 |
Wan | -0.070 |
claw | -0.069 |
Neph | -0.067 |
Token | likely |
Token ID | 1884 |
Feature activation | +6.35e-02 |
Pos logit contributions | |
fitt | +0.130 |
slic | +0.120 |
hof | +0.115 |
leakage | +0.114 |
stamped | +0.114 |
Neg logit contributions | |
ˈ | -0.186 |
Redd | -0.158 |
Wan | -0.154 |
claw | -0.153 |
Neph | -0.147 |
Token | be |
Token ID | 307 |
Feature activation | +8.22e-03 |
Pos logit contributions | |
fitt | +0.134 |
slic | +0.124 |
hof | +0.119 |
leakage | +0.119 |
stamped | +0.118 |
Neg logit contributions | |
ˈ | -0.201 |
Redd | -0.171 |
Wan | -0.168 |
claw | -0.166 |
Neph | -0.160 |
Token | a |
Token ID | 257 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
fitt | +0.018 |
slic | +0.017 |
hof | +0.016 |
stamped | +0.016 |
leakage | +0.016 |
Neg logit contributions | |
ˈ | -0.025 |
Redd | -0.021 |
claw | -0.021 |
Wan | -0.021 |
Neph | -0.020 |
Token | cards |
Token ID | 4116 |
Feature activation | +7.60e-02 |
Pos logit contributions | |
ˈ | +0.141 |
Redd | +0.120 |
Wan | +0.117 |
claw | +0.117 |
Neph | +0.112 |
Neg logit contributions | |
fitt | -0.096 |
slic | -0.089 |
hof | -0.086 |
leakage | -0.085 |
stamped | -0.085 |
Token | and |
Token ID | 290 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
fitt | +0.161 |
slic | +0.149 |
stamped | +0.142 |
hof | +0.142 |
leakage | +0.141 |
Neg logit contributions | |
ˈ | -0.241 |
Redd | -0.205 |
Wan | -0.200 |
claw | -0.199 |
Neph | -0.192 |
Token | legitimate |
Token ID | 9829 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
ˈ | +0.039 |
Redd | +0.033 |
Wan | +0.032 |
claw | +0.032 |
Neph | +0.031 |
Neg logit contributions | |
fitt | -0.023 |
slic | -0.021 |
hof | -0.021 |
leakage | -0.020 |
stamped | -0.020 |
Token | - |
Token ID | 12 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
ˈ | +0.371 |
Redd | +0.321 |
Wan | +0.314 |
claw | +0.312 |
Neph | +0.303 |
Neg logit contributions | |
fitt | -0.199 |
slic | -0.182 |
hof | -0.177 |
leakage | -0.171 |
stamped | -0.168 |
Token | app |
Token ID | 1324 |
Feature activation | +9.51e-02 |
Pos logit contributions | |
ˈ | +0.031 |
Redd | +0.026 |
claw | +0.025 |
Wan | +0.025 |
Neph | +0.024 |
Neg logit contributions | |
fitt | -0.023 |
slic | -0.021 |
hof | -0.020 |
leakage | -0.020 |
stamped | -0.020 |
Token | earing |
Token ID | 6648 |
Feature activation | +2.80e-01 |
Pos logit contributions | |
fitt | +0.227 |
slic | +0.212 |
hof | +0.203 |
stamped | +0.202 |
leakage | +0.202 |
Neg logit contributions | |
ˈ | -0.276 |
Redd | -0.230 |
claw | -0.223 |
Wan | -0.222 |
Neph | -0.212 |
Token | front |
Token ID | 2166 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
fitt | +0.532 |
slic | +0.486 |
hof | +0.471 |
leakage | +0.462 |
stamped | +0.457 |
Neg logit contributions | |
ˈ | -0.943 |
Redd | -0.812 |
Wan | -0.792 |
claw | -0.788 |
Neph | -0.764 |
Token | companies |
Token ID | 2706 |
Feature activation | +1.33e-02 |
Pos logit contributions | |
fitt | +0.197 |
slic | +0.178 |
hof | +0.169 |
leakage | +0.167 |
stamped | +0.166 |
Neg logit contributions | |
ˈ | -0.411 |
Redd | -0.357 |
Wan | -0.350 |
claw | -0.348 |
Neph | -0.336 |
Token | . |
Token ID | 13 |
Feature activation | +1.44e-02 |
Pos logit contributions | |
fitt | +0.030 |
slic | +0.028 |
hof | +0.027 |
leakage | +0.027 |
stamped | +0.026 |
Neg logit contributions | |
ˈ | -0.040 |
Redd | -0.034 |
Wan | -0.033 |
claw | -0.033 |
Neph | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
fitt | +0.035 |
slic | +0.033 |
hof | +0.031 |
leakage | +0.031 |
stamped | +0.031 |
Neg logit contributions | |
ˈ | -0.041 |
Redd | -0.034 |
Wan | -0.033 |
claw | -0.033 |
Neph | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | +3.71e-03 |
Pos logit contributions | |
fitt | +0.051 |
slic | +0.047 |
leakage | +0.045 |
hof | +0.045 |
stamped | +0.045 |
Neg logit contributions | |
ˈ | -0.062 |
Redd | -0.051 |
Wan | -0.050 |
claw | -0.050 |
Neph | -0.048 |
Token | would |
Token ID | 561 |
Feature activation | -2.66e-02 |
Pos logit contributions | |
fitt | +0.227 |
slic | +0.212 |
hof | +0.201 |
leakage | +0.199 |
stamped | +0.197 |
Neg logit contributions | |
ˈ | -0.369 |
Redd | -0.313 |
Wan | -0.307 |
claw | -0.307 |
Neph | -0.297 |
Token | be |
Token ID | 307 |
Feature activation | -3.16e-02 |
Pos logit contributions | |
ˈ | +0.080 |
Redd | +0.066 |
claw | +0.065 |
Wan | +0.065 |
Neph | +0.063 |
Neg logit contributions | |
fitt | -0.059 |
slic | -0.056 |
hof | -0.053 |
leakage | -0.053 |
stamped | -0.052 |
Token | preserved |
Token ID | 17232 |
Feature activation | +2.34e-01 |
Pos logit contributions | |
ˈ | +0.105 |
Redd | +0.090 |
Wan | +0.088 |
claw | +0.087 |
Neph | +0.085 |
Neg logit contributions | |
fitt | -0.061 |
slic | -0.056 |
hof | -0.054 |
leakage | -0.053 |
stamped | -0.052 |
Token | as |
Token ID | 355 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
fitt | +0.593 |
slic | +0.556 |
hof | +0.536 |
leakage | +0.534 |
stamped | +0.531 |
Neg logit contributions | |
ˈ | -0.642 |
Redd | -0.529 |
Wan | -0.516 |
claw | -0.513 |
Neph | -0.490 |
Token | a |
Token ID | 257 |
Feature activation | +4.93e-03 |
Pos logit contributions | |
ˈ | +0.069 |
Redd | +0.058 |
Wan | +0.057 |
claw | +0.056 |
Neph | +0.055 |
Neg logit contributions | |
fitt | -0.048 |
slic | -0.045 |
hof | -0.043 |
leakage | -0.043 |
stamped | -0.042 |
Token | special |
Token ID | 2041 |
Feature activation | +5.81e-02 |
Pos logit contributions | |
fitt | +0.009 |
slic | +0.008 |
hof | +0.008 |
leakage | +0.008 |
stamped | +0.008 |
Neg logit contributions | |
ˈ | -0.017 |
Redd | -0.014 |
Wan | -0.014 |
claw | -0.014 |
Neph | -0.014 |
Token | Se |
Token ID | 1001 |
Feature activation | +1.70e-01 |
Pos logit contributions | |
fitt | +0.114 |
slic | +0.105 |
hof | +0.100 |
leakage | +0.099 |
stamped | +0.098 |
Neg logit contributions | |
ˈ | -0.192 |
Redd | -0.165 |
Wan | -0.161 |
claw | -0.160 |
Neph | -0.155 |
Token | gu |
Token ID | 5162 |
Feature activation | +1.10e-03 |
Pos logit contributions | |
fitt | +0.452 |
slic | +0.425 |
leakage | +0.408 |
stamped | +0.407 |
hof | +0.407 |
Neg logit contributions | |
ˈ | -0.449 |
Redd | -0.367 |
Wan | -0.357 |
claw | -0.356 |
Neph | -0.338 |
Token | in |
Token ID | 259 |
Feature activation | +9.95e-03 |
Pos logit contributions | |
fitt | +0.003 |
slic | +0.003 |
leakage | +0.002 |
hof | +0.002 |
stamped | +0.002 |
Neg logit contributions | |
ˈ | -0.003 |
Redd | -0.003 |
Wan | -0.003 |
claw | -0.002 |
Neph | -0.002 |
Token | landmark |
Token ID | 20533 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
fitt | +0.026 |
slic | +0.024 |
leakage | +0.023 |
hof | +0.023 |
stamped | +0.023 |
Neg logit contributions | |
ˈ | -0.027 |
Redd | -0.022 |
Wan | -0.021 |
claw | -0.021 |
Neph | -0.020 |
Token | for |
Token ID | 329 |
Feature activation | -4.22e-03 |
Pos logit contributions | |
fitt | +0.379 |
slic | +0.356 |
hof | +0.343 |
leakage | +0.342 |
stamped | +0.339 |
Neg logit contributions | |
ˈ | -0.388 |
Redd | -0.318 |
Wan | -0.309 |
claw | -0.308 |
Neph | -0.293 |
Token | ers |
Token ID | 364 |
Feature activation | -1.96e-01 |
Pos logit contributions | |
ˈ | +0.461 |
Redd | +0.382 |
Wan | +0.373 |
claw | +0.370 |
Neph | +0.353 |
Neg logit contributions | |
fitt | -0.409 |
slic | -0.382 |
hof | -0.368 |
leakage | -0.367 |
stamped | -0.366 |
Token | Reading |
Token ID | 36120 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
ˈ | +0.311 |
Redd | +0.220 |
Wan | +0.209 |
claw | +0.204 |
Neph | +0.184 |
Neg logit contributions | |
fitt | -0.725 |
slic | -0.694 |
hof | -0.675 |
leakage | -0.674 |
stamped | -0.673 |
Token | 106 |
Token ID | 15696 |
Feature activation | -3.83e-03 |
Pos logit contributions | |
ˈ | +0.496 |
Redd | +0.411 |
Wan | +0.400 |
claw | +0.398 |
Neph | +0.386 |
Neg logit contributions | |
fitt | -0.456 |
slic | -0.428 |
hof | -0.411 |
leakage | -0.406 |
stamped | -0.405 |
Token | 378 |
Token ID | 30695 |
Feature activation | +4.09e-02 |
Pos logit contributions | |
ˈ | +0.012 |
Redd | +0.010 |
Wan | +0.010 |
claw | +0.010 |
Neph | +0.009 |
Neg logit contributions | |
fitt | -0.008 |
slic | -0.008 |
hof | -0.007 |
leakage | -0.007 |
stamped | -0.007 |
Token | 46 |
Token ID | 3510 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
fitt | +0.091 |
slic | +0.084 |
hof | +0.081 |
leakage | +0.080 |
stamped | +0.080 |
Neg logit contributions | |
ˈ | -0.125 |
Redd | -0.106 |
Wan | -0.104 |
claw | -0.103 |
Neph | -0.099 |
Token | 40 |
Token ID | 2319 |
Feature activation | +2.06e-03 |
Pos logit contributions | |
fitt | +0.324 |
slic | +0.302 |
hof | +0.290 |
leakage | +0.289 |
stamped | +0.287 |
Neg logit contributions | |
ˈ | -0.372 |
Redd | -0.310 |
Wan | -0.302 |
claw | -0.300 |
Neph | -0.289 |
Token | 995 |
Token ID | 33438 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
fitt | +0.004 |
slic | +0.004 |
leakage | +0.004 |
hof | +0.004 |
stamped | +0.004 |
Neg logit contributions | |
ˈ | -0.006 |
Redd | -0.005 |
Wan | -0.005 |
claw | -0.005 |
Neph | -0.005 |
Token | 47 |
Token ID | 2857 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
fitt | +0.291 |
slic | +0.268 |
hof | +0.257 |
leakage | +0.255 |
stamped | +0.253 |
Neg logit contributions | |
ˈ | -0.406 |
Redd | -0.343 |
Wan | -0.337 |
claw | -0.336 |
Neph | -0.324 |
Token | Boost |
Token ID | 19835 |
Feature activation | +9.37e-03 |
Pos logit contributions | |
fitt | +0.269 |
slic | +0.250 |
hof | +0.241 |
leakage | +0.240 |
stamped | +0.239 |
Neg logit contributions | |
ˈ | -0.315 |
Redd | -0.262 |
Wan | -0.255 |
claw | -0.254 |
Neph | -0.245 |
Token | Serial |
Token ID | 32634 |
Feature activation | -1.54e-01 |
Pos logit contributions | |
fitt | +0.022 |
slic | +0.021 |
hof | +0.020 |
leakage | +0.020 |
stamped | +0.020 |
Neg logit contributions | |
ˈ | -0.027 |
Redd | -0.023 |
Wan | -0.022 |
claw | -0.022 |
Neph | -0.021 |
Token | ization |
Token ID | 1634 |
Feature activation | +6.68e-03 |
Pos logit contributions | |
ˈ | +0.542 |
Redd | +0.468 |
Wan | +0.460 |
claw | +0.457 |
Neph | +0.442 |
Neg logit contributions | |
fitt | -0.271 |
slic | -0.246 |
hof | -0.233 |
leakage | -0.231 |
stamped | -0.230 |
Token | a |
Token ID | 257 |
Feature activation | -8.71e-03 |
Pos logit contributions | |
ˈ | +0.143 |
Redd | +0.121 |
Wan | +0.118 |
claw | +0.118 |
Neph | +0.113 |
Neg logit contributions | |
fitt | -0.100 |
slic | -0.093 |
hof | -0.089 |
leakage | -0.087 |
stamped | -0.086 |
Token | high |
Token ID | 1029 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
ˈ | +0.030 |
Redd | +0.026 |
Wan | +0.025 |
claw | +0.025 |
Neph | +0.024 |
Neg logit contributions | |
fitt | -0.016 |
slic | -0.014 |
hof | -0.014 |
leakage | -0.014 |
stamped | -0.013 |
Token | job |
Token ID | 1693 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
ˈ | +0.381 |
Redd | +0.323 |
claw | +0.320 |
Wan | +0.317 |
Neph | +0.307 |
Neg logit contributions | |
fitt | -0.222 |
slic | -0.206 |
hof | -0.198 |
stamped | -0.190 |
leakage | -0.190 |
Token | placement |
Token ID | 13127 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
ˈ | +0.635 |
Redd | +0.545 |
claw | +0.538 |
Wan | +0.533 |
Neph | +0.510 |
Neg logit contributions | |
fitt | -0.336 |
slic | -0.309 |
hof | -0.293 |
leakage | -0.287 |
stamped | -0.286 |
Token | rate |
Token ID | 2494 |
Feature activation | +9.47e-02 |
Pos logit contributions | |
ˈ | +0.636 |
Redd | +0.549 |
claw | +0.540 |
Wan | +0.537 |
Neph | +0.522 |
Neg logit contributions | |
fitt | -0.304 |
slic | -0.280 |
hof | -0.265 |
leakage | -0.257 |
stamped | -0.256 |
Token | . |
Token ID | 13 |
Feature activation | +3.60e-02 |
Pos logit contributions | |
fitt | +0.231 |
slic | +0.217 |
hof | +0.208 |
leakage | +0.207 |
stamped | +0.206 |
Neg logit contributions | |
ˈ | -0.269 |
Redd | -0.223 |
Wan | -0.218 |
claw | -0.217 |
Neph | -0.207 |
Token |
|
Token ID | 198 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
fitt | +0.089 |
slic | +0.084 |
hof | +0.080 |
leakage | +0.080 |
stamped | +0.079 |
Neg logit contributions | |
ˈ | -0.102 |
Redd | -0.084 |
Wan | -0.083 |
claw | -0.082 |
Neph | -0.079 |
Token |
|
Token ID | 198 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
fitt | +0.042 |
slic | +0.039 |
leakage | +0.037 |
hof | +0.037 |
stamped | +0.037 |
Neg logit contributions | |
ˈ | -0.050 |
Redd | -0.042 |
Wan | -0.041 |
claw | -0.041 |
Neph | -0.039 |
Token | Cat |
Token ID | 21979 |
Feature activation | +3.82e-02 |
Pos logit contributions | |
fitt | +0.028 |
slic | +0.026 |
leakage | +0.025 |
hof | +0.025 |
stamped | +0.025 |
Neg logit contributions | |
ˈ | -0.026 |
Redd | -0.021 |
Wan | -0.021 |
claw | -0.020 |
Neph | -0.019 |
Token | ast |
Token ID | 459 |
Feature activation | -3.02e-02 |
Pos logit contributions | |
fitt | +0.080 |
slic | +0.074 |
hof | +0.071 |
leakage | +0.070 |
stamped | +0.070 |
Neg logit contributions | |
ˈ | -0.121 |
Redd | -0.103 |
Wan | -0.101 |
claw | -0.100 |
Neph | -0.097 |
Token | rophic |
Token ID | 18191 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
ˈ | +0.059 |
Redd | +0.045 |
Wan | +0.043 |
claw | +0.043 |
Neph | +0.039 |
Neg logit contributions | |
fitt | -0.100 |
slic | -0.095 |
hof | -0.093 |
leakage | -0.092 |
stamped | -0.092 |
Token | ol |
Token ID | 349 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
fitt | +0.065 |
slic | +0.060 |
stamped | +0.057 |
leakage | +0.057 |
hof | +0.056 |
Neg logit contributions | |
ˈ | -0.094 |
Redd | -0.079 |
claw | -0.078 |
Wan | -0.078 |
Neph | -0.074 |
Token | iy |
Token ID | 7745 |
Feature activation | -5.42e-02 |
Pos logit contributions | |
fitt | +0.292 |
slic | +0.276 |
hof | +0.267 |
leakage | +0.266 |
stamped | +0.265 |
Neg logit contributions | |
ˈ | -0.243 |
Redd | -0.195 |
Wan | -0.189 |
claw | -0.187 |
Neph | -0.178 |
Token | ub |
Token ID | 549 |
Feature activation | +5.55e-02 |
Pos logit contributions | |
ˈ | +0.147 |
Redd | +0.121 |
Wan | +0.118 |
claw | +0.117 |
Neph | +0.112 |
Neg logit contributions | |
fitt | -0.139 |
slic | -0.130 |
hof | -0.126 |
leakage | -0.125 |
stamped | -0.125 |
Token | ov |
Token ID | 709 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
fitt | +0.129 |
slic | +0.121 |
leakage | +0.115 |
hof | +0.115 |
stamped | +0.115 |
Neg logit contributions | |
ˈ | -0.164 |
Redd | -0.137 |
Wan | -0.134 |
claw | -0.134 |
Neph | -0.128 |
Token | . |
Token ID | 13 |
Feature activation | -1.96e-02 |
Pos logit contributions | |
ˈ | +0.327 |
Redd | +0.266 |
Wan | +0.261 |
claw | +0.259 |
Neph | +0.246 |
Neg logit contributions | |
fitt | -0.327 |
slic | -0.308 |
hof | -0.297 |
leakage | -0.296 |
stamped | -0.295 |
Token |
|
Token ID | 198 |
Feature activation | -8.31e-04 |
Pos logit contributions | |
ˈ | +0.055 |
Redd | +0.046 |
Wan | +0.045 |
claw | +0.044 |
Neph | +0.043 |
Neg logit contributions | |
fitt | -0.049 |
slic | -0.046 |
leakage | -0.044 |
stamped | -0.044 |
hof | -0.044 |
Token |
|
Token ID | 198 |
Feature activation | -2.71e-03 |
Pos logit contributions | |
ˈ | +0.002 |
Redd | +0.002 |
Wan | +0.002 |
claw | +0.002 |
Neph | +0.002 |
Neg logit contributions | |
fitt | -0.002 |
slic | -0.002 |
leakage | -0.002 |
hof | -0.002 |
stamped | -0.002 |
Token | Z |
Token ID | 57 |
Feature activation | -9.80e-02 |
Pos logit contributions | |
ˈ | +0.007 |
Redd | +0.006 |
Wan | +0.006 |
claw | +0.006 |
Neph | +0.005 |
Neg logit contributions | |
fitt | -0.007 |
slic | -0.007 |
leakage | -0.007 |
stamped | -0.006 |
hof | -0.006 |
Token | apor |
Token ID | 12687 |
Feature activation | +1.33e-03 |
Pos logit contributions | |
ˈ | +0.269 |
Redd | +0.221 |
claw | +0.216 |
Wan | +0.216 |
Neph | +0.204 |
Neg logit contributions | |
fitt | -0.250 |
slic | -0.235 |
leakage | -0.225 |
stamped | -0.224 |
hof | -0.222 |
Token | iz |
Token ID | 528 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
fitt | +0.003 |
slic | +0.003 |
hof | +0.003 |
leakage | +0.003 |
stamped | +0.003 |
Neg logit contributions | |
ˈ | -0.004 |
Redd | -0.003 |
Wan | -0.003 |
claw | -0.003 |
Neph | -0.003 |
Token | h |
Token ID | 71 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
ˈ | +0.419 |
Redd | +0.340 |
claw | +0.331 |
Wan | +0.331 |
Neph | +0.312 |
Neg logit contributions | |
fitt | -0.449 |
slic | -0.423 |
leakage | -0.407 |
hof | -0.405 |
stamped | -0.405 |
Token | than |
Token ID | 621 |
Feature activation | -3.13e-02 |
Pos logit contributions | |
fitt | +0.422 |
slic | +0.396 |
hof | +0.383 |
leakage | +0.381 |
stamped | +0.379 |
Neg logit contributions | |
ˈ | -0.438 |
Redd | -0.359 |
Wan | -0.350 |
claw | -0.348 |
Neph | -0.331 |
Token | a |
Token ID | 257 |
Feature activation | -9.78e-03 |
Pos logit contributions | |
ˈ | +0.081 |
Redd | +0.066 |
Wan | +0.065 |
claw | +0.064 |
Neph | +0.062 |
Neg logit contributions | |
fitt | -0.083 |
slic | -0.078 |
hof | -0.076 |
leakage | -0.075 |
stamped | -0.075 |
Token | c |
Token ID | 269 |
Feature activation | +6.78e-02 |
Pos logit contributions | |
ˈ | +0.030 |
Redd | +0.026 |
Wan | +0.025 |
claw | +0.025 |
Neph | +0.024 |
Neg logit contributions | |
fitt | -0.021 |
slic | -0.020 |
hof | -0.019 |
leakage | -0.019 |
stamped | -0.019 |
Token | inch |
Token ID | 8589 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
fitt | +0.180 |
slic | +0.169 |
hof | +0.164 |
leakage | +0.163 |
stamped | +0.162 |
Neg logit contributions | |
ˈ | -0.178 |
Redd | -0.145 |
Wan | -0.142 |
claw | -0.140 |
Neph | -0.134 |
Token | and |
Token ID | 290 |
Feature activation | -5.98e-03 |
Pos logit contributions | |
ˈ | +0.692 |
Redd | +0.571 |
claw | +0.560 |
Wan | +0.557 |
Neph | +0.532 |
Neg logit contributions | |
fitt | -0.605 |
slic | -0.566 |
hof | -0.547 |
leakage | -0.545 |
stamped | -0.540 |
Token | as |
Token ID | 355 |
Feature activation | -6.31e-03 |
Pos logit contributions | |
ˈ | +0.018 |
Redd | +0.016 |
Wan | +0.015 |
claw | +0.015 |
Neph | +0.015 |
Neg logit contributions | |
fitt | -0.013 |
slic | -0.012 |
hof | -0.012 |
leakage | -0.011 |
stamped | -0.011 |
Token | competitive |
Token ID | 7606 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
ˈ | +0.020 |
Redd | +0.017 |
Wan | +0.016 |
claw | +0.016 |
Neph | +0.016 |
Neg logit contributions | |
fitt | -0.014 |
slic | -0.013 |
hof | -0.012 |
leakage | -0.012 |
stamped | -0.012 |
Token | as |
Token ID | 355 |
Feature activation | +3.70e-02 |
Pos logit contributions | |
fitt | +0.031 |
slic | +0.029 |
hof | +0.028 |
leakage | +0.028 |
stamped | +0.028 |
Neg logit contributions | |
ˈ | -0.036 |
Redd | -0.030 |
Wan | -0.030 |
claw | -0.029 |
Neph | -0.028 |
Token | a |
Token ID | 257 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
fitt | +0.088 |
slic | +0.082 |
hof | +0.080 |
leakage | +0.079 |
stamped | +0.078 |
Neg logit contributions | |
ˈ | -0.107 |
Redd | -0.089 |
Wan | -0.087 |
claw | -0.086 |
Neph | -0.083 |
Token | sibling |
Token ID | 33423 |
Feature activation | -4.06e-02 |
Pos logit contributions | |
fitt | +0.082 |
slic | +0.076 |
hof | +0.073 |
leakage | +0.072 |
stamped | +0.072 |
Neg logit contributions | |
ˈ | -0.123 |
Redd | -0.104 |
Wan | -0.102 |
claw | -0.101 |
Neph | -0.098 |
Token | rivalry |
Token ID | 26390 |
Feature activation | -7.42e-02 |
Pos logit contributions | |
ˈ | +0.125 |
Redd | +0.105 |
claw | +0.103 |
Wan | +0.103 |
Neph | +0.099 |
Neg logit contributions | |
fitt | -0.089 |
slic | -0.082 |
hof | -0.080 |
leakage | -0.079 |
stamped | -0.078 |
Token | After |
Token ID | 3260 |
Feature activation | +4.21e-02 |
Pos logit contributions | |
fitt | +0.099 |
slic | +0.094 |
leakage | +0.090 |
stamped | +0.089 |
hof | +0.089 |
Neg logit contributions | |
ˈ | -0.090 |
Redd | -0.074 |
Wan | -0.072 |
claw | -0.071 |
Neph | -0.066 |
Token | 1 |
Token ID | 352 |
Feature activation | +9.80e-02 |
Pos logit contributions | |
fitt | +0.089 |
slic | +0.083 |
hof | +0.079 |
stamped | +0.078 |
leakage | +0.078 |
Neg logit contributions | |
ˈ | -0.133 |
Redd | -0.111 |
claw | -0.110 |
Wan | -0.109 |
Neph | -0.105 |
Token | July |
Token ID | 2901 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
fitt | +0.267 |
slic | +0.251 |
hof | +0.244 |
leakage | +0.244 |
stamped | +0.243 |
Neg logit contributions | |
ˈ | -0.248 |
Redd | -0.204 |
Wan | -0.198 |
claw | -0.194 |
Neph | -0.186 |
Token | 2017 |
Token ID | 2177 |
Feature activation | +4.17e-02 |
Pos logit contributions | |
fitt | +0.218 |
slic | +0.203 |
hof | +0.194 |
leakage | +0.192 |
stamped | +0.191 |
Neg logit contributions | |
ˈ | -0.313 |
Redd | -0.264 |
Wan | -0.259 |
claw | -0.258 |
Neph | -0.248 |
Token | , |
Token ID | 11 |
Feature activation | +7.99e-02 |
Pos logit contributions | |
fitt | +0.096 |
slic | +0.090 |
hof | +0.086 |
stamped | +0.085 |
leakage | +0.085 |
Neg logit contributions | |
ˈ | -0.124 |
Redd | -0.103 |
claw | -0.101 |
Wan | -0.101 |
Neph | -0.096 |
Token | Christopher |
Token ID | 12803 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
fitt | +0.165 |
slic | +0.154 |
hof | +0.149 |
stamped | +0.144 |
leakage | +0.143 |
Neg logit contributions | |
ˈ | -0.253 |
Redd | -0.214 |
claw | -0.211 |
Wan | -0.210 |
Neph | -0.203 |
Token | reck |
Token ID | 12482 |
Feature activation | +1.18e-01 |
Pos logit contributions | |
ˈ | +0.093 |
Redd | +0.077 |
Wan | +0.076 |
claw | +0.075 |
Neph | +0.072 |
Neg logit contributions | |
fitt | -0.081 |
slic | -0.076 |
hof | -0.073 |
leakage | -0.073 |
stamped | -0.072 |
Token | ons |
Token ID | 684 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
fitt | +0.347 |
slic | +0.329 |
leakage | +0.320 |
stamped | +0.317 |
hof | +0.317 |
Neg logit contributions | |
ˈ | -0.276 |
Redd | -0.219 |
Wan | -0.213 |
claw | -0.210 |
Neph | -0.199 |
Token | there |
Token ID | 612 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
fitt | +0.587 |
slic | +0.546 |
hof | +0.526 |
stamped | +0.518 |
leakage | +0.516 |
Neg logit contributions | |
ˈ | -0.821 |
Redd | -0.693 |
Wan | -0.679 |
claw | -0.674 |
Neph | -0.649 |
Token | will |
Token ID | 481 |
Feature activation | +5.98e-02 |
Pos logit contributions | |
fitt | +0.054 |
slic | +0.050 |
hof | +0.048 |
leakage | +0.048 |
stamped | +0.047 |
Neg logit contributions | |
ˈ | -0.084 |
Redd | -0.071 |
Wan | -0.070 |
claw | -0.069 |
Neph | -0.067 |
Token | likely |
Token ID | 1884 |
Feature activation | +6.35e-02 |
Pos logit contributions | |
fitt | +0.130 |
slic | +0.120 |
hof | +0.115 |
leakage | +0.114 |
stamped | +0.114 |
Neg logit contributions | |
ˈ | -0.186 |
Redd | -0.158 |
Wan | -0.154 |
claw | -0.153 |
Neph | -0.147 |
Token | Example |
Token ID | 16281 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
fitt | +0.111 |
slic | +0.104 |
hof | +0.100 |
leakage | +0.100 |
stamped | +0.100 |
Neg logit contributions | |
ˈ | -0.114 |
Redd | -0.094 |
claw | -0.091 |
Wan | -0.091 |
Neph | -0.086 |
Token | : |
Token ID | 25 |
Feature activation | +6.78e-02 |
Pos logit contributions | |
fitt | +0.580 |
slic | +0.541 |
hof | +0.521 |
leakage | +0.519 |
stamped | +0.517 |
Neg logit contributions | |
ˈ | -0.680 |
Redd | -0.566 |
Wan | -0.553 |
claw | -0.548 |
Neph | -0.525 |
Token | Your |
Token ID | 3406 |
Feature activation | +4.42e-02 |
Pos logit contributions | |
fitt | +0.168 |
slic | +0.157 |
hof | +0.151 |
leakage | +0.150 |
stamped | +0.150 |
Neg logit contributions | |
ˈ | -0.190 |
Redd | -0.158 |
Wan | -0.154 |
claw | -0.153 |
Neph | -0.146 |
Token | + |
Token ID | 1343 |
Feature activation | +7.40e-02 |
Pos logit contributions | |
fitt | +0.109 |
slic | +0.102 |
hof | +0.099 |
leakage | +0.098 |
stamped | +0.098 |
Neg logit contributions | |
ˈ | -0.124 |
Redd | -0.102 |
Wan | -0.100 |
claw | -0.099 |
Neph | -0.095 |
Token | 1 |
Token ID | 16 |
Feature activation | +6.09e-02 |
Pos logit contributions | |
fitt | +0.194 |
slic | +0.182 |
hof | +0.175 |
leakage | +0.175 |
stamped | +0.174 |
Neg logit contributions | |
ˈ | -0.198 |
Redd | -0.162 |
Wan | -0.158 |
claw | -0.157 |
Neph | -0.149 |
Token | shield |
Token ID | 7614 |
Feature activation | -5.36e-02 |
Pos logit contributions | |
fitt | +0.146 |
slic | +0.136 |
hof | +0.131 |
leakage | +0.131 |
stamped | +0.130 |
Neg logit contributions | |
ˈ | -0.175 |
Redd | -0.146 |
Wan | -0.143 |
claw | -0.142 |
Neph | -0.136 |
Token | keeps |
Token ID | 7622 |
Feature activation | -3.11e-02 |
Pos logit contributions | |
ˈ | +0.164 |
Redd | +0.137 |
claw | +0.136 |
Wan | +0.135 |
Neph | +0.130 |
Neg logit contributions | |
fitt | -0.118 |
slic | -0.109 |
hof | -0.106 |
leakage | -0.104 |
stamped | -0.104 |
Token | it |
Token ID | 340 |
Feature activation | -5.25e-02 |
Pos logit contributions | |
ˈ | +0.097 |
Redd | +0.081 |
Wan | +0.080 |
claw | +0.080 |
Neph | +0.077 |
Neg logit contributions | |
fitt | -0.067 |
slic | -0.062 |
hof | -0.060 |
leakage | -0.059 |
stamped | -0.059 |
Token | � |
Token ID | 447 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
ˈ | +0.155 |
Redd | +0.130 |
Wan | +0.127 |
claw | +0.126 |
Neph | +0.121 |
Neg logit contributions | |
fitt | -0.122 |
slic | -0.113 |
hof | -0.109 |
leakage | -0.108 |
stamped | -0.108 |
Token | � |
Token ID | 247 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
fitt | +0.063 |
slic | +0.060 |
hof | +0.058 |
leakage | +0.058 |
stamped | +0.058 |
Neg logit contributions | |
ˈ | -0.049 |
Redd | -0.039 |
Wan | -0.037 |
claw | -0.037 |
Neph | -0.035 |
Token | s |
Token ID | 82 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
ˈ | +0.042 |
Redd | +0.035 |
claw | +0.034 |
Wan | +0.034 |
Neph | +0.033 |
Neg logit contributions | |
fitt | -0.036 |
slic | -0.033 |
hof | -0.032 |
leakage | -0.032 |
stamped | -0.032 |
Token | The |
Token ID | 383 |
Feature activation | -9.63e-02 |
Pos logit contributions | |
ˈ | +0.109 |
Redd | +0.090 |
Wan | +0.088 |
claw | +0.087 |
Neph | +0.084 |
Neg logit contributions | |
fitt | -0.088 |
slic | -0.082 |
hof | -0.079 |
leakage | -0.079 |
stamped | -0.078 |
Token | Verge |
Token ID | 44499 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
ˈ | +0.244 |
Redd | +0.200 |
Wan | +0.193 |
claw | +0.191 |
Neph | +0.183 |
Neg logit contributions | |
fitt | -0.265 |
slic | -0.249 |
hof | -0.240 |
leakage | -0.240 |
stamped | -0.238 |
Token | . |
Token ID | 13 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
fitt | +0.348 |
slic | +0.327 |
hof | +0.316 |
leakage | +0.315 |
stamped | +0.314 |
Neg logit contributions | |
ˈ | -0.340 |
Redd | -0.278 |
Wan | -0.272 |
claw | -0.267 |
Neph | -0.255 |
Token | Ellis |
Token ID | 21299 |
Feature activation | +8.22e-02 |
Pos logit contributions | |
ˈ | +0.092 |
Redd | +0.076 |
Wan | +0.074 |
claw | +0.074 |
Neph | +0.071 |
Neg logit contributions | |
fitt | -0.084 |
slic | -0.079 |
leakage | -0.076 |
hof | -0.076 |
stamped | -0.075 |
Token | Hamb |
Token ID | 26175 |
Feature activation | -9.20e-02 |
Pos logit contributions | |
fitt | +0.204 |
slic | +0.191 |
leakage | +0.183 |
hof | +0.183 |
stamped | +0.182 |
Neg logit contributions | |
ˈ | -0.229 |
Redd | -0.191 |
Wan | -0.187 |
claw | -0.185 |
Neph | -0.177 |
Token | urger |
Token ID | 32650 |
Feature activation | -1.62e-01 |
Pos logit contributions | |
ˈ | +0.212 |
Redd | +0.167 |
claw | +0.163 |
Wan | +0.161 |
Neph | +0.151 |
Neg logit contributions | |
fitt | -0.274 |
slic | -0.259 |
leakage | -0.251 |
hof | -0.250 |
stamped | -0.250 |
Token | got |
Token ID | 1392 |
Feature activation | +3.42e-02 |
Pos logit contributions | |
ˈ | +0.462 |
Redd | +0.384 |
claw | +0.375 |
Wan | +0.373 |
Neph | +0.356 |
Neg logit contributions | |
fitt | -0.390 |
slic | -0.364 |
leakage | -0.350 |
hof | -0.347 |
stamped | -0.347 |
Token | to |
Token ID | 284 |
Feature activation | -3.27e-02 |
Pos logit contributions | |
fitt | +0.077 |
slic | +0.072 |
hof | +0.069 |
leakage | +0.068 |
stamped | +0.068 |
Neg logit contributions | |
ˈ | -0.104 |
Redd | -0.087 |
Wan | -0.085 |
claw | -0.085 |
Neph | -0.082 |
Token | test |
Token ID | 1332 |
Feature activation | +2.17e-02 |
Pos logit contributions | |
ˈ | +0.101 |
Redd | +0.086 |
Wan | +0.083 |
claw | +0.083 |
Neph | +0.080 |
Neg logit contributions | |
fitt | -0.071 |
slic | -0.066 |
hof | -0.064 |
leakage | -0.063 |
stamped | -0.062 |
Token | it |
Token ID | 340 |
Feature activation | -9.04e-03 |
Pos logit contributions | |
fitt | +0.048 |
slic | +0.044 |
hof | +0.043 |
leakage | +0.042 |
stamped | +0.042 |
Neg logit contributions | |
ˈ | -0.067 |
Redd | -0.056 |
claw | -0.055 |
Wan | -0.055 |
Neph | -0.053 |
Token | out |
Token ID | 503 |
Feature activation | +3.35e-02 |
Pos logit contributions | |
ˈ | +0.026 |
Redd | +0.022 |
claw | +0.021 |
Wan | +0.021 |
Neph | +0.020 |
Neg logit contributions | |
fitt | -0.021 |
slic | -0.020 |
hof | -0.019 |
leakage | -0.019 |
stamped | -0.019 |
Token | issued |
Token ID | 4884 |
Feature activation | -7.50e-02 |
Pos logit contributions | |
ˈ | +0.015 |
Redd | +0.012 |
claw | +0.012 |
Wan | +0.012 |
Neph | +0.012 |
Neg logit contributions | |
fitt | -0.012 |
slic | -0.011 |
hof | -0.011 |
leakage | -0.011 |
stamped | -0.010 |
Token | notices |
Token ID | 19748 |
Feature activation | -7.44e-02 |
Pos logit contributions | |
ˈ | +0.235 |
Redd | +0.201 |
Wan | +0.196 |
claw | +0.195 |
Neph | +0.188 |
Neg logit contributions | |
fitt | -0.158 |
slic | -0.146 |
hof | -0.141 |
leakage | -0.139 |
stamped | -0.137 |
Token | to |
Token ID | 284 |
Feature activation | -2.52e-02 |
Pos logit contributions | |
ˈ | +0.211 |
Redd | +0.175 |
claw | +0.171 |
Wan | +0.171 |
Neph | +0.163 |
Neg logit contributions | |
fitt | -0.180 |
slic | -0.169 |
hof | -0.163 |
leakage | -0.161 |
stamped | -0.159 |
Token | the |
Token ID | 262 |
Feature activation | +1.98e-02 |
Pos logit contributions | |
ˈ | +0.074 |
Redd | +0.061 |
Wan | +0.060 |
claw | +0.060 |
Neph | +0.058 |
Neg logit contributions | |
fitt | -0.059 |
slic | -0.055 |
hof | -0.053 |
leakage | -0.053 |
stamped | -0.052 |
Token | Maharashtra |
Token ID | 41624 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
fitt | +0.044 |
slic | +0.042 |
hof | +0.040 |
leakage | +0.039 |
stamped | +0.039 |
Neg logit contributions | |
ˈ | -0.060 |
Redd | -0.050 |
Wan | -0.049 |
claw | -0.048 |
Neph | -0.047 |
Token | government |
Token ID | 1230 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
ˈ | +0.389 |
Redd | +0.326 |
Wan | +0.318 |
claw | +0.315 |
Neph | +0.304 |
Neg logit contributions | |
fitt | -0.319 |
slic | -0.299 |
hof | -0.289 |
leakage | -0.284 |
stamped | -0.283 |
Token | and |
Token ID | 290 |
Feature activation | +1.71e-03 |
Pos logit contributions | |
ˈ | +0.283 |
Redd | +0.237 |
claw | +0.230 |
Wan | +0.230 |
Neph | +0.220 |
Neg logit contributions | |
fitt | -0.241 |
slic | -0.226 |
hof | -0.217 |
leakage | -0.215 |
stamped | -0.213 |
Token | the |
Token ID | 262 |
Feature activation | +3.07e-02 |
Pos logit contributions | |
fitt | +0.004 |
slic | +0.004 |
hof | +0.004 |
leakage | +0.003 |
stamped | +0.003 |
Neg logit contributions | |
ˈ | -0.005 |
Redd | -0.004 |
Wan | -0.004 |
claw | -0.004 |
Neph | -0.004 |
Token | Maharashtra |
Token ID | 41624 |
Feature activation | -1.23e-01 |
Pos logit contributions | |
fitt | +0.073 |
slic | +0.068 |
hof | +0.066 |
leakage | +0.065 |
stamped | +0.065 |
Neg logit contributions | |
ˈ | -0.088 |
Redd | -0.074 |
Wan | -0.072 |
claw | -0.071 |
Neph | -0.069 |
Token | Film |
Token ID | 13741 |
Feature activation | -1.28e-03 |
Pos logit contributions | |
ˈ | +0.339 |
Redd | +0.282 |
Wan | +0.275 |
claw | +0.272 |
Neph | +0.263 |
Neg logit contributions | |
fitt | -0.304 |
slic | -0.286 |
hof | -0.277 |
leakage | -0.272 |
stamped | -0.271 |
Token | , |
Token ID | 11 |
Feature activation | -2.80e-02 |
Pos logit contributions | |
ˈ | +0.004 |
Redd | +0.003 |
Wan | +0.003 |
claw | +0.003 |
Neph | +0.003 |
Neg logit contributions | |
fitt | -0.003 |
slic | -0.003 |
hof | -0.003 |
leakage | -0.003 |
stamped | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -2.23e-03 |
Pos logit contributions | |
ˈ | +0.069 |
Redd | +0.057 |
Wan | +0.056 |
claw | +0.056 |
Neph | +0.053 |
Neg logit contributions | |
fitt | -0.066 |
slic | -0.062 |
leakage | -0.059 |
hof | -0.059 |
stamped | -0.059 |
Token |
|
Token ID | 198 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
ˈ | +0.006 |
Redd | +0.005 |
Wan | +0.005 |
claw | +0.005 |
Neph | +0.005 |
Neg logit contributions | |
fitt | -0.005 |
slic | -0.005 |
leakage | -0.005 |
stamped | -0.005 |
hof | -0.005 |
Token | Now |
Token ID | 3844 |
Feature activation | -6.14e-02 |
Pos logit contributions | |
ˈ | +0.043 |
Redd | +0.035 |
Wan | +0.034 |
claw | +0.033 |
Neph | +0.031 |
Neg logit contributions | |
fitt | -0.047 |
slic | -0.044 |
leakage | -0.042 |
hof | -0.042 |
stamped | -0.042 |
Token | you |
Token ID | 345 |
Feature activation | +6.19e-02 |
Pos logit contributions | |
ˈ | +0.183 |
Redd | +0.151 |
Wan | +0.150 |
claw | +0.150 |
Neph | +0.144 |
Neg logit contributions | |
fitt | -0.141 |
slic | -0.130 |
hof | -0.126 |
leakage | -0.125 |
stamped | -0.124 |
Token | � |
Token ID | 447 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
fitt | +0.132 |
slic | +0.122 |
hof | +0.118 |
leakage | +0.118 |
stamped | +0.115 |
Neg logit contributions | |
ˈ | -0.194 |
Redd | -0.161 |
Wan | -0.160 |
claw | -0.160 |
Neph | -0.153 |
Token | � |
Token ID | 247 |
Feature activation | -4.06e-02 |
Pos logit contributions | |
fitt | +0.350 |
slic | +0.333 |
hof | +0.322 |
leakage | +0.321 |
stamped | +0.321 |
Neg logit contributions | |
ˈ | -0.250 |
Redd | -0.195 |
Wan | -0.188 |
claw | -0.186 |
Neph | -0.175 |
Token | re |
Token ID | 260 |
Feature activation | +2.71e-02 |
Pos logit contributions | |
ˈ | +0.099 |
Redd | +0.077 |
claw | +0.076 |
Wan | +0.075 |
Neph | +0.071 |
Neg logit contributions | |
fitt | -0.117 |
slic | -0.111 |
leakage | -0.107 |
hof | -0.106 |
stamped | -0.106 |
Token | ready |
Token ID | 3492 |
Feature activation | +2.91e-02 |
Pos logit contributions | |
fitt | +0.056 |
slic | +0.052 |
hof | +0.050 |
leakage | +0.050 |
stamped | +0.049 |
Neg logit contributions | |
ˈ | -0.086 |
Redd | -0.073 |
claw | -0.072 |
Wan | -0.072 |
Neph | -0.069 |
Token | to |
Token ID | 284 |
Feature activation | +6.19e-02 |
Pos logit contributions | |
fitt | +0.072 |
slic | +0.067 |
hof | +0.064 |
stamped | +0.064 |
leakage | +0.064 |
Neg logit contributions | |
ˈ | -0.082 |
Redd | -0.069 |
Wan | -0.067 |
claw | -0.066 |
Neph | -0.064 |
Token | � |
Token ID | 564 |
Feature activation | +1.95e-02 |
Pos logit contributions | |
fitt | +0.135 |
slic | +0.125 |
hof | +0.122 |
leakage | +0.120 |
stamped | +0.118 |
Neg logit contributions | |
ˈ | -0.192 |
Redd | -0.160 |
claw | -0.157 |
Wan | -0.156 |
Neph | -0.151 |
Token | � |
Token ID | 250 |
Feature activation | +1.48e-02 |
Pos logit contributions | |
fitt | +0.058 |
slic | +0.055 |
hof | +0.054 |
leakage | +0.053 |
stamped | +0.053 |
Neg logit contributions | |
ˈ | -0.045 |
Redd | -0.035 |
Wan | -0.034 |
claw | -0.034 |
Neph | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
ˈ | +0.052 |
Redd | +0.043 |
Wan | +0.042 |
claw | +0.041 |
Neph | +0.040 |
Neg logit contributions | |
fitt | -0.046 |
slic | -0.043 |
leakage | -0.041 |
hof | -0.041 |
stamped | -0.041 |
Token |
|
Token ID | 198 |
Feature activation | -8.32e-03 |
Pos logit contributions | |
fitt | +0.038 |
slic | +0.035 |
leakage | +0.034 |
hof | +0.034 |
stamped | +0.033 |
Neg logit contributions | |
ˈ | -0.045 |
Redd | -0.038 |
Wan | -0.037 |
claw | -0.037 |
Neph | -0.035 |
Token | 12 |
Token ID | 1065 |
Feature activation | -4.91e-02 |
Pos logit contributions | |
ˈ | +0.023 |
Redd | +0.019 |
Wan | +0.018 |
claw | +0.018 |
Neph | +0.017 |
Neg logit contributions | |
fitt | -0.021 |
slic | -0.020 |
hof | -0.019 |
leakage | -0.019 |
stamped | -0.019 |
Token | . |
Token ID | 13 |
Feature activation | -5.02e-02 |
Pos logit contributions | |
ˈ | +0.127 |
Redd | +0.103 |
Wan | +0.101 |
claw | +0.100 |
Neph | +0.095 |
Neg logit contributions | |
fitt | -0.133 |
slic | -0.125 |
leakage | -0.120 |
hof | -0.120 |
stamped | -0.120 |
Token | Donkey |
Token ID | 43823 |
Feature activation | +9.33e-02 |
Pos logit contributions | |
ˈ | +0.132 |
Redd | +0.108 |
Wan | +0.105 |
claw | +0.104 |
Neph | +0.100 |
Neg logit contributions | |
fitt | -0.134 |
slic | -0.125 |
hof | -0.121 |
leakage | -0.120 |
stamped | -0.120 |
Token | Kong |
Token ID | 9071 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
fitt | +0.254 |
slic | +0.239 |
hof | +0.230 |
leakage | +0.230 |
stamped | +0.229 |
Neg logit contributions | |
ˈ | -0.239 |
Redd | -0.195 |
Wan | -0.189 |
claw | -0.188 |
Neph | -0.178 |
Token | Country |
Token ID | 12946 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
ˈ | +0.831 |
Redd | +0.671 |
Wan | +0.649 |
claw | +0.644 |
Neph | +0.614 |
Neg logit contributions | |
fitt | -0.959 |
slic | -0.905 |
hof | -0.873 |
leakage | -0.871 |
stamped | -0.863 |
Token | 2 |
Token ID | 362 |
Feature activation | +5.59e-02 |
Pos logit contributions | |
fitt | +0.573 |
slic | +0.534 |
hof | +0.513 |
leakage | +0.510 |
stamped | +0.507 |
Neg logit contributions | |
ˈ | -0.693 |
Redd | -0.579 |
Wan | -0.564 |
claw | -0.560 |
Neph | -0.539 |
Token | : |
Token ID | 25 |
Feature activation | +6.08e-02 |
Pos logit contributions | |
fitt | +0.131 |
slic | +0.122 |
hof | +0.117 |
leakage | +0.117 |
stamped | +0.117 |
Neg logit contributions | |
ˈ | -0.164 |
Redd | -0.137 |
Wan | -0.134 |
claw | -0.133 |
Neph | -0.128 |
Token | D |
Token ID | 360 |
Feature activation | +9.84e-02 |
Pos logit contributions | |
fitt | +0.160 |
slic | +0.150 |
hof | +0.144 |
leakage | +0.144 |
stamped | +0.143 |
Neg logit contributions | |
ˈ | -0.161 |
Redd | -0.132 |
Wan | -0.129 |
claw | -0.128 |
Neph | -0.123 |
Token | iddy |
Token ID | 34208 |
Feature activation | +5.73e-02 |
Pos logit contributions | |
fitt | +0.273 |
slic | +0.257 |
hof | +0.248 |
leakage | +0.248 |
stamped | +0.246 |
Neg logit contributions | |
ˈ | -0.247 |
Redd | -0.200 |
Wan | -0.195 |
claw | -0.193 |
Neph | -0.183 |
Token | the |
Token ID | 262 |
Feature activation | -4.48e-03 |
Pos logit contributions | |
ˈ | +0.138 |
Redd | +0.116 |
claw | +0.114 |
Wan | +0.113 |
Neph | +0.108 |
Neg logit contributions | |
fitt | -0.112 |
slic | -0.105 |
hof | -0.100 |
leakage | -0.100 |
stamped | -0.100 |
Token | reign |
Token ID | 13580 |
Feature activation | -2.59e-02 |
Pos logit contributions | |
ˈ | +0.014 |
Redd | +0.011 |
Wan | +0.011 |
claw | +0.011 |
Neph | +0.011 |
Neg logit contributions | |
fitt | -0.010 |
slic | -0.009 |
hof | -0.009 |
leakage | -0.009 |
stamped | -0.009 |
Token | of |
Token ID | 286 |
Feature activation | +8.92e-03 |
Pos logit contributions | |
ˈ | +0.067 |
Redd | +0.054 |
Wan | +0.053 |
claw | +0.052 |
Neph | +0.050 |
Neg logit contributions | |
fitt | -0.070 |
slic | -0.066 |
hof | -0.064 |
leakage | -0.064 |
stamped | -0.063 |
Token | social |
Token ID | 1919 |
Feature activation | +1.73e-01 |
Pos logit contributions | |
fitt | +0.023 |
slic | +0.022 |
hof | +0.021 |
leakage | +0.021 |
stamped | +0.021 |
Neg logit contributions | |
ˈ | -0.024 |
Redd | -0.020 |
Wan | -0.019 |
claw | -0.019 |
Neph | -0.018 |
Token | justice |
Token ID | 5316 |
Feature activation | -1.40e-01 |
Pos logit contributions | |
fitt | +0.341 |
slic | +0.314 |
hof | +0.305 |
leakage | +0.298 |
stamped | +0.296 |
Neg logit contributions | |
ˈ | -0.567 |
Redd | -0.485 |
Wan | -0.475 |
claw | -0.471 |
Neph | -0.457 |
Token | indo |
Token ID | 23046 |
Feature activation | -4.45e-01 |
Pos logit contributions | |
ˈ | +0.395 |
Redd | +0.331 |
Wan | +0.322 |
claw | +0.321 |
Neph | +0.310 |
Neg logit contributions | |
fitt | -0.338 |
slic | -0.319 |
hof | -0.308 |
leakage | -0.305 |
stamped | -0.301 |
Token | ct |
Token ID | 310 |
Feature activation | -7.69e-02 |
Pos logit contributions | |
ˈ | +1.142 |
Redd | +0.925 |
Wan | +0.906 |
claw | +0.891 |
Neph | +0.847 |
Neg logit contributions | |
fitt | -1.196 |
slic | -1.139 |
leakage | -1.092 |
hof | -1.091 |
stamped | -1.077 |
Token | rin |
Token ID | 12769 |
Feature activation | -1.68e-01 |
Pos logit contributions | |
ˈ | +0.174 |
Redd | +0.137 |
Wan | +0.132 |
claw | +0.132 |
Neph | +0.124 |
Neg logit contributions | |
fitt | -0.232 |
slic | -0.221 |
leakage | -0.213 |
stamped | -0.212 |
hof | -0.211 |
Token | ators |
Token ID | 2024 |
Feature activation | -6.82e-02 |
Pos logit contributions | |
ˈ | +0.469 |
Redd | +0.386 |
Wan | +0.378 |
claw | +0.377 |
Neph | +0.359 |
Neg logit contributions | |
fitt | -0.419 |
slic | -0.391 |
leakage | -0.377 |
hof | -0.375 |
stamped | -0.374 |
Token | , |
Token ID | 11 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
ˈ | +0.204 |
Redd | +0.172 |
Wan | +0.168 |
claw | +0.167 |
Neph | +0.161 |
Neg logit contributions | |
fitt | -0.156 |
slic | -0.145 |
hof | -0.139 |
leakage | -0.138 |
stamped | -0.137 |
Token | academics |
Token ID | 22321 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
ˈ | +0.105 |
Redd | +0.088 |
claw | +0.086 |
Wan | +0.086 |
Neph | +0.083 |
Neg logit contributions | |
fitt | -0.077 |
slic | -0.071 |
hof | -0.069 |
leakage | -0.067 |
stamped | -0.067 |
Token |
|
Token ID | 198 |
Feature activation | -9.02e-02 |
Pos logit contributions | |
ˈ | +0.206 |
Redd | +0.172 |
Wan | +0.168 |
claw | +0.167 |
Neph | +0.160 |
Neg logit contributions | |
fitt | -0.172 |
slic | -0.161 |
leakage | -0.154 |
hof | -0.153 |
stamped | -0.152 |
Token | Capture |
Token ID | 49630 |
Feature activation | -5.38e-02 |
Pos logit contributions | |
ˈ | +0.219 |
Redd | +0.178 |
Wan | +0.172 |
claw | +0.170 |
Neph | +0.159 |
Neg logit contributions | |
fitt | -0.260 |
slic | -0.245 |
leakage | -0.238 |
hof | -0.236 |
stamped | -0.235 |
Token | unique |
Token ID | 3748 |
Feature activation | +7.54e-02 |
Pos logit contributions | |
ˈ | +0.166 |
Redd | +0.140 |
Wan | +0.137 |
claw | +0.137 |
Neph | +0.132 |
Neg logit contributions | |
fitt | -0.116 |
slic | -0.108 |
hof | -0.105 |
leakage | -0.104 |
stamped | -0.103 |
Token | monsters |
Token ID | 10963 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
fitt | +0.168 |
slic | +0.156 |
hof | +0.151 |
leakage | +0.150 |
stamped | +0.149 |
Neg logit contributions | |
ˈ | -0.228 |
Redd | -0.192 |
Wan | -0.188 |
claw | -0.187 |
Neph | -0.180 |
Token | to |
Token ID | 284 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
ˈ | +0.572 |
Redd | +0.475 |
claw | +0.468 |
Wan | +0.465 |
Neph | +0.447 |
Neg logit contributions | |
fitt | -0.454 |
slic | -0.424 |
hof | -0.409 |
leakage | -0.408 |
stamped | -0.401 |
Token | fight |
Token ID | 1907 |
Feature activation | -3.86e-01 |
Pos logit contributions | |
ˈ | +0.371 |
Redd | +0.311 |
claw | +0.306 |
Wan | +0.300 |
Neph | +0.296 |
Neg logit contributions | |
fitt | -0.255 |
slic | -0.238 |
hof | -0.232 |
leakage | -0.231 |
stamped | -0.222 |
Token | alongside |
Token ID | 7848 |
Feature activation | -3.72e-02 |
Pos logit contributions | |
ˈ | +1.103 |
Redd | +0.915 |
claw | +0.902 |
Wan | +0.893 |
Neph | +0.865 |
Neg logit contributions | |
fitt | -0.919 |
slic | -0.856 |
leakage | -0.828 |
hof | -0.827 |
stamped | -0.815 |
Token | you |
Token ID | 345 |
Feature activation | -6.47e-02 |
Pos logit contributions | |
ˈ | +0.113 |
Redd | +0.096 |
Wan | +0.094 |
claw | +0.093 |
Neph | +0.090 |
Neg logit contributions | |
fitt | -0.083 |
slic | -0.077 |
hof | -0.074 |
leakage | -0.074 |
stamped | -0.073 |
Token |
|
Token ID | 198 |
Feature activation | -1.31e-01 |
Pos logit contributions | |
ˈ | +0.189 |
Redd | +0.158 |
Wan | +0.154 |
claw | +0.154 |
Neph | +0.148 |
Neg logit contributions | |
fitt | -0.152 |
slic | -0.142 |
hof | -0.136 |
leakage | -0.136 |
stamped | -0.135 |
Token |
|
Token ID | 198 |
Feature activation | -1.42e-01 |
Pos logit contributions | |
ˈ | +0.376 |
Redd | +0.313 |
Wan | +0.305 |
claw | +0.304 |
Neph | +0.291 |
Neg logit contributions | |
fitt | -0.318 |
slic | -0.297 |
leakage | -0.284 |
hof | -0.282 |
stamped | -0.281 |
Token | All |
Token ID | 3237 |
Feature activation | -1.77e-01 |
Pos logit contributions | |
ˈ | +0.341 |
Redd | +0.277 |
Wan | +0.269 |
claw | +0.265 |
Neph | +0.247 |
Neg logit contributions | |
fitt | -0.414 |
slic | -0.391 |
leakage | -0.381 |
hof | -0.376 |
stamped | -0.375 |
Token | also |
Token ID | 635 |
Feature activation | +6.44e-03 |
Pos logit contributions | |
ˈ | +0.033 |
Redd | +0.027 |
claw | +0.027 |
Wan | +0.027 |
Neph | +0.026 |
Neg logit contributions | |
fitt | -0.024 |
slic | -0.023 |
hof | -0.022 |
leakage | -0.022 |
stamped | -0.021 |
Token | restrained |
Token ID | 31531 |
Feature activation | +8.10e-02 |
Pos logit contributions | |
fitt | +0.016 |
slic | +0.015 |
hof | +0.015 |
leakage | +0.014 |
stamped | +0.014 |
Neg logit contributions | |
ˈ | -0.018 |
Redd | -0.015 |
claw | -0.014 |
Wan | -0.014 |
Neph | -0.014 |
Token | Wh |
Token ID | 854 |
Feature activation | +6.28e-02 |
Pos logit contributions | |
fitt | +0.184 |
slic | +0.171 |
hof | +0.164 |
leakage | +0.162 |
stamped | +0.162 |
Neg logit contributions | |
ˈ | -0.243 |
Redd | -0.204 |
Wan | -0.200 |
claw | -0.198 |
Neph | -0.192 |
Token | ist |
Token ID | 396 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
fitt | +0.132 |
slic | +0.121 |
hof | +0.116 |
leakage | +0.115 |
stamped | +0.115 |
Neg logit contributions | |
ˈ | -0.200 |
Redd | -0.170 |
Wan | -0.167 |
claw | -0.165 |
Neph | -0.159 |
Token | ling |
Token ID | 1359 |
Feature activation | +2.58e-01 |
Pos logit contributions | |
fitt | +0.324 |
slic | +0.302 |
hof | +0.289 |
leakage | +0.288 |
stamped | +0.288 |
Neg logit contributions | |
ˈ | -0.413 |
Redd | -0.347 |
Wan | -0.339 |
claw | -0.337 |
Neph | -0.322 |
Token | Woods |
Token ID | 16483 |
Feature activation | -3.36e-01 |
Pos logit contributions | |
fitt | +0.610 |
slic | +0.569 |
hof | +0.545 |
leakage | +0.544 |
stamped | +0.541 |
Neg logit contributions | |
ˈ | -0.754 |
Redd | -0.632 |
Wan | -0.617 |
claw | -0.614 |
Neph | -0.586 |
Token | from |
Token ID | 422 |
Feature activation | -1.72e-02 |
Pos logit contributions | |
ˈ | +0.976 |
Redd | +0.814 |
Wan | +0.796 |
claw | +0.792 |
Neph | +0.758 |
Neg logit contributions | |
fitt | -0.794 |
slic | -0.743 |
hof | -0.714 |
leakage | -0.709 |
stamped | -0.707 |
Token | granting |
Token ID | 21787 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
ˈ | +0.055 |
Redd | +0.047 |
claw | +0.045 |
Wan | +0.045 |
Neph | +0.044 |
Neg logit contributions | |
fitt | -0.036 |
slic | -0.033 |
hof | -0.032 |
leakage | -0.031 |
stamped | -0.031 |
Token | admissions |
Token ID | 25349 |
Feature activation | -9.23e-02 |
Pos logit contributions | |
fitt | +0.329 |
slic | +0.304 |
hof | +0.291 |
leakage | +0.289 |
stamped | +0.288 |
Neg logit contributions | |
ˈ | -0.493 |
Redd | -0.419 |
Wan | -0.410 |
claw | -0.407 |
Neph | -0.392 |
Token | to |
Token ID | 284 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
ˈ | +0.255 |
Redd | +0.211 |
Wan | +0.206 |
claw | +0.205 |
Neph | +0.196 |
Neg logit contributions | |
fitt | -0.231 |
slic | -0.217 |
hof | -0.209 |
leakage | -0.208 |
stamped | -0.206 |
Token | students |
Token ID | 2444 |
Feature activation | -1.41e-01 |
Pos logit contributions | |
ˈ | +0.180 |
Redd | +0.152 |
Wan | +0.149 |
claw | +0.147 |
Neph | +0.143 |
Neg logit contributions | |
fitt | -0.129 |
slic | -0.121 |
hof | -0.117 |
leakage | -0.115 |
stamped | -0.114 |
Token | team |
Token ID | 1074 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
ˈ | +0.069 |
Redd | +0.059 |
Wan | +0.058 |
claw | +0.057 |
Neph | +0.056 |
Neg logit contributions | |
fitt | -0.040 |
slic | -0.037 |
hof | -0.036 |
leakage | -0.035 |
stamped | -0.035 |
Token | : |
Token ID | 25 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
ˈ | +0.304 |
Redd | +0.255 |
Wan | +0.252 |
claw | +0.248 |
Neph | +0.239 |
Neg logit contributions | |
fitt | -0.235 |
slic | -0.217 |
hof | -0.210 |
leakage | -0.210 |
stamped | -0.208 |
Token | ' |
Token ID | 705 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
ˈ | +0.070 |
Redd | +0.057 |
Wan | +0.056 |
claw | +0.056 |
Neph | +0.054 |
Neg logit contributions | |
fitt | -0.061 |
slic | -0.057 |
hof | -0.055 |
leakage | -0.055 |
stamped | -0.054 |
Token | do |
Token ID | 4598 |
Feature activation | +1.03e-01 |
Pos logit contributions | |
fitt | +0.362 |
slic | +0.340 |
leakage | +0.330 |
stamped | +0.327 |
hof | +0.326 |
Neg logit contributions | |
ˈ | -0.333 |
Redd | -0.272 |
Wan | -0.268 |
claw | -0.263 |
Neph | -0.245 |
Token | you |
Token ID | 345 |
Feature activation | -2.85e-02 |
Pos logit contributions | |
fitt | +0.221 |
slic | +0.205 |
hof | +0.197 |
leakage | +0.196 |
stamped | +0.194 |
Neg logit contributions | |
ˈ | -0.323 |
Redd | -0.271 |
Wan | -0.268 |
claw | -0.266 |
Neph | -0.255 |
Token | remember |
Token ID | 3505 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
ˈ | +0.091 |
Redd | +0.076 |
Wan | +0.076 |
claw | +0.075 |
Neph | +0.073 |
Neg logit contributions | |
fitt | -0.059 |
slic | -0.054 |
hof | -0.053 |
leakage | -0.052 |
stamped | -0.051 |
Token | ?' |
Token ID | 8348 |
Feature activation | +2.48e-02 |
Pos logit contributions | |
ˈ | +1.023 |
Redd | +0.862 |
Wan | +0.851 |
claw | +0.837 |
Neph | +0.827 |
Neg logit contributions | |
fitt | -0.744 |
slic | -0.679 |
hof | -0.673 |
leakage | -0.660 |
stamped | -0.649 |
Token | Already |
Token ID | 27511 |
Feature activation | -9.83e-02 |
Pos logit contributions | |
fitt | +0.062 |
slic | +0.058 |
hof | +0.056 |
leakage | +0.056 |
stamped | +0.055 |
Neg logit contributions | |
ˈ | -0.068 |
Redd | -0.056 |
Wan | -0.056 |
claw | -0.055 |
Neph | -0.053 |
Token | then |
Token ID | 788 |
Feature activation | +4.87e-02 |
Pos logit contributions | |
ˈ | +0.302 |
Redd | +0.256 |
Wan | +0.254 |
claw | +0.250 |
Neph | +0.244 |
Neg logit contributions | |
fitt | -0.209 |
slic | -0.193 |
hof | -0.190 |
leakage | -0.185 |
stamped | -0.181 |
Token | it |
Token ID | 340 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
fitt | +0.103 |
slic | +0.094 |
hof | +0.092 |
leakage | +0.090 |
stamped | +0.089 |
Neg logit contributions | |
ˈ | -0.152 |
Redd | -0.129 |
Wan | -0.127 |
claw | -0.126 |
Neph | -0.122 |
Token | was |
Token ID | 373 |
Feature activation | +8.29e-03 |
Pos logit contributions | |
fitt | +0.031 |
slic | +0.029 |
hof | +0.029 |
leakage | +0.028 |
stamped | +0.027 |
Neg logit contributions | |
ˈ | -0.049 |
Redd | -0.040 |
Wan | -0.040 |
claw | -0.040 |
Neph | -0.039 |