Token | 't |
Token ID | 470 |
Feature activation | +3.02e+01 |
Pos logit contributions | |
Where | +0.103 |
See | +0.095 |
Oh | +0.092 |
Welcome | +0.091 |
Do | +0.091 |
Neg logit contributions | |
ish | -0.140 |
Majesty | -0.124 |
ci | -0.119 |
ans | -0.112 |
majesty | -0.110 |
Token | know |
Token ID | 760 |
Feature activation | +2.96e+01 |
Pos logit contributions | |
ish | +0.196 |
Majesty | +0.175 |
ci | +0.166 |
cient | +0.161 |
majesty | +0.159 |
Neg logit contributions | |
Where | -0.120 |
Welcome | -0.108 |
See | -0.106 |
On | -0.105 |
He | -0.103 |
Token | the |
Token ID | 262 |
Feature activation | +3.35e+01 |
Pos logit contributions | |
ish | +0.181 |
Majesty | +0.157 |
ci | +0.146 |
oppy | +0.145 |
majesty | +0.143 |
Neg logit contributions | |
Where | -0.132 |
See | -0.116 |
Welcome | -0.115 |
On | -0.114 |
Oh | -0.114 |
Token | rh |
Token ID | 9529 |
Feature activation | +5.70e+01 |
Pos logit contributions | |
ish | +0.197 |
Majesty | +0.176 |
oppy | +0.164 |
majesty | +0.160 |
ci | +0.160 |
Neg logit contributions | |
Where | -0.152 |
Oh | -0.141 |
See | -0.137 |
Welcome | -0.133 |
Wow | -0.130 |
Token | in |
Token ID | 259 |
Feature activation | +4.43e+01 |
Pos logit contributions | |
ish | +0.270 |
Majesty | +0.267 |
majesty | +0.237 |
ci | +0.222 |
oppy | +0.217 |
Neg logit contributions | |
Where | -0.308 |
Oh | -0.279 |
See | -0.279 |
Welcome | -0.274 |
For | -0.271 |
Token | oc |
Token ID | 420 |
Feature activation | +7.41e+01 |
Pos logit contributions | |
ish | +0.237 |
Majesty | +0.217 |
majesty | +0.196 |
oppy | +0.191 |
ci | +0.185 |
Neg logit contributions | |
Where | -0.220 |
See | -0.201 |
Oh | -0.200 |
Welcome | -0.197 |
On | -0.194 |
Token | eros |
Token ID | 27498 |
Feature activation | +4.12e+01 |
Pos logit contributions | |
oppy | +0.291 |
ish | +0.264 |
Majesty | +0.258 |
majesty | +0.250 |
iggle | +0.248 |
Neg logit contributions | |
Where | -0.391 |
Warning | -0.369 |
See | -0.365 |
Oh | -0.363 |
Sir | -0.348 |
Token | was |
Token ID | 373 |
Feature activation | +3.13e+01 |
Pos logit contributions | |
ish | +0.299 |
Majesty | +0.275 |
majesty | +0.256 |
ci | +0.251 |
oppy | +0.250 |
Neg logit contributions | |
Where | -0.130 |
See | -0.112 |
Oh | -0.110 |
Welcome | -0.108 |
On | -0.108 |
Token | wild |
Token ID | 4295 |
Feature activation | +3.28e+01 |
Pos logit contributions | |
ish | +0.204 |
Majesty | +0.183 |
majesty | +0.168 |
ci | +0.167 |
oppy | +0.166 |
Neg logit contributions | |
Where | -0.128 |
See | -0.114 |
Oh | -0.111 |
On | -0.111 |
Welcome | -0.109 |
Token | . |
Token ID | 13 |
Feature activation | +2.40e+01 |
Pos logit contributions | |
ish | +0.226 |
Majesty | +0.224 |
oppy | +0.215 |
majesty | +0.213 |
cient | +0.199 |
Neg logit contributions | |
Where | -0.101 |
Welcome | -0.089 |
Do | -0.081 |
Oh | -0.081 |
On | -0.077 |
Token | Can |
Token ID | 1680 |
Feature activation | +2.57e+01 |
Pos logit contributions | |
ish | +0.153 |
Majesty | +0.144 |
majesty | +0.132 |
cient | +0.130 |
oppy | +0.130 |
Neg logit contributions | |
Where | -0.088 |
See | -0.078 |
Oh | -0.076 |
Warning | -0.075 |
Welcome | -0.075 |
Token | he |
Token ID | 339 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
ish | +0.312 |
Majesty | +0.280 |
majesty | +0.259 |
ci | +0.252 |
cient | +0.252 |
Neg logit contributions | |
Where | -0.159 |
On | -0.139 |
Oh | -0.139 |
Welcome | -0.138 |
See | -0.138 |
Token | would |
Token ID | 561 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
ish | +0.234 |
Majesty | +0.213 |
majesty | +0.198 |
ci | +0.196 |
oppy | +0.195 |
Neg logit contributions | |
Where | -0.112 |
On | -0.099 |
See | -0.099 |
Welcome | -0.095 |
Oh | -0.094 |
Token | take |
Token ID | 1011 |
Feature activation | +3.13e+01 |
Pos logit contributions | |
ish | +0.186 |
Majesty | +0.161 |
oppy | +0.153 |
ishes | +0.150 |
ci | +0.149 |
Neg logit contributions | |
Where | -0.112 |
On | -0.112 |
He | -0.106 |
One | -0.106 |
See | -0.104 |
Token | the |
Token ID | 262 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
ish | +0.209 |
Majesty | +0.188 |
majesty | +0.174 |
ci | +0.172 |
cient | +0.171 |
Neg logit contributions | |
Where | -0.120 |
See | -0.109 |
Welcome | -0.105 |
Oh | -0.104 |
On | -0.102 |
Token | av |
Token ID | 1196 |
Feature activation | +6.23e+01 |
Pos logit contributions | |
ish | +0.181 |
Majesty | +0.164 |
majesty | +0.149 |
oppy | +0.147 |
ci | +0.143 |
Neg logit contributions | |
Where | -0.167 |
Oh | -0.155 |
Welcome | -0.153 |
See | -0.152 |
On | -0.149 |
Token | oc |
Token ID | 420 |
Feature activation | +7.20e+01 |
Pos logit contributions | |
Majesty | +0.359 |
majesty | +0.342 |
ish | +0.330 |
knee | +0.316 |
oppy | +0.306 |
Neg logit contributions | |
Where | -0.254 |
On | -0.248 |
One | -0.246 |
See | -0.239 |
To | -0.237 |
Token | ados |
Token ID | 22484 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
oppy | +0.263 |
ish | +0.240 |
iggle | +0.229 |
Majesty | +0.228 |
majesty | +0.226 |
Neg logit contributions | |
Where | -0.371 |
Warning | -0.361 |
See | -0.360 |
Sir | -0.356 |
Oh | -0.343 |
Token | and |
Token ID | 290 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
Majesty | +0.262 |
ish | +0.256 |
majesty | +0.243 |
oppy | +0.218 |
ci | +0.210 |
Neg logit contributions | |
Where | -0.163 |
On | -0.159 |
To | -0.150 |
For | -0.144 |
He | -0.144 |
Token | scatter |
Token ID | 41058 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
ish | +0.157 |
Majesty | +0.139 |
oppy | +0.132 |
majesty | +0.127 |
ci | +0.127 |
Neg logit contributions | |
Where | -0.118 |
See | -0.107 |
On | -0.104 |
Welcome | -0.101 |
What | -0.100 |
Token | them |
Token ID | 606 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
ish | +0.209 |
Majesty | +0.196 |
majesty | +0.180 |
ci | +0.178 |
oppy | +0.176 |
Neg logit contributions | |
Where | -0.125 |
See | -0.113 |
Oh | -0.110 |
Welcome | -0.109 |
On | -0.107 |
Token | around |
Token ID | 1088 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
ish | +0.195 |
Majesty | +0.186 |
majesty | +0.172 |
oppy | +0.164 |
cient | +0.163 |
Neg logit contributions | |
Where | -0.125 |
On | -0.118 |
See | -0.110 |
Welcome | -0.108 |
To | -0.107 |
Token | am |
Token ID | 716 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
ish | +0.157 |
Majesty | +0.145 |
majesty | +0.132 |
ci | +0.131 |
cient | +0.127 |
Neg logit contributions | |
Where | -0.099 |
See | -0.092 |
On | -0.090 |
Oh | -0.088 |
Welcome | -0.087 |
Token | taking |
Token ID | 2263 |
Feature activation | +3.13e+01 |
Pos logit contributions | |
ish | +0.171 |
Majesty | +0.144 |
ci | +0.144 |
ishes | +0.135 |
cient | +0.134 |
Neg logit contributions | |
Where | -0.097 |
See | -0.089 |
On | -0.083 |
Welcome | -0.082 |
Oh | -0.081 |
Token | the |
Token ID | 262 |
Feature activation | +3.26e+01 |
Pos logit contributions | |
ish | +0.197 |
Majesty | +0.176 |
ci | +0.164 |
majesty | +0.161 |
oppy | +0.159 |
Neg logit contributions | |
Where | -0.131 |
See | -0.120 |
Oh | -0.116 |
Welcome | -0.116 |
To | -0.112 |
Token | rh |
Token ID | 9529 |
Feature activation | +5.14e+01 |
Pos logit contributions | |
ish | +0.171 |
Majesty | +0.158 |
oppy | +0.142 |
majesty | +0.142 |
ci | +0.134 |
Neg logit contributions | |
Where | -0.154 |
Oh | -0.147 |
Welcome | -0.145 |
On | -0.139 |
See | -0.138 |
Token | in |
Token ID | 259 |
Feature activation | +4.23e+01 |
Pos logit contributions | |
Majesty | +0.253 |
ish | +0.249 |
majesty | +0.226 |
ci | +0.211 |
oppy | +0.205 |
Neg logit contributions | |
Where | -0.260 |
Oh | -0.237 |
For | -0.235 |
He | -0.235 |
Welcome | -0.234 |
Token | oc |
Token ID | 420 |
Feature activation | +6.99e+01 |
Pos logit contributions | |
Majesty | +0.243 |
ish | +0.242 |
majesty | +0.226 |
oppy | +0.215 |
ishes | +0.200 |
Neg logit contributions | |
Where | -0.176 |
To | -0.163 |
Oh | -0.159 |
Welcome | -0.158 |
On | -0.157 |
Token | eros |
Token ID | 27498 |
Feature activation | +4.01e+01 |
Pos logit contributions | |
oppy | +0.282 |
ish | +0.252 |
Majesty | +0.250 |
majesty | +0.242 |
iggle | +0.239 |
Neg logit contributions | |
Where | -0.336 |
Warning | -0.326 |
See | -0.319 |
Oh | -0.315 |
Sir | -0.314 |
Token | to |
Token ID | 284 |
Feature activation | +2.61e+01 |
Pos logit contributions | |
ish | +0.242 |
Majesty | +0.232 |
majesty | +0.219 |
oppy | +0.208 |
ci | +0.196 |
Neg logit contributions | |
Where | -0.159 |
To | -0.148 |
For | -0.143 |
On | -0.142 |
Welcome | -0.140 |
Token | a |
Token ID | 257 |
Feature activation | +2.78e+01 |
Pos logit contributions | |
ish | +0.174 |
Majesty | +0.149 |
ci | +0.143 |
oppy | +0.138 |
majesty | +0.137 |
Neg logit contributions | |
Where | -0.105 |
See | -0.095 |
On | -0.093 |
Welcome | -0.091 |
Oh | -0.091 |
Token | new |
Token ID | 649 |
Feature activation | +3.22e+01 |
Pos logit contributions | |
ish | +0.169 |
Majesty | +0.151 |
majesty | +0.139 |
ci | +0.138 |
oppy | +0.135 |
Neg logit contributions | |
Where | -0.122 |
See | -0.109 |
Oh | -0.109 |
On | -0.108 |
Welcome | -0.107 |
Token | home |
Token ID | 1363 |
Feature activation | +3.02e+01 |
Pos logit contributions | |
ish | +0.183 |
Majesty | +0.157 |
oppy | +0.155 |
majesty | +0.148 |
cient | +0.145 |
Neg logit contributions | |
Where | -0.150 |
On | -0.138 |
One | -0.136 |
Welcome | -0.129 |
See | -0.129 |
Token | give |
Token ID | 1577 |
Feature activation | +3.20e+01 |
Pos logit contributions | |
ish | +0.204 |
Majesty | +0.182 |
ci | +0.167 |
majesty | +0.165 |
oppy | +0.164 |
Neg logit contributions | |
Where | -0.122 |
On | -0.112 |
What | -0.109 |
See | -0.107 |
One | -0.107 |
Token | to |
Token ID | 284 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
ish | +0.220 |
Majesty | +0.216 |
majesty | +0.199 |
castle | +0.193 |
oppy | +0.191 |
Neg logit contributions | |
Where | -0.108 |
See | -0.095 |
Oh | -0.090 |
Welcome | -0.090 |
What | -0.088 |
Token | the |
Token ID | 262 |
Feature activation | +3.25e+01 |
Pos logit contributions | |
ish | +0.196 |
Majesty | +0.172 |
pp | +0.162 |
ci | +0.162 |
cient | +0.160 |
Neg logit contributions | |
Where | -0.071 |
See | -0.068 |
He | -0.060 |
On | -0.060 |
What | -0.059 |
Token | rh |
Token ID | 9529 |
Feature activation | +5.21e+01 |
Pos logit contributions | |
ish | +0.180 |
Majesty | +0.158 |
ci | +0.148 |
oppy | +0.145 |
majesty | +0.142 |
Neg logit contributions | |
Where | -0.157 |
See | -0.146 |
Oh | -0.143 |
Welcome | -0.139 |
On | -0.139 |
Token | in |
Token ID | 259 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
ish | +0.248 |
Majesty | +0.236 |
majesty | +0.209 |
ci | +0.202 |
oppy | +0.192 |
Neg logit contributions | |
Where | -0.283 |
See | -0.257 |
Oh | -0.255 |
On | -0.254 |
He | -0.254 |
Token | oc |
Token ID | 420 |
Feature activation | +6.97e+01 |
Pos logit contributions | |
ish | +0.234 |
Majesty | +0.226 |
majesty | +0.204 |
oppy | +0.195 |
ci | +0.193 |
Neg logit contributions | |
Where | -0.176 |
On | -0.163 |
To | -0.163 |
He | -0.161 |
For | -0.160 |
Token | eros |
Token ID | 27498 |
Feature activation | +3.90e+01 |
Pos logit contributions | |
oppy | +0.266 |
ish | +0.258 |
Majesty | +0.234 |
iggle | +0.231 |
adow | +0.230 |
Neg logit contributions | |
Where | -0.365 |
Warning | -0.351 |
See | -0.340 |
Sir | -0.337 |
Oh | -0.335 |
Token | . |
Token ID | 13 |
Feature activation | +2.24e+01 |
Pos logit contributions | |
ish | +0.252 |
Majesty | +0.235 |
majesty | +0.216 |
ci | +0.211 |
oppy | +0.211 |
Neg logit contributions | |
Where | -0.138 |
On | -0.124 |
For | -0.122 |
To | -0.121 |
See | -0.120 |
Token | Lily |
Token ID | 20037 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
ish | +0.150 |
Majesty | +0.141 |
majesty | +0.129 |
cient | +0.127 |
ci | +0.126 |
Neg logit contributions | |
Where | -0.078 |
Oh | -0.068 |
See | -0.068 |
Warning | -0.066 |
Welcome | -0.066 |
Token | walked |
Token ID | 6807 |
Feature activation | +2.54e+01 |
Pos logit contributions | |
ish | +0.188 |
Majesty | +0.174 |
oppy | +0.162 |
majesty | +0.161 |
cient | +0.161 |
Neg logit contributions | |
See | -0.061 |
On | -0.061 |
Where | -0.060 |
He | -0.059 |
That | -0.056 |
Token | to |
Token ID | 284 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
ish | +0.125 |
Majesty | +0.106 |
ci | +0.098 |
cient | +0.092 |
majesty | +0.092 |
Neg logit contributions | |
Where | -0.133 |
See | -0.129 |
Warning | -0.127 |
Oh | -0.126 |
Welcome | -0.122 |
Token | quiet |
Token ID | 5897 |
Feature activation | +5.22e+01 |
Pos logit contributions | |
Where | +0.076 |
See | +0.069 |
Oh | +0.068 |
Time | +0.067 |
What | +0.067 |
Neg logit contributions | |
ish | -0.107 |
Majesty | -0.100 |
ci | -0.099 |
cient | -0.094 |
oppy | -0.093 |
Token | compared |
Token ID | 3688 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
ish | +0.387 |
Majesty | +0.347 |
oppy | +0.347 |
cient | +0.334 |
majesty | +0.324 |
Neg logit contributions | |
Where | -0.149 |
Time | -0.121 |
Welcome | -0.120 |
Oh | -0.117 |
For | -0.117 |
Token | to |
Token ID | 284 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
ish | +0.273 |
Majesty | +0.252 |
majesty | +0.230 |
oppy | +0.229 |
ci | +0.226 |
Neg logit contributions | |
Where | -0.165 |
See | -0.145 |
Oh | -0.144 |
On | -0.141 |
Welcome | -0.140 |
Token | the |
Token ID | 262 |
Feature activation | +3.54e+01 |
Pos logit contributions | |
ish | +0.183 |
Majesty | +0.162 |
majesty | +0.148 |
oppy | +0.147 |
ci | +0.147 |
Neg logit contributions | |
Where | -0.120 |
See | -0.108 |
Oh | -0.105 |
On | -0.104 |
Welcome | -0.103 |
Token | noisy |
Token ID | 31210 |
Feature activation | +4.04e+01 |
Pos logit contributions | |
ish | +0.208 |
Majesty | +0.185 |
oppy | +0.170 |
majesty | +0.168 |
ci | +0.168 |
Neg logit contributions | |
Where | -0.161 |
Oh | -0.147 |
See | -0.146 |
Welcome | -0.142 |
On | -0.141 |
Token | se |
Token ID | 384 |
Feature activation | +6.69e+01 |
Pos logit contributions | |
ish | +0.240 |
Majesty | +0.218 |
oppy | +0.208 |
cient | +0.199 |
majesty | +0.198 |
Neg logit contributions | |
Where | -0.173 |
Welcome | -0.157 |
Oh | -0.156 |
Time | -0.156 |
See | -0.156 |
Token | ag |
Token ID | 363 |
Feature activation | +4.42e+01 |
Pos logit contributions | |
ish | +0.330 |
Majesty | +0.325 |
oppy | +0.309 |
majesty | +0.299 |
opsy | +0.281 |
Neg logit contributions | |
See | -0.295 |
He | -0.288 |
Time | -0.285 |
To | -0.283 |
Where | -0.280 |
Token | ull |
Token ID | 724 |
Feature activation | +3.81e+01 |
Pos logit contributions | |
ish | +0.257 |
Majesty | +0.240 |
majesty | +0.215 |
oppy | +0.205 |
ci | +0.204 |
Neg logit contributions | |
Where | -0.198 |
See | -0.181 |
On | -0.181 |
He | -0.180 |
For | -0.178 |
Token | s |
Token ID | 82 |
Feature activation | +3.38e+01 |
Pos logit contributions | |
ish | +0.239 |
Majesty | +0.233 |
majesty | +0.215 |
oppy | +0.209 |
cient | +0.196 |
Neg logit contributions | |
Where | -0.134 |
See | -0.124 |
He | -0.122 |
On | -0.121 |
Welcome | -0.118 |
Token | outside |
Token ID | 2354 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
ish | +0.210 |
Majesty | +0.191 |
oppy | +0.175 |
majesty | +0.174 |
ci | +0.172 |
Neg logit contributions | |
Where | -0.137 |
See | -0.127 |
On | -0.123 |
Oh | -0.120 |
Welcome | -0.119 |
Token | . |
Token ID | 13 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
ish | +0.230 |
Majesty | +0.211 |
majesty | +0.194 |
oppy | +0.191 |
ci | +0.190 |
Neg logit contributions | |
Where | -0.131 |
See | -0.117 |
Oh | -0.115 |
On | -0.113 |
Welcome | -0.113 |
Token | children |
Token ID | 1751 |
Feature activation | +4.57e+01 |
Pos logit contributions | |
Where | +0.087 |
See | +0.077 |
Oh | +0.076 |
On | +0.074 |
Welcome | +0.074 |
Neg logit contributions | |
ish | -0.170 |
Majesty | -0.155 |
majesty | -0.143 |
ci | -0.142 |
oppy | -0.140 |
Token | put |
Token ID | 1234 |
Feature activation | +3.48e+01 |
Pos logit contributions | |
ish | +0.304 |
Majesty | +0.280 |
majesty | +0.259 |
oppy | +0.256 |
ci | +0.250 |
Neg logit contributions | |
Where | -0.164 |
See | -0.145 |
On | -0.142 |
Welcome | -0.141 |
Oh | -0.140 |
Token | on |
Token ID | 319 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
ish | +0.227 |
Majesty | +0.224 |
majesty | +0.204 |
oppy | +0.199 |
cient | +0.195 |
Neg logit contributions | |
Where | -0.125 |
See | -0.115 |
Oh | -0.112 |
Welcome | -0.110 |
Wow | -0.108 |
Token | their |
Token ID | 511 |
Feature activation | +3.89e+01 |
Pos logit contributions | |
ish | +0.201 |
Majesty | +0.182 |
majesty | +0.166 |
ci | +0.164 |
oppy | +0.164 |
Neg logit contributions | |
Where | -0.114 |
See | -0.104 |
On | -0.102 |
Oh | -0.101 |
Welcome | -0.099 |
Token | bath |
Token ID | 7837 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
ish | +0.202 |
Majesty | +0.178 |
oppy | +0.162 |
cient | +0.160 |
majesty | +0.155 |
Neg logit contributions | |
Where | -0.191 |
Oh | -0.173 |
See | -0.172 |
Welcome | -0.171 |
On | -0.170 |
Token | ro |
Token ID | 305 |
Feature activation | +6.64e+01 |
Pos logit contributions | |
ish | +0.233 |
Majesty | +0.219 |
cient | +0.194 |
majesty | +0.189 |
oppy | +0.183 |
Neg logit contributions | |
Where | -0.170 |
To | -0.164 |
On | -0.163 |
For | -0.159 |
He | -0.152 |
Token | bes |
Token ID | 12636 |
Feature activation | +4.56e+01 |
Pos logit contributions | |
ish | +0.438 |
cient | +0.374 |
Majesty | +0.368 |
ishes | +0.352 |
oppy | +0.347 |
Neg logit contributions | |
On | -0.235 |
To | -0.224 |
Where | -0.221 |
He | -0.217 |
When | -0.213 |
Token | and |
Token ID | 290 |
Feature activation | +2.71e+01 |
Pos logit contributions | |
ish | +0.295 |
Majesty | +0.283 |
majesty | +0.261 |
oppy | +0.249 |
ci | +0.239 |
Neg logit contributions | |
Where | -0.172 |
On | -0.161 |
Welcome | -0.152 |
See | -0.151 |
Oh | -0.151 |
Token | ran |
Token ID | 4966 |
Feature activation | +2.84e+01 |
Pos logit contributions | |
ish | +0.183 |
Majesty | +0.170 |
majesty | +0.155 |
cient | +0.153 |
oppy | +0.150 |
Neg logit contributions | |
Where | -0.100 |
See | -0.088 |
On | -0.088 |
Welcome | -0.085 |
Oh | -0.084 |
Token | around |
Token ID | 1088 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
ish | +0.154 |
Majesty | +0.137 |
majesty | +0.123 |
ci | +0.122 |
oppy | +0.119 |
Neg logit contributions | |
Where | -0.144 |
See | -0.132 |
Oh | -0.131 |
On | -0.129 |
Welcome | -0.129 |
Token | in |
Token ID | 287 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
ish | +0.171 |
Majesty | +0.155 |
majesty | +0.142 |
ci | +0.139 |
oppy | +0.137 |
Neg logit contributions | |
Where | -0.110 |
See | -0.098 |
Oh | -0.097 |
On | -0.097 |
Welcome | -0.096 |
Token | When |
Token ID | 1649 |
Feature activation | +2.75e+01 |
Pos logit contributions | |
ish | +0.183 |
Majesty | +0.170 |
majesty | +0.157 |
ci | +0.155 |
oppy | +0.154 |
Neg logit contributions | |
Where | -0.080 |
See | -0.069 |
Oh | -0.069 |
On | -0.066 |
Warning | -0.066 |
Token | Daisy |
Token ID | 40355 |
Feature activation | +3.26e+01 |
Pos logit contributions | |
ish | +0.199 |
Majesty | +0.176 |
ci | +0.162 |
majesty | +0.162 |
cient | +0.161 |
Neg logit contributions | |
Where | -0.093 |
See | -0.081 |
Welcome | -0.081 |
Oh | -0.081 |
On | -0.080 |
Token | put |
Token ID | 1234 |
Feature activation | +2.86e+01 |
Pos logit contributions | |
ish | +0.227 |
Majesty | +0.212 |
majesty | +0.195 |
ci | +0.193 |
cient | +0.189 |
Neg logit contributions | |
Where | -0.108 |
See | -0.098 |
On | -0.096 |
Welcome | -0.094 |
Oh | -0.092 |
Token | the |
Token ID | 262 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
ish | +0.201 |
Majesty | +0.189 |
majesty | +0.175 |
cient | +0.171 |
ci | +0.169 |
Neg logit contributions | |
Where | -0.098 |
See | -0.087 |
Oh | -0.085 |
On | -0.081 |
Wow | -0.081 |
Token | magn |
Token ID | 7842 |
Feature activation | +4.04e+01 |
Pos logit contributions | |
ish | +0.142 |
Majesty | +0.133 |
oppy | +0.119 |
majesty | +0.118 |
ci | +0.115 |
Neg logit contributions | |
Where | -0.142 |
Oh | -0.134 |
See | -0.130 |
Welcome | -0.126 |
Wow | -0.124 |
Token | ifying |
Token ID | 4035 |
Feature activation | +6.56e+01 |
Pos logit contributions | |
ish | +0.231 |
Majesty | +0.211 |
majesty | +0.191 |
ci | +0.186 |
oppy | +0.183 |
Neg logit contributions | |
Where | -0.189 |
See | -0.173 |
Oh | -0.171 |
On | -0.169 |
Welcome | -0.169 |
Token | glass |
Token ID | 5405 |
Feature activation | +3.73e+01 |
Pos logit contributions | |
ish | +0.410 |
Majesty | +0.394 |
ci | +0.348 |
majesty | +0.346 |
cient | +0.337 |
Neg logit contributions | |
Oh | -0.268 |
Where | -0.265 |
See | -0.264 |
On | -0.257 |
To | -0.248 |
Token | down |
Token ID | 866 |
Feature activation | +3.11e+01 |
Pos logit contributions | |
Majesty | +0.206 |
ish | +0.201 |
majesty | +0.179 |
cient | +0.174 |
ci | +0.168 |
Neg logit contributions | |
Where | -0.171 |
On | -0.161 |
See | -0.160 |
Oh | -0.158 |
To | -0.158 |
Token | , |
Token ID | 11 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
ish | +0.161 |
Majesty | +0.143 |
majesty | +0.127 |
ci | +0.126 |
cient | +0.123 |
Neg logit contributions | |
Where | -0.165 |
See | -0.153 |
Oh | -0.151 |
On | -0.149 |
Welcome | -0.148 |
Token | the |
Token ID | 262 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
ish | +0.159 |
Majesty | +0.144 |
majesty | +0.135 |
ci | +0.132 |
cient | +0.130 |
Neg logit contributions | |
Where | -0.062 |
See | -0.053 |
Oh | -0.052 |
On | -0.051 |
Welcome | -0.051 |
Token | cater |
Token ID | 20825 |
Feature activation | +4.32e+01 |
Pos logit contributions | |
ish | +0.143 |
Majesty | +0.127 |
ci | +0.114 |
majesty | +0.113 |
oppy | +0.111 |
Neg logit contributions | |
Where | -0.135 |
Oh | -0.124 |
See | -0.124 |
Welcome | -0.120 |
Wow | -0.119 |
Token | that |
Token ID | 326 |
Feature activation | +2.65e+01 |
Pos logit contributions | |
ish | +0.208 |
Majesty | +0.187 |
oppy | +0.176 |
cient | +0.174 |
majesty | +0.173 |
Neg logit contributions | |
Where | -0.122 |
On | -0.107 |
See | -0.107 |
Welcome | -0.106 |
Oh | -0.104 |
Token | the |
Token ID | 262 |
Feature activation | +3.05e+01 |
Pos logit contributions | |
ish | +0.173 |
Majesty | +0.157 |
majesty | +0.144 |
ci | +0.142 |
oppy | +0.140 |
Neg logit contributions | |
Where | -0.105 |
See | -0.094 |
Oh | -0.093 |
Welcome | -0.091 |
On | -0.091 |
Token | bad |
Token ID | 2089 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
ish | +0.178 |
Majesty | +0.157 |
majesty | +0.143 |
ci | +0.143 |
oppy | +0.142 |
Neg logit contributions | |
Where | -0.141 |
Oh | -0.128 |
See | -0.128 |
Welcome | -0.125 |
On | -0.122 |
Token | rh |
Token ID | 9529 |
Feature activation | +4.95e+01 |
Pos logit contributions | |
ish | +0.206 |
Majesty | +0.182 |
cient | +0.173 |
oppy | +0.170 |
majesty | +0.168 |
Neg logit contributions | |
Where | -0.128 |
Welcome | -0.118 |
See | -0.117 |
Oh | -0.116 |
Time | -0.116 |
Token | in |
Token ID | 259 |
Feature activation | +3.95e+01 |
Pos logit contributions | |
ish | +0.225 |
Majesty | +0.206 |
majesty | +0.180 |
ci | +0.175 |
oppy | +0.170 |
Neg logit contributions | |
Where | -0.286 |
See | -0.266 |
Oh | -0.263 |
Welcome | -0.260 |
On | -0.257 |
Token | oc |
Token ID | 420 |
Feature activation | +6.44e+01 |
Pos logit contributions | |
ish | +0.210 |
Majesty | +0.187 |
majesty | +0.168 |
ci | +0.165 |
oppy | +0.163 |
Neg logit contributions | |
Where | -0.202 |
See | -0.186 |
Oh | -0.184 |
On | -0.181 |
Welcome | -0.181 |
Token | eros |
Token ID | 27498 |
Feature activation | +3.60e+01 |
Pos logit contributions | |
oppy | +0.238 |
ish | +0.234 |
Majesty | +0.219 |
opsy | +0.205 |
majesty | +0.202 |
Neg logit contributions | |
Where | -0.344 |
See | -0.332 |
Warning | -0.327 |
Oh | -0.322 |
Welcome | -0.311 |
Token | was |
Token ID | 373 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
ish | +0.264 |
Majesty | +0.245 |
majesty | +0.228 |
oppy | +0.223 |
ci | +0.223 |
Neg logit contributions | |
Where | -0.109 |
See | -0.095 |
Oh | -0.091 |
On | -0.090 |
Welcome | -0.090 |
Token | now |
Token ID | 783 |
Feature activation | +2.74e+01 |
Pos logit contributions | |
ish | +0.170 |
Majesty | +0.152 |
majesty | +0.140 |
oppy | +0.139 |
ci | +0.138 |
Neg logit contributions | |
Where | -0.113 |
See | -0.103 |
On | -0.098 |
Welcome | -0.098 |
Oh | -0.097 |
Token | nice |
Token ID | 3621 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
ish | +0.171 |
Majesty | +0.154 |
majesty | +0.142 |
oppy | +0.140 |
cient | +0.140 |
Neg logit contributions | |
Where | -0.117 |
See | -0.108 |
On | -0.103 |
Oh | -0.102 |
Welcome | -0.102 |
Token | . |
Token ID | 13 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
ish | +0.162 |
Majesty | +0.151 |
majesty | +0.137 |
oppy | +0.136 |
cient | +0.136 |
Neg logit contributions | |
Where | -0.112 |
See | -0.100 |
Welcome | -0.099 |
Oh | -0.097 |
On | -0.096 |
Token | it |
Token ID | 340 |
Feature activation | +2.90e+01 |
Pos logit contributions | |
ish | +0.199 |
Majesty | +0.188 |
majesty | +0.172 |
castle | +0.169 |
cient | +0.168 |
Neg logit contributions | |
Where | -0.103 |
See | -0.094 |
Oh | -0.089 |
Welcome | -0.086 |
What | -0.084 |
Token | to |
Token ID | 284 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
ish | +0.179 |
Majesty | +0.168 |
majesty | +0.152 |
cient | +0.150 |
ci | +0.150 |
Neg logit contributions | |
Where | -0.114 |
Welcome | -0.103 |
See | -0.102 |
To | -0.101 |
On | -0.101 |
Token | the |
Token ID | 262 |
Feature activation | +2.84e+01 |
Pos logit contributions | |
ish | +0.150 |
Majesty | +0.130 |
ci | +0.122 |
majesty | +0.119 |
oppy | +0.118 |
Neg logit contributions | |
Where | -0.081 |
See | -0.073 |
Oh | -0.070 |
Welcome | -0.069 |
What | -0.068 |
Token | rh |
Token ID | 9529 |
Feature activation | +4.64e+01 |
Pos logit contributions | |
ish | +0.161 |
Majesty | +0.139 |
ci | +0.131 |
oppy | +0.130 |
majesty | +0.127 |
Neg logit contributions | |
Where | -0.137 |
Oh | -0.124 |
See | -0.122 |
Welcome | -0.120 |
On | -0.118 |
Token | in |
Token ID | 259 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
ish | +0.217 |
Majesty | +0.205 |
majesty | +0.181 |
ci | +0.175 |
oppy | +0.167 |
Neg logit contributions | |
Where | -0.256 |
See | -0.236 |
Oh | -0.234 |
On | -0.230 |
He | -0.230 |
Token | oc |
Token ID | 420 |
Feature activation | +6.39e+01 |
Pos logit contributions | |
ish | +0.200 |
Majesty | +0.184 |
majesty | +0.168 |
oppy | +0.161 |
ci | +0.160 |
Neg logit contributions | |
Where | -0.169 |
On | -0.156 |
To | -0.152 |
For | -0.151 |
Oh | -0.151 |
Token | eros |
Token ID | 27498 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
oppy | +0.247 |
ish | +0.236 |
Majesty | +0.224 |
adow | +0.216 |
iggle | +0.215 |
Neg logit contributions | |
Where | -0.323 |
Warning | -0.312 |
See | -0.305 |
Sir | -0.300 |
Oh | -0.299 |
Token | . |
Token ID | 13 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
ish | +0.237 |
Majesty | +0.220 |
majesty | +0.204 |
oppy | +0.198 |
ci | +0.198 |
Neg logit contributions | |
Where | -0.118 |
On | -0.105 |
To | -0.101 |
See | -0.101 |
For | -0.101 |
Token | When |
Token ID | 1649 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
ish | +0.130 |
Majesty | +0.121 |
majesty | +0.112 |
cient | +0.109 |
oppy | +0.109 |
Neg logit contributions | |
Where | -0.074 |
Oh | -0.065 |
See | -0.064 |
Warning | -0.063 |
Time | -0.063 |
Token | he |
Token ID | 339 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
ish | +0.149 |
Majesty | +0.135 |
majesty | +0.124 |
ci | +0.123 |
oppy | +0.121 |
Neg logit contributions | |
Where | -0.085 |
See | -0.077 |
Oh | -0.075 |
Welcome | -0.074 |
On | -0.074 |
Token | tasted |
Token ID | 29187 |
Feature activation | +2.40e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.158 |
majesty | +0.145 |
ci | +0.144 |
cient | +0.140 |
Neg logit contributions | |
Where | -0.091 |
See | -0.081 |
On | -0.079 |
Oh | -0.079 |
Welcome | -0.078 |
Token | his |
Token ID | 465 |
Feature activation | +4.47e+01 |
Pos logit contributions | |
Where | +0.076 |
See | +0.069 |
Oh | +0.068 |
Welcome | +0.067 |
What | +0.067 |
Neg logit contributions | |
ish | -0.072 |
Majesty | -0.068 |
majesty | -0.062 |
ci | -0.061 |
castle | -0.061 |
Token | head |
Token ID | 1182 |
Feature activation | +4.36e+01 |
Pos logit contributions | |
ish | +0.242 |
Majesty | +0.208 |
cient | +0.194 |
ci | +0.192 |
oppy | +0.190 |
Neg logit contributions | |
Where | -0.209 |
On | -0.190 |
Oh | -0.185 |
See | -0.184 |
He | -0.182 |
Token | out |
Token ID | 503 |
Feature activation | +4.00e+01 |
Pos logit contributions | |
ish | +0.285 |
Majesty | +0.265 |
majesty | +0.244 |
oppy | +0.240 |
cient | +0.234 |
Neg logit contributions | |
Where | -0.165 |
On | -0.148 |
See | -0.145 |
Welcome | -0.140 |
Oh | -0.139 |
Token | of |
Token ID | 286 |
Feature activation | +3.58e+01 |
Pos logit contributions | |
ish | +0.259 |
Majesty | +0.234 |
majesty | +0.214 |
ci | +0.214 |
oppy | +0.210 |
Neg logit contributions | |
Where | -0.159 |
See | -0.143 |
Oh | -0.141 |
On | -0.140 |
Welcome | -0.138 |
Token | his |
Token ID | 465 |
Feature activation | +4.01e+01 |
Pos logit contributions | |
ish | +0.243 |
Majesty | +0.218 |
ci | +0.201 |
majesty | +0.200 |
cient | +0.200 |
Neg logit contributions | |
Where | -0.139 |
See | -0.124 |
Oh | -0.121 |
On | -0.119 |
Welcome | -0.117 |
Token | bur |
Token ID | 4356 |
Feature activation | +6.29e+01 |
Pos logit contributions | |
ish | +0.213 |
Majesty | +0.190 |
cient | +0.180 |
pp | +0.177 |
majesty | +0.168 |
Neg logit contributions | |
Where | -0.182 |
On | -0.167 |
Oh | -0.163 |
See | -0.160 |
He | -0.156 |
Token | row |
Token ID | 808 |
Feature activation | +4.65e+01 |
Pos logit contributions | |
Majesty | +0.332 |
ish | +0.309 |
majesty | +0.297 |
cient | +0.296 |
oppy | +0.278 |
Neg logit contributions | |
Where | -0.263 |
He | -0.254 |
On | -0.247 |
To | -0.230 |
One | -0.229 |
Token | and |
Token ID | 290 |
Feature activation | +2.72e+01 |
Pos logit contributions | |
ish | +0.326 |
Majesty | +0.314 |
majesty | +0.291 |
oppy | +0.284 |
cient | +0.277 |
Neg logit contributions | |
Where | -0.139 |
On | -0.132 |
He | -0.131 |
To | -0.119 |
For | -0.117 |
Token | saw |
Token ID | 2497 |
Feature activation | +2.59e+01 |
Pos logit contributions | |
ish | +0.191 |
Majesty | +0.168 |
cient | +0.157 |
oppy | +0.157 |
majesty | +0.155 |
Neg logit contributions | |
Where | -0.099 |
See | -0.086 |
On | -0.084 |
Oh | -0.081 |
Welcome | -0.079 |
Token | something |
Token ID | 1223 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.155 |
majesty | +0.143 |
ci | +0.142 |
oppy | +0.141 |
Neg logit contributions | |
Where | -0.103 |
See | -0.092 |
Oh | -0.089 |
On | -0.086 |
Welcome | -0.086 |
Token | new |
Token ID | 649 |
Feature activation | +2.84e+01 |
Pos logit contributions | |
ish | +0.149 |
Majesty | +0.128 |
ci | +0.119 |
majesty | +0.116 |
oppy | +0.115 |
Neg logit contributions | |
Where | -0.114 |
See | -0.107 |
Warning | -0.104 |
Oh | -0.104 |
Welcome | -0.102 |
Token | you |
Token ID | 345 |
Feature activation | +3.56e+01 |
Pos logit contributions | |
Where | +0.093 |
See | +0.088 |
On | +0.086 |
Welcome | +0.085 |
Warning | +0.085 |
Neg logit contributions | |
ish | -0.123 |
Majesty | -0.109 |
majesty | -0.100 |
ci | -0.099 |
oppy | -0.098 |
Token | go |
Token ID | 467 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
ish | +0.221 |
Majesty | +0.194 |
ci | +0.185 |
majesty | +0.175 |
oppy | +0.174 |
Neg logit contributions | |
Where | -0.143 |
See | -0.132 |
Welcome | -0.132 |
On | -0.130 |
To | -0.128 |
Token | , |
Token ID | 11 |
Feature activation | +2.57e+01 |
Pos logit contributions | |
ish | +0.195 |
Majesty | +0.176 |
majesty | +0.165 |
cient | +0.159 |
oppy | +0.158 |
Neg logit contributions | |
Where | -0.146 |
On | -0.135 |
Welcome | -0.127 |
One | -0.127 |
Do | -0.127 |
Token | my |
Token ID | 616 |
Feature activation | +3.15e+01 |
Pos logit contributions | |
ish | +0.165 |
Majesty | +0.140 |
ci | +0.137 |
cient | +0.134 |
ishes | +0.133 |
Neg logit contributions | |
Where | -0.106 |
On | -0.095 |
What | -0.093 |
Do | -0.092 |
He | -0.091 |
Token | d |
Token ID | 288 |
Feature activation | +4.18e+01 |
Pos logit contributions | |
ish | +0.162 |
ci | +0.135 |
Majesty | +0.132 |
cient | +0.131 |
pp | +0.128 |
Neg logit contributions | |
Where | -0.151 |
Oh | -0.140 |
See | -0.138 |
On | -0.133 |
Welcome | -0.133 |
Token | arl |
Token ID | 7063 |
Feature activation | +6.29e+01 |
Pos logit contributions | |
ish | +0.218 |
ci | +0.216 |
Majesty | +0.212 |
cient | +0.190 |
gy | +0.185 |
Neg logit contributions | |
Where | -0.175 |
He | -0.168 |
To | -0.167 |
Welcome | -0.164 |
For | -0.164 |
Token | ings |
Token ID | 654 |
Feature activation | +3.34e+01 |
Pos logit contributions | |
ish | +0.317 |
ci | +0.290 |
Majesty | +0.289 |
cient | +0.266 |
oppy | +0.254 |
Neg logit contributions | |
He | -0.273 |
To | -0.269 |
See | -0.267 |
On | -0.262 |
For | -0.257 |
Token | . |
Token ID | 13 |
Feature activation | +2.53e+01 |
Pos logit contributions | |
ish | +0.188 |
Majesty | +0.171 |
majesty | +0.153 |
ci | +0.150 |
oppy | +0.150 |
Neg logit contributions | |
Where | -0.161 |
See | -0.147 |
Oh | -0.146 |
Welcome | -0.145 |
On | -0.145 |
Token | Enjoy |
Token ID | 18179 |
Feature activation | +2.97e+01 |
Pos logit contributions | |
ish | +0.161 |
Majesty | +0.145 |
majesty | +0.133 |
ci | +0.132 |
oppy | +0.130 |
Neg logit contributions | |
Where | -0.104 |
See | -0.094 |
Oh | -0.093 |
On | -0.091 |
Welcome | -0.091 |
Token | your |
Token ID | 534 |
Feature activation | +3.16e+01 |
Pos logit contributions | |
ish | +0.182 |
ci | +0.163 |
gy | +0.156 |
Majesty | +0.156 |
cient | +0.155 |
Neg logit contributions | |
Where | -0.117 |
What | -0.107 |
For | -0.106 |
To | -0.104 |
On | -0.103 |
Token | lunch |
Token ID | 9965 |
Feature activation | +3.74e+01 |
Pos logit contributions | |
ish | +0.175 |
Majesty | +0.148 |
ci | +0.145 |
cient | +0.143 |
pp | +0.139 |
Neg logit contributions | |
Where | -0.137 |
See | -0.128 |
Welcome | -0.127 |
Oh | -0.123 |
On | -0.122 |
Token | her |
Token ID | 607 |
Feature activation | +4.32e+01 |
Pos logit contributions | |
Where | +0.089 |
See | +0.079 |
Oh | +0.078 |
On | +0.077 |
Welcome | +0.077 |
Neg logit contributions | |
ish | -0.137 |
Majesty | -0.125 |
majesty | -0.114 |
ci | -0.112 |
oppy | -0.111 |
Token | mom |
Token ID | 1995 |
Feature activation | +3.70e+01 |
Pos logit contributions | |
ish | +0.245 |
Majesty | +0.204 |
ci | +0.195 |
cient | +0.194 |
oppy | +0.189 |
Neg logit contributions | |
Where | -0.195 |
On | -0.174 |
Oh | -0.173 |
See | -0.172 |
Welcome | -0.163 |
Token | my |
Token ID | 1820 |
Feature activation | +3.90e+01 |
Pos logit contributions | |
ish | +0.240 |
Majesty | +0.224 |
majesty | +0.206 |
oppy | +0.202 |
ci | +0.197 |
Neg logit contributions | |
Where | -0.139 |
See | -0.126 |
On | -0.121 |
Oh | -0.120 |
Welcome | -0.119 |
Token | watched |
Token ID | 7342 |
Feature activation | +3.32e+01 |
Pos logit contributions | |
ish | +0.254 |
Majesty | +0.239 |
majesty | +0.221 |
oppy | +0.216 |
ci | +0.210 |
Neg logit contributions | |
Where | -0.138 |
See | -0.126 |
On | -0.121 |
Welcome | -0.120 |
For | -0.117 |
Token | in |
Token ID | 287 |
Feature activation | +2.65e+01 |
Pos logit contributions | |
ish | +0.224 |
Majesty | +0.208 |
majesty | +0.196 |
oppy | +0.188 |
ci | +0.185 |
Neg logit contributions | |
Where | -0.124 |
On | -0.105 |
What | -0.105 |
Welcome | -0.104 |
Oh | -0.104 |
Token | amaz |
Token ID | 40642 |
Feature activation | +6.24e+01 |
Pos logit contributions | |
ish | +0.161 |
Majesty | +0.145 |
majesty | +0.132 |
ci | +0.131 |
oppy | +0.128 |
Neg logit contributions | |
Where | -0.115 |
See | -0.105 |
Oh | -0.104 |
Welcome | -0.102 |
On | -0.102 |
Token | ement |
Token ID | 972 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
ish | +0.431 |
Majesty | +0.404 |
oppy | +0.391 |
majesty | +0.388 |
cient | +0.377 |
Neg logit contributions | |
Where | -0.200 |
See | -0.188 |
Oh | -0.169 |
Welcome | -0.165 |
He | -0.162 |
Token | as |
Token ID | 355 |
Feature activation | +2.71e+01 |
Pos logit contributions | |
ish | +0.240 |
Majesty | +0.226 |
majesty | +0.211 |
cient | +0.206 |
oppy | +0.205 |
Neg logit contributions | |
Where | -0.102 |
On | -0.095 |
For | -0.089 |
To | -0.086 |
When | -0.086 |
Token | the |
Token ID | 262 |
Feature activation | +2.97e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.155 |
majesty | +0.142 |
ci | +0.141 |
oppy | +0.138 |
Neg logit contributions | |
Where | -0.111 |
See | -0.100 |
Oh | -0.099 |
On | -0.097 |
Welcome | -0.097 |
Token | machine |
Token ID | 4572 |
Feature activation | +3.42e+01 |
Pos logit contributions | |
ish | +0.166 |
Majesty | +0.150 |
majesty | +0.136 |
ci | +0.134 |
cient | +0.129 |
Neg logit contributions | |
Where | -0.141 |
See | -0.130 |
On | -0.128 |
Oh | -0.127 |
Warning | -0.127 |
Token | flew |
Token ID | 13112 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
ish | +0.221 |
Majesty | +0.199 |
majesty | +0.183 |
ci | +0.182 |
oppy | +0.178 |
Neg logit contributions | |
Where | -0.135 |
See | -0.122 |
Oh | -0.120 |
On | -0.118 |
Welcome | -0.117 |
Token | Everyday |
Token ID | 48154 |
Feature activation | +4.46e+01 |
Pos logit contributions | |
Where | +0.075 |
See | +0.069 |
On | +0.068 |
Welcome | +0.067 |
Oh | +0.065 |
Neg logit contributions | |
ish | -0.136 |
Majesty | -0.126 |
majesty | -0.116 |
oppy | -0.112 |
ci | -0.111 |
Token | he |
Token ID | 339 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
ish | +0.312 |
Majesty | +0.280 |
majesty | +0.259 |
ci | +0.252 |
cient | +0.252 |
Neg logit contributions | |
Where | -0.159 |
On | -0.139 |
Oh | -0.139 |
Welcome | -0.138 |
See | -0.138 |
Token | would |
Token ID | 561 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
ish | +0.234 |
Majesty | +0.213 |
majesty | +0.198 |
ci | +0.196 |
oppy | +0.195 |
Neg logit contributions | |
Where | -0.112 |
On | -0.099 |
See | -0.099 |
Welcome | -0.095 |
Oh | -0.094 |
Token | take |
Token ID | 1011 |
Feature activation | +3.13e+01 |
Pos logit contributions | |
ish | +0.186 |
Majesty | +0.161 |
oppy | +0.153 |
ishes | +0.150 |
ci | +0.149 |
Neg logit contributions | |
Where | -0.112 |
On | -0.112 |
He | -0.106 |
One | -0.106 |
See | -0.104 |
Token | the |
Token ID | 262 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
ish | +0.209 |
Majesty | +0.188 |
majesty | +0.174 |
ci | +0.172 |
cient | +0.171 |
Neg logit contributions | |
Where | -0.120 |
See | -0.109 |
Welcome | -0.105 |
Oh | -0.104 |
On | -0.102 |
Token | av |
Token ID | 1196 |
Feature activation | +6.23e+01 |
Pos logit contributions | |
ish | +0.181 |
Majesty | +0.164 |
majesty | +0.149 |
oppy | +0.147 |
ci | +0.143 |
Neg logit contributions | |
Where | -0.167 |
Oh | -0.155 |
Welcome | -0.153 |
See | -0.152 |
On | -0.149 |
Token | oc |
Token ID | 420 |
Feature activation | +7.20e+01 |
Pos logit contributions | |
Majesty | +0.359 |
majesty | +0.342 |
ish | +0.330 |
knee | +0.316 |
oppy | +0.306 |
Neg logit contributions | |
Where | -0.254 |
On | -0.248 |
One | -0.246 |
See | -0.239 |
To | -0.237 |
Token | ados |
Token ID | 22484 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
oppy | +0.263 |
ish | +0.240 |
iggle | +0.229 |
Majesty | +0.228 |
majesty | +0.226 |
Neg logit contributions | |
Where | -0.371 |
Warning | -0.361 |
See | -0.360 |
Sir | -0.356 |
Oh | -0.343 |
Token | and |
Token ID | 290 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
Majesty | +0.262 |
ish | +0.256 |
majesty | +0.243 |
oppy | +0.218 |
ci | +0.210 |
Neg logit contributions | |
Where | -0.163 |
On | -0.159 |
To | -0.150 |
For | -0.144 |
He | -0.144 |
Token | scatter |
Token ID | 41058 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
ish | +0.157 |
Majesty | +0.139 |
oppy | +0.132 |
majesty | +0.127 |
ci | +0.127 |
Neg logit contributions | |
Where | -0.118 |
See | -0.107 |
On | -0.104 |
Welcome | -0.101 |
What | -0.100 |
Token | them |
Token ID | 606 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
ish | +0.209 |
Majesty | +0.196 |
majesty | +0.180 |
ci | +0.178 |
oppy | +0.176 |
Neg logit contributions | |
Where | -0.125 |
See | -0.113 |
Oh | -0.110 |
Welcome | -0.109 |
On | -0.107 |
Token | as |
Token ID | 355 |
Feature activation | +2.12e+01 |
Pos logit contributions | |
ish | +0.211 |
Majesty | +0.193 |
majesty | +0.180 |
oppy | +0.178 |
ci | +0.175 |
Neg logit contributions | |
Where | -0.103 |
On | -0.091 |
See | -0.089 |
Welcome | -0.087 |
Oh | -0.087 |
Token | he |
Token ID | 339 |
Feature activation | +2.06e+01 |
Pos logit contributions | |
ish | +0.149 |
Majesty | +0.133 |
majesty | +0.123 |
ci | +0.122 |
cient | +0.121 |
Neg logit contributions | |
Where | -0.075 |
See | -0.067 |
On | -0.065 |
Welcome | -0.064 |
Oh | -0.064 |
Token | opened |
Token ID | 4721 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
ish | +0.138 |
Majesty | +0.125 |
majesty | +0.115 |
ci | +0.114 |
oppy | +0.112 |
Neg logit contributions | |
Where | -0.077 |
See | -0.069 |
Oh | -0.068 |
Welcome | -0.067 |
On | -0.066 |
Token | the |
Token ID | 262 |
Feature activation | +2.53e+01 |
Pos logit contributions | |
ish | +0.187 |
Majesty | +0.171 |
majesty | +0.160 |
oppy | +0.157 |
cient | +0.156 |
Neg logit contributions | |
Where | -0.101 |
See | -0.090 |
On | -0.088 |
Oh | -0.086 |
Welcome | -0.083 |
Token | ch |
Token ID | 442 |
Feature activation | +3.68e+01 |
Pos logit contributions | |
ish | +0.157 |
Majesty | +0.141 |
majesty | +0.129 |
oppy | +0.129 |
ci | +0.129 |
Neg logit contributions | |
Where | -0.107 |
Oh | -0.097 |
See | -0.096 |
On | -0.093 |
Welcome | -0.093 |
Token | ocol |
Token ID | 4668 |
Feature activation | +6.18e+01 |
Pos logit contributions | |
ish | +0.139 |
Majesty | +0.137 |
ci | +0.136 |
cient | +0.128 |
gy | +0.122 |
Neg logit contributions | |
See | -0.187 |
Where | -0.185 |
He | -0.183 |
Time | -0.181 |
Care | -0.175 |
Token | ates |
Token ID | 689 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
ish | +0.307 |
Majesty | +0.293 |
cient | +0.262 |
ci | +0.257 |
majesty | +0.257 |
Neg logit contributions | |
Where | -0.288 |
See | -0.276 |
Warning | -0.268 |
To | -0.263 |
On | -0.262 |
Token | and |
Token ID | 290 |
Feature activation | +1.97e+01 |
Pos logit contributions | |
ish | +0.208 |
Majesty | +0.200 |
majesty | +0.187 |
oppy | +0.176 |
cient | +0.173 |
Neg logit contributions | |
Where | -0.120 |
On | -0.109 |
See | -0.102 |
Welcome | -0.102 |
Oh | -0.102 |
Token | started |
Token ID | 2067 |
Feature activation | +2.25e+01 |
Pos logit contributions | |
ish | +0.130 |
Majesty | +0.113 |
oppy | +0.107 |
cient | +0.104 |
majesty | +0.103 |
Neg logit contributions | |
Where | -0.079 |
See | -0.070 |
Oh | -0.068 |
On | -0.067 |
Who | -0.067 |
Token | eating |
Token ID | 6600 |
Feature activation | +2.58e+01 |
Pos logit contributions | |
ish | +0.140 |
Majesty | +0.121 |
oppy | +0.112 |
majesty | +0.112 |
cient | +0.109 |
Neg logit contributions | |
Where | -0.100 |
See | -0.092 |
On | -0.090 |
Welcome | -0.086 |
Time | -0.086 |
Token | them |
Token ID | 606 |
Feature activation | +2.46e+01 |
Pos logit contributions | |
ish | +0.167 |
Majesty | +0.153 |
ci | +0.142 |
majesty | +0.141 |
oppy | +0.140 |
Neg logit contributions | |
Where | -0.103 |
See | -0.093 |
On | -0.089 |
Oh | -0.089 |
Welcome | -0.088 |
Token | giving |
Token ID | 3501 |
Feature activation | +3.09e+01 |
Pos logit contributions | |
ish | +0.167 |
Majesty | +0.137 |
ci | +0.134 |
oppy | +0.133 |
cient | +0.129 |
Neg logit contributions | |
Where | -0.121 |
See | -0.112 |
Oh | -0.107 |
What | -0.105 |
Warning | -0.104 |
Token | him |
Token ID | 683 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
ish | +0.188 |
Majesty | +0.177 |
castle | +0.166 |
majesty | +0.164 |
oppy | +0.160 |
Neg logit contributions | |
Where | -0.126 |
See | -0.116 |
Oh | -0.113 |
Welcome | -0.112 |
What | -0.108 |
Token | too |
Token ID | 1165 |
Feature activation | +2.77e+01 |
Pos logit contributions | |
ish | +0.194 |
Majesty | +0.188 |
ci | +0.174 |
cient | +0.173 |
majesty | +0.171 |
Neg logit contributions | |
Where | -0.087 |
See | -0.074 |
For | -0.074 |
Oh | -0.072 |
What | -0.072 |
Token | many |
Token ID | 867 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
ish | +0.195 |
Majesty | +0.178 |
majesty | +0.167 |
oppy | +0.163 |
cient | +0.160 |
Neg logit contributions | |
Where | -0.093 |
Oh | -0.080 |
See | -0.078 |
Wow | -0.078 |
Warning | -0.076 |
Token | ch |
Token ID | 442 |
Feature activation | +3.79e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.155 |
ci | +0.142 |
majesty | +0.140 |
oppy | +0.139 |
Neg logit contributions | |
Where | -0.121 |
See | -0.111 |
Oh | -0.107 |
Welcome | -0.107 |
On | -0.106 |
Token | ocol |
Token ID | 4668 |
Feature activation | +6.17e+01 |
Pos logit contributions | |
ci | +0.154 |
Majesty | +0.148 |
ish | +0.144 |
cient | +0.133 |
gy | +0.127 |
Neg logit contributions | |
See | -0.182 |
He | -0.181 |
Where | -0.179 |
Welcome | -0.177 |
One | -0.176 |
Token | ates |
Token ID | 689 |
Feature activation | +3.57e+01 |
Pos logit contributions | |
ish | +0.306 |
Majesty | +0.305 |
cient | +0.276 |
majesty | +0.268 |
ci | +0.263 |
Neg logit contributions | |
Where | -0.271 |
See | -0.259 |
Warning | -0.254 |
For | -0.249 |
One | -0.248 |
Token | ." |
Token ID | 526 |
Feature activation | +1.76e+01 |
Pos logit contributions | |
ish | +0.244 |
Majesty | +0.241 |
majesty | +0.220 |
cient | +0.211 |
oppy | +0.210 |
Neg logit contributions | |
Where | -0.112 |
On | -0.098 |
For | -0.098 |
He | -0.096 |
To | -0.096 |
Token | The |
Token ID | 383 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
ish | +0.141 |
Majesty | +0.130 |
majesty | +0.121 |
ci | +0.121 |
oppy | +0.119 |
Neg logit contributions | |
Where | -0.043 |
See | -0.036 |
Oh | -0.035 |
On | -0.034 |
Welcome | -0.034 |
Token | king |
Token ID | 5822 |
Feature activation | +2.44e+01 |
Pos logit contributions | |
ish | +0.128 |
Majesty | +0.108 |
ci | +0.106 |
oppy | +0.099 |
cient | +0.098 |
Neg logit contributions | |
Where | -0.103 |
See | -0.092 |
Oh | -0.092 |
Welcome | -0.091 |
On | -0.089 |
Token | learned |
Token ID | 4499 |
Feature activation | +1.77e+01 |
Pos logit contributions | |
ish | +0.164 |
Majesty | +0.155 |
majesty | +0.141 |
cient | +0.139 |
oppy | +0.139 |
Neg logit contributions | |
Where | -0.079 |
See | -0.074 |
On | -0.073 |
He | -0.072 |
Oh | -0.069 |
Token | reward |
Token ID | 6721 |
Feature activation | +4.71e+01 |
Pos logit contributions | |
ish | +0.313 |
Majesty | +0.308 |
oppy | +0.285 |
majesty | +0.281 |
atmeal | +0.279 |
Neg logit contributions | |
Where | -0.258 |
Oh | -0.239 |
See | -0.225 |
Wow | -0.225 |
Welcome | -0.223 |
Token | . |
Token ID | 13 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
ish | +0.297 |
Majesty | +0.279 |
majesty | +0.250 |
cient | +0.243 |
oppy | +0.243 |
Neg logit contributions | |
Where | -0.191 |
See | -0.168 |
On | -0.167 |
Welcome | -0.166 |
For | -0.166 |
Token | It |
Token ID | 632 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
ish | +0.184 |
Majesty | +0.171 |
majesty | +0.157 |
ci | +0.155 |
cient | +0.154 |
Neg logit contributions | |
Where | -0.088 |
See | -0.077 |
Oh | -0.076 |
Warning | -0.074 |
On | -0.073 |
Token | was |
Token ID | 373 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
ish | +0.203 |
Majesty | +0.187 |
majesty | +0.173 |
oppy | +0.171 |
ci | +0.171 |
Neg logit contributions | |
Where | -0.084 |
See | -0.075 |
Oh | -0.071 |
On | -0.071 |
Welcome | -0.070 |
Token | ch |
Token ID | 442 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
ish | +0.163 |
Majesty | +0.146 |
majesty | +0.133 |
ci | +0.133 |
oppy | +0.131 |
Neg logit contributions | |
Where | -0.112 |
See | -0.101 |
Oh | -0.099 |
On | -0.098 |
Welcome | -0.097 |
Token | ocol |
Token ID | 4668 |
Feature activation | +6.11e+01 |
Pos logit contributions | |
ish | +0.122 |
Majesty | +0.122 |
ci | +0.106 |
majesty | +0.105 |
cient | +0.093 |
Neg logit contributions | |
Where | -0.213 |
See | -0.207 |
Welcome | -0.201 |
Oh | -0.200 |
On | -0.200 |
Token | ates |
Token ID | 689 |
Feature activation | +3.54e+01 |
Pos logit contributions | |
ish | +0.295 |
Majesty | +0.281 |
cient | +0.253 |
majesty | +0.248 |
ci | +0.247 |
Neg logit contributions | |
Where | -0.305 |
See | -0.292 |
Warning | -0.282 |
For | -0.272 |
One | -0.272 |
Token | and |
Token ID | 290 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
ish | +0.222 |
Majesty | +0.219 |
majesty | +0.202 |
oppy | +0.189 |
cient | +0.186 |
Neg logit contributions | |
Where | -0.127 |
On | -0.118 |
For | -0.114 |
He | -0.113 |
Welcome | -0.112 |
Token | sweets |
Token ID | 42402 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.150 |
oppy | +0.139 |
ci | +0.136 |
cient | +0.136 |
Neg logit contributions | |
Where | -0.108 |
See | -0.098 |
Oh | -0.093 |
Welcome | -0.092 |
On | -0.092 |
Token | ! |
Token ID | 0 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
ish | +0.220 |
Majesty | +0.209 |
majesty | +0.191 |
oppy | +0.188 |
cient | +0.181 |
Neg logit contributions | |
Where | -0.132 |
On | -0.120 |
See | -0.115 |
To | -0.113 |
Welcome | -0.113 |
Token |
|
Token ID | 198 |
Feature activation | +1.74e+01 |
Pos logit contributions | |
ish | +0.131 |
Majesty | +0.120 |
majesty | +0.110 |
ci | +0.109 |
oppy | +0.109 |
Neg logit contributions | |
Where | -0.073 |
See | -0.063 |
Oh | -0.063 |
On | -0.062 |
Warning | -0.061 |
Token | John |
Token ID | 1757 |
Feature activation | +5.07e+01 |
Pos logit contributions | |
Where | +0.079 |
See | +0.070 |
Oh | +0.070 |
Welcome | +0.068 |
On | +0.068 |
Neg logit contributions | |
ish | -0.138 |
Majesty | -0.125 |
ci | -0.115 |
majesty | -0.115 |
cient | -0.113 |
Token | chose |
Token ID | 7690 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
ish | +0.345 |
Majesty | +0.324 |
oppy | +0.303 |
majesty | +0.301 |
cient | +0.289 |
Neg logit contributions | |
Where | -0.167 |
See | -0.150 |
Oh | -0.141 |
Welcome | -0.140 |
On | -0.140 |
Token | some |
Token ID | 617 |
Feature activation | +3.71e+01 |
Pos logit contributions | |
ish | +0.235 |
Majesty | +0.221 |
majesty | +0.204 |
oppy | +0.203 |
cient | +0.199 |
Neg logit contributions | |
Where | -0.134 |
See | -0.118 |
Oh | -0.115 |
On | -0.114 |
Welcome | -0.111 |
Token | carrots |
Token ID | 34397 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
ish | +0.215 |
Majesty | +0.204 |
majesty | +0.182 |
ci | +0.179 |
oppy | +0.179 |
Neg logit contributions | |
Where | -0.166 |
See | -0.154 |
Oh | -0.151 |
On | -0.150 |
Welcome | -0.148 |
Token | and |
Token ID | 290 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
Majesty | +0.291 |
majesty | +0.264 |
ish | +0.263 |
oppy | +0.238 |
cient | +0.233 |
Neg logit contributions | |
Where | -0.137 |
On | -0.127 |
He | -0.126 |
For | -0.121 |
To | -0.119 |
Token | cuc |
Token ID | 38421 |
Feature activation | +6.03e+01 |
Pos logit contributions | |
ish | +0.163 |
Majesty | +0.154 |
majesty | +0.143 |
oppy | +0.140 |
cient | +0.136 |
Neg logit contributions | |
Where | -0.093 |
See | -0.083 |
On | -0.082 |
He | -0.078 |
Oh | -0.078 |
Token | umbers |
Token ID | 17024 |
Feature activation | +3.24e+01 |
Pos logit contributions | |
Majesty | +0.274 |
majesty | +0.253 |
ish | +0.246 |
ci | +0.245 |
sing | +0.239 |
Neg logit contributions | |
Where | -0.310 |
See | -0.299 |
For | -0.289 |
On | -0.289 |
He | -0.288 |
Token | to |
Token ID | 284 |
Feature activation | +2.70e+01 |
Pos logit contributions | |
ish | +0.213 |
Majesty | +0.212 |
majesty | +0.192 |
ci | +0.188 |
oppy | +0.186 |
Neg logit contributions | |
Where | -0.110 |
He | -0.097 |
See | -0.096 |
On | -0.095 |
For | -0.093 |
Token | take |
Token ID | 1011 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
ish | +0.167 |
Majesty | +0.154 |
ci | +0.144 |
majesty | +0.140 |
ig | +0.136 |
Neg logit contributions | |
Where | -0.113 |
What | -0.102 |
On | -0.101 |
One | -0.098 |
Who | -0.097 |
Token | home |
Token ID | 1363 |
Feature activation | +2.83e+01 |
Pos logit contributions | |
ish | +0.186 |
Majesty | +0.174 |
majesty | +0.161 |
ci | +0.160 |
oppy | +0.156 |
Neg logit contributions | |
Where | -0.104 |
See | -0.096 |
Welcome | -0.091 |
Oh | -0.089 |
To | -0.088 |
Token | . |
Token ID | 13 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
ish | +0.201 |
Majesty | +0.200 |
majesty | +0.184 |
cient | +0.176 |
oppy | +0.171 |
Neg logit contributions | |
Where | -0.082 |
On | -0.076 |
For | -0.073 |
He | -0.071 |
To | -0.071 |
Token | . |
Token ID | 13 |
Feature activation | +2.60e+01 |
Pos logit contributions | |
ish | +0.207 |
Majesty | +0.183 |
ci | +0.169 |
majesty | +0.166 |
cient | +0.166 |
Neg logit contributions | |
Where | -0.155 |
Oh | -0.137 |
See | -0.136 |
Welcome | -0.134 |
On | -0.134 |
Token | The |
Token ID | 383 |
Feature activation | +2.97e+01 |
Pos logit contributions | |
ish | +0.165 |
Majesty | +0.149 |
majesty | +0.137 |
ci | +0.136 |
cient | +0.134 |
Neg logit contributions | |
Where | -0.105 |
See | -0.094 |
Oh | -0.093 |
On | -0.092 |
Welcome | -0.090 |
Token | more |
Token ID | 517 |
Feature activation | +3.01e+01 |
Pos logit contributions | |
ish | +0.164 |
Majesty | +0.145 |
ci | +0.131 |
majesty | +0.131 |
oppy | +0.129 |
Neg logit contributions | |
Where | -0.145 |
See | -0.133 |
Oh | -0.133 |
Welcome | -0.130 |
On | -0.129 |
Token | , |
Token ID | 11 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
ish | +0.178 |
Majesty | +0.159 |
cient | +0.145 |
ci | +0.144 |
oppy | +0.142 |
Neg logit contributions | |
Where | -0.133 |
See | -0.124 |
Welcome | -0.121 |
On | -0.120 |
Oh | -0.119 |
Token | the |
Token ID | 262 |
Feature activation | +2.87e+01 |
Pos logit contributions | |
ish | +0.149 |
Majesty | +0.136 |
oppy | +0.126 |
majesty | +0.124 |
cient | +0.124 |
Neg logit contributions | |
Where | -0.098 |
See | -0.090 |
Welcome | -0.089 |
Oh | -0.087 |
Time | -0.085 |
Token | mer |
Token ID | 4017 |
Feature activation | +5.99e+01 |
Pos logit contributions | |
ish | +0.164 |
Majesty | +0.144 |
ci | +0.132 |
majesty | +0.131 |
oppy | +0.130 |
Neg logit contributions | |
Where | -0.136 |
Oh | -0.124 |
See | -0.123 |
Welcome | -0.120 |
On | -0.119 |
Token | rier |
Token ID | 5277 |
Feature activation | +4.50e+01 |
Pos logit contributions | |
ish | +0.185 |
atmeal | +0.160 |
oppy | +0.160 |
ci | +0.160 |
cient | +0.145 |
Neg logit contributions | |
Where | -0.340 |
Who | -0.320 |
Welcome | -0.318 |
See | -0.311 |
Wow | -0.309 |
Token | . |
Token ID | 13 |
Feature activation | +2.09e+01 |
Pos logit contributions | |
ish | +0.283 |
Majesty | +0.259 |
oppy | +0.247 |
cient | +0.239 |
ci | +0.238 |
Neg logit contributions | |
Where | -0.172 |
See | -0.155 |
Welcome | -0.149 |
Oh | -0.148 |
To | -0.148 |
Token | Come |
Token ID | 7911 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
ish | +0.131 |
Majesty | +0.124 |
majesty | +0.113 |
cient | +0.110 |
oppy | +0.110 |
Neg logit contributions | |
Where | -0.081 |
Oh | -0.071 |
On | -0.070 |
See | -0.069 |
Listen | -0.068 |
Token | to |
Token ID | 284 |
Feature activation | +2.02e+01 |
Pos logit contributions | |
ish | +0.131 |
Majesty | +0.119 |
majesty | +0.108 |
ci | +0.107 |
oppy | +0.105 |
Neg logit contributions | |
Where | -0.097 |
See | -0.088 |
Oh | -0.087 |
On | -0.086 |
Welcome | -0.085 |
Token | my |
Token ID | 616 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
ish | +0.140 |
Majesty | +0.122 |
ci | +0.116 |
majesty | +0.111 |
cient | +0.111 |
Neg logit contributions | |
Where | -0.074 |
On | -0.065 |
Welcome | -0.063 |
See | -0.063 |
What | -0.062 |
Token |
|
Token ID | 198 |
Feature activation | +2.11e+01 |
Pos logit contributions | |
ish | +0.128 |
Majesty | +0.124 |
oppy | +0.120 |
majesty | +0.117 |
adow | +0.108 |
Neg logit contributions | |
Where | -0.069 |
Oh | -0.062 |
Warning | -0.061 |
Welcome | -0.061 |
See | -0.059 |
Token | " |
Token ID | 1 |
Feature activation | +2.07e+01 |
Pos logit contributions | |
ish | +0.130 |
Majesty | +0.127 |
oppy | +0.120 |
majesty | +0.118 |
ap | +0.112 |
Neg logit contributions | |
Where | -0.062 |
Oh | -0.054 |
Warning | -0.054 |
See | -0.053 |
Welcome | -0.052 |
Token | The |
Token ID | 464 |
Feature activation | +2.74e+01 |
Pos logit contributions | |
ish | +0.129 |
Majesty | +0.124 |
ci | +0.115 |
majesty | +0.114 |
mit | +0.112 |
Neg logit contributions | |
Warning | -0.041 |
Where | -0.036 |
On | -0.034 |
For | -0.034 |
generations | -0.034 |
Token | rh |
Token ID | 9529 |
Feature activation | +4.43e+01 |
Pos logit contributions | |
ish | +0.152 |
Majesty | +0.133 |
ci | +0.121 |
majesty | +0.120 |
oppy | +0.119 |
Neg logit contributions | |
Where | -0.136 |
See | -0.124 |
Oh | -0.123 |
Welcome | -0.121 |
On | -0.121 |
Token | in |
Token ID | 259 |
Feature activation | +3.25e+01 |
Pos logit contributions | |
ish | +0.210 |
Majesty | +0.199 |
ci | +0.175 |
majesty | +0.174 |
oppy | +0.165 |
Neg logit contributions | |
Where | -0.244 |
See | -0.223 |
Oh | -0.222 |
Welcome | -0.217 |
He | -0.216 |
Token | oc |
Token ID | 420 |
Feature activation | +5.98e+01 |
Pos logit contributions | |
ish | +0.177 |
Majesty | +0.162 |
majesty | +0.144 |
oppy | +0.144 |
ci | +0.141 |
Neg logit contributions | |
Where | -0.151 |
See | -0.138 |
Oh | -0.136 |
On | -0.136 |
Welcome | -0.136 |
Token | eros |
Token ID | 27498 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
oppy | +0.231 |
ish | +0.227 |
adow | +0.212 |
iggle | +0.208 |
Majesty | +0.206 |
Neg logit contributions | |
Where | -0.311 |
Warning | -0.294 |
See | -0.285 |
Oh | -0.284 |
Sir | -0.279 |
Token | is |
Token ID | 318 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
ish | +0.196 |
Majesty | +0.184 |
oppy | +0.168 |
majesty | +0.167 |
ci | +0.167 |
Neg logit contributions | |
Where | -0.107 |
See | -0.098 |
Welcome | -0.094 |
Oh | -0.093 |
On | -0.093 |
Token | in |
Token ID | 287 |
Feature activation | +2.49e+01 |
Pos logit contributions | |
ish | +0.137 |
Majesty | +0.123 |
majesty | +0.111 |
ci | +0.111 |
oppy | +0.109 |
Neg logit contributions | |
Where | -0.101 |
See | -0.092 |
Oh | -0.091 |
On | -0.090 |
Welcome | -0.089 |
Token | there |
Token ID | 612 |
Feature activation | +2.46e+01 |
Pos logit contributions | |
ish | +0.149 |
Majesty | +0.134 |
majesty | +0.122 |
ci | +0.120 |
oppy | +0.118 |
Neg logit contributions | |
Where | -0.111 |
See | -0.101 |
Oh | -0.100 |
On | -0.098 |
Welcome | -0.098 |
Token | , |
Token ID | 11 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
ish | +0.135 |
Majesty | +0.122 |
ci | +0.112 |
majesty | +0.111 |
oppy | +0.108 |
Neg logit contributions | |
Where | -0.117 |
On | -0.110 |
Oh | -0.106 |
One | -0.104 |
Welcome | -0.104 |
Token | there |
Token ID | 612 |
Feature activation | +2.81e+01 |
Pos logit contributions | |
ish | +0.141 |
Majesty | +0.123 |
majesty | +0.110 |
ci | +0.108 |
cient | +0.106 |
Neg logit contributions | |
Where | -0.150 |
See | -0.138 |
On | -0.138 |
Welcome | -0.136 |
Oh | -0.136 |
Token | was |
Token ID | 373 |
Feature activation | +2.27e+01 |
Pos logit contributions | |
ish | +0.201 |
Majesty | +0.186 |
majesty | +0.173 |
ci | +0.169 |
cient | +0.167 |
Neg logit contributions | |
Where | -0.093 |
See | -0.082 |
Oh | -0.080 |
On | -0.080 |
Welcome | -0.078 |
Token | a |
Token ID | 257 |
Feature activation | +2.47e+01 |
Pos logit contributions | |
ish | +0.141 |
Majesty | +0.129 |
majesty | +0.117 |
ci | +0.116 |
oppy | +0.114 |
Neg logit contributions | |
Where | -0.094 |
See | -0.085 |
Oh | -0.083 |
Welcome | -0.082 |
On | -0.082 |
Token | rh |
Token ID | 9529 |
Feature activation | +4.48e+01 |
Pos logit contributions | |
ish | +0.146 |
Majesty | +0.130 |
ci | +0.118 |
majesty | +0.118 |
oppy | +0.115 |
Neg logit contributions | |
Where | -0.112 |
See | -0.102 |
Oh | -0.101 |
On | -0.100 |
Welcome | -0.099 |
Token | in |
Token ID | 259 |
Feature activation | +3.56e+01 |
Pos logit contributions | |
ish | +0.205 |
Majesty | +0.191 |
majesty | +0.169 |
ci | +0.160 |
oppy | +0.154 |
Neg logit contributions | |
Where | -0.258 |
See | -0.237 |
Oh | -0.237 |
On | -0.234 |
Welcome | -0.233 |
Token | oc |
Token ID | 420 |
Feature activation | +5.95e+01 |
Pos logit contributions | |
ish | +0.190 |
Majesty | +0.175 |
majesty | +0.157 |
ci | +0.152 |
oppy | +0.151 |
Neg logit contributions | |
Where | -0.176 |
Oh | -0.159 |
See | -0.158 |
On | -0.158 |
Welcome | -0.156 |
Token | eros |
Token ID | 27498 |
Feature activation | +3.38e+01 |
Pos logit contributions | |
oppy | +0.252 |
ish | +0.231 |
Majesty | +0.221 |
opsy | +0.213 |
majesty | +0.208 |
Neg logit contributions | |
Where | -0.281 |
Warning | -0.275 |
Sir | -0.271 |
See | -0.265 |
Oh | -0.260 |
Token | who |
Token ID | 508 |
Feature activation | +2.71e+01 |
Pos logit contributions | |
ish | +0.207 |
Majesty | +0.189 |
majesty | +0.173 |
ci | +0.168 |
oppy | +0.167 |
Neg logit contributions | |
Where | -0.145 |
See | -0.130 |
On | -0.128 |
Oh | -0.128 |
Welcome | -0.127 |
Token | was |
Token ID | 373 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
ish | +0.178 |
Majesty | +0.159 |
ci | +0.149 |
cient | +0.147 |
majesty | +0.146 |
Neg logit contributions | |
Where | -0.105 |
Oh | -0.094 |
See | -0.093 |
Warning | -0.091 |
Time | -0.090 |
Token | always |
Token ID | 1464 |
Feature activation | +2.59e+01 |
Pos logit contributions | |
ish | +0.168 |
Majesty | +0.152 |
majesty | +0.142 |
ci | +0.139 |
oppy | +0.139 |
Neg logit contributions | |
Where | -0.095 |
On | -0.085 |
See | -0.085 |
Oh | -0.082 |
Welcome | -0.080 |
Token | naughty |
Token ID | 45128 |
Feature activation | +2.51e+01 |
Pos logit contributions | |
ish | +0.151 |
Majesty | +0.135 |
majesty | +0.123 |
ci | +0.121 |
oppy | +0.121 |
Neg logit contributions | |
Where | -0.121 |
See | -0.110 |
Oh | -0.109 |
Welcome | -0.107 |
On | -0.107 |
Token | became |
Token ID | 2627 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
Where | +0.091 |
Oh | +0.084 |
See | +0.082 |
Welcome | +0.080 |
Warning | +0.080 |
Neg logit contributions | |
ish | -0.111 |
Majesty | -0.097 |
ci | -0.089 |
majesty | -0.088 |
cient | -0.086 |
Token | good |
Token ID | 922 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
Where | +0.102 |
See | +0.093 |
Oh | +0.092 |
On | +0.091 |
Welcome | +0.090 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.120 |
majesty | -0.109 |
ci | -0.107 |
oppy | -0.106 |
Token | friends |
Token ID | 2460 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
Where | +0.117 |
See | +0.109 |
On | +0.106 |
Oh | +0.106 |
Welcome | +0.106 |
Neg logit contributions | |
ish | -0.108 |
Majesty | -0.097 |
majesty | -0.087 |
cient | -0.085 |
ci | -0.085 |
Token | . |
Token ID | 13 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
Where | +0.095 |
See | +0.087 |
Oh | +0.086 |
On | +0.084 |
Warning | +0.084 |
Neg logit contributions | |
ish | -0.126 |
Majesty | -0.109 |
ci | -0.102 |
majesty | -0.099 |
oppy | -0.098 |
Token | The |
Token ID | 383 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
Where | +0.119 |
Who | +0.103 |
Are | +0.102 |
Warning | +0.102 |
Time | +0.102 |
Neg logit contributions | |
ish | -0.147 |
Majesty | -0.123 |
oppy | -0.122 |
majesty | -0.120 |
cient | -0.115 |
Token | moral |
Token ID | 6573 |
Feature activation | -2.77e+01 |
Pos logit contributions | |
Where | +0.110 |
See | +0.106 |
To | +0.104 |
Welcome | +0.103 |
Warning | +0.102 |
Neg logit contributions | |
ish | -0.111 |
Majesty | -0.092 |
knee | -0.090 |
majesty | -0.085 |
sister | -0.085 |
Token | of |
Token ID | 286 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
Where | +0.135 |
See | +0.125 |
Who | +0.123 |
Are | +0.122 |
Wow | +0.119 |
Neg logit contributions | |
ish | -0.127 |
ap | -0.105 |
ci | -0.102 |
ute | -0.100 |
oppy | -0.099 |
Token | the |
Token ID | 262 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
Where | +0.082 |
Oh | +0.073 |
See | +0.073 |
Welcome | +0.070 |
On | +0.070 |
Neg logit contributions | |
ish | -0.141 |
Majesty | -0.131 |
majesty | -0.120 |
ci | -0.116 |
cient | -0.115 |
Token | story |
Token ID | 1621 |
Feature activation | -2.33e+01 |
Pos logit contributions | |
Where | +0.119 |
See | +0.111 |
He | +0.105 |
Oh | +0.105 |
Wow | +0.103 |
Neg logit contributions | |
ish | -0.094 |
ci | -0.073 |
Majesty | -0.073 |
cient | -0.071 |
oppy | -0.070 |
Token | is |
Token ID | 318 |
Feature activation | -2.58e+01 |
Pos logit contributions | |
Where | +0.130 |
See | +0.122 |
Oh | +0.118 |
Welcome | +0.116 |
Who | +0.115 |
Neg logit contributions | |
ish | -0.114 |
Majesty | -0.088 |
ci | -0.086 |
oppy | -0.082 |
ap | -0.082 |
Token | that |
Token ID | 326 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
Where | +0.138 |
See | +0.127 |
Oh | +0.126 |
On | +0.125 |
Welcome | +0.124 |
Neg logit contributions | |
ish | -0.133 |
Majesty | -0.118 |
majesty | -0.105 |
ci | -0.103 |
oppy | -0.100 |
Token | after |
Token ID | 706 |
Feature activation | -2.03e+01 |
Pos logit contributions | |
Where | +0.098 |
See | +0.094 |
Oh | +0.089 |
Warning | +0.088 |
Welcome | +0.087 |
Neg logit contributions | |
ish | -0.120 |
Majesty | -0.104 |
oppy | -0.095 |
ci | -0.095 |
majesty | -0.094 |
Token | . |
Token ID | 13 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
Where | +0.075 |
See | +0.067 |
On | +0.065 |
Oh | +0.065 |
Welcome | +0.064 |
Neg logit contributions | |
ish | -0.139 |
Majesty | -0.126 |
majesty | -0.115 |
ci | -0.114 |
cient | -0.113 |
Token |
|
Token ID | 198 |
Feature activation | -2.44e+01 |
Pos logit contributions | |
Where | +0.079 |
Warning | +0.067 |
On | +0.065 |
Who | +0.064 |
Oh | +0.064 |
Neg logit contributions | |
ish | -0.171 |
Majesty | -0.149 |
oppy | -0.148 |
ci | -0.148 |
cient | -0.147 |
Token |
|
Token ID | 198 |
Feature activation | -2.48e+01 |
Pos logit contributions | |
Where | +0.090 |
See | +0.083 |
Oh | +0.081 |
Warning | +0.080 |
Welcome | +0.079 |
Neg logit contributions | |
ish | -0.154 |
Majesty | -0.135 |
oppy | -0.131 |
cient | -0.129 |
ci | -0.128 |
Token | The |
Token ID | 464 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
Where | +0.066 |
See | +0.061 |
Warning | +0.061 |
Welcome | +0.058 |
Who | +0.058 |
Neg logit contributions | |
ish | -0.156 |
cient | -0.140 |
ci | -0.137 |
oppy | -0.135 |
opsy | -0.133 |
Token | moral |
Token ID | 6573 |
Feature activation | -2.73e+01 |
Pos logit contributions | |
Where | +0.100 |
See | +0.092 |
Warning | +0.090 |
Who | +0.089 |
To | +0.089 |
Neg logit contributions | |
ish | -0.121 |
Majesty | -0.101 |
ci | -0.095 |
cient | -0.094 |
oppy | -0.093 |
Token | of |
Token ID | 286 |
Feature activation | -2.10e+01 |
Pos logit contributions | |
Where | +0.134 |
Who | +0.122 |
Are | +0.118 |
What | +0.118 |
See | +0.117 |
Neg logit contributions | |
ish | -0.136 |
ci | -0.109 |
oppy | -0.108 |
ap | -0.106 |
Majesty | -0.101 |
Token | the |
Token ID | 262 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
Where | +0.084 |
See | +0.075 |
Oh | +0.075 |
Welcome | +0.073 |
On | +0.073 |
Neg logit contributions | |
ish | -0.137 |
Majesty | -0.125 |
majesty | -0.115 |
ci | -0.111 |
oppy | -0.110 |
Token | story |
Token ID | 1621 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
Where | +0.121 |
See | +0.109 |
Who | +0.106 |
Oh | +0.104 |
Wow | +0.101 |
Neg logit contributions | |
ish | -0.088 |
cient | -0.071 |
Majesty | -0.071 |
ci | -0.069 |
oppy | -0.067 |
Token | is |
Token ID | 318 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
Where | +0.112 |
See | +0.102 |
Oh | +0.101 |
On | +0.099 |
Welcome | +0.098 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.117 |
majesty | -0.108 |
ci | -0.106 |
cient | -0.105 |
Token | to |
Token ID | 284 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
Where | +0.125 |
On | +0.117 |
To | +0.117 |
Oh | +0.115 |
Welcome | +0.113 |
Neg logit contributions | |
ish | -0.146 |
Majesty | -0.137 |
majesty | -0.121 |
ci | -0.116 |
ishes | -0.111 |
Token | feel |
Token ID | 1254 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
Where | +0.079 |
On | +0.077 |
He | +0.077 |
For | +0.072 |
To | +0.070 |
Neg logit contributions | |
ish | -0.117 |
Majesty | -0.113 |
ci | -0.103 |
cient | -0.103 |
majesty | -0.102 |
Token | good |
Token ID | 922 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
Where | +0.075 |
See | +0.067 |
Oh | +0.066 |
On | +0.065 |
Warning | +0.064 |
Neg logit contributions | |
ish | -0.140 |
Majesty | -0.127 |
majesty | -0.117 |
ci | -0.115 |
oppy | -0.114 |
Token | too |
Token ID | 1165 |
Feature activation | -1.84e+01 |
Pos logit contributions | |
Where | +0.090 |
See | +0.082 |
Oh | +0.080 |
Welcome | +0.079 |
On | +0.079 |
Neg logit contributions | |
ish | -0.126 |
Majesty | -0.115 |
majesty | -0.105 |
ci | -0.103 |
cient | -0.102 |
Token | . |
Token ID | 13 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
Where | +0.082 |
See | +0.075 |
Oh | +0.075 |
Warning | +0.072 |
Wow | +0.072 |
Neg logit contributions | |
ish | -0.112 |
Majesty | -0.100 |
majesty | -0.091 |
oppy | -0.090 |
ci | -0.089 |
Token | The |
Token ID | 383 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
Where | +0.100 |
Oh | +0.087 |
Warning | +0.085 |
See | +0.084 |
Welcome | +0.084 |
Neg logit contributions | |
ish | -0.163 |
Majesty | -0.150 |
majesty | -0.142 |
oppy | -0.134 |
cient | -0.133 |
Token | moral |
Token ID | 6573 |
Feature activation | -2.72e+01 |
Pos logit contributions | |
Where | +0.083 |
Warning | +0.076 |
See | +0.073 |
Oh | +0.071 |
To | +0.071 |
Neg logit contributions | |
ish | -0.141 |
Majesty | -0.127 |
knee | -0.122 |
majesty | -0.121 |
castle | -0.115 |
Token | of |
Token ID | 286 |
Feature activation | -2.16e+01 |
Pos logit contributions | |
Where | +0.132 |
Who | +0.118 |
See | +0.117 |
Are | +0.116 |
Oh | +0.114 |
Neg logit contributions | |
ish | -0.136 |
ci | -0.109 |
oppy | -0.108 |
ap | -0.106 |
Majesty | -0.102 |
Token | the |
Token ID | 262 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
Where | +0.083 |
Oh | +0.073 |
See | +0.072 |
On | +0.070 |
Welcome | +0.070 |
Neg logit contributions | |
ish | -0.146 |
Majesty | -0.136 |
majesty | -0.124 |
ci | -0.119 |
oppy | -0.119 |
Token | story |
Token ID | 1621 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
Where | +0.126 |
See | +0.117 |
Oh | +0.111 |
He | +0.109 |
On | +0.108 |
Neg logit contributions | |
ish | -0.086 |
Majesty | -0.074 |
majesty | -0.068 |
oppy | -0.066 |
collection | -0.066 |
Token | is |
Token ID | 318 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
Where | +0.118 |
See | +0.107 |
Oh | +0.106 |
Welcome | +0.103 |
On | +0.102 |
Neg logit contributions | |
ish | -0.128 |
Majesty | -0.109 |
majesty | -0.100 |
ci | -0.100 |
oppy | -0.098 |
Token | to |
Token ID | 284 |
Feature activation | -2.50e+01 |
Pos logit contributions | |
Where | +0.137 |
See | +0.126 |
Oh | +0.125 |
On | +0.125 |
Welcome | +0.123 |
Neg logit contributions | |
ish | -0.135 |
Majesty | -0.121 |
majesty | -0.107 |
ci | -0.106 |
cient | -0.102 |
Token | and |
Token ID | 290 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
Where | +0.104 |
See | +0.095 |
Oh | +0.095 |
Welcome | +0.093 |
Warning | +0.093 |
Neg logit contributions | |
ish | -0.118 |
Majesty | -0.105 |
majesty | -0.095 |
ci | -0.094 |
oppy | -0.091 |
Token | they |
Token ID | 484 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
Where | +0.098 |
See | +0.087 |
Oh | +0.087 |
Warning | +0.086 |
Welcome | +0.085 |
Neg logit contributions | |
ish | -0.151 |
Majesty | -0.135 |
ci | -0.127 |
majesty | -0.125 |
oppy | -0.123 |
Token | took |
Token ID | 1718 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
Where | +0.099 |
See | +0.089 |
Oh | +0.088 |
Welcome | +0.086 |
On | +0.086 |
Neg logit contributions | |
ish | -0.152 |
Majesty | -0.137 |
majesty | -0.125 |
ci | -0.125 |
oppy | -0.123 |
Token | a |
Token ID | 257 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
Where | +0.101 |
See | +0.091 |
Oh | +0.090 |
On | +0.089 |
Welcome | +0.088 |
Neg logit contributions | |
ish | -0.151 |
Majesty | -0.135 |
majesty | -0.123 |
ci | -0.123 |
oppy | -0.121 |
Token | nap |
Token ID | 25422 |
Feature activation | -2.37e+01 |
Pos logit contributions | |
Where | +0.129 |
See | +0.119 |
Warning | +0.118 |
Oh | +0.117 |
Welcome | +0.114 |
Neg logit contributions | |
ish | -0.112 |
Majesty | -0.092 |
oppy | -0.088 |
majesty | -0.085 |
ci | -0.084 |
Token | . |
Token ID | 13 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
Where | +0.078 |
On | +0.067 |
See | +0.065 |
For | +0.065 |
Oh | +0.065 |
Neg logit contributions | |
ish | -0.167 |
Majesty | -0.158 |
majesty | -0.144 |
cient | -0.144 |
ci | -0.137 |
Token | They |
Token ID | 1119 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
Where | +0.114 |
Warning | +0.113 |
Oh | +0.101 |
Welcome | +0.099 |
Who | +0.097 |
Neg logit contributions | |
ish | -0.145 |
Majesty | -0.134 |
majesty | -0.128 |
cient | -0.127 |
oppy | -0.126 |
Token | were |
Token ID | 547 |
Feature activation | -2.53e+01 |
Pos logit contributions | |
Where | +0.105 |
See | +0.094 |
Oh | +0.093 |
Welcome | +0.091 |
On | +0.091 |
Neg logit contributions | |
ish | -0.165 |
Majesty | -0.148 |
majesty | -0.136 |
ci | -0.136 |
oppy | -0.134 |
Token | happy |
Token ID | 3772 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
Where | +0.096 |
See | +0.088 |
On | +0.085 |
Oh | +0.084 |
Welcome | +0.083 |
Neg logit contributions | |
ish | -0.169 |
Majesty | -0.152 |
ci | -0.140 |
cient | -0.139 |
majesty | -0.139 |
Token | and |
Token ID | 290 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
Where | +0.124 |
See | +0.114 |
Oh | +0.112 |
On | +0.110 |
Welcome | +0.110 |
Neg logit contributions | |
ish | -0.147 |
Majesty | -0.131 |
majesty | -0.119 |
ci | -0.117 |
cient | -0.115 |
Token | tired |
Token ID | 10032 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
Where | +0.109 |
See | +0.099 |
Oh | +0.098 |
Welcome | +0.096 |
On | +0.096 |
Neg logit contributions | |
ish | -0.160 |
Majesty | -0.145 |
majesty | -0.131 |
ci | -0.129 |
cient | -0.127 |
Token | her |
Token ID | 607 |
Feature activation | -1.89e+01 |
Pos logit contributions | |
Where | +0.095 |
On | +0.089 |
See | +0.088 |
Warning | +0.088 |
Oh | +0.087 |
Neg logit contributions | |
ish | -0.127 |
Majesty | -0.115 |
majesty | -0.105 |
oppy | -0.105 |
ci | -0.103 |
Token | . |
Token ID | 13 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
Where | +0.078 |
On | +0.069 |
See | +0.068 |
Oh | +0.067 |
Welcome | +0.067 |
Neg logit contributions | |
ish | -0.118 |
Majesty | -0.107 |
ci | -0.098 |
majesty | -0.098 |
cient | -0.096 |
Token |
|
Token ID | 198 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
Where | +0.075 |
Warning | +0.066 |
Oh | +0.065 |
Welcome | +0.063 |
Time | +0.061 |
Neg logit contributions | |
ish | -0.175 |
Majesty | -0.165 |
majesty | -0.154 |
oppy | -0.149 |
cient | -0.148 |
Token |
|
Token ID | 198 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
Where | +0.079 |
Warning | +0.071 |
Oh | +0.071 |
See | +0.067 |
Welcome | +0.067 |
Neg logit contributions | |
ish | -0.152 |
Majesty | -0.140 |
oppy | -0.139 |
majesty | -0.135 |
cient | -0.133 |
Token | The |
Token ID | 464 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
Where | +0.077 |
Warning | +0.076 |
Oh | +0.071 |
Welcome | +0.069 |
See | +0.069 |
Neg logit contributions | |
ish | -0.141 |
Majesty | -0.134 |
majesty | -0.125 |
cient | -0.123 |
oppy | -0.121 |
Token | moral |
Token ID | 6573 |
Feature activation | -2.70e+01 |
Pos logit contributions | |
Where | +0.070 |
See | +0.064 |
Warning | +0.063 |
On | +0.062 |
To | +0.061 |
Neg logit contributions | |
ish | -0.153 |
Majesty | -0.137 |
majesty | -0.127 |
oppy | -0.124 |
knee | -0.121 |
Token | of |
Token ID | 286 |
Feature activation | -2.06e+01 |
Pos logit contributions | |
Where | +0.130 |
Who | +0.116 |
See | +0.116 |
Are | +0.115 |
What | +0.113 |
Neg logit contributions | |
ish | -0.138 |
ci | -0.108 |
oppy | -0.108 |
Majesty | -0.104 |
ap | -0.102 |
Token | the |
Token ID | 262 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
Where | +0.081 |
Oh | +0.072 |
See | +0.071 |
Welcome | +0.069 |
On | +0.069 |
Neg logit contributions | |
ish | -0.138 |
Majesty | -0.127 |
majesty | -0.116 |
ci | -0.112 |
cient | -0.112 |
Token | story |
Token ID | 1621 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
Where | +0.110 |
See | +0.100 |
Oh | +0.096 |
On | +0.095 |
Warning | +0.093 |
Neg logit contributions | |
ish | -0.104 |
Majesty | -0.091 |
oppy | -0.084 |
majesty | -0.083 |
cient | -0.079 |
Token | is |
Token ID | 318 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
Where | +0.117 |
See | +0.107 |
Oh | +0.106 |
Welcome | +0.103 |
On | +0.102 |
Neg logit contributions | |
ish | -0.127 |
Majesty | -0.109 |
majesty | -0.100 |
ci | -0.099 |
cient | -0.097 |
Token | that |
Token ID | 326 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
Where | +0.122 |
To | +0.114 |
On | +0.113 |
See | +0.111 |
Oh | +0.110 |
Neg logit contributions | |
ish | -0.146 |
Majesty | -0.135 |
majesty | -0.120 |
ci | -0.119 |
castle | -0.112 |
Token | his |
Token ID | 465 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
Where | +0.082 |
See | +0.075 |
Oh | +0.074 |
On | +0.073 |
Welcome | +0.073 |
Neg logit contributions | |
ish | -0.119 |
Majesty | -0.107 |
majesty | -0.097 |
ci | -0.097 |
oppy | -0.095 |
Token | foot |
Token ID | 2366 |
Feature activation | -1.67e+01 |
Pos logit contributions | |
Where | +0.111 |
Oh | +0.099 |
He | +0.099 |
See | +0.098 |
What | +0.097 |
Neg logit contributions | |
ish | -0.077 |
cient | -0.073 |
Majesty | -0.071 |
pp | -0.063 |
ci | -0.062 |
Token | again |
Token ID | 757 |
Feature activation | -1.85e+01 |
Pos logit contributions | |
Where | +0.056 |
See | +0.046 |
On | +0.045 |
Oh | +0.045 |
He | +0.045 |
Neg logit contributions | |
ish | -0.116 |
Majesty | -0.114 |
majesty | -0.107 |
cient | -0.103 |
oppy | -0.101 |
Token | . |
Token ID | 13 |
Feature activation | -2.51e+01 |
Pos logit contributions | |
Where | +0.075 |
See | +0.069 |
Oh | +0.068 |
Welcome | +0.067 |
Wow | +0.066 |
Neg logit contributions | |
ish | -0.119 |
Majesty | -0.106 |
ci | -0.098 |
majesty | -0.097 |
oppy | -0.096 |
Token | The |
Token ID | 383 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
Where | +0.105 |
Warning | +0.093 |
Oh | +0.091 |
Welcome | +0.089 |
On | +0.089 |
Neg logit contributions | |
ish | -0.157 |
Majesty | -0.142 |
majesty | -0.130 |
oppy | -0.127 |
ci | -0.127 |
Token | moral |
Token ID | 6573 |
Feature activation | -2.69e+01 |
Pos logit contributions | |
Where | +0.087 |
Welcome | +0.082 |
See | +0.079 |
On | +0.078 |
Wow | +0.078 |
Neg logit contributions | |
ish | -0.139 |
Majesty | -0.124 |
knee | -0.122 |
majesty | -0.114 |
oppy | -0.109 |
Token | of |
Token ID | 286 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
Where | +0.126 |
Who | +0.113 |
See | +0.109 |
Wow | +0.109 |
What | +0.109 |
Neg logit contributions | |
ish | -0.141 |
ci | -0.113 |
oppy | -0.110 |
Majesty | -0.107 |
ap | -0.105 |
Token | the |
Token ID | 262 |
Feature activation | -2.15e+01 |
Pos logit contributions | |
Where | +0.071 |
Oh | +0.063 |
See | +0.061 |
What | +0.061 |
That | +0.059 |
Neg logit contributions | |
ish | -0.150 |
Majesty | -0.144 |
majesty | -0.132 |
cient | -0.125 |
oppy | -0.122 |
Token | story |
Token ID | 1621 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
Where | +0.118 |
See | +0.107 |
On | +0.102 |
Oh | +0.102 |
Wow | +0.101 |
Neg logit contributions | |
ish | -0.099 |
Majesty | -0.087 |
oppy | -0.079 |
ci | -0.079 |
majesty | -0.079 |
Token | is |
Token ID | 318 |
Feature activation | -2.56e+01 |
Pos logit contributions | |
Where | +0.111 |
See | +0.100 |
Oh | +0.099 |
Welcome | +0.098 |
On | +0.097 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.116 |
ci | -0.107 |
majesty | -0.106 |
oppy | -0.104 |
Token | that |
Token ID | 326 |
Feature activation | -2.61e+01 |
Pos logit contributions | |
Where | +0.125 |
On | +0.115 |
To | +0.114 |
See | +0.114 |
Oh | +0.113 |
Neg logit contributions | |
ish | -0.140 |
Majesty | -0.131 |
majesty | -0.117 |
ci | -0.112 |
cient | -0.109 |
Token | , |
Token ID | 11 |
Feature activation | -2.02e+01 |
Pos logit contributions | |
Where | +0.102 |
Oh | +0.093 |
Welcome | +0.091 |
See | +0.091 |
That | +0.091 |
Neg logit contributions | |
ish | -0.119 |
ci | -0.107 |
Majesty | -0.106 |
ishes | -0.098 |
majesty | -0.093 |
Token | I |
Token ID | 314 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
Where | +0.092 |
See | +0.083 |
Oh | +0.083 |
Welcome | +0.082 |
On | +0.082 |
Neg logit contributions | |
ish | -0.120 |
Majesty | -0.109 |
majesty | -0.098 |
ci | -0.098 |
oppy | -0.096 |
Token | will |
Token ID | 481 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
Where | +0.104 |
See | +0.095 |
Oh | +0.093 |
On | +0.092 |
Welcome | +0.092 |
Neg logit contributions | |
ish | -0.143 |
Majesty | -0.129 |
majesty | -0.117 |
ci | -0.116 |
oppy | -0.114 |
Token | marry |
Token ID | 12479 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
Where | +0.104 |
See | +0.096 |
Welcome | +0.095 |
On | +0.094 |
To | +0.091 |
Neg logit contributions | |
ish | -0.142 |
Majesty | -0.123 |
ci | -0.115 |
oppy | -0.113 |
majesty | -0.110 |
Token | you |
Token ID | 345 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
Where | +0.101 |
See | +0.091 |
Welcome | +0.090 |
Oh | +0.090 |
Wow | +0.088 |
Neg logit contributions | |
ish | -0.124 |
Majesty | -0.111 |
majesty | -0.099 |
ci | -0.099 |
oppy | -0.099 |
Token | !" |
Token ID | 2474 |
Feature activation | -2.68e+01 |
Pos logit contributions | |
Where | +0.092 |
On | +0.086 |
Welcome | +0.085 |
For | +0.084 |
One | +0.084 |
Neg logit contributions | |
ish | -0.124 |
Majesty | -0.111 |
majesty | -0.101 |
ci | -0.100 |
oppy | -0.099 |
Token | They |
Token ID | 1119 |
Feature activation | -2.49e+01 |
Pos logit contributions | |
Where | +0.102 |
See | +0.090 |
Oh | +0.089 |
Welcome | +0.087 |
On | +0.086 |
Neg logit contributions | |
ish | -0.180 |
Majesty | -0.162 |
majesty | -0.150 |
ci | -0.149 |
oppy | -0.146 |
Token | had |
Token ID | 550 |
Feature activation | -2.49e+01 |
Pos logit contributions | |
Where | +0.101 |
See | +0.091 |
On | +0.090 |
Oh | +0.089 |
Welcome | +0.089 |
Neg logit contributions | |
ish | -0.156 |
Majesty | -0.143 |
majesty | -0.131 |
ci | -0.128 |
oppy | -0.127 |
Token | a |
Token ID | 257 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
Where | +0.102 |
See | +0.092 |
Oh | +0.091 |
On | +0.089 |
Welcome | +0.089 |
Neg logit contributions | |
ish | -0.158 |
Majesty | -0.143 |
majesty | -0.131 |
ci | -0.130 |
oppy | -0.128 |
Token | big |
Token ID | 1263 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
Where | +0.081 |
See | +0.075 |
On | +0.072 |
Oh | +0.072 |
Welcome | +0.070 |
Neg logit contributions | |
ish | -0.159 |
Majesty | -0.144 |
ci | -0.134 |
majesty | -0.132 |
cient | -0.129 |
Token | party |
Token ID | 2151 |
Feature activation | -2.44e+01 |
Pos logit contributions | |
See | +0.080 |
Time | +0.077 |
moral | +0.077 |
Today | +0.076 |
On | +0.074 |
Neg logit contributions | |
ish | -0.115 |
Majesty | -0.108 |
cient | -0.100 |
ishes | -0.098 |
majesty | -0.097 |
Token | ?" |
Token ID | 1701 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
Where | +0.088 |
On | +0.079 |
Do | +0.079 |
Welcome | +0.078 |
Time | +0.078 |
Neg logit contributions | |
ish | -0.086 |
Majesty | -0.084 |
majesty | -0.076 |
mit | -0.070 |
cient | -0.068 |
Token | her |
Token ID | 607 |
Feature activation | -2.09e+01 |
Pos logit contributions | |
Where | +0.098 |
See | +0.089 |
Welcome | +0.088 |
Warning | +0.087 |
On | +0.087 |
Neg logit contributions | |
ish | -0.150 |
Majesty | -0.134 |
majesty | -0.124 |
oppy | -0.123 |
ci | -0.123 |
Token | mom |
Token ID | 1995 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
Where | +0.108 |
See | +0.099 |
Oh | +0.098 |
On | +0.097 |
Welcome | +0.096 |
Neg logit contributions | |
ish | -0.111 |
Majesty | -0.099 |
majesty | -0.088 |
ci | -0.088 |
cient | -0.086 |
Token | asked |
Token ID | 1965 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
Where | +0.079 |
See | +0.074 |
Welcome | +0.073 |
Warning | +0.073 |
Oh | +0.073 |
Neg logit contributions | |
ish | -0.149 |
Majesty | -0.126 |
ci | -0.125 |
oppy | -0.120 |
cient | -0.118 |
Token | . |
Token ID | 13 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
Where | +0.088 |
Oh | +0.075 |
Do | +0.073 |
See | +0.073 |
What | +0.073 |
Neg logit contributions | |
ish | -0.161 |
Majesty | -0.153 |
majesty | -0.142 |
ci | -0.138 |
cient | -0.134 |
Token | " |
Token ID | 366 |
Feature activation | -2.67e+01 |
Pos logit contributions | |
Where | +0.102 |
See | +0.093 |
Warning | +0.093 |
Welcome | +0.092 |
Oh | +0.091 |
Neg logit contributions | |
ish | -0.149 |
Majesty | -0.133 |
majesty | -0.123 |
cient | -0.122 |
oppy | -0.122 |
Token | I |
Token ID | 40 |
Feature activation | -2.54e+01 |
Pos logit contributions | |
Where | +0.048 |
Warning | +0.042 |
See | +0.042 |
Welcome | +0.042 |
On | +0.041 |
Neg logit contributions | |
ish | -0.207 |
Majesty | -0.184 |
ci | -0.184 |
oppy | -0.178 |
cient | -0.174 |
Token | fell |
Token ID | 3214 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
Where | +0.091 |
See | +0.090 |
On | +0.086 |
Oh | +0.085 |
To | +0.084 |
Neg logit contributions | |
ish | -0.164 |
Majesty | -0.161 |
majesty | -0.144 |
castle | -0.139 |
ishes | -0.137 |
Token | off |
Token ID | 572 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
Where | +0.089 |
Oh | +0.084 |
On | +0.081 |
See | +0.081 |
Welcome | +0.079 |
Neg logit contributions | |
ish | -0.145 |
Majesty | -0.139 |
majesty | -0.128 |
oppy | -0.123 |
cient | -0.122 |
Token | the |
Token ID | 262 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
Where | +0.087 |
See | +0.079 |
Oh | +0.078 |
On | +0.077 |
Welcome | +0.077 |
Neg logit contributions | |
ish | -0.138 |
Majesty | -0.126 |
majesty | -0.114 |
ci | -0.113 |
cient | -0.111 |
Token | swing |
Token ID | 9628 |
Feature activation | -2.05e+01 |
Pos logit contributions | |
Where | +0.125 |
Oh | +0.116 |
See | +0.116 |
On | +0.115 |
Welcome | +0.112 |
Neg logit contributions | |
ish | -0.099 |
Majesty | -0.085 |
ci | -0.075 |
majesty | -0.074 |
oppy | -0.074 |
Token | ran |
Token ID | 4966 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
Where | +0.104 |
Welcome | +0.097 |
See | +0.097 |
Warning | +0.095 |
On | +0.094 |
Neg logit contributions | |
ish | -0.138 |
Majesty | -0.118 |
majesty | -0.109 |
oppy | -0.109 |
ci | -0.108 |
Token | very |
Token ID | 845 |
Feature activation | -2.22e+01 |
Pos logit contributions | |
Where | +0.120 |
See | +0.116 |
Warning | +0.113 |
Oh | +0.111 |
Welcome | +0.111 |
Neg logit contributions | |
ish | -0.124 |
Majesty | -0.104 |
majesty | -0.093 |
ci | -0.091 |
oppy | -0.090 |
Token | fast |
Token ID | 3049 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
Where | +0.070 |
See | +0.062 |
Oh | +0.060 |
Welcome | +0.060 |
Warning | +0.058 |
Neg logit contributions | |
ish | -0.161 |
Majesty | -0.145 |
majesty | -0.136 |
oppy | -0.134 |
ci | -0.134 |
Token | and |
Token ID | 290 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
Where | +0.106 |
See | +0.096 |
Oh | +0.095 |
On | +0.094 |
Welcome | +0.093 |
Neg logit contributions | |
ish | -0.140 |
Majesty | -0.126 |
majesty | -0.114 |
ci | -0.113 |
oppy | -0.112 |
Token | far |
Token ID | 1290 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
Where | +0.103 |
See | +0.094 |
Oh | +0.093 |
Warning | +0.092 |
On | +0.092 |
Neg logit contributions | |
ish | -0.143 |
Majesty | -0.128 |
majesty | -0.117 |
ci | -0.116 |
cient | -0.114 |
Token | . |
Token ID | 13 |
Feature activation | -2.67e+01 |
Pos logit contributions | |
Where | +0.111 |
See | +0.108 |
On | +0.105 |
Warning | +0.104 |
Oh | +0.104 |
Neg logit contributions | |
ish | -0.119 |
Majesty | -0.098 |
majesty | -0.088 |
cient | -0.087 |
ci | -0.087 |
Token | Ben |
Token ID | 3932 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
Where | +0.109 |
Warning | +0.101 |
Welcome | +0.099 |
See | +0.097 |
Oh | +0.097 |
Neg logit contributions | |
ish | -0.163 |
Majesty | -0.147 |
oppy | -0.138 |
majesty | -0.136 |
cient | -0.131 |
Token | and |
Token ID | 290 |
Feature activation | -2.48e+01 |
Pos logit contributions | |
Where | +0.110 |
See | +0.101 |
Oh | +0.100 |
Welcome | +0.098 |
On | +0.098 |
Neg logit contributions | |
ish | -0.132 |
Majesty | -0.116 |
majesty | -0.106 |
ci | -0.104 |
oppy | -0.103 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
Where | +0.107 |
See | +0.101 |
Warning | +0.100 |
On | +0.098 |
Oh | +0.096 |
Neg logit contributions | |
ish | -0.146 |
Majesty | -0.128 |
ci | -0.119 |
majesty | -0.119 |
oppy | -0.117 |
Token | could |
Token ID | 714 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
Where | +0.104 |
Welcome | +0.096 |
See | +0.095 |
Time | +0.095 |
Warning | +0.095 |
Neg logit contributions | |
ish | -0.144 |
Majesty | -0.116 |
cient | -0.111 |
ci | -0.110 |
oppy | -0.108 |
Token | not |
Token ID | 407 |
Feature activation | -2.50e+01 |
Pos logit contributions | |
Where | +0.112 |
On | +0.102 |
See | +0.101 |
Oh | +0.099 |
Welcome | +0.095 |
Neg logit contributions | |
ish | -0.149 |
Majesty | -0.134 |
ci | -0.122 |
majesty | -0.121 |
cient | -0.119 |
Token | the |
Token ID | 262 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
Oh | +0.120 |
Where | +0.120 |
Warning | +0.119 |
See | +0.119 |
Wow | +0.119 |
Neg logit contributions | |
ish | -0.108 |
Majesty | -0.098 |
ci | -0.088 |
majesty | -0.086 |
oppy | -0.085 |
Token | mechanic |
Token ID | 21600 |
Feature activation | -1.87e+01 |
Pos logit contributions | |
Where | +0.122 |
Wow | +0.117 |
On | +0.115 |
Warning | +0.115 |
Oh | +0.113 |
Neg logit contributions | |
ish | -0.095 |
Majesty | -0.085 |
knee | -0.075 |
ci | -0.073 |
majesty | -0.073 |
Token | who |
Token ID | 508 |
Feature activation | -2.22e+01 |
Pos logit contributions | |
Where | +0.082 |
See | +0.073 |
On | +0.072 |
Welcome | +0.072 |
Oh | +0.072 |
Neg logit contributions | |
ish | -0.111 |
Majesty | -0.103 |
majesty | -0.094 |
oppy | -0.091 |
cient | -0.090 |
Token | helped |
Token ID | 4193 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
Where | +0.093 |
Oh | +0.084 |
Warning | +0.082 |
See | +0.081 |
On | +0.081 |
Neg logit contributions | |
ish | -0.141 |
Majesty | -0.123 |
ci | -0.117 |
majesty | -0.114 |
cient | -0.114 |
Token | him |
Token ID | 683 |
Feature activation | -2.14e+01 |
Pos logit contributions | |
Where | +0.115 |
See | +0.107 |
Oh | +0.105 |
Welcome | +0.103 |
On | +0.102 |
Neg logit contributions | |
ish | -0.137 |
Majesty | -0.121 |
ci | -0.109 |
majesty | -0.109 |
oppy | -0.107 |
Token | . |
Token ID | 13 |
Feature activation | -2.67e+01 |
Pos logit contributions | |
Where | +0.090 |
On | +0.084 |
To | +0.080 |
He | +0.079 |
See | +0.078 |
Neg logit contributions | |
ish | -0.129 |
Majesty | -0.120 |
majesty | -0.111 |
ci | -0.107 |
oppy | -0.107 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
Where | +0.125 |
Oh | +0.112 |
Warning | +0.109 |
Who | +0.107 |
Welcome | +0.107 |
Neg logit contributions | |
ish | -0.144 |
Majesty | -0.131 |
oppy | -0.125 |
cient | -0.124 |
ci | -0.121 |
Token | Once |
Token ID | 7454 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
Where | +0.097 |
Warning | +0.093 |
See | +0.091 |
Oh | +0.091 |
Who | +0.088 |
Neg logit contributions | |
ish | -0.130 |
oppy | -0.115 |
gy | -0.115 |
ci | -0.111 |
adow | -0.106 |
Token | upon |
Token ID | 2402 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
Where | +0.086 |
See | +0.078 |
Oh | +0.077 |
On | +0.077 |
Welcome | +0.076 |
Neg logit contributions | |
ish | -0.120 |
Majesty | -0.109 |
majesty | -0.099 |
ci | -0.098 |
cient | -0.096 |
Token | a |
Token ID | 257 |
Feature activation | -2.22e+01 |
Pos logit contributions | |
Where | +0.100 |
See | +0.092 |
Oh | +0.091 |
Warning | +0.089 |
Welcome | +0.089 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.121 |
majesty | -0.110 |
ci | -0.109 |
oppy | -0.108 |
Token | time |
Token ID | 640 |
Feature activation | -2.44e+01 |
Pos logit contributions | |
Where | +0.054 |
On | +0.050 |
See | +0.046 |
Oh | +0.045 |
One | +0.044 |
Neg logit contributions | |
ish | -0.176 |
Majesty | -0.165 |
majesty | -0.153 |
ci | -0.153 |
cient | -0.151 |
Token | looked |
Token ID | 3114 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
Where | +0.101 |
Warning | +0.097 |
Welcome | +0.096 |
See | +0.094 |
Oh | +0.093 |
Neg logit contributions | |
ish | -0.129 |
ci | -0.108 |
gy | -0.107 |
cient | -0.105 |
Majesty | -0.105 |
Token | angry |
Token ID | 7954 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
Where | +0.109 |
See | +0.100 |
Oh | +0.098 |
On | +0.097 |
Welcome | +0.096 |
Neg logit contributions | |
ish | -0.144 |
Majesty | -0.128 |
majesty | -0.116 |
ci | -0.116 |
cient | -0.113 |
Token | and |
Token ID | 290 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
Where | +0.125 |
See | +0.118 |
Oh | +0.117 |
On | +0.115 |
Welcome | +0.115 |
Neg logit contributions | |
ish | -0.118 |
Majesty | -0.098 |
ci | -0.086 |
majesty | -0.086 |
oppy | -0.083 |
Token | said |
Token ID | 531 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
Where | +0.098 |
See | +0.089 |
Warning | +0.089 |
Oh | +0.088 |
On | +0.087 |
Neg logit contributions | |
ish | -0.144 |
Majesty | -0.129 |
cient | -0.120 |
majesty | -0.118 |
ci | -0.118 |
Token | , |
Token ID | 11 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
Where | +0.124 |
See | +0.115 |
He | +0.112 |
Are | +0.110 |
Do | +0.110 |
Neg logit contributions | |
ish | -0.139 |
Majesty | -0.125 |
ci | -0.118 |
majesty | -0.112 |
oppy | -0.107 |
Token | " |
Token ID | 366 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
Where | +0.099 |
See | +0.092 |
Oh | +0.092 |
Welcome | +0.091 |
Warning | +0.091 |
Neg logit contributions | |
ish | -0.136 |
Majesty | -0.124 |
cient | -0.114 |
majesty | -0.113 |
ci | -0.110 |
Token | Did |
Token ID | 11633 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
Where | +0.059 |
On | +0.058 |
See | +0.052 |
Welcome | +0.049 |
To | +0.048 |
Neg logit contributions | |
ish | -0.194 |
ci | -0.166 |
cient | -0.163 |
Majesty | -0.160 |
ans | -0.159 |
Token | you |
Token ID | 345 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
Where | +0.105 |
That | +0.093 |
Oh | +0.092 |
What | +0.092 |
See | +0.089 |
Neg logit contributions | |
ish | -0.162 |
Majesty | -0.148 |
majesty | -0.136 |
ci | -0.134 |
castle | -0.128 |
Token | break |
Token ID | 2270 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
Where | +0.099 |
On | +0.092 |
See | +0.089 |
To | +0.088 |
Oh | +0.088 |
Neg logit contributions | |
ish | -0.172 |
Majesty | -0.167 |
majesty | -0.151 |
ci | -0.145 |
oppy | -0.141 |
Token | my |
Token ID | 616 |
Feature activation | -2.32e+01 |
Pos logit contributions | |
Where | +0.086 |
What | +0.078 |
Oh | +0.076 |
See | +0.070 |
Wow | +0.068 |
Neg logit contributions | |
ish | -0.142 |
Majesty | -0.141 |
majesty | -0.131 |
oppy | -0.127 |
atmeal | -0.126 |
Token | window |
Token ID | 4324 |
Feature activation | -1.93e+01 |
Pos logit contributions | |
Where | +0.110 |
Oh | +0.098 |
See | +0.097 |
Wow | +0.097 |
On | +0.096 |
Neg logit contributions | |
ish | -0.124 |
Majesty | -0.121 |
majesty | -0.109 |
cient | -0.105 |
oppy | -0.104 |
Token | and |
Token ID | 290 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
Where | +0.101 |
See | +0.093 |
Oh | +0.092 |
Welcome | +0.090 |
On | +0.090 |
Neg logit contributions | |
ish | -0.118 |
Majesty | -0.104 |
ci | -0.095 |
majesty | -0.094 |
oppy | -0.092 |
Token | played |
Token ID | 2826 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
Where | +0.079 |
See | +0.075 |
Oh | +0.069 |
Welcome | +0.069 |
Wow | +0.068 |
Neg logit contributions | |
ish | -0.161 |
Majesty | -0.149 |
majesty | -0.134 |
cient | -0.133 |
oppy | -0.133 |
Token | together |
Token ID | 1978 |
Feature activation | -2.21e+01 |
Pos logit contributions | |
Where | +0.097 |
See | +0.088 |
On | +0.086 |
Oh | +0.084 |
For | +0.083 |
Neg logit contributions | |
ish | -0.137 |
Majesty | -0.124 |
majesty | -0.114 |
ci | -0.112 |
oppy | -0.111 |
Token | every |
Token ID | 790 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
Where | +0.102 |
See | +0.093 |
Oh | +0.091 |
On | +0.091 |
Welcome | +0.090 |
Neg logit contributions | |
ish | -0.130 |
Majesty | -0.116 |
majesty | -0.106 |
ci | -0.104 |
oppy | -0.103 |
Token | day |
Token ID | 1110 |
Feature activation | -2.19e+01 |
Pos logit contributions | |
Where | +0.105 |
See | +0.101 |
Warning | +0.099 |
Oh | +0.096 |
To | +0.094 |
Neg logit contributions | |
ish | -0.114 |
Majesty | -0.093 |
ci | -0.089 |
oppy | -0.083 |
cient | -0.082 |
Token | . |
Token ID | 13 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
Where | +0.092 |
See | +0.085 |
Oh | +0.084 |
Welcome | +0.081 |
Wow | +0.081 |
Neg logit contributions | |
ish | -0.137 |
Majesty | -0.120 |
ci | -0.113 |
oppy | -0.109 |
majesty | -0.109 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -2.51e+01 |
Pos logit contributions | |
Where | +0.099 |
Warning | +0.087 |
On | +0.084 |
Oh | +0.084 |
Who | +0.083 |
Neg logit contributions | |
ish | -0.171 |
Majesty | -0.146 |
ci | -0.140 |
oppy | -0.139 |
cient | -0.139 |
Token | Once |
Token ID | 7454 |
Feature activation | -1.86e+01 |
Pos logit contributions | |
Where | +0.091 |
See | +0.087 |
Warning | +0.086 |
Oh | +0.084 |
Who | +0.083 |
Neg logit contributions | |
ish | -0.139 |
oppy | -0.123 |
gy | -0.118 |
ci | -0.116 |
ap | -0.112 |
Token | upon |
Token ID | 2402 |
Feature activation | -2.23e+01 |
Pos logit contributions | |
Where | +0.077 |
On | +0.071 |
See | +0.070 |
Oh | +0.069 |
Welcome | +0.068 |
Neg logit contributions | |
ish | -0.114 |
Majesty | -0.107 |
majesty | -0.096 |
ci | -0.096 |
cient | -0.092 |
Token | a |
Token ID | 257 |
Feature activation | -2.08e+01 |
Pos logit contributions | |
Where | +0.096 |
See | +0.088 |
Oh | +0.087 |
Warning | +0.085 |
Welcome | +0.085 |
Neg logit contributions | |
ish | -0.132 |
Majesty | -0.117 |
majesty | -0.107 |
ci | -0.106 |
oppy | -0.106 |
Token | time |
Token ID | 640 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
Where | +0.050 |
On | +0.046 |
See | +0.043 |
Oh | +0.042 |
One | +0.041 |
Neg logit contributions | |
ish | -0.166 |
Majesty | -0.155 |
majesty | -0.144 |
ci | -0.143 |
cient | -0.142 |
Token | and |
Token ID | 290 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
Where | +0.126 |
See | +0.125 |
Welcome | +0.124 |
Warning | +0.123 |
Oh | +0.120 |
Neg logit contributions | |
ish | -0.114 |
Majesty | -0.089 |
knee | -0.083 |
oppy | -0.082 |
majesty | -0.080 |
Token | angry |
Token ID | 7954 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
Where | +0.098 |
See | +0.092 |
On | +0.092 |
Warning | +0.091 |
Welcome | +0.089 |
Neg logit contributions | |
ish | -0.125 |
Majesty | -0.108 |
cient | -0.101 |
majesty | -0.099 |
ci | -0.099 |
Token | . |
Token ID | 13 |
Feature activation | -2.38e+01 |
Pos logit contributions | |
Where | +0.104 |
See | +0.101 |
Oh | +0.098 |
On | +0.097 |
Warning | +0.097 |
Neg logit contributions | |
ish | -0.128 |
Majesty | -0.109 |
ci | -0.097 |
majesty | -0.097 |
knee | -0.096 |
Token |
|
Token ID | 198 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
Where | +0.074 |
See | +0.068 |
Welcome | +0.066 |
Warning | +0.065 |
On | +0.064 |
Neg logit contributions | |
ish | -0.162 |
Majesty | -0.147 |
oppy | -0.139 |
majesty | -0.137 |
cient | -0.137 |
Token |
|
Token ID | 198 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
Where | +0.080 |
Welcome | +0.075 |
Oh | +0.073 |
Wow | +0.072 |
See | +0.072 |
Neg logit contributions | |
ish | -0.151 |
oppy | -0.144 |
Majesty | -0.137 |
majesty | -0.134 |
cient | -0.128 |
Token | " |
Token ID | 1 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
Where | +0.105 |
See | +0.100 |
Welcome | +0.100 |
Oh | +0.097 |
Warning | +0.096 |
Neg logit contributions | |
ish | -0.137 |
oppy | -0.120 |
Majesty | -0.117 |
majesty | -0.112 |
cient | -0.108 |
Token | What |
Token ID | 2061 |
Feature activation | -2.51e+01 |
Pos logit contributions | |
Warning | +0.046 |
On | +0.045 |
Welcome | +0.045 |
To | +0.042 |
One | +0.040 |
Neg logit contributions | |
ish | -0.188 |
Majesty | -0.160 |
ishes | -0.157 |
oppy | -0.156 |
ci | -0.155 |
Token | did |
Token ID | 750 |
Feature activation | -2.48e+01 |
Pos logit contributions | |
Where | +0.105 |
See | +0.095 |
Oh | +0.093 |
On | +0.092 |
Welcome | +0.091 |
Neg logit contributions | |
ish | -0.158 |
Majesty | -0.141 |
majesty | -0.129 |
ci | -0.129 |
oppy | -0.127 |
Token | you |
Token ID | 345 |
Feature activation | -2.48e+01 |
Pos logit contributions | |
Where | +0.110 |
Oh | +0.099 |
See | +0.097 |
To | +0.096 |
Welcome | +0.096 |
Neg logit contributions | |
ish | -0.157 |
Majesty | -0.139 |
ci | -0.124 |
majesty | -0.123 |
cient | -0.121 |
Token | do |
Token ID | 466 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
Where | +0.100 |
On | +0.091 |
Oh | +0.091 |
What | +0.090 |
That | +0.089 |
Neg logit contributions | |
ish | -0.153 |
Majesty | -0.147 |
majesty | -0.136 |
ci | -0.130 |
oppy | -0.126 |
Token | ?" |
Token ID | 1701 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
Where | +0.107 |
On | +0.099 |
To | +0.098 |
What | +0.098 |
For | +0.096 |
Neg logit contributions | |
ish | -0.136 |
Majesty | -0.129 |
majesty | -0.116 |
cient | -0.111 |
ishes | -0.110 |
Token | from |
Token ID | 422 |
Feature activation | -1.98e+01 |
Pos logit contributions | |
Where | +0.051 |
On | +0.047 |
He | +0.045 |
For | +0.045 |
To | +0.044 |
Neg logit contributions | |
ish | -0.131 |
Majesty | -0.123 |
majesty | -0.114 |
cient | -0.111 |
oppy | -0.110 |
Token | now |
Token ID | 783 |
Feature activation | -2.12e+01 |
Pos logit contributions | |
Where | +0.086 |
See | +0.078 |
Oh | +0.077 |
On | +0.076 |
Welcome | +0.076 |
Neg logit contributions | |
ish | -0.121 |
Majesty | -0.109 |
majesty | -0.100 |
ci | -0.099 |
oppy | -0.097 |
Token | on |
Token ID | 319 |
Feature activation | -1.92e+01 |
Pos logit contributions | |
Where | +0.086 |
Oh | +0.080 |
See | +0.080 |
Wow | +0.079 |
Welcome | +0.078 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.117 |
ci | -0.109 |
oppy | -0.107 |
majesty | -0.106 |
Token | . |
Token ID | 13 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
Where | +0.074 |
See | +0.066 |
Oh | +0.065 |
On | +0.064 |
Welcome | +0.064 |
Neg logit contributions | |
ish | -0.128 |
Majesty | -0.116 |
majesty | -0.107 |
ci | -0.106 |
oppy | -0.104 |
Token | The |
Token ID | 383 |
Feature activation | -2.21e+01 |
Pos logit contributions | |
Where | +0.091 |
See | +0.080 |
Oh | +0.079 |
On | +0.077 |
Welcome | +0.077 |
Neg logit contributions | |
ish | -0.168 |
Majesty | -0.152 |
oppy | -0.140 |
majesty | -0.140 |
ci | -0.139 |
Token | moral |
Token ID | 6573 |
Feature activation | -2.66e+01 |
Pos logit contributions | |
Where | +0.123 |
Warning | +0.117 |
Oh | +0.116 |
See | +0.116 |
Welcome | +0.115 |
Neg logit contributions | |
ish | -0.102 |
Majesty | -0.089 |
majesty | -0.079 |
cient | -0.076 |
ans | -0.071 |
Token | of |
Token ID | 286 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
Where | +0.119 |
Who | +0.105 |
See | +0.103 |
Oh | +0.102 |
Wow | +0.102 |
Neg logit contributions | |
ish | -0.151 |
oppy | -0.123 |
Majesty | -0.122 |
ci | -0.121 |
majesty | -0.118 |
Token | the |
Token ID | 262 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
Where | +0.074 |
Oh | +0.066 |
See | +0.064 |
What | +0.062 |
Welcome | +0.062 |
Neg logit contributions | |
ish | -0.149 |
Majesty | -0.142 |
majesty | -0.130 |
cient | -0.123 |
ci | -0.122 |
Token | story |
Token ID | 1621 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
Where | +0.108 |
See | +0.098 |
Oh | +0.096 |
Wow | +0.094 |
On | +0.093 |
Neg logit contributions | |
ish | -0.108 |
Majesty | -0.095 |
majesty | -0.087 |
cient | -0.086 |
oppy | -0.084 |
Token | is |
Token ID | 318 |
Feature activation | -2.54e+01 |
Pos logit contributions | |
Where | +0.111 |
See | +0.100 |
Oh | +0.100 |
Welcome | +0.097 |
On | +0.096 |
Neg logit contributions | |
ish | -0.131 |
Majesty | -0.113 |
majesty | -0.104 |
ci | -0.103 |
oppy | -0.102 |
Token | that |
Token ID | 326 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
Where | +0.115 |
To | +0.109 |
On | +0.107 |
For | +0.104 |
See | +0.104 |
Neg logit contributions | |
ish | -0.147 |
Majesty | -0.140 |
majesty | -0.124 |
ci | -0.121 |
castle | -0.116 |
Token | her |
Token ID | 607 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
Where | +0.093 |
See | +0.083 |
Oh | +0.082 |
On | +0.080 |
Welcome | +0.080 |
Neg logit contributions | |
ish | -0.152 |
Majesty | -0.139 |
majesty | -0.127 |
ci | -0.124 |
oppy | -0.124 |
Token | mom |
Token ID | 1995 |
Feature activation | -2.25e+01 |
Pos logit contributions | |
Where | +0.097 |
See | +0.089 |
Oh | +0.087 |
On | +0.085 |
Welcome | +0.085 |
Neg logit contributions | |
ish | -0.124 |
Majesty | -0.111 |
ci | -0.101 |
majesty | -0.099 |
cient | -0.098 |
Token | went |
Token ID | 1816 |
Feature activation | -2.40e+01 |
Pos logit contributions | |
Where | +0.094 |
Oh | +0.085 |
See | +0.084 |
Warning | +0.082 |
Welcome | +0.082 |
Neg logit contributions | |
ish | -0.146 |
Majesty | -0.124 |
ci | -0.119 |
oppy | -0.114 |
cient | -0.114 |
Token | back |
Token ID | 736 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
Where | +0.138 |
See | +0.129 |
Oh | +0.128 |
Welcome | +0.126 |
On | +0.126 |
Neg logit contributions | |
ish | -0.113 |
Majesty | -0.098 |
majesty | -0.086 |
ci | -0.085 |
oppy | -0.083 |
Token | home |
Token ID | 1363 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
Where | +0.104 |
On | +0.097 |
Welcome | +0.092 |
See | +0.092 |
For | +0.091 |
Neg logit contributions | |
ish | -0.128 |
Majesty | -0.124 |
majesty | -0.111 |
cient | -0.104 |
oppy | -0.103 |
Token | . |
Token ID | 13 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
Where | +0.102 |
See | +0.093 |
On | +0.091 |
Oh | +0.091 |
Welcome | +0.089 |
Neg logit contributions | |
ish | -0.137 |
Majesty | -0.123 |
majesty | -0.111 |
ci | -0.110 |
cient | -0.108 |
Token | |
Token ID | 220 |
Feature activation | -2.07e+01 |
Pos logit contributions | |
Warning | +0.124 |
Where | +0.124 |
Time | +0.112 |
See | +0.111 |
Oh | +0.111 |
Neg logit contributions | |
ish | -0.131 |
Majesty | -0.120 |
oppy | -0.115 |
majesty | -0.114 |
cient | -0.110 |
Token |
|
Token ID | 198 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
Where | +0.056 |
Oh | +0.048 |
Warning | +0.047 |
Welcome | +0.046 |
Time | +0.045 |
Neg logit contributions | |
ish | -0.155 |
Majesty | -0.142 |
majesty | -0.135 |
oppy | -0.135 |
cient | -0.132 |
Token |
|
Token ID | 198 |
Feature activation | -2.57e+01 |
Pos logit contributions | |
Where | +0.089 |
Warning | +0.087 |
Oh | +0.081 |
See | +0.078 |
Welcome | +0.076 |
Neg logit contributions | |
ish | -0.146 |
oppy | -0.139 |
Majesty | -0.135 |
majesty | -0.133 |
cient | -0.132 |
Token | L |
Token ID | 43 |
Feature activation | -1.91e+01 |
Pos logit contributions | |
Warning | +0.081 |
Where | +0.072 |
See | +0.072 |
Welcome | +0.068 |
Oh | +0.067 |
Neg logit contributions | |
ish | -0.128 |
oppy | -0.122 |
Majesty | -0.119 |
cient | -0.119 |
iggle | -0.118 |
Token | ily |
Token ID | 813 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
Where | +0.069 |
See | +0.062 |
Oh | +0.061 |
On | +0.059 |
Welcome | +0.059 |
Neg logit contributions | |
ish | -0.132 |
Majesty | -0.119 |
majesty | -0.110 |
ci | -0.109 |
oppy | -0.108 |
Token | but |
Token ID | 475 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
Where | +0.098 |
See | +0.089 |
Oh | +0.088 |
On | +0.086 |
Welcome | +0.085 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.121 |
majesty | -0.111 |
oppy | -0.109 |
ci | -0.109 |
Token | it |
Token ID | 340 |
Feature activation | -2.34e+01 |
Pos logit contributions | |
Where | +0.106 |
See | +0.100 |
Warning | +0.100 |
Welcome | +0.098 |
On | +0.097 |
Neg logit contributions | |
ish | -0.141 |
Majesty | -0.122 |
ci | -0.115 |
oppy | -0.112 |
majesty | -0.111 |
Token | did |
Token ID | 750 |
Feature activation | -2.18e+01 |
Pos logit contributions | |
Where | +0.087 |
See | +0.078 |
Oh | +0.076 |
Welcome | +0.076 |
On | +0.075 |
Neg logit contributions | |
ish | -0.158 |
Majesty | -0.141 |
ci | -0.132 |
majesty | -0.130 |
oppy | -0.129 |
Token | not |
Token ID | 407 |
Feature activation | -2.31e+01 |
Pos logit contributions | |
Where | +0.107 |
See | +0.098 |
Oh | +0.097 |
On | +0.096 |
Welcome | +0.095 |
Neg logit contributions | |
ish | -0.122 |
Majesty | -0.109 |
majesty | -0.098 |
ci | -0.098 |
oppy | -0.095 |
Token | help |
Token ID | 1037 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
Where | +0.123 |
See | +0.117 |
Oh | +0.116 |
Wow | +0.112 |
Warning | +0.111 |
Neg logit contributions | |
ish | -0.119 |
Majesty | -0.102 |
majesty | -0.092 |
oppy | -0.090 |
cient | -0.088 |
Token | . |
Token ID | 13 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
See | +0.123 |
Where | +0.121 |
Oh | +0.119 |
Wow | +0.117 |
On | +0.116 |
Neg logit contributions | |
ish | -0.104 |
Majesty | -0.083 |
gy | -0.076 |
oppy | -0.075 |
cient | -0.073 |
Token | Spot |
Token ID | 15899 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
Where | +0.116 |
Warning | +0.105 |
Welcome | +0.104 |
See | +0.101 |
Oh | +0.100 |
Neg logit contributions | |
ish | -0.151 |
Majesty | -0.137 |
majesty | -0.126 |
cient | -0.123 |
oppy | -0.123 |
Token | dragged |
Token ID | 17901 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
Where | +0.096 |
See | +0.087 |
Oh | +0.086 |
Welcome | +0.085 |
Warning | +0.084 |
Neg logit contributions | |
ish | -0.156 |
Majesty | -0.140 |
majesty | -0.128 |
ci | -0.128 |
oppy | -0.126 |
Token | Tommy |
Token ID | 19919 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
Where | +0.124 |
See | +0.124 |
On | +0.123 |
Today | +0.120 |
Warning | +0.120 |
Neg logit contributions | |
ish | -0.116 |
Majesty | -0.087 |
gy | -0.086 |
knee | -0.082 |
oppy | -0.079 |
Token | across |
Token ID | 1973 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
Where | +0.118 |
See | +0.109 |
Oh | +0.108 |
Welcome | +0.106 |
On | +0.106 |
Neg logit contributions | |
ish | -0.120 |
Majesty | -0.106 |
majesty | -0.095 |
ci | -0.094 |
oppy | -0.092 |
Token | the |
Token ID | 262 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
Where | +0.118 |
See | +0.112 |
Wow | +0.112 |
Welcome | +0.111 |
Oh | +0.111 |
Neg logit contributions | |
ish | -0.121 |
Majesty | -0.108 |
ci | -0.096 |
oppy | -0.096 |
majesty | -0.094 |
Token | prayer |
Token ID | 11443 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
Where | +0.099 |
See | +0.091 |
Oh | +0.089 |
Warning | +0.088 |
Welcome | +0.088 |
Neg logit contributions | |
ish | -0.121 |
Majesty | -0.108 |
majesty | -0.098 |
ci | -0.096 |
cient | -0.096 |
Token | . |
Token ID | 13 |
Feature activation | -2.39e+01 |
Pos logit contributions | |
Where | +0.108 |
See | +0.099 |
Oh | +0.098 |
On | +0.097 |
Welcome | +0.097 |
Neg logit contributions | |
ish | -0.115 |
Majesty | -0.102 |
majesty | -0.092 |
ci | -0.090 |
oppy | -0.089 |
Token | He |
Token ID | 679 |
Feature activation | -2.21e+01 |
Pos logit contributions | |
Where | +0.098 |
Warning | +0.089 |
Oh | +0.087 |
Time | +0.086 |
Welcome | +0.085 |
Neg logit contributions | |
ish | -0.144 |
Majesty | -0.121 |
cient | -0.117 |
ci | -0.114 |
gy | -0.113 |
Token | said |
Token ID | 531 |
Feature activation | -2.45e+01 |
Pos logit contributions | |
Where | +0.092 |
Oh | +0.084 |
See | +0.083 |
Warning | +0.082 |
Welcome | +0.081 |
Neg logit contributions | |
ish | -0.140 |
Majesty | -0.121 |
ci | -0.116 |
majesty | -0.112 |
oppy | -0.112 |
Token | " |
Token ID | 366 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
Where | +0.116 |
See | +0.106 |
On | +0.104 |
Welcome | +0.104 |
To | +0.103 |
Neg logit contributions | |
ish | -0.143 |
Majesty | -0.122 |
ci | -0.119 |
oppy | -0.113 |
majesty | -0.109 |
Token | Dear |
Token ID | 20266 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
Warning | +0.076 |
Where | +0.073 |
See | +0.072 |
Oh | +0.065 |
On | +0.065 |
Neg logit contributions | |
ish | -0.148 |
ci | -0.133 |
atmeal | -0.124 |
Majesty | -0.123 |
cient | -0.120 |
Token | God |
Token ID | 1793 |
Feature activation | -1.99e+01 |
Pos logit contributions | |
Where | +0.135 |
See | +0.127 |
Oh | +0.124 |
On | +0.122 |
Warning | +0.121 |
Neg logit contributions | |
ish | -0.139 |
Majesty | -0.126 |
majesty | -0.113 |
ci | -0.108 |
cient | -0.108 |
Token | , |
Token ID | 11 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
Where | +0.099 |
Welcome | +0.092 |
For | +0.088 |
See | +0.088 |
On | +0.088 |
Neg logit contributions | |
ish | -0.103 |
Majesty | -0.093 |
ci | -0.086 |
majesty | -0.082 |
oppy | -0.081 |
Token | please |
Token ID | 3387 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
Where | +0.118 |
See | +0.108 |
Oh | +0.107 |
Welcome | +0.106 |
On | +0.106 |
Neg logit contributions | |
ish | -0.123 |
Majesty | -0.109 |
majesty | -0.098 |
ci | -0.097 |
oppy | -0.095 |
Token | make |
Token ID | 787 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
Where | +0.104 |
See | +0.095 |
To | +0.095 |
On | +0.095 |
Welcome | +0.092 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.115 |
ci | -0.108 |
ishes | -0.104 |
oppy | -0.103 |
Token | my |
Token ID | 616 |
Feature activation | -2.20e+01 |
Pos logit contributions | |
Where | +0.089 |
See | +0.079 |
To | +0.076 |
Time | +0.076 |
On | +0.076 |
Neg logit contributions | |
ish | -0.153 |
ci | -0.133 |
Majesty | -0.130 |
mit | -0.126 |
majesty | -0.125 |
Token | elephant |
Token ID | 20950 |
Feature activation | -1.73e+01 |
Pos logit contributions | |
Where | +0.140 |
On | +0.133 |
Time | +0.130 |
See | +0.130 |
Warning | +0.130 |
Neg logit contributions | |
ish | -0.078 |
Majesty | -0.067 |
majesty | -0.057 |
cient | -0.052 |
ci | -0.048 |
Token | again |
Token ID | 757 |
Feature activation | -2.11e+01 |
Pos logit contributions | |
Where | +0.056 |
On | +0.054 |
He | +0.052 |
For | +0.052 |
See | +0.051 |
Neg logit contributions | |
ish | -0.109 |
Majesty | -0.108 |
majesty | -0.100 |
cient | -0.098 |
oppy | -0.097 |
Token | and |
Token ID | 290 |
Feature activation | -2.29e+01 |
Pos logit contributions | |
Where | +0.089 |
On | +0.082 |
See | +0.080 |
Oh | +0.079 |
To | +0.077 |
Neg logit contributions | |
ish | -0.131 |
Majesty | -0.120 |
majesty | -0.110 |
cient | -0.106 |
oppy | -0.105 |
Token | kissed |
Token ID | 27946 |
Feature activation | -2.30e+01 |
Pos logit contributions | |
Where | +0.076 |
See | +0.070 |
Oh | +0.065 |
Welcome | +0.064 |
On | +0.063 |
Neg logit contributions | |
ish | -0.164 |
Majesty | -0.150 |
majesty | -0.138 |
cient | -0.138 |
oppy | -0.138 |
Token | it |
Token ID | 340 |
Feature activation | -2.24e+01 |
Pos logit contributions | |
Where | +0.101 |
See | +0.092 |
On | +0.092 |
Oh | +0.091 |
Warning | +0.091 |
Neg logit contributions | |
ish | -0.136 |
Majesty | -0.120 |
ci | -0.111 |
majesty | -0.108 |
cient | -0.107 |
Token | . |
Token ID | 13 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
Where | +0.103 |
Oh | +0.094 |
See | +0.094 |
Warning | +0.093 |
Welcome | +0.091 |
Neg logit contributions | |
ish | -0.132 |
Majesty | -0.116 |
ci | -0.106 |
majesty | -0.105 |
oppy | -0.103 |
Token | She |
Token ID | 1375 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
Where | +0.106 |
Warning | +0.093 |
On | +0.091 |
Oh | +0.091 |
Time | +0.088 |
Neg logit contributions | |
ish | -0.166 |
Majesty | -0.157 |
majesty | -0.146 |
cient | -0.138 |
ci | -0.137 |
Token | said |
Token ID | 531 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
Where | +0.077 |
See | +0.072 |
On | +0.068 |
Oh | +0.067 |
That | +0.064 |
Neg logit contributions | |
ish | -0.172 |
Majesty | -0.159 |
majesty | -0.146 |
cient | -0.145 |
oppy | -0.142 |
Token | thank |
Token ID | 5875 |
Feature activation | -2.49e+01 |
Pos logit contributions | |
Where | +0.105 |
See | +0.103 |
Welcome | +0.098 |
That | +0.094 |
Listen | +0.093 |
Neg logit contributions | |
ish | -0.167 |
ci | -0.144 |
Majesty | -0.143 |
oppy | -0.136 |
ishes | -0.132 |
Token | you |
Token ID | 345 |
Feature activation | -2.28e+01 |
Pos logit contributions | |
Where | +0.131 |
See | +0.120 |
Oh | +0.119 |
Welcome | +0.117 |
On | +0.117 |
Neg logit contributions | |
ish | -0.132 |
Majesty | -0.118 |
majesty | -0.106 |
ci | -0.101 |
oppy | -0.100 |
Token | and |
Token ID | 290 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
Where | +0.088 |
On | +0.081 |
For | +0.080 |
To | +0.080 |
Welcome | +0.080 |
Neg logit contributions | |
ish | -0.146 |
Majesty | -0.133 |
majesty | -0.122 |
cient | -0.118 |
ishes | -0.118 |
Token | learned |
Token ID | 4499 |
Feature activation | -2.41e+01 |
Pos logit contributions | |
Where | +0.098 |
Oh | +0.086 |
Time | +0.084 |
Welcome | +0.084 |
Warning | +0.080 |
Neg logit contributions | |
ish | -0.150 |
Majesty | -0.131 |
ci | -0.122 |
majesty | -0.121 |
oppy | -0.121 |
Token | that |
Token ID | 326 |
Feature activation | -2.58e+01 |
Pos logit contributions | |
Where | +0.126 |
See | +0.116 |
Oh | +0.115 |
On | +0.115 |
Welcome | +0.112 |
Neg logit contributions | |
ish | -0.129 |
Majesty | -0.114 |
majesty | -0.102 |
ci | -0.100 |
oppy | -0.099 |
Token | courage |
Token ID | 11917 |
Feature activation | -2.35e+01 |
Pos logit contributions | |
Where | +0.133 |
See | +0.123 |
Oh | +0.122 |
On | +0.120 |
Welcome | +0.119 |
Neg logit contributions | |
ish | -0.135 |
Majesty | -0.118 |
ci | -0.107 |
majesty | -0.105 |
oppy | -0.103 |
Token | is |
Token ID | 318 |
Feature activation | -2.36e+01 |
Pos logit contributions | |
Where | +0.105 |
See | +0.095 |
Oh | +0.094 |
On | +0.092 |
Welcome | +0.092 |
Neg logit contributions | |
ish | -0.141 |
Majesty | -0.126 |
majesty | -0.115 |
ci | -0.114 |
oppy | -0.112 |
Token | important |
Token ID | 1593 |
Feature activation | -2.13e+01 |
Pos logit contributions | |
Where | +0.110 |
Oh | +0.107 |
Wow | +0.105 |
Warning | +0.104 |
See | +0.103 |
Neg logit contributions | |
ish | -0.129 |
Majesty | -0.114 |
majesty | -0.103 |
ci | -0.100 |
cient | -0.098 |
Token | . |
Token ID | 13 |
Feature activation | -2.65e+01 |
Pos logit contributions | |
Where | +0.089 |
See | +0.081 |
Oh | +0.080 |
On | +0.079 |
Welcome | +0.078 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.120 |
majesty | -0.110 |
ci | -0.109 |
oppy | -0.107 |
Token | They |
Token ID | 1119 |
Feature activation | -2.49e+01 |
Pos logit contributions | |
Where | +0.096 |
On | +0.085 |
Oh | +0.079 |
Welcome | +0.078 |
Time | +0.078 |
Neg logit contributions | |
ish | -0.167 |
Majesty | -0.154 |
oppy | -0.149 |
majesty | -0.146 |
ci | -0.136 |
Token | learned |
Token ID | 4499 |
Feature activation | -2.55e+01 |
Pos logit contributions | |
Where | +0.102 |
Oh | +0.090 |
Time | +0.087 |
Welcome | +0.087 |
See | +0.084 |
Neg logit contributions | |
ish | -0.160 |
Majesty | -0.140 |
ci | -0.130 |
majesty | -0.130 |
oppy | -0.129 |
Token | that |
Token ID | 326 |
Feature activation | -2.71e+01 |
Pos logit contributions | |
Where | +0.135 |
See | +0.124 |
Oh | +0.123 |
On | +0.122 |
Welcome | +0.120 |
Neg logit contributions | |
ish | -0.134 |
Majesty | -0.119 |
majesty | -0.106 |
ci | -0.105 |
oppy | -0.103 |
Token | soccer |
Token ID | 11783 |
Feature activation | -2.27e+01 |
Pos logit contributions | |
Where | +0.136 |
See | +0.125 |
Oh | +0.125 |
On | +0.122 |
Welcome | +0.121 |
Neg logit contributions | |
ish | -0.145 |
Majesty | -0.128 |
ci | -0.116 |
majesty | -0.114 |
oppy | -0.112 |
Token | is |
Token ID | 318 |
Feature activation | -2.43e+01 |
Pos logit contributions | |
Where | +0.090 |
See | +0.082 |
Oh | +0.080 |
On | +0.079 |
Welcome | +0.078 |
Neg logit contributions | |
ish | -0.145 |
Majesty | -0.134 |
majesty | -0.122 |
ci | -0.120 |
oppy | -0.118 |
Token | . |
Token ID | 13 |
Feature activation | -2.54e+01 |
Pos logit contributions | |
Where | +0.074 |
See | +0.066 |
Oh | +0.064 |
On | +0.064 |
Welcome | +0.063 |
Neg logit contributions | |
ish | -0.135 |
Majesty | -0.124 |
majesty | -0.114 |
ci | -0.112 |
oppy | -0.111 |
Token |
|
Token ID | 198 |
Feature activation | -2.49e+01 |
Pos logit contributions | |
Where | +0.092 |
See | +0.081 |
Oh | +0.080 |
Welcome | +0.079 |
On | +0.078 |
Neg logit contributions | |
ish | -0.173 |
Majesty | -0.157 |
majesty | -0.145 |
oppy | -0.143 |
ci | -0.143 |
Token |
|
Token ID | 198 |
Feature activation | -2.42e+01 |
Pos logit contributions | |
Where | +0.090 |
Warning | +0.088 |
Oh | +0.087 |
See | +0.079 |
Wow | +0.079 |
Neg logit contributions | |
ish | -0.123 |
oppy | -0.120 |
ap | -0.108 |
Majesty | -0.108 |
majesty | -0.107 |
Token | " |
Token ID | 1 |
Feature activation | -2.59e+01 |
Pos logit contributions | |
Where | +0.097 |
See | +0.090 |
Warning | +0.090 |
Oh | +0.089 |
Welcome | +0.084 |
Neg logit contributions | |
ish | -0.141 |
Majesty | -0.124 |
oppy | -0.119 |
majesty | -0.115 |
ci | -0.113 |
Token | Can |
Token ID | 6090 |
Feature activation | -2.46e+01 |
Pos logit contributions | |
security | +0.062 |
Warning | +0.056 |
generations | +0.055 |
On | +0.054 |
lessly | +0.052 |
Neg logit contributions | |
ish | -0.151 |
cuc | -0.132 |
atmeal | -0.129 |
Majesty | -0.129 |
ci | -0.128 |
Token | I |
Token ID | 314 |
Feature activation | -2.64e+01 |
Pos logit contributions | |
Where | +0.100 |
Do | +0.087 |
Oh | +0.087 |
There | +0.086 |
What | +0.085 |
Neg logit contributions | |
ish | -0.165 |
Majesty | -0.152 |
majesty | -0.138 |
ci | -0.134 |
ishes | -0.132 |
Token | see |
Token ID | 766 |
Feature activation | -2.37e+01 |
Pos logit contributions | |
Where | +0.116 |
On | +0.106 |
See | +0.105 |
Welcome | +0.102 |
Oh | +0.101 |
Neg logit contributions | |
ish | -0.157 |
Majesty | -0.149 |
majesty | -0.133 |
ci | -0.132 |
cient | -0.129 |
Token | it |
Token ID | 340 |
Feature activation | -2.26e+01 |
Pos logit contributions | |
Where | +0.087 |
See | +0.074 |
What | +0.073 |
Oh | +0.072 |
Welcome | +0.071 |
Neg logit contributions | |
ish | -0.159 |
Majesty | -0.151 |
majesty | -0.141 |
ci | -0.139 |
oppy | -0.137 |
Token | ?" |
Token ID | 1701 |
Feature activation | -2.54e+01 |
Pos logit contributions | |
Where | +0.111 |
On | +0.109 |
What | +0.101 |
One | +0.101 |
Do | +0.101 |
Neg logit contributions | |
Majesty | -0.118 |
ish | -0.116 |
majesty | -0.109 |
ci | -0.096 |
cient | -0.094 |
Token | Ben |
Token ID | 3932 |
Feature activation | -2.09e+01 |
Pos logit contributions | |
Where | +0.113 |
Warning | +0.104 |
See | +0.104 |
Welcome | +0.102 |
Oh | +0.102 |
Neg logit contributions | |
ish | -0.143 |
Majesty | -0.126 |
oppy | -0.120 |
majesty | -0.116 |
ci | -0.112 |
Token | asks |
Token ID | 7893 |
Feature activation | -2.47e+01 |
Pos logit contributions | |
Where | +0.089 |
See | +0.082 |
Oh | +0.081 |
Welcome | +0.079 |
On | +0.078 |
Neg logit contributions | |
ish | -0.130 |
Majesty | -0.115 |
ci | -0.105 |
majesty | -0.104 |
oppy | -0.102 |
Token | that |
Token ID | 326 |
Feature activation | +2.65e+01 |
Pos logit contributions | |
ish | +0.208 |
Majesty | +0.187 |
oppy | +0.176 |
cient | +0.174 |
majesty | +0.173 |
Neg logit contributions | |
Where | -0.122 |
On | -0.107 |
See | -0.107 |
Welcome | -0.106 |
Oh | -0.104 |
Token | the |
Token ID | 262 |
Feature activation | +3.05e+01 |
Pos logit contributions | |
ish | +0.173 |
Majesty | +0.157 |
majesty | +0.144 |
ci | +0.142 |
oppy | +0.140 |
Neg logit contributions | |
Where | -0.105 |
See | -0.094 |
Oh | -0.093 |
Welcome | -0.091 |
On | -0.091 |
Token | bad |
Token ID | 2089 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
ish | +0.178 |
Majesty | +0.157 |
majesty | +0.143 |
ci | +0.143 |
oppy | +0.142 |
Neg logit contributions | |
Where | -0.141 |
Oh | -0.128 |
See | -0.128 |
Welcome | -0.125 |
On | -0.122 |
Token | rh |
Token ID | 9529 |
Feature activation | +4.95e+01 |
Pos logit contributions | |
ish | +0.206 |
Majesty | +0.182 |
cient | +0.173 |
oppy | +0.170 |
majesty | +0.168 |
Neg logit contributions | |
Where | -0.128 |
Welcome | -0.118 |
See | -0.117 |
Oh | -0.116 |
Time | -0.116 |
Token | in |
Token ID | 259 |
Feature activation | +3.95e+01 |
Pos logit contributions | |
ish | +0.225 |
Majesty | +0.206 |
majesty | +0.180 |
ci | +0.175 |
oppy | +0.170 |
Neg logit contributions | |
Where | -0.286 |
See | -0.266 |
Oh | -0.263 |
Welcome | -0.260 |
On | -0.257 |
Token | oc |
Token ID | 420 |
Feature activation | +6.44e+01 |
Pos logit contributions | |
ish | +0.210 |
Majesty | +0.187 |
majesty | +0.168 |
ci | +0.165 |
oppy | +0.163 |
Neg logit contributions | |
Where | -0.202 |
See | -0.186 |
Oh | -0.184 |
On | -0.181 |
Welcome | -0.181 |
Token | eros |
Token ID | 27498 |
Feature activation | +3.60e+01 |
Pos logit contributions | |
oppy | +0.238 |
ish | +0.234 |
Majesty | +0.219 |
opsy | +0.205 |
majesty | +0.202 |
Neg logit contributions | |
Where | -0.344 |
See | -0.332 |
Warning | -0.327 |
Oh | -0.322 |
Welcome | -0.311 |
Token | was |
Token ID | 373 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
ish | +0.264 |
Majesty | +0.245 |
majesty | +0.228 |
oppy | +0.223 |
ci | +0.223 |
Neg logit contributions | |
Where | -0.109 |
See | -0.095 |
Oh | -0.091 |
On | -0.090 |
Welcome | -0.090 |
Token | now |
Token ID | 783 |
Feature activation | +2.74e+01 |
Pos logit contributions | |
ish | +0.170 |
Majesty | +0.152 |
majesty | +0.140 |
oppy | +0.139 |
ci | +0.138 |
Neg logit contributions | |
Where | -0.113 |
See | -0.103 |
On | -0.098 |
Welcome | -0.098 |
Oh | -0.097 |
Token | nice |
Token ID | 3621 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
ish | +0.171 |
Majesty | +0.154 |
majesty | +0.142 |
oppy | +0.140 |
cient | +0.140 |
Neg logit contributions | |
Where | -0.117 |
See | -0.108 |
On | -0.103 |
Oh | -0.102 |
Welcome | -0.102 |
Token | . |
Token ID | 13 |
Feature activation | +1.94e+01 |
Pos logit contributions | |
ish | +0.162 |
Majesty | +0.151 |
majesty | +0.137 |
oppy | +0.136 |
cient | +0.136 |
Neg logit contributions | |
Where | -0.112 |
See | -0.100 |
Welcome | -0.099 |
Oh | -0.097 |
On | -0.096 |
Token | it |
Token ID | 340 |
Feature activation | +2.90e+01 |
Pos logit contributions | |
ish | +0.199 |
Majesty | +0.188 |
majesty | +0.172 |
castle | +0.169 |
cient | +0.168 |
Neg logit contributions | |
Where | -0.103 |
See | -0.094 |
Oh | -0.089 |
Welcome | -0.086 |
What | -0.084 |
Token | to |
Token ID | 284 |
Feature activation | +2.17e+01 |
Pos logit contributions | |
ish | +0.179 |
Majesty | +0.168 |
majesty | +0.152 |
cient | +0.150 |
ci | +0.150 |
Neg logit contributions | |
Where | -0.114 |
Welcome | -0.103 |
See | -0.102 |
To | -0.101 |
On | -0.101 |
Token | the |
Token ID | 262 |
Feature activation | +2.84e+01 |
Pos logit contributions | |
ish | +0.150 |
Majesty | +0.130 |
ci | +0.122 |
majesty | +0.119 |
oppy | +0.118 |
Neg logit contributions | |
Where | -0.081 |
See | -0.073 |
Oh | -0.070 |
Welcome | -0.069 |
What | -0.068 |
Token | rh |
Token ID | 9529 |
Feature activation | +4.64e+01 |
Pos logit contributions | |
ish | +0.161 |
Majesty | +0.139 |
ci | +0.131 |
oppy | +0.130 |
majesty | +0.127 |
Neg logit contributions | |
Where | -0.137 |
Oh | -0.124 |
See | -0.122 |
Welcome | -0.120 |
On | -0.118 |
Token | in |
Token ID | 259 |
Feature activation | +3.66e+01 |
Pos logit contributions | |
ish | +0.217 |
Majesty | +0.205 |
majesty | +0.181 |
ci | +0.175 |
oppy | +0.167 |
Neg logit contributions | |
Where | -0.256 |
See | -0.236 |
Oh | -0.234 |
On | -0.230 |
He | -0.230 |
Token | oc |
Token ID | 420 |
Feature activation | +6.39e+01 |
Pos logit contributions | |
ish | +0.200 |
Majesty | +0.184 |
majesty | +0.168 |
oppy | +0.161 |
ci | +0.160 |
Neg logit contributions | |
Where | -0.169 |
On | -0.156 |
To | -0.152 |
For | -0.151 |
Oh | -0.151 |
Token | eros |
Token ID | 27498 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
oppy | +0.247 |
ish | +0.236 |
Majesty | +0.224 |
adow | +0.216 |
iggle | +0.215 |
Neg logit contributions | |
Where | -0.323 |
Warning | -0.312 |
See | -0.305 |
Sir | -0.300 |
Oh | -0.299 |
Token | . |
Token ID | 13 |
Feature activation | +1.99e+01 |
Pos logit contributions | |
ish | +0.237 |
Majesty | +0.220 |
majesty | +0.204 |
oppy | +0.198 |
ci | +0.198 |
Neg logit contributions | |
Where | -0.118 |
On | -0.105 |
To | -0.101 |
See | -0.101 |
For | -0.101 |
Token | When |
Token ID | 1649 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
ish | +0.130 |
Majesty | +0.121 |
majesty | +0.112 |
cient | +0.109 |
oppy | +0.109 |
Neg logit contributions | |
Where | -0.074 |
Oh | -0.065 |
See | -0.064 |
Warning | -0.063 |
Time | -0.063 |
Token | he |
Token ID | 339 |
Feature activation | +2.50e+01 |
Pos logit contributions | |
ish | +0.149 |
Majesty | +0.135 |
majesty | +0.124 |
ci | +0.123 |
oppy | +0.121 |
Neg logit contributions | |
Where | -0.085 |
See | -0.077 |
Oh | -0.075 |
Welcome | -0.074 |
On | -0.074 |
Token | tasted |
Token ID | 29187 |
Feature activation | +2.40e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.158 |
majesty | +0.145 |
ci | +0.144 |
cient | +0.140 |
Neg logit contributions | |
Where | -0.091 |
See | -0.081 |
On | -0.079 |
Oh | -0.079 |
Welcome | -0.078 |
Token | his |
Token ID | 465 |
Feature activation | +4.47e+01 |
Pos logit contributions | |
Where | +0.076 |
See | +0.069 |
Oh | +0.068 |
Welcome | +0.067 |
What | +0.067 |
Neg logit contributions | |
ish | -0.072 |
Majesty | -0.068 |
majesty | -0.062 |
ci | -0.061 |
castle | -0.061 |
Token | head |
Token ID | 1182 |
Feature activation | +4.36e+01 |
Pos logit contributions | |
ish | +0.242 |
Majesty | +0.208 |
cient | +0.194 |
ci | +0.192 |
oppy | +0.190 |
Neg logit contributions | |
Where | -0.209 |
On | -0.190 |
Oh | -0.185 |
See | -0.184 |
He | -0.182 |
Token | out |
Token ID | 503 |
Feature activation | +4.00e+01 |
Pos logit contributions | |
ish | +0.285 |
Majesty | +0.265 |
majesty | +0.244 |
oppy | +0.240 |
cient | +0.234 |
Neg logit contributions | |
Where | -0.165 |
On | -0.148 |
See | -0.145 |
Welcome | -0.140 |
Oh | -0.139 |
Token | of |
Token ID | 286 |
Feature activation | +3.58e+01 |
Pos logit contributions | |
ish | +0.259 |
Majesty | +0.234 |
majesty | +0.214 |
ci | +0.214 |
oppy | +0.210 |
Neg logit contributions | |
Where | -0.159 |
See | -0.143 |
Oh | -0.141 |
On | -0.140 |
Welcome | -0.138 |
Token | his |
Token ID | 465 |
Feature activation | +4.01e+01 |
Pos logit contributions | |
ish | +0.243 |
Majesty | +0.218 |
ci | +0.201 |
majesty | +0.200 |
cient | +0.200 |
Neg logit contributions | |
Where | -0.139 |
See | -0.124 |
Oh | -0.121 |
On | -0.119 |
Welcome | -0.117 |
Token | bur |
Token ID | 4356 |
Feature activation | +6.29e+01 |
Pos logit contributions | |
ish | +0.213 |
Majesty | +0.190 |
cient | +0.180 |
pp | +0.177 |
majesty | +0.168 |
Neg logit contributions | |
Where | -0.182 |
On | -0.167 |
Oh | -0.163 |
See | -0.160 |
He | -0.156 |
Token | row |
Token ID | 808 |
Feature activation | +4.65e+01 |
Pos logit contributions | |
Majesty | +0.332 |
ish | +0.309 |
majesty | +0.297 |
cient | +0.296 |
oppy | +0.278 |
Neg logit contributions | |
Where | -0.263 |
He | -0.254 |
On | -0.247 |
To | -0.230 |
One | -0.229 |
Token | and |
Token ID | 290 |
Feature activation | +2.72e+01 |
Pos logit contributions | |
ish | +0.326 |
Majesty | +0.314 |
majesty | +0.291 |
oppy | +0.284 |
cient | +0.277 |
Neg logit contributions | |
Where | -0.139 |
On | -0.132 |
He | -0.131 |
To | -0.119 |
For | -0.117 |
Token | saw |
Token ID | 2497 |
Feature activation | +2.59e+01 |
Pos logit contributions | |
ish | +0.191 |
Majesty | +0.168 |
cient | +0.157 |
oppy | +0.157 |
majesty | +0.155 |
Neg logit contributions | |
Where | -0.099 |
See | -0.086 |
On | -0.084 |
Oh | -0.081 |
Welcome | -0.079 |
Token | something |
Token ID | 1223 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.155 |
majesty | +0.143 |
ci | +0.142 |
oppy | +0.141 |
Neg logit contributions | |
Where | -0.103 |
See | -0.092 |
Oh | -0.089 |
On | -0.086 |
Welcome | -0.086 |
Token | new |
Token ID | 649 |
Feature activation | +2.84e+01 |
Pos logit contributions | |
ish | +0.149 |
Majesty | +0.128 |
ci | +0.119 |
majesty | +0.116 |
oppy | +0.115 |
Neg logit contributions | |
Where | -0.114 |
See | -0.107 |
Warning | -0.104 |
Oh | -0.104 |
Welcome | -0.102 |
Token | he |
Token ID | 339 |
Feature activation | +3.36e+01 |
Pos logit contributions | |
ish | +0.312 |
Majesty | +0.280 |
majesty | +0.259 |
ci | +0.252 |
cient | +0.252 |
Neg logit contributions | |
Where | -0.159 |
On | -0.139 |
Oh | -0.139 |
Welcome | -0.138 |
See | -0.138 |
Token | would |
Token ID | 561 |
Feature activation | +2.93e+01 |
Pos logit contributions | |
ish | +0.234 |
Majesty | +0.213 |
majesty | +0.198 |
ci | +0.196 |
oppy | +0.195 |
Neg logit contributions | |
Where | -0.112 |
On | -0.099 |
See | -0.099 |
Welcome | -0.095 |
Oh | -0.094 |
Token | take |
Token ID | 1011 |
Feature activation | +3.13e+01 |
Pos logit contributions | |
ish | +0.186 |
Majesty | +0.161 |
oppy | +0.153 |
ishes | +0.150 |
ci | +0.149 |
Neg logit contributions | |
Where | -0.112 |
On | -0.112 |
He | -0.106 |
One | -0.106 |
See | -0.104 |
Token | the |
Token ID | 262 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
ish | +0.209 |
Majesty | +0.188 |
majesty | +0.174 |
ci | +0.172 |
cient | +0.171 |
Neg logit contributions | |
Where | -0.120 |
See | -0.109 |
Welcome | -0.105 |
Oh | -0.104 |
On | -0.102 |
Token | av |
Token ID | 1196 |
Feature activation | +6.23e+01 |
Pos logit contributions | |
ish | +0.181 |
Majesty | +0.164 |
majesty | +0.149 |
oppy | +0.147 |
ci | +0.143 |
Neg logit contributions | |
Where | -0.167 |
Oh | -0.155 |
Welcome | -0.153 |
See | -0.152 |
On | -0.149 |
Token | oc |
Token ID | 420 |
Feature activation | +7.20e+01 |
Pos logit contributions | |
Majesty | +0.359 |
majesty | +0.342 |
ish | +0.330 |
knee | +0.316 |
oppy | +0.306 |
Neg logit contributions | |
Where | -0.254 |
On | -0.248 |
One | -0.246 |
See | -0.239 |
To | -0.237 |
Token | ados |
Token ID | 22484 |
Feature activation | +4.14e+01 |
Pos logit contributions | |
oppy | +0.263 |
ish | +0.240 |
iggle | +0.229 |
Majesty | +0.228 |
majesty | +0.226 |
Neg logit contributions | |
Where | -0.371 |
Warning | -0.361 |
See | -0.360 |
Sir | -0.356 |
Oh | -0.343 |
Token | and |
Token ID | 290 |
Feature activation | +2.62e+01 |
Pos logit contributions | |
Majesty | +0.262 |
ish | +0.256 |
majesty | +0.243 |
oppy | +0.218 |
ci | +0.210 |
Neg logit contributions | |
Where | -0.163 |
On | -0.159 |
To | -0.150 |
For | -0.144 |
He | -0.144 |
Token | scatter |
Token ID | 41058 |
Feature activation | +3.21e+01 |
Pos logit contributions | |
ish | +0.157 |
Majesty | +0.139 |
oppy | +0.132 |
majesty | +0.127 |
ci | +0.127 |
Neg logit contributions | |
Where | -0.118 |
See | -0.107 |
On | -0.104 |
Welcome | -0.101 |
What | -0.100 |
Token | them |
Token ID | 606 |
Feature activation | +3.18e+01 |
Pos logit contributions | |
ish | +0.209 |
Majesty | +0.196 |
majesty | +0.180 |
ci | +0.178 |
oppy | +0.176 |
Neg logit contributions | |
Where | -0.125 |
See | -0.113 |
Oh | -0.110 |
Welcome | -0.109 |
On | -0.107 |
Token | around |
Token ID | 1088 |
Feature activation | +2.89e+01 |
Pos logit contributions | |
ish | +0.195 |
Majesty | +0.186 |
majesty | +0.172 |
oppy | +0.164 |
cient | +0.163 |
Neg logit contributions | |
Where | -0.125 |
On | -0.118 |
See | -0.110 |
Welcome | -0.108 |
To | -0.107 |
Token | you |
Token ID | 345 |
Feature activation | +3.56e+01 |
Pos logit contributions | |
Where | +0.093 |
See | +0.088 |
On | +0.086 |
Welcome | +0.085 |
Warning | +0.085 |
Neg logit contributions | |
ish | -0.123 |
Majesty | -0.109 |
majesty | -0.100 |
ci | -0.099 |
oppy | -0.098 |
Token | go |
Token ID | 467 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
ish | +0.221 |
Majesty | +0.194 |
ci | +0.185 |
majesty | +0.175 |
oppy | +0.174 |
Neg logit contributions | |
Where | -0.143 |
See | -0.132 |
Welcome | -0.132 |
On | -0.130 |
To | -0.128 |
Token | , |
Token ID | 11 |
Feature activation | +2.57e+01 |
Pos logit contributions | |
ish | +0.195 |
Majesty | +0.176 |
majesty | +0.165 |
cient | +0.159 |
oppy | +0.158 |
Neg logit contributions | |
Where | -0.146 |
On | -0.135 |
Welcome | -0.127 |
One | -0.127 |
Do | -0.127 |
Token | my |
Token ID | 616 |
Feature activation | +3.15e+01 |
Pos logit contributions | |
ish | +0.165 |
Majesty | +0.140 |
ci | +0.137 |
cient | +0.134 |
ishes | +0.133 |
Neg logit contributions | |
Where | -0.106 |
On | -0.095 |
What | -0.093 |
Do | -0.092 |
He | -0.091 |
Token | d |
Token ID | 288 |
Feature activation | +4.18e+01 |
Pos logit contributions | |
ish | +0.162 |
ci | +0.135 |
Majesty | +0.132 |
cient | +0.131 |
pp | +0.128 |
Neg logit contributions | |
Where | -0.151 |
Oh | -0.140 |
See | -0.138 |
On | -0.133 |
Welcome | -0.133 |
Token | arl |
Token ID | 7063 |
Feature activation | +6.29e+01 |
Pos logit contributions | |
ish | +0.218 |
ci | +0.216 |
Majesty | +0.212 |
cient | +0.190 |
gy | +0.185 |
Neg logit contributions | |
Where | -0.175 |
He | -0.168 |
To | -0.167 |
Welcome | -0.164 |
For | -0.164 |
Token | ings |
Token ID | 654 |
Feature activation | +3.34e+01 |
Pos logit contributions | |
ish | +0.317 |
ci | +0.290 |
Majesty | +0.289 |
cient | +0.266 |
oppy | +0.254 |
Neg logit contributions | |
He | -0.273 |
To | -0.269 |
See | -0.267 |
On | -0.262 |
For | -0.257 |
Token | . |
Token ID | 13 |
Feature activation | +2.53e+01 |
Pos logit contributions | |
ish | +0.188 |
Majesty | +0.171 |
majesty | +0.153 |
ci | +0.150 |
oppy | +0.150 |
Neg logit contributions | |
Where | -0.161 |
See | -0.147 |
Oh | -0.146 |
Welcome | -0.145 |
On | -0.145 |
Token | Enjoy |
Token ID | 18179 |
Feature activation | +2.97e+01 |
Pos logit contributions | |
ish | +0.161 |
Majesty | +0.145 |
majesty | +0.133 |
ci | +0.132 |
oppy | +0.130 |
Neg logit contributions | |
Where | -0.104 |
See | -0.094 |
Oh | -0.093 |
On | -0.091 |
Welcome | -0.091 |
Token | your |
Token ID | 534 |
Feature activation | +3.16e+01 |
Pos logit contributions | |
ish | +0.182 |
ci | +0.163 |
gy | +0.156 |
Majesty | +0.156 |
cient | +0.155 |
Neg logit contributions | |
Where | -0.117 |
What | -0.107 |
For | -0.106 |
To | -0.104 |
On | -0.103 |
Token | lunch |
Token ID | 9965 |
Feature activation | +3.74e+01 |
Pos logit contributions | |
ish | +0.175 |
Majesty | +0.148 |
ci | +0.145 |
cient | +0.143 |
pp | +0.139 |
Neg logit contributions | |
Where | -0.137 |
See | -0.128 |
Welcome | -0.127 |
Oh | -0.123 |
On | -0.122 |
Token | 's |
Token ID | 338 |
Feature activation | +2.33e+01 |
Pos logit contributions | |
ish | +0.146 |
Majesty | +0.141 |
majesty | +0.129 |
oppy | +0.127 |
castle | +0.125 |
Neg logit contributions | |
Where | -0.080 |
See | -0.077 |
Welcome | -0.073 |
Oh | -0.072 |
That | -0.071 |
Token | too |
Token ID | 1165 |
Feature activation | +2.64e+01 |
Pos logit contributions | |
ish | +0.141 |
Majesty | +0.127 |
majesty | +0.116 |
ci | +0.115 |
oppy | +0.113 |
Neg logit contributions | |
Where | -0.103 |
See | -0.093 |
Oh | -0.092 |
On | -0.091 |
Welcome | -0.090 |
Token | big |
Token ID | 1263 |
Feature activation | +2.65e+01 |
Pos logit contributions | |
ish | +0.163 |
Majesty | +0.145 |
majesty | +0.133 |
ci | +0.133 |
oppy | +0.131 |
Neg logit contributions | |
Where | -0.114 |
See | -0.103 |
Oh | -0.101 |
Welcome | -0.099 |
Warning | -0.098 |
Token | for |
Token ID | 329 |
Feature activation | +2.20e+01 |
Pos logit contributions | |
ish | +0.161 |
Majesty | +0.150 |
oppy | +0.141 |
majesty | +0.138 |
ci | +0.136 |
Neg logit contributions | |
Where | -0.109 |
Welcome | -0.099 |
On | -0.097 |
See | -0.096 |
Do | -0.095 |
Token | your |
Token ID | 534 |
Feature activation | +2.69e+01 |
Pos logit contributions | |
ish | +0.117 |
Majesty | +0.103 |
majesty | +0.092 |
ci | +0.092 |
oppy | +0.089 |
Neg logit contributions | |
Where | -0.114 |
See | -0.105 |
Oh | -0.104 |
On | -0.102 |
Welcome | -0.102 |
Token | bag |
Token ID | 6131 |
Feature activation | +3.27e+01 |
Pos logit contributions | |
ish | +0.144 |
Majesty | +0.122 |
ci | +0.115 |
cient | +0.115 |
pp | +0.114 |
Neg logit contributions | |
Where | -0.132 |
On | -0.117 |
Oh | -0.116 |
See | -0.114 |
Welcome | -0.114 |
Token | ." |
Token ID | 526 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
ish | +0.192 |
Majesty | +0.188 |
majesty | +0.168 |
oppy | +0.157 |
ci | +0.152 |
Neg logit contributions | |
Where | -0.136 |
On | -0.132 |
He | -0.126 |
To | -0.125 |
For | -0.124 |
Token |
|
Token ID | 198 |
Feature activation | +1.51e+01 |
Pos logit contributions | |
ish | +0.126 |
Majesty | +0.117 |
majesty | +0.109 |
ci | +0.108 |
oppy | +0.107 |
Neg logit contributions | |
Where | -0.047 |
See | -0.040 |
Oh | -0.039 |
Welcome | -0.038 |
On | -0.038 |
Token |
|
Token ID | 198 |
Feature activation | +1.52e+01 |
Pos logit contributions | |
ish | +0.101 |
Majesty | +0.094 |
oppy | +0.093 |
majesty | +0.089 |
cient | +0.088 |
Neg logit contributions | |
Where | -0.046 |
Oh | -0.039 |
Warning | -0.039 |
See | -0.039 |
Welcome | -0.039 |
Token | Ben |
Token ID | 11696 |
Feature activation | +1.98e+01 |
Pos logit contributions | |
ish | +0.103 |
Majesty | +0.098 |
oppy | +0.093 |
majesty | +0.091 |
ci | +0.090 |
Neg logit contributions | |
Where | -0.043 |
See | -0.038 |
Welcome | -0.037 |
Oh | -0.037 |
Warning | -0.036 |
Token | looked |
Token ID | 3114 |
Feature activation | +1.84e+01 |
Pos logit contributions | |
ish | +0.137 |
Majesty | +0.129 |
majesty | +0.119 |
oppy | +0.115 |
cient | +0.114 |
Neg logit contributions | |
Where | -0.066 |
On | -0.062 |
See | -0.060 |
That | -0.057 |
Oh | -0.057 |
Token | day |
Token ID | 1110 |
Feature activation | +3.68e+01 |
Pos logit contributions | |
Where | +0.087 |
See | +0.077 |
Oh | +0.075 |
On | +0.074 |
Welcome | +0.074 |
Neg logit contributions | |
ish | -0.132 |
Majesty | -0.119 |
majesty | -0.110 |
ci | -0.109 |
cient | -0.107 |
Token | cleaning |
Token ID | 12724 |
Feature activation | +3.96e+01 |
Pos logit contributions | |
ish | +0.224 |
Majesty | +0.199 |
cient | +0.181 |
ci | +0.179 |
majesty | +0.179 |
Neg logit contributions | |
Where | -0.151 |
On | -0.143 |
See | -0.140 |
Welcome | -0.138 |
To | -0.138 |
Token | and |
Token ID | 290 |
Feature activation | +2.41e+01 |
Pos logit contributions | |
ish | +0.242 |
Majesty | +0.228 |
cient | +0.222 |
majesty | +0.215 |
oppy | +0.202 |
Neg logit contributions | |
Where | -0.152 |
What | -0.137 |
Oh | -0.134 |
For | -0.134 |
On | -0.132 |
Token | fixing |
Token ID | 18682 |
Feature activation | +3.06e+01 |
Pos logit contributions | |
ish | +0.170 |
Majesty | +0.147 |
cient | +0.141 |
oppy | +0.138 |
ans | +0.138 |
Neg logit contributions | |
Where | -0.085 |
See | -0.078 |
Time | -0.073 |
On | -0.073 |
Are | -0.072 |
Token | the |
Token ID | 262 |
Feature activation | +3.30e+01 |
Pos logit contributions | |
ish | +0.201 |
Majesty | +0.186 |
majesty | +0.172 |
cient | +0.171 |
oppy | +0.169 |
Neg logit contributions | |
Where | -0.119 |
See | -0.104 |
Oh | -0.103 |
What | -0.100 |
On | -0.099 |
Token | wardrobe |
Token ID | 35593 |
Feature activation | +3.82e+01 |
Pos logit contributions | |
ish | +0.180 |
Majesty | +0.159 |
oppy | +0.147 |
majesty | +0.144 |
ci | +0.143 |
Neg logit contributions | |
Where | -0.165 |
Oh | -0.152 |
See | -0.147 |
Welcome | -0.143 |
On | -0.143 |
Token | so |
Token ID | 523 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
ish | +0.263 |
Majesty | +0.243 |
majesty | +0.226 |
oppy | +0.223 |
cient | +0.214 |
Neg logit contributions | |
Where | -0.136 |
On | -0.121 |
See | -0.116 |
To | -0.115 |
For | -0.114 |
Token | it |
Token ID | 340 |
Feature activation | +2.66e+01 |
Pos logit contributions | |
ish | +0.132 |
Majesty | +0.119 |
majesty | +0.109 |
ci | +0.109 |
oppy | +0.107 |
Neg logit contributions | |
Where | -0.081 |
See | -0.073 |
Oh | -0.072 |
On | -0.071 |
Welcome | -0.071 |
Token | looked |
Token ID | 3114 |
Feature activation | +2.95e+01 |
Pos logit contributions | |
ish | +0.182 |
Majesty | +0.169 |
majesty | +0.156 |
oppy | +0.152 |
cient | +0.151 |
Neg logit contributions | |
Where | -0.092 |
See | -0.084 |
On | -0.080 |
Oh | -0.080 |
To | -0.079 |
Token | nice |
Token ID | 3621 |
Feature activation | +3.00e+01 |
Pos logit contributions | |
ish | +0.181 |
Majesty | +0.164 |
majesty | +0.150 |
ci | +0.150 |
oppy | +0.148 |
Neg logit contributions | |
Where | -0.127 |
See | -0.115 |
Oh | -0.113 |
On | -0.113 |
Welcome | -0.111 |
Token | . |
Token ID | 13 |
Feature activation | +1.86e+01 |
Pos logit contributions | |
ish | +0.199 |
Majesty | +0.190 |
oppy | +0.177 |
majesty | +0.176 |
cient | +0.173 |
Neg logit contributions | |
Where | -0.110 |
On | -0.093 |
Welcome | -0.093 |
See | -0.092 |
Oh | -0.091 |
Token | time |
Token ID | 640 |
Feature activation | +2.76e+01 |
Pos logit contributions | |
ish | +0.292 |
ci | +0.271 |
Majesty | +0.271 |
cient | +0.268 |
ishes | +0.261 |
Neg logit contributions | |
One | -0.042 |
On | -0.038 |
Where | -0.035 |
Time | -0.033 |
Today | -0.027 |
Token | , |
Token ID | 11 |
Feature activation | +2.56e+01 |
Pos logit contributions | |
ish | +0.166 |
Majesty | +0.147 |
ci | +0.137 |
majesty | +0.134 |
cient | +0.131 |
Neg logit contributions | |
Where | -0.126 |
On | -0.118 |
Welcome | -0.116 |
See | -0.114 |
Time | -0.113 |
Token | there |
Token ID | 612 |
Feature activation | +2.61e+01 |
Pos logit contributions | |
ish | +0.198 |
Majesty | +0.179 |
majesty | +0.170 |
ci | +0.165 |
oppy | +0.164 |
Neg logit contributions | |
Where | -0.080 |
Oh | -0.068 |
See | -0.066 |
On | -0.066 |
Welcome | -0.066 |
Token | was |
Token ID | 373 |
Feature activation | +2.43e+01 |
Pos logit contributions | |
ish | +0.184 |
Majesty | +0.165 |
ci | +0.153 |
majesty | +0.153 |
oppy | +0.152 |
Neg logit contributions | |
Where | -0.088 |
See | -0.078 |
Oh | -0.077 |
Welcome | -0.075 |
On | -0.074 |
Token | an |
Token ID | 281 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
ish | +0.160 |
Majesty | +0.144 |
majesty | +0.132 |
ci | +0.131 |
oppy | +0.129 |
Neg logit contributions | |
Where | -0.096 |
See | -0.086 |
Oh | -0.085 |
On | -0.084 |
Welcome | -0.083 |
Token | old |
Token ID | 1468 |
Feature activation | +3.68e+01 |
Pos logit contributions | |
ish | +0.172 |
Majesty | +0.166 |
majesty | +0.162 |
oppy | +0.158 |
pp | +0.154 |
Neg logit contributions | |
Where | -0.102 |
On | -0.091 |
One | -0.089 |
Welcome | -0.089 |
moral | -0.089 |
Token | man |
Token ID | 582 |
Feature activation | +3.17e+01 |
Pos logit contributions | |
ish | +0.249 |
Majesty | +0.228 |
ishes | +0.217 |
oppy | +0.215 |
cient | +0.212 |
Neg logit contributions | |
Where | -0.108 |
Oh | -0.098 |
Wow | -0.097 |
He | -0.096 |
On | -0.096 |
Token | . |
Token ID | 13 |
Feature activation | +1.90e+01 |
Pos logit contributions | |
ish | +0.202 |
Majesty | +0.193 |
majesty | +0.178 |
oppy | +0.168 |
cient | +0.165 |
Neg logit contributions | |
Where | -0.127 |
On | -0.112 |
Welcome | -0.108 |
See | -0.108 |
Oh | -0.107 |
Token | He |
Token ID | 679 |
Feature activation | +2.18e+01 |
Pos logit contributions | |
ish | +0.132 |
Majesty | +0.123 |
majesty | +0.114 |
cient | +0.113 |
ci | +0.112 |
Neg logit contributions | |
Where | -0.062 |
See | -0.053 |
Oh | -0.053 |
Warning | -0.051 |
Time | -0.051 |
Token | loved |
Token ID | 6151 |
Feature activation | +2.26e+01 |
Pos logit contributions | |
ish | +0.148 |
Majesty | +0.135 |
ci | +0.125 |
majesty | +0.124 |
cient | +0.122 |
Neg logit contributions | |
Where | -0.078 |
See | -0.069 |
Oh | -0.069 |
Welcome | -0.067 |
Warning | -0.066 |
Token | to |
Token ID | 284 |
Feature activation | +2.01e+01 |
Pos logit contributions | |
ish | +0.144 |
Majesty | +0.127 |
oppy | +0.120 |
majesty | +0.116 |
ci | +0.115 |
Neg logit contributions | |
Where | -0.099 |
See | -0.088 |
Welcome | -0.087 |
On | -0.085 |
Oh | -0.085 |
Token | a |
Token ID | 257 |
Feature activation | +2.94e+01 |
Pos logit contributions | |
ish | +0.186 |
Majesty | +0.171 |
ci | +0.157 |
majesty | +0.157 |
oppy | +0.156 |
Neg logit contributions | |
Where | -0.110 |
See | -0.098 |
Oh | -0.096 |
Welcome | -0.093 |
What | -0.090 |
Token | new |
Token ID | 649 |
Feature activation | +3.40e+01 |
Pos logit contributions | |
ish | +0.181 |
Majesty | +0.162 |
ci | +0.150 |
majesty | +0.147 |
oppy | +0.146 |
Neg logit contributions | |
Where | -0.127 |
See | -0.116 |
Oh | -0.114 |
On | -0.112 |
Welcome | -0.111 |
Token | home |
Token ID | 1363 |
Feature activation | +3.17e+01 |
Pos logit contributions | |
ish | +0.194 |
Majesty | +0.173 |
oppy | +0.168 |
cient | +0.165 |
majesty | +0.159 |
Neg logit contributions | |
Where | -0.148 |
See | -0.138 |
Oh | -0.134 |
On | -0.133 |
Welcome | -0.132 |
Token | . |
Token ID | 13 |
Feature activation | +2.23e+01 |
Pos logit contributions | |
ish | +0.228 |
Majesty | +0.216 |
majesty | +0.198 |
oppy | +0.196 |
cient | +0.192 |
Neg logit contributions | |
Where | -0.100 |
On | -0.088 |
For | -0.084 |
Welcome | -0.083 |
To | -0.083 |
Token | The |
Token ID | 383 |
Feature activation | +2.67e+01 |
Pos logit contributions | |
ish | +0.152 |
Majesty | +0.144 |
majesty | +0.133 |
oppy | +0.131 |
cient | +0.130 |
Neg logit contributions | |
Where | -0.072 |
Oh | -0.061 |
See | -0.061 |
Warning | -0.061 |
Listen | -0.060 |
Token | navy |
Token ID | 23956 |
Feature activation | +3.52e+01 |
Pos logit contributions | |
ish | +0.147 |
Majesty | +0.130 |
ci | +0.118 |
majesty | +0.117 |
oppy | +0.115 |
Neg logit contributions | |
Where | -0.132 |
See | -0.120 |
Oh | -0.120 |
Welcome | -0.118 |
On | -0.117 |
Token | was |
Token ID | 373 |
Feature activation | +2.38e+01 |
Pos logit contributions | |
ish | +0.199 |
Majesty | +0.179 |
oppy | +0.162 |
majesty | +0.161 |
cient | +0.155 |
Neg logit contributions | |
Where | -0.156 |
See | -0.145 |
Oh | -0.140 |
Welcome | -0.139 |
On | -0.138 |
Token | happy |
Token ID | 3772 |
Feature activation | +2.36e+01 |
Pos logit contributions | |
ish | +0.147 |
Majesty | +0.131 |
majesty | +0.120 |
ci | +0.119 |
oppy | +0.118 |
Neg logit contributions | |
Where | -0.104 |
See | -0.094 |
Oh | -0.092 |
On | -0.092 |
Welcome | -0.091 |
Token | and |
Token ID | 290 |
Feature activation | +2.05e+01 |
Pos logit contributions | |
ish | +0.145 |
Majesty | +0.132 |
cient | +0.121 |
majesty | +0.121 |
oppy | +0.117 |
Neg logit contributions | |
Where | -0.105 |
See | -0.094 |
On | -0.092 |
Oh | -0.091 |
Welcome | -0.090 |
Token | the |
Token ID | 262 |
Feature activation | +2.52e+01 |
Pos logit contributions | |
ish | +0.138 |
Majesty | +0.123 |
majesty | +0.112 |
oppy | +0.111 |
cient | +0.109 |
Neg logit contributions | |
Where | -0.078 |
See | -0.072 |
Welcome | -0.070 |
Oh | -0.069 |
On | -0.068 |
Token | water |
Token ID | 1660 |
Feature activation | +2.91e+01 |
Pos logit contributions | |
ish | +0.138 |
Majesty | +0.124 |
majesty | +0.111 |
ci | +0.110 |
oppy | +0.107 |
Neg logit contributions | |
Where | -0.125 |
See | -0.115 |
Oh | -0.114 |
On | -0.113 |
Welcome | -0.112 |
Token | � |
Token ID | 129 |
Feature activation | +3.91e+01 |
Pos logit contributions | |
ish | +0.386 |
Majesty | +0.347 |
ci | +0.329 |
ishes | +0.326 |
cient | +0.324 |
Neg logit contributions | |
Where | -0.074 |
See | -0.064 |
On | -0.061 |
Oh | -0.057 |
To | -0.056 |
Token | � |
Token ID | 241 |
Feature activation | +3.71e+01 |
Pos logit contributions | |
ish | +0.206 |
Majesty | +0.182 |
majesty | +0.163 |
ci | +0.161 |
oppy | +0.158 |
Neg logit contributions | |
Where | -0.202 |
See | -0.187 |
Oh | -0.185 |
On | -0.182 |
Welcome | -0.182 |
Token | But |
Token ID | 1537 |
Feature activation | +2.71e+01 |
Pos logit contributions | |
ish | +0.280 |
Majesty | +0.260 |
ci | +0.245 |
majesty | +0.241 |
oppy | +0.238 |
Neg logit contributions | |
Where | -0.084 |
See | -0.068 |
Warning | -0.068 |
Welcome | -0.066 |
Oh | -0.064 |
Token | why |
Token ID | 1521 |
Feature activation | +3.04e+01 |
Pos logit contributions | |
ish | +0.171 |
Majesty | +0.150 |
cient | +0.140 |
majesty | +0.140 |
oppy | +0.138 |
Neg logit contributions | |
Where | -0.114 |
What | -0.100 |
Oh | -0.098 |
See | -0.098 |
On | -0.098 |
Token | ? |
Token ID | 30 |
Feature activation | +2.55e+01 |
Pos logit contributions | |
ish | +0.181 |
Majesty | +0.162 |
ci | +0.146 |
majesty | +0.144 |
cient | +0.143 |
Neg logit contributions | |
Where | -0.130 |
On | -0.123 |
See | -0.122 |
That | -0.119 |
Oh | -0.118 |
Token | â |
Token ID | 22940 |
Feature activation | +3.45e+01 |
Pos logit contributions | |
ish | +0.169 |
Majesty | +0.155 |
majesty | +0.141 |
ci | +0.140 |
oppy | +0.139 |
Neg logit contributions | |
Where | -0.093 |
See | -0.082 |
Oh | -0.082 |
On | -0.080 |
Welcome | -0.079 |
Token | € |
Token ID | 26391 |
Feature activation | +3.37e+01 |
Pos logit contributions | |
ish | +0.186 |
Majesty | +0.165 |
majesty | +0.149 |
ci | +0.145 |
oppy | +0.144 |
Neg logit contributions | |
Where | -0.174 |
See | -0.161 |
Oh | -0.160 |
On | -0.157 |
Welcome | -0.157 |
Token |
|
Token ID | 198 |
Feature activation | +2.04e+01 |
Pos logit contributions | |
ish | +0.250 |
Majesty | +0.219 |
ci | +0.206 |
majesty | +0.203 |
ishes | +0.202 |
Neg logit contributions | |
Where | -0.104 |
See | -0.096 |
On | -0.095 |
To | -0.090 |
Oh | -0.089 |
Token |
|
Token ID | 198 |
Feature activation | +1.92e+01 |
Pos logit contributions | |
ish | +0.127 |
Majesty | +0.124 |
oppy | +0.121 |
majesty | +0.114 |
ci | +0.110 |
Neg logit contributions | |
Where | -0.059 |
Oh | -0.050 |
Warning | -0.050 |
Welcome | -0.049 |
Wow | -0.048 |
Token | Her |
Token ID | 9360 |
Feature activation | +2.77e+01 |
Pos logit contributions | |
ish | +0.121 |
Majesty | +0.118 |
oppy | +0.112 |
majesty | +0.108 |
ci | +0.106 |
Neg logit contributions | |
Where | -0.053 |
Warning | -0.046 |
Oh | -0.045 |
Welcome | -0.044 |
See | -0.044 |
Token | mum |
Token ID | 25682 |
Feature activation | +2.45e+01 |
Pos logit contributions | |
ish | +0.151 |
Majesty | +0.126 |
ci | +0.118 |
cient | +0.117 |
ishes | +0.116 |
Neg logit contributions | |
Where | -0.136 |
See | -0.124 |
On | -0.124 |
Oh | -0.122 |
To | -0.118 |
Token | a |
Token ID | 257 |
Feature activation | +1.32e+01 |
Pos logit contributions | |
ish | +0.080 |
Majesty | +0.072 |
majesty | +0.066 |
oppy | +0.065 |
ci | +0.065 |
Neg logit contributions | |
Where | -0.058 |
See | -0.053 |
Oh | -0.053 |
Warning | -0.052 |
Welcome | -0.052 |
Token | time |
Token ID | 640 |
Feature activation | +9.17e+00 |
Pos logit contributions | |
ish | +0.108 |
Majesty | +0.102 |
ci | +0.096 |
cient | +0.095 |
majesty | +0.095 |
Neg logit contributions | |
Where | -0.027 |
On | -0.026 |
One | -0.024 |
See | -0.023 |
Time | -0.023 |
Token | , |
Token ID | 11 |
Feature activation | +1.00e+01 |
Pos logit contributions | |
ish | +0.053 |
Majesty | +0.050 |
ci | +0.046 |
majesty | +0.044 |
ishes | +0.044 |
Neg logit contributions | |
Where | -0.041 |
On | -0.040 |
One | -0.039 |
Welcome | -0.038 |
Oh | -0.037 |
Token | there |
Token ID | 612 |
Feature activation | +1.10e+01 |
Pos logit contributions | |
ish | +0.064 |
Majesty | +0.058 |
majesty | +0.053 |
ci | +0.053 |
oppy | +0.052 |
Neg logit contributions | |
Where | -0.040 |
See | -0.036 |
Oh | -0.036 |
Welcome | -0.035 |
On | -0.035 |
Token | was |
Token ID | 373 |
Feature activation | +9.86e+00 |
Pos logit contributions | |
ish | +0.078 |
Majesty | +0.070 |
ci | +0.065 |
majesty | +0.065 |
oppy | +0.065 |
Neg logit contributions | |
Where | -0.036 |
See | -0.032 |
Oh | -0.031 |
Welcome | -0.030 |
On | -0.030 |
Token | a |
Token ID | 257 |
Feature activation | +1.21e+01 |
Pos logit contributions | |
ish | +0.069 |
Majesty | +0.063 |
majesty | +0.058 |
ci | +0.058 |
cient | +0.057 |
Neg logit contributions | |
Where | -0.036 |
See | -0.032 |
Oh | -0.032 |
On | -0.031 |
Welcome | -0.031 |
Token | little |
Token ID | 1310 |
Feature activation | +1.65e+01 |
Pos logit contributions | |
ish | +0.075 |
Majesty | +0.068 |
ci | +0.064 |
majesty | +0.062 |
cient | +0.061 |
Neg logit contributions | |
Where | -0.051 |
Oh | -0.045 |
See | -0.045 |
On | -0.045 |
Welcome | -0.044 |
Token | bird |
Token ID | 6512 |
Feature activation | +1.48e+01 |
Pos logit contributions | |
Majesty | +0.120 |
ish | +0.109 |
majesty | +0.108 |
ric | +0.103 |
urg | +0.102 |
Neg logit contributions | |
Wow | -0.044 |
Oh | -0.043 |
Welcome | -0.042 |
Where | -0.042 |
Time | -0.036 |
Token | named |
Token ID | 3706 |
Feature activation | +1.02e+01 |
Pos logit contributions | |
Majesty | +0.094 |
ish | +0.090 |
majesty | +0.086 |
ishes | +0.075 |
oppy | +0.075 |
Neg logit contributions | |
Where | -0.059 |
One | -0.054 |
On | -0.054 |
To | -0.052 |
Do | -0.051 |
Token | Tweet |
Token ID | 18752 |
Feature activation | +1.66e+01 |
Pos logit contributions | |
ish | +0.063 |
Majesty | +0.058 |
majesty | +0.053 |
ci | +0.053 |
oppy | +0.050 |
Neg logit contributions | |
Where | -0.044 |
See | -0.040 |
Oh | -0.039 |
Welcome | -0.039 |
On | -0.039 |
Token | . |
Token ID | 13 |
Feature activation | +5.09e+00 |
Pos logit contributions | |
ish | +0.070 |
Majesty | +0.068 |
majesty | +0.059 |
ci | +0.054 |
cient | +0.052 |
Neg logit contributions | |
Where | -0.098 |
On | -0.092 |
One | -0.091 |
He | -0.090 |
See | -0.088 |
Token | , |
Token ID | 11 |
Feature activation | +8.01e+00 |
Pos logit contributions | |
ish | +0.095 |
Majesty | +0.085 |
majesty | +0.078 |
oppy | +0.077 |
cient | +0.076 |
Neg logit contributions | |
Where | -0.067 |
On | -0.062 |
See | -0.060 |
Welcome | -0.058 |
Oh | -0.058 |
Token | and |
Token ID | 290 |
Feature activation | +8.09e+00 |
Pos logit contributions | |
ish | +0.050 |
Majesty | +0.044 |
oppy | +0.041 |
majesty | +0.041 |
cient | +0.040 |
Neg logit contributions | |
Where | -0.036 |
On | -0.032 |
See | -0.032 |
Oh | -0.031 |
Welcome | -0.031 |
Token | saw |
Token ID | 2497 |
Feature activation | +7.28e+00 |
Pos logit contributions | |
ish | +0.055 |
Majesty | +0.050 |
majesty | +0.046 |
cient | +0.045 |
oppy | +0.045 |
Neg logit contributions | |
Where | -0.031 |
See | -0.027 |
On | -0.027 |
Oh | -0.026 |
Welcome | -0.026 |
Token | a |
Token ID | 257 |
Feature activation | +9.13e+00 |
Pos logit contributions | |
ish | +0.051 |
Majesty | +0.046 |
majesty | +0.043 |
ci | +0.042 |
oppy | +0.042 |
Neg logit contributions | |
Where | -0.026 |
See | -0.023 |
Oh | -0.022 |
What | -0.021 |
On | -0.021 |
Token | big |
Token ID | 1263 |
Feature activation | +1.41e+01 |
Pos logit contributions | |
ish | +0.052 |
Majesty | +0.048 |
majesty | +0.043 |
ci | +0.042 |
oppy | +0.042 |
Neg logit contributions | |
Where | -0.042 |
See | -0.038 |
Warning | -0.038 |
Oh | -0.038 |
Welcome | -0.037 |
Token | surprise |
Token ID | 5975 |
Feature activation | +1.04e+01 |
Pos logit contributions | |
ish | +0.076 |
Majesty | +0.069 |
cient | +0.063 |
ci | +0.062 |
majesty | +0.061 |
Neg logit contributions | |
Where | -0.068 |
Oh | -0.062 |
See | -0.062 |
On | -0.061 |
Wow | -0.061 |
Token | waiting |
Token ID | 4953 |
Feature activation | +9.63e+00 |
Pos logit contributions | |
ish | +0.054 |
Majesty | +0.045 |
ci | +0.043 |
castle | +0.041 |
oppy | +0.041 |
Neg logit contributions | |
Where | -0.052 |
See | -0.051 |
Oh | -0.049 |
Warning | -0.049 |
Wow | -0.049 |
Token | for |
Token ID | 329 |
Feature activation | +8.28e+00 |
Pos logit contributions | |
ish | +0.051 |
Majesty | +0.045 |
cient | +0.040 |
majesty | +0.040 |
oppy | +0.040 |
Neg logit contributions | |
Where | -0.050 |
On | -0.046 |
Oh | -0.045 |
See | -0.045 |
Welcome | -0.045 |
Token | her |
Token ID | 607 |
Feature activation | +9.87e+00 |
Pos logit contributions | |
ish | +0.037 |
Majesty | +0.035 |
oppy | +0.032 |
majesty | +0.031 |
ci | +0.029 |
Neg logit contributions | |
Where | -0.043 |
See | -0.042 |
Oh | -0.041 |
Wow | -0.041 |
On | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | +3.26e+00 |
Pos logit contributions | |
ish | +0.061 |
Majesty | +0.055 |
majesty | +0.050 |
ci | +0.050 |
cient | +0.049 |
Neg logit contributions | |
Where | -0.042 |
See | -0.037 |
Oh | -0.037 |
On | -0.037 |
Welcome | -0.036 |
Token | On |
Token ID | 1550 |
Feature activation | +8.14e+00 |
Pos logit contributions | |
ish | +0.018 |
Majesty | +0.017 |
oppy | +0.017 |
majesty | +0.016 |
ipp | +0.015 |
Neg logit contributions | |
Where | -0.013 |
Warning | -0.012 |
Listen | -0.012 |
Welcome | -0.012 |
Time | -0.012 |
Token | fish |
Token ID | 5916 |
Feature activation | +1.72e+01 |
Pos logit contributions | |
ish | +0.073 |
Majesty | +0.065 |
ci | +0.061 |
cient | +0.058 |
majesty | +0.058 |
Neg logit contributions | |
Where | -0.080 |
Oh | -0.072 |
See | -0.072 |
Welcome | -0.071 |
Wow | -0.070 |
Token | said |
Token ID | 531 |
Feature activation | +8.79e+00 |
Pos logit contributions | |
ish | +0.114 |
Majesty | +0.108 |
majesty | +0.099 |
oppy | +0.096 |
ci | +0.095 |
Neg logit contributions | |
Where | -0.063 |
See | -0.058 |
On | -0.056 |
Oh | -0.054 |
Welcome | -0.052 |
Token | ," |
Token ID | 553 |
Feature activation | +8.97e+00 |
Pos logit contributions | |
ish | +0.052 |
Majesty | +0.045 |
ci | +0.044 |
oppy | +0.041 |
ishes | +0.041 |
Neg logit contributions | |
Where | -0.041 |
See | -0.038 |
He | -0.036 |
Welcome | -0.036 |
Are | -0.035 |
Token | There |
Token ID | 1318 |
Feature activation | +9.85e+00 |
Pos logit contributions | |
ish | +0.064 |
Majesty | +0.058 |
ci | +0.055 |
cient | +0.055 |
majesty | +0.053 |
Neg logit contributions | |
Where | -0.024 |
On | -0.021 |
Warning | -0.021 |
Time | -0.021 |
Welcome | -0.021 |
Token | you |
Token ID | 345 |
Feature activation | +8.58e+00 |
Pos logit contributions | |
ish | +0.067 |
Majesty | +0.056 |
ci | +0.055 |
cient | +0.053 |
oppy | +0.053 |
Neg logit contributions | |
Where | -0.038 |
Welcome | -0.033 |
Oh | -0.033 |
See | -0.032 |
On | -0.032 |
Token | go |
Token ID | 467 |
Feature activation | +8.90e+00 |
Pos logit contributions | |
ish | +0.051 |
Majesty | +0.050 |
majesty | +0.045 |
ci | +0.043 |
oppy | +0.042 |
Neg logit contributions | |
Where | -0.034 |
On | -0.032 |
See | -0.032 |
To | -0.031 |
Oh | -0.031 |
Token | !" |
Token ID | 2474 |
Feature activation | +6.77e+00 |
Pos logit contributions | |
ish | +0.055 |
Majesty | +0.051 |
majesty | +0.047 |
oppy | +0.046 |
cient | +0.044 |
Neg logit contributions | |
Where | -0.038 |
On | -0.034 |
See | -0.033 |
Oh | -0.033 |
Welcome | -0.033 |
Token |
|
Token ID | 198 |
Feature activation | +6.45e+00 |
Pos logit contributions | |
ish | +0.048 |
Majesty | +0.043 |
oppy | +0.041 |
cient | +0.041 |
ci | +0.041 |
Neg logit contributions | |
Where | -0.020 |
Time | -0.016 |
Welcome | -0.016 |
Warning | -0.016 |
On | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +6.46e+00 |
Pos logit contributions | |
ish | +0.041 |
oppy | +0.038 |
Majesty | +0.038 |
majesty | +0.036 |
opsy | +0.035 |
Neg logit contributions | |
Where | -0.020 |
Welcome | -0.017 |
Warning | -0.017 |
Oh | -0.017 |
Wow | -0.016 |
Token | The |
Token ID | 464 |
Feature activation | +1.33e+01 |
Pos logit contributions | |
ish | +0.042 |
Majesty | +0.041 |
oppy | +0.038 |
majesty | +0.038 |
opsy | +0.036 |
Neg logit contributions | |
Where | -0.017 |
Welcome | -0.014 |
Warning | -0.014 |
Oh | -0.014 |
Wow | -0.013 |
Token | little |
Token ID | 1310 |
Feature activation | +1.63e+01 |
Pos logit contributions | |
ish | +0.063 |
Majesty | +0.054 |
ci | +0.049 |
majesty | +0.048 |
cient | +0.047 |
Neg logit contributions | |
Where | -0.078 |
See | -0.071 |
Oh | -0.071 |
Welcome | -0.070 |
On | -0.069 |
Token | my |
Token ID | 1820 |
Feature activation | +1.14e+01 |
Pos logit contributions | |
ish | +0.063 |
Majesty | +0.059 |
majesty | +0.054 |
oppy | +0.051 |
ci | +0.051 |
Neg logit contributions | |
Where | -0.044 |
On | -0.039 |
Oh | -0.039 |
See | -0.039 |
Welcome | -0.038 |
Token | 's |
Token ID | 338 |
Feature activation | +8.99e+00 |
Pos logit contributions | |
ish | +0.070 |
Majesty | +0.066 |
majesty | +0.061 |
oppy | +0.059 |
cient | +0.058 |
Neg logit contributions | |
Where | -0.047 |
On | -0.043 |
He | -0.042 |
See | -0.041 |
Oh | -0.040 |
Token | ears |
Token ID | 11368 |
Feature activation | +9.71e+00 |
Pos logit contributions | |
ish | +0.051 |
Majesty | +0.045 |
oppy | +0.041 |
majesty | +0.041 |
cient | +0.040 |
Neg logit contributions | |
Where | -0.042 |
On | -0.037 |
Oh | -0.037 |
See | -0.036 |
Welcome | -0.036 |
Token | hurt |
Token ID | 5938 |
Feature activation | +8.39e+00 |
Pos logit contributions | |
ish | +0.057 |
Majesty | +0.052 |
majesty | +0.048 |
ci | +0.047 |
oppy | +0.046 |
Neg logit contributions | |
Where | -0.044 |
See | -0.040 |
On | -0.039 |
Oh | -0.039 |
Welcome | -0.039 |
Token | . |
Token ID | 13 |
Feature activation | +1.88e+00 |
Pos logit contributions | |
ish | +0.053 |
Majesty | +0.047 |
ci | +0.043 |
majesty | +0.043 |
oppy | +0.042 |
Neg logit contributions | |
Where | -0.035 |
See | -0.032 |
Oh | -0.031 |
On | -0.031 |
Welcome | -0.031 |
Token | He |
Token ID | 679 |
Feature activation | +4.13e+00 |
Pos logit contributions | |
ish | +0.010 |
Majesty | +0.008 |
cient | +0.008 |
ci | +0.007 |
majesty | +0.007 |
Neg logit contributions | |
Where | -0.010 |
Welcome | -0.009 |
Warning | -0.009 |
Time | -0.009 |
Oh | -0.009 |
Token | covered |
Token ID | 5017 |
Feature activation | +7.79e+00 |
Pos logit contributions | |
ish | +0.025 |
Majesty | +0.021 |
ci | +0.020 |
cient | +0.019 |
majesty | +0.019 |
Neg logit contributions | |
Where | -0.019 |
Welcome | -0.018 |
See | -0.017 |
Oh | -0.017 |
Warning | -0.017 |
Token | his |
Token ID | 465 |
Feature activation | +7.47e+00 |
Pos logit contributions | |
ish | +0.056 |
Majesty | +0.052 |
majesty | +0.049 |
oppy | +0.048 |
ci | +0.047 |
Neg logit contributions | |
Where | -0.027 |
Oh | -0.023 |
See | -0.023 |
What | -0.022 |
Wow | -0.022 |
Token | ears |
Token ID | 11368 |
Feature activation | +8.00e+00 |
Pos logit contributions | |
ish | +0.039 |
Majesty | +0.036 |
oppy | +0.033 |
cient | +0.033 |
pp | +0.033 |
Neg logit contributions | |
Where | -0.033 |
On | -0.030 |
Oh | -0.029 |
He | -0.029 |
See | -0.029 |
Token | with |
Token ID | 351 |
Feature activation | +4.25e+00 |
Pos logit contributions | |
ish | +0.049 |
Majesty | +0.046 |
majesty | +0.042 |
oppy | +0.041 |
cient | +0.040 |
Neg logit contributions | |
Where | -0.034 |
On | -0.031 |
See | -0.031 |
Oh | -0.030 |
He | -0.029 |
Token | his |
Token ID | 465 |
Feature activation | +7.03e+00 |
Pos logit contributions | |
ish | +0.027 |
Majesty | +0.024 |
majesty | +0.022 |
ci | +0.022 |
oppy | +0.021 |
Neg logit contributions | |
Where | -0.018 |
See | -0.016 |
Oh | -0.016 |
On | -0.016 |
Welcome | -0.016 |
Token | But |
Token ID | 887 |
Feature activation | +4.96e+00 |
Pos logit contributions | |
ish | +0.035 |
Majesty | +0.032 |
majesty | +0.030 |
ci | +0.029 |
oppy | +0.029 |
Neg logit contributions | |
Where | -0.024 |
See | -0.022 |
On | -0.022 |
Oh | -0.022 |
Welcome | -0.021 |
Token | be |
Token ID | 307 |
Feature activation | +6.56e+00 |
Pos logit contributions | |
ish | +0.031 |
Majesty | +0.027 |
ci | +0.025 |
majesty | +0.025 |
cient | +0.025 |
Neg logit contributions | |
Where | -0.021 |
See | -0.019 |
What | -0.019 |
Oh | -0.019 |
On | -0.018 |
Token | careful |
Token ID | 8161 |
Feature activation | +8.44e+00 |
Pos logit contributions | |
ish | +0.034 |
Majesty | +0.030 |
majesty | +0.027 |
ci | +0.026 |
oppy | +0.026 |
Neg logit contributions | |
Where | -0.035 |
See | -0.032 |
Oh | -0.032 |
Welcome | -0.032 |
Warning | -0.031 |
Token | , |
Token ID | 11 |
Feature activation | +7.34e+00 |
Pos logit contributions | |
ish | +0.062 |
Majesty | +0.061 |
cient | +0.056 |
majesty | +0.055 |
oppy | +0.053 |
Neg logit contributions | |
Where | -0.024 |
One | -0.021 |
He | -0.021 |
On | -0.021 |
Time | -0.020 |
Token | it |
Token ID | 340 |
Feature activation | +6.98e+00 |
Pos logit contributions | |
ish | +0.049 |
Majesty | +0.045 |
cient | +0.042 |
ci | +0.041 |
majesty | +0.041 |
Neg logit contributions | |
Where | -0.028 |
Oh | -0.024 |
See | -0.024 |
What | -0.023 |
Do | -0.023 |
Token | 's |
Token ID | 338 |
Feature activation | +6.13e+00 |
Pos logit contributions | |
ish | +0.044 |
Majesty | +0.042 |
majesty | +0.038 |
ci | +0.037 |
oppy | +0.037 |
Neg logit contributions | |
Where | -0.025 |
See | -0.024 |
On | -0.023 |
To | -0.023 |
Oh | -0.022 |
Token | very |
Token ID | 845 |
Feature activation | +8.60e+00 |
Pos logit contributions | |
ish | +0.037 |
Majesty | +0.034 |
majesty | +0.031 |
ci | +0.031 |
cient | +0.030 |
Neg logit contributions | |
Where | -0.027 |
See | -0.024 |
Oh | -0.024 |
On | -0.024 |
Welcome | -0.023 |
Token | heavy |
Token ID | 4334 |
Feature activation | +9.70e+00 |
Pos logit contributions | |
ish | +0.055 |
Majesty | +0.050 |
ci | +0.046 |
majesty | +0.045 |
cient | +0.045 |
Neg logit contributions | |
Where | -0.034 |
See | -0.031 |
On | -0.031 |
Oh | -0.030 |
Welcome | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
ish | +0.067 |
Majesty | +0.064 |
majesty | +0.059 |
cient | +0.059 |
oppy | +0.058 |
Neg logit contributions | |
Where | -0.031 |
On | -0.027 |
Welcome | -0.025 |
For | -0.025 |
Do | -0.025 |
Token | You |
Token ID | 921 |
Feature activation | +3.01e+00 |
Pos logit contributions | |
ish | +0.024 |
Majesty | +0.022 |
majesty | +0.020 |
oppy | +0.019 |
ci | +0.019 |
Neg logit contributions | |
Where | -0.015 |
See | -0.014 |
On | -0.014 |
Oh | -0.013 |
Welcome | -0.013 |
Token | don |
Token ID | 836 |
Feature activation | +6.00e+00 |
Pos logit contributions | |
ish | +0.020 |
Majesty | +0.019 |
majesty | +0.017 |
ci | +0.017 |
cient | +0.016 |
Neg logit contributions | |
Where | -0.011 |
See | -0.010 |
On | -0.010 |
To | -0.009 |
Oh | -0.009 |
Token | When |
Token ID | 1649 |
Feature activation | -9.72e+00 |
Pos logit contributions | |
Where | +0.038 |
See | +0.034 |
On | +0.034 |
Oh | +0.034 |
Welcome | +0.033 |
Neg logit contributions | |
ish | -0.058 |
Majesty | -0.053 |
majesty | -0.049 |
ci | -0.048 |
oppy | -0.047 |
Token | the |
Token ID | 262 |
Feature activation | -8.08e+00 |
Pos logit contributions | |
Where | +0.048 |
See | +0.044 |
Oh | +0.044 |
Welcome | +0.043 |
On | +0.043 |
Neg logit contributions | |
ish | -0.054 |
Majesty | -0.048 |
majesty | -0.043 |
ci | -0.043 |
oppy | -0.042 |
Token | law |
Token ID | 1099 |
Feature activation | -4.57e+00 |
Pos logit contributions | |
Where | +0.042 |
See | +0.039 |
On | +0.038 |
Oh | +0.038 |
Welcome | +0.037 |
Neg logit contributions | |
ish | -0.043 |
Majesty | -0.037 |
majesty | -0.034 |
ci | -0.033 |
cient | -0.033 |
Token | changes |
Token ID | 2458 |
Feature activation | -6.82e+00 |
Pos logit contributions | |
Where | +0.023 |
See | +0.021 |
Oh | +0.021 |
Welcome | +0.021 |
On | +0.021 |
Neg logit contributions | |
ish | -0.025 |
Majesty | -0.022 |
majesty | -0.020 |
ci | -0.019 |
oppy | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | -9.14e+00 |
Pos logit contributions | |
Where | +0.028 |
See | +0.026 |
Welcome | +0.025 |
On | +0.025 |
To | +0.025 |
Neg logit contributions | |
ish | -0.039 |
Majesty | -0.038 |
majesty | -0.034 |
ci | -0.033 |
oppy | -0.032 |
Token | we |
Token ID | 356 |
Feature activation | -1.15e+01 |
Pos logit contributions | |
Where | +0.040 |
See | +0.036 |
On | +0.035 |
Oh | +0.035 |
Welcome | +0.035 |
Neg logit contributions | |
ish | -0.057 |
Majesty | -0.051 |
oppy | -0.047 |
ci | -0.047 |
majesty | -0.046 |
Token | can |
Token ID | 460 |
Feature activation | -1.09e+01 |
Pos logit contributions | |
Where | +0.045 |
See | +0.041 |
On | +0.040 |
Welcome | +0.039 |
Oh | +0.039 |
Neg logit contributions | |
ish | -0.073 |
Majesty | -0.068 |
ci | -0.062 |
majesty | -0.061 |
oppy | -0.059 |
Token | play |
Token ID | 711 |
Feature activation | -9.06e+00 |
Pos logit contributions | |
One | +0.041 |
On | +0.041 |
Where | +0.041 |
See | +0.038 |
To | +0.037 |
Neg logit contributions | |
ish | -0.070 |
Majesty | -0.063 |
ishes | -0.058 |
majesty | -0.058 |
ci | -0.057 |
Token | with |
Token ID | 351 |
Feature activation | -8.40e+00 |
Pos logit contributions | |
Where | +0.039 |
See | +0.034 |
On | +0.034 |
Oh | +0.033 |
Welcome | +0.033 |
Neg logit contributions | |
ish | -0.057 |
Majesty | -0.051 |
majesty | -0.047 |
ci | -0.047 |
oppy | -0.046 |
Token | water |
Token ID | 1660 |
Feature activation | -6.95e+00 |
Pos logit contributions | |
Where | +0.034 |
See | +0.031 |
Oh | +0.030 |
Welcome | +0.029 |
On | +0.029 |
Neg logit contributions | |
ish | -0.053 |
Majesty | -0.049 |
majesty | -0.044 |
ci | -0.044 |
oppy | -0.043 |
Token | again |
Token ID | 757 |
Feature activation | -6.90e+00 |
Pos logit contributions | |
Where | +0.026 |
Welcome | +0.023 |
On | +0.023 |
For | +0.023 |
To | +0.023 |
Neg logit contributions | |
ish | -0.044 |
Majesty | -0.043 |
majesty | -0.038 |
oppy | -0.038 |
ci | -0.037 |
Token | it |
Token ID | 340 |
Feature activation | -5.96e+00 |
Pos logit contributions | |
Where | +0.024 |
See | +0.021 |
Oh | +0.021 |
That | +0.021 |
Welcome | +0.020 |
Neg logit contributions | |
ish | -0.049 |
Majesty | -0.044 |
oppy | -0.041 |
ci | -0.040 |
majesty | -0.040 |
Token | 's |
Token ID | 338 |
Feature activation | -5.86e+00 |
Pos logit contributions | |
Where | +0.019 |
See | +0.019 |
That | +0.018 |
Oh | +0.018 |
To | +0.017 |
Neg logit contributions | |
Majesty | -0.037 |
ish | -0.037 |
majesty | -0.034 |
oppy | -0.032 |
castle | -0.032 |
Token | mine |
Token ID | 6164 |
Feature activation | -5.61e+00 |
Pos logit contributions | |
Where | +0.031 |
Oh | +0.028 |
See | +0.028 |
On | +0.028 |
Welcome | +0.028 |
Neg logit contributions | |
ish | -0.030 |
Majesty | -0.027 |
majesty | -0.024 |
ci | -0.024 |
cient | -0.023 |
Token | now |
Token ID | 783 |
Feature activation | -5.77e+00 |
Pos logit contributions | |
Where | +0.024 |
On | +0.022 |
He | +0.021 |
For | +0.020 |
Oh | +0.020 |
Neg logit contributions | |
ish | -0.033 |
Majesty | -0.031 |
cient | -0.029 |
oppy | -0.028 |
majesty | -0.028 |
Token | !" |
Token ID | 2474 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
Where | +0.027 |
On | +0.025 |
See | +0.024 |
Welcome | +0.024 |
Oh | +0.024 |
Neg logit contributions | |
ish | -0.032 |
Majesty | -0.029 |
oppy | -0.026 |
ci | -0.026 |
majesty | -0.026 |
Token | Lily |
Token ID | 20037 |
Feature activation | -5.79e+00 |
Pos logit contributions | |
Where | +0.045 |
Warning | +0.041 |
Welcome | +0.041 |
See | +0.040 |
Time | +0.039 |
Neg logit contributions | |
ish | -0.056 |
Majesty | -0.051 |
ci | -0.047 |
majesty | -0.047 |
oppy | -0.047 |
Token | said |
Token ID | 531 |
Feature activation | -9.94e+00 |
Pos logit contributions | |
Where | +0.020 |
See | +0.018 |
Oh | +0.017 |
On | +0.017 |
Welcome | +0.017 |
Neg logit contributions | |
ish | -0.041 |
Majesty | -0.037 |
majesty | -0.034 |
ci | -0.034 |
oppy | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | -1.01e+01 |
Pos logit contributions | |
Where | +0.031 |
On | +0.026 |
See | +0.026 |
Oh | +0.025 |
Welcome | +0.025 |
Neg logit contributions | |
ish | -0.072 |
Majesty | -0.068 |
majesty | -0.063 |
cient | -0.061 |
oppy | -0.060 |
Token | " |
Token ID | 366 |
Feature activation | -1.02e+01 |
Pos logit contributions | |
Where | +0.042 |
Welcome | +0.037 |
Warning | +0.037 |
Time | +0.036 |
See | +0.036 |
Neg logit contributions | |
ish | -0.057 |
Majesty | -0.053 |
cient | -0.049 |
majesty | -0.049 |
ci | -0.047 |
Token | It |
Token ID | 1026 |
Feature activation | -8.37e+00 |
Pos logit contributions | |
Where | +0.019 |
See | +0.018 |
Welcome | +0.018 |
On | +0.018 |
Time | +0.018 |
Neg logit contributions | |
ish | -0.072 |
Majesty | -0.064 |
ci | -0.063 |
knee | -0.061 |
cient | -0.060 |
Token | 's |
Token ID | 338 |
Feature activation | -7.78e+00 |
Pos logit contributions | |
Where | +0.035 |
See | +0.032 |
Oh | +0.031 |
Welcome | +0.031 |
On | +0.030 |
Neg logit contributions | |
ish | -0.049 |
Majesty | -0.047 |
majesty | -0.043 |
oppy | -0.042 |
ci | -0.041 |
Token | it |
Token ID | 340 |
Feature activation | -5.18e+00 |
Pos logit contributions | |
Where | +0.026 |
See | +0.023 |
Oh | +0.023 |
Warning | +0.023 |
Welcome | +0.023 |
Neg logit contributions | |
ish | -0.037 |
Majesty | -0.034 |
majesty | -0.031 |
oppy | -0.030 |
ci | -0.030 |
Token | was |
Token ID | 373 |
Feature activation | -4.99e+00 |
Pos logit contributions | |
Where | +0.017 |
See | +0.015 |
Oh | +0.015 |
On | +0.014 |
Welcome | +0.014 |
Neg logit contributions | |
ish | -0.037 |
Majesty | -0.035 |
majesty | -0.032 |
ci | -0.031 |
cient | -0.031 |
Token | completely |
Token ID | 3190 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
Where | +0.023 |
See | +0.021 |
Warning | +0.021 |
Oh | +0.020 |
Welcome | +0.020 |
Neg logit contributions | |
ish | -0.029 |
Majesty | -0.026 |
majesty | -0.024 |
oppy | -0.023 |
ci | -0.023 |
Token | full |
Token ID | 1336 |
Feature activation | -3.31e+00 |
Pos logit contributions | |
Where | +0.007 |
See | +0.006 |
Oh | +0.006 |
On | +0.006 |
Welcome | +0.006 |
Neg logit contributions | |
ish | -0.008 |
Majesty | -0.008 |
majesty | -0.007 |
ci | -0.007 |
oppy | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | -9.48e+00 |
Pos logit contributions | |
Where | +0.013 |
See | +0.012 |
Oh | +0.011 |
On | +0.011 |
Welcome | +0.011 |
Neg logit contributions | |
ish | -0.022 |
Majesty | -0.019 |
majesty | -0.018 |
ci | -0.018 |
oppy | -0.017 |
Token | |
Token ID | 220 |
Feature activation | -3.48e+00 |
Pos logit contributions | |
Where | +0.032 |
Warning | +0.028 |
Oh | +0.027 |
Time | +0.026 |
Welcome | +0.026 |
Neg logit contributions | |
ish | -0.063 |
Majesty | -0.058 |
cient | -0.055 |
oppy | -0.054 |
ci | -0.053 |
Token |
|
Token ID | 198 |
Feature activation | -9.53e+00 |
Pos logit contributions | |
Where | +0.010 |
Welcome | +0.009 |
Oh | +0.009 |
Warning | +0.009 |
See | +0.009 |
Neg logit contributions | |
ish | -0.024 |
Majesty | -0.022 |
oppy | -0.021 |
majesty | -0.020 |
cient | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | -9.13e+00 |
Pos logit contributions | |
Where | +0.035 |
Warning | +0.032 |
See | +0.032 |
Oh | +0.032 |
Welcome | +0.031 |
Neg logit contributions | |
ish | -0.052 |
oppy | -0.047 |
Majesty | -0.045 |
cient | -0.044 |
ci | -0.044 |
Token | The |
Token ID | 464 |
Feature activation | -5.41e+00 |
Pos logit contributions | |
Warning | +0.024 |
See | +0.024 |
Where | +0.023 |
Oh | +0.022 |
Welcome | +0.021 |
Neg logit contributions | |
ish | -0.051 |
Majesty | -0.049 |
cient | -0.049 |
ap | -0.046 |
ci | -0.046 |
Token | woman |
Token ID | 2415 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
Where | +0.025 |
See | +0.023 |
Oh | +0.023 |
Welcome | +0.022 |
Warning | +0.022 |
Neg logit contributions | |
ish | -0.031 |
Majesty | -0.028 |
majesty | -0.026 |
ci | -0.025 |
cient | -0.025 |
Token | always |
Token ID | 1464 |
Feature activation | -8.68e+00 |
Pos logit contributions | |
Where | +0.010 |
See | +0.009 |
On | +0.009 |
Oh | +0.008 |
That | +0.008 |
Neg logit contributions | |
ish | -0.024 |
Majesty | -0.024 |
majesty | -0.022 |
oppy | -0.021 |
cient | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | -8.37e+00 |
Pos logit contributions | |
Where | +0.005 |
Oh | +0.005 |
Welcome | +0.005 |
Warning | +0.004 |
See | +0.004 |
Neg logit contributions | |
ish | -0.014 |
Majesty | -0.012 |
oppy | -0.012 |
majesty | -0.011 |
cient | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -8.11e+00 |
Pos logit contributions | |
Where | +0.029 |
Warning | +0.026 |
Oh | +0.026 |
Welcome | +0.026 |
See | +0.025 |
Neg logit contributions | |
ish | -0.049 |
Majesty | -0.045 |
oppy | -0.044 |
majesty | -0.042 |
cient | -0.041 |
Token | He |
Token ID | 1544 |
Feature activation | -5.44e+00 |
Pos logit contributions | |
Warning | +0.021 |
Where | +0.021 |
See | +0.021 |
Welcome | +0.020 |
Oh | +0.020 |
Neg logit contributions | |
ish | -0.049 |
Majesty | -0.047 |
majesty | -0.043 |
cient | -0.042 |
ci | -0.042 |
Token | started |
Token ID | 2067 |
Feature activation | -6.38e+00 |
Pos logit contributions | |
Where | +0.020 |
See | +0.018 |
Oh | +0.018 |
On | +0.018 |
Welcome | +0.018 |
Neg logit contributions | |
ish | -0.037 |
Majesty | -0.033 |
majesty | -0.031 |
ci | -0.030 |
oppy | -0.030 |
Token | to |
Token ID | 284 |
Feature activation | -6.47e+00 |
Pos logit contributions | |
Where | +0.030 |
On | +0.027 |
See | +0.027 |
Oh | +0.026 |
Welcome | +0.026 |
Neg logit contributions | |
ish | -0.038 |
Majesty | -0.034 |
majesty | -0.031 |
oppy | -0.030 |
ci | -0.030 |
Token | t |
Token ID | 256 |
Feature activation | -5.87e-01 |
Pos logit contributions | |
Where | +0.026 |
On | +0.026 |
Who | +0.025 |
What | +0.024 |
Warning | +0.023 |
Neg logit contributions | |
ish | -0.040 |
Majesty | -0.036 |
majesty | -0.035 |
oppy | -0.033 |
cient | -0.032 |
Token | inker |
Token ID | 24275 |
Feature activation | -2.24e+00 |
Pos logit contributions | |
Where | +0.003 |
See | +0.003 |
Oh | +0.003 |
On | +0.003 |
Welcome | +0.003 |
Neg logit contributions | |
ish | -0.003 |
Majesty | -0.003 |
majesty | -0.002 |
ci | -0.002 |
cient | -0.002 |
Token | with |
Token ID | 351 |
Feature activation | -6.60e+00 |
Pos logit contributions | |
Where | +0.010 |
On | +0.009 |
See | +0.008 |
Welcome | +0.008 |
To | +0.008 |
Neg logit contributions | |
ish | -0.014 |
Majesty | -0.012 |
majesty | -0.012 |
oppy | -0.011 |
ci | -0.011 |
Token | it |
Token ID | 340 |
Feature activation | -6.49e+00 |
Pos logit contributions | |
Where | +0.027 |
See | +0.024 |
Oh | +0.024 |
On | +0.023 |
Welcome | +0.023 |
Neg logit contributions | |
ish | -0.043 |
Majesty | -0.039 |
majesty | -0.035 |
ci | -0.035 |
oppy | -0.034 |
Token | and |
Token ID | 290 |
Feature activation | -7.63e+00 |
Pos logit contributions | |
Where | +0.034 |
See | +0.031 |
Oh | +0.031 |
Welcome | +0.031 |
Wow | +0.030 |
Neg logit contributions | |
ish | -0.035 |
Majesty | -0.030 |
ci | -0.027 |
majesty | -0.027 |
oppy | -0.026 |
Token | try |
Token ID | 1949 |
Feature activation | -8.96e+00 |
Pos logit contributions | |
Where | +0.029 |
See | +0.026 |
On | +0.025 |
Oh | +0.025 |
Welcome | +0.025 |
Neg logit contributions | |
ish | -0.051 |
Majesty | -0.046 |
majesty | -0.043 |
oppy | -0.042 |
ci | -0.042 |
Token |
|
Token ID | 198 |
Feature activation | -5.08e+00 |
Pos logit contributions | |
Where | +0.011 |
Warning | +0.010 |
Welcome | +0.009 |
Oh | +0.009 |
See | +0.009 |
Neg logit contributions | |
ish | -0.024 |
Majesty | -0.022 |
majesty | -0.021 |
oppy | -0.020 |
cient | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | -5.21e+00 |
Pos logit contributions | |
Where | +0.015 |
Oh | +0.013 |
Welcome | +0.013 |
See | +0.013 |
Warning | +0.012 |
Neg logit contributions | |
ish | -0.035 |
Majesty | -0.033 |
oppy | -0.031 |
majesty | -0.031 |
cient | -0.030 |
Token | They |
Token ID | 2990 |
Feature activation | -2.71e+00 |
Pos logit contributions | |
Where | +0.015 |
Welcome | +0.013 |
See | +0.013 |
Oh | +0.013 |
Warning | +0.012 |
Neg logit contributions | |
ish | -0.036 |
Majesty | -0.033 |
majesty | -0.032 |
oppy | -0.031 |
castle | -0.030 |
Token | get |
Token ID | 651 |
Feature activation | -2.98e+00 |
Pos logit contributions | |
On | +0.011 |
Where | +0.011 |
See | +0.010 |
He | +0.010 |
Warning | +0.010 |
Neg logit contributions | |
ish | -0.016 |
Majesty | -0.015 |
ci | -0.014 |
majesty | -0.013 |
cient | -0.013 |
Token | up |
Token ID | 510 |
Feature activation | -8.49e-01 |
Pos logit contributions | |
Where | +0.015 |
See | +0.013 |
Oh | +0.013 |
Welcome | +0.013 |
On | +0.013 |
Neg logit contributions | |
ish | -0.016 |
Majesty | -0.015 |
majesty | -0.014 |
oppy | -0.013 |
cient | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | -1.95e+00 |
Pos logit contributions | |
Where | +0.004 |
See | +0.004 |
Oh | +0.004 |
Welcome | +0.004 |
Wow | +0.004 |
Neg logit contributions | |
ish | -0.004 |
Majesty | -0.004 |
ci | -0.004 |
majesty | -0.003 |
oppy | -0.003 |
Token | walk |
Token ID | 2513 |
Feature activation | -6.12e-01 |
Pos logit contributions | |
Where | +0.009 |
On | +0.008 |
See | +0.007 |
What | +0.007 |
Who | +0.007 |
Neg logit contributions | |
ish | -0.011 |
Majesty | -0.011 |
majesty | -0.010 |
cient | -0.010 |
oppy | -0.010 |
Token | back |
Token ID | 736 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
Where | +0.003 |
See | +0.003 |
Oh | +0.003 |
Welcome | +0.003 |
On | +0.003 |
Neg logit contributions | |
ish | -0.003 |
Majesty | -0.003 |
ci | -0.002 |
majesty | -0.002 |
oppy | -0.002 |
Token | down |
Token ID | 866 |
Feature activation | -7.23e-01 |
Pos logit contributions | |
Where | +0.008 |
On | +0.008 |
See | +0.008 |
Oh | +0.008 |
Welcome | +0.007 |
Neg logit contributions | |
ish | -0.009 |
Majesty | -0.008 |
majesty | -0.008 |
cient | -0.007 |
ci | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +7.77e-01 |
Pos logit contributions | |
Where | +0.004 |
See | +0.004 |
Wow | +0.004 |
Listen | +0.004 |
Oh | +0.004 |
Neg logit contributions | |
ish | -0.003 |
ap | -0.002 |
Majesty | -0.002 |
ci | -0.002 |
oppy | -0.002 |
Token | hill |
Token ID | 12788 |
Feature activation | +2.87e+00 |
Pos logit contributions | |
ish | +0.004 |
Majesty | +0.003 |
majesty | +0.003 |
ci | +0.003 |
oppy | +0.003 |
Neg logit contributions | |
Where | -0.005 |
See | -0.004 |
Oh | -0.004 |
Welcome | -0.004 |
Warning | -0.004 |