Token | ition |
Token ID | 653 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
scribe | +0.036 |
results | +0.035 |
adem | +0.035 |
inen | +0.035 |
rior | +0.034 |
Neg logit contributions | |
ellen | -0.034 |
Developer | -0.032 |
rite | -0.031 |
taboola | -0.031 |
aux | -0.030 |
Token | Team |
Token ID | 4816 |
Feature activation | +4.88e-01 |
Pos logit contributions | |
scribe | +0.234 |
results | +0.229 |
adem | +0.228 |
inen | +0.225 |
rior | +0.220 |
Neg logit contributions | |
ellen | -0.251 |
Developer | -0.239 |
taboola | -0.234 |
rite | -0.233 |
yip | -0.224 |
Token |
|
Token ID | 198 |
Feature activation | +3.01e-02 |
Pos logit contributions | |
scribe | +0.109 |
results | +0.107 |
adem | +0.105 |
inen | +0.104 |
rior | +0.101 |
Neg logit contributions | |
ellen | -0.120 |
Developer | -0.115 |
rite | -0.112 |
taboola | -0.112 |
aux | -0.108 |
Token |
|
Token ID | 198 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
scribe | +0.006 |
results | +0.006 |
adem | +0.006 |
inen | +0.006 |
rior | +0.006 |
Neg logit contributions | |
ellen | -0.008 |
Developer | -0.007 |
rite | -0.007 |
taboola | -0.007 |
yip | -0.007 |
Token | War |
Token ID | 13195 |
Feature activation | -3.97e-02 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | riors |
Token ID | 8657 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.011 |
rite | +0.011 |
taboola | +0.011 |
aux | +0.011 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.006 |
Token | � |
Token ID | 447 |
Feature activation | -7.96e-03 |
Pos logit contributions | |
scribe | +0.325 |
results | +0.318 |
adem | +0.316 |
inen | +0.312 |
rior | +0.308 |
Neg logit contributions | |
ellen | -0.325 |
Developer | -0.308 |
taboola | -0.302 |
rite | -0.299 |
yip | -0.290 |
Token | � |
Token ID | 247 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | Less |
Token ID | 12892 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
rite | -0.004 |
taboola | -0.004 |
yip | -0.003 |
Token | on |
Token ID | 261 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
scribe | +0.009 |
results | +0.009 |
adem | +0.009 |
inen | +0.009 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.007 |
Developer | -0.006 |
rite | -0.006 |
taboola | -0.006 |
aux | -0.006 |
Token | vs |
Token ID | 3691 |
Feature activation | +1.98e-01 |
Pos logit contributions | |
ellen | +0.065 |
Developer | +0.062 |
rite | +0.061 |
taboola | +0.061 |
yip | +0.059 |
Neg logit contributions | |
scribe | -0.061 |
results | -0.060 |
adem | -0.060 |
inen | -0.059 |
rior | -0.057 |
Token | answered |
Token ID | 9373 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.019 |
inen | +0.018 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.021 |
Developer | -0.020 |
rite | -0.020 |
taboola | -0.020 |
yip | -0.019 |
Token | — |
Token ID | 851 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | Golden |
Token ID | 8407 |
Feature activation | -1.90e-01 |
Pos logit contributions | |
scribe | +0.031 |
results | +0.030 |
adem | +0.030 |
inen | +0.030 |
rior | +0.029 |
Neg logit contributions | |
ellen | -0.033 |
Developer | -0.031 |
rite | -0.030 |
taboola | -0.030 |
yip | -0.029 |
Token | State |
Token ID | 9012 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
ellen | +0.047 |
Developer | +0.045 |
rite | +0.044 |
taboola | +0.044 |
aux | +0.043 |
Neg logit contributions | |
scribe | -0.041 |
results | -0.041 |
adem | -0.040 |
inen | -0.040 |
rior | -0.039 |
Token | War |
Token ID | 13195 |
Feature activation | -5.66e-02 |
Pos logit contributions | |
ellen | +0.031 |
Developer | +0.030 |
rite | +0.029 |
taboola | +0.029 |
aux | +0.028 |
Neg logit contributions | |
scribe | -0.024 |
results | -0.024 |
adem | -0.024 |
inen | -0.023 |
rior | -0.023 |
Token | riors |
Token ID | 8657 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ellen | +0.025 |
Developer | +0.025 |
rite | +0.024 |
taboola | +0.024 |
aux | +0.024 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.000 |
Token | (@ |
Token ID | 4275 |
Feature activation | +7.43e-01 |
Pos logit contributions | |
scribe | +0.237 |
results | +0.232 |
adem | +0.228 |
inen | +0.224 |
rior | +0.217 |
Neg logit contributions | |
ellen | -0.411 |
Developer | -0.395 |
rite | -0.390 |
taboola | -0.389 |
yip | -0.377 |
Token | war |
Token ID | 5767 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
scribe | +0.187 |
results | +0.184 |
adem | +0.182 |
inen | +0.180 |
rior | +0.176 |
Neg logit contributions | |
ellen | -0.161 |
Developer | -0.152 |
rite | -0.149 |
taboola | -0.148 |
aux | -0.142 |
Token | riors |
Token ID | 8657 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.004 |
adem | +0.004 |
inen | +0.003 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.088 |
Developer | -0.085 |
rite | -0.085 |
taboola | -0.085 |
aux | -0.083 |
Token | ) |
Token ID | 8 |
Feature activation | +4.47e-02 |
Pos logit contributions | |
scribe | +0.289 |
results | +0.282 |
adem | +0.279 |
inen | +0.276 |
rior | +0.267 |
Neg logit contributions | |
ellen | -0.356 |
Developer | -0.340 |
rite | -0.334 |
taboola | -0.334 |
aux | -0.322 |
Token | September |
Token ID | 2693 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.009 |
adem | +0.009 |
inen | +0.009 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.011 |
Developer | -0.011 |
rite | -0.011 |
taboola | -0.011 |
yip | -0.010 |
Token | State |
Token ID | 9012 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
ellen | +0.047 |
Developer | +0.045 |
rite | +0.044 |
taboola | +0.044 |
aux | +0.043 |
Neg logit contributions | |
scribe | -0.041 |
results | -0.041 |
adem | -0.040 |
inen | -0.040 |
rior | -0.039 |
Token | War |
Token ID | 13195 |
Feature activation | -5.66e-02 |
Pos logit contributions | |
ellen | +0.031 |
Developer | +0.030 |
rite | +0.029 |
taboola | +0.029 |
aux | +0.028 |
Neg logit contributions | |
scribe | -0.024 |
results | -0.024 |
adem | -0.024 |
inen | -0.023 |
rior | -0.023 |
Token | riors |
Token ID | 8657 |
Feature activation | +1.39e+00 |
Pos logit contributions | |
ellen | +0.025 |
Developer | +0.025 |
rite | +0.024 |
taboola | +0.024 |
aux | +0.024 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.000 |
Token | (@ |
Token ID | 4275 |
Feature activation | +7.43e-01 |
Pos logit contributions | |
scribe | +0.237 |
results | +0.232 |
adem | +0.228 |
inen | +0.224 |
rior | +0.217 |
Neg logit contributions | |
ellen | -0.411 |
Developer | -0.395 |
rite | -0.390 |
taboola | -0.389 |
yip | -0.377 |
Token | war |
Token ID | 5767 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
scribe | +0.187 |
results | +0.184 |
adem | +0.182 |
inen | +0.180 |
rior | +0.176 |
Neg logit contributions | |
ellen | -0.161 |
Developer | -0.152 |
rite | -0.149 |
taboola | -0.148 |
aux | -0.142 |
Token | riors |
Token ID | 8657 |
Feature activation | +1.38e+00 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.004 |
adem | +0.004 |
inen | +0.003 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.088 |
Developer | -0.085 |
rite | -0.085 |
taboola | -0.085 |
aux | -0.083 |
Token | ) |
Token ID | 8 |
Feature activation | +4.47e-02 |
Pos logit contributions | |
scribe | +0.289 |
results | +0.282 |
adem | +0.279 |
inen | +0.276 |
rior | +0.267 |
Neg logit contributions | |
ellen | -0.356 |
Developer | -0.340 |
rite | -0.334 |
taboola | -0.334 |
aux | -0.322 |
Token | September |
Token ID | 2693 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.009 |
adem | +0.009 |
inen | +0.009 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.011 |
Developer | -0.011 |
rite | -0.011 |
taboola | -0.011 |
yip | -0.010 |
Token | 24 |
Token ID | 1987 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
scribe | +0.027 |
results | +0.027 |
inen | +0.026 |
adem | +0.026 |
rior | +0.025 |
Neg logit contributions | |
ellen | -0.035 |
Developer | -0.033 |
rite | -0.033 |
taboola | -0.033 |
yip | -0.032 |
Token | , |
Token ID | 11 |
Feature activation | +1.02e-03 |
Pos logit contributions | |
scribe | +0.048 |
results | +0.047 |
adem | +0.046 |
inen | +0.046 |
rior | +0.045 |
Neg logit contributions | |
ellen | -0.067 |
Developer | -0.064 |
rite | -0.063 |
taboola | -0.062 |
yip | -0.062 |
Token | 2016 |
Token ID | 1584 |
Feature activation | -2.66e-01 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.000 |
Developer | -0.000 |
rite | -0.000 |
taboola | -0.000 |
yip | -0.000 |
Token | @ |
Token ID | 2488 |
Feature activation | -4.48e-01 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.017 |
adem | +0.017 |
inen | +0.016 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.018 |
Developer | -0.017 |
rite | -0.016 |
taboola | -0.016 |
aux | -0.016 |
Token | Gl |
Token ID | 9861 |
Feature activation | +2.01e-01 |
Pos logit contributions | |
ellen | +0.111 |
Developer | +0.106 |
rite | +0.104 |
taboola | +0.103 |
aux | +0.100 |
Neg logit contributions | |
scribe | -0.099 |
results | -0.097 |
adem | -0.096 |
inen | -0.095 |
rior | -0.092 |
Token | as |
Token ID | 292 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
scribe | +0.042 |
results | +0.041 |
adem | +0.041 |
inen | +0.040 |
rior | +0.039 |
Neg logit contributions | |
ellen | -0.052 |
Developer | -0.050 |
taboola | -0.049 |
rite | -0.049 |
yip | -0.047 |
Token | gow |
Token ID | 21175 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
scribe | +0.029 |
results | +0.028 |
adem | +0.028 |
inen | +0.027 |
rior | +0.026 |
Neg logit contributions | |
ellen | -0.038 |
Developer | -0.036 |
taboola | -0.036 |
rite | -0.036 |
yip | -0.035 |
Token | War |
Token ID | 13195 |
Feature activation | -7.83e-02 |
Pos logit contributions | |
scribe | +0.035 |
results | +0.034 |
adem | +0.034 |
inen | +0.034 |
rior | +0.033 |
Neg logit contributions | |
ellen | -0.031 |
Developer | -0.029 |
rite | -0.029 |
taboola | -0.029 |
aux | -0.027 |
Token | riors |
Token ID | 8657 |
Feature activation | +1.35e+00 |
Pos logit contributions | |
ellen | +0.036 |
Developer | +0.035 |
taboola | +0.035 |
rite | +0.035 |
yip | +0.034 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
rior | -0.000 |
adem | -0.000 |
riors | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | -1.60e-02 |
Pos logit contributions | |
scribe | +0.301 |
results | +0.296 |
adem | +0.293 |
inen | +0.289 |
rior | +0.282 |
Neg logit contributions | |
ellen | -0.331 |
Developer | -0.316 |
rite | -0.310 |
taboola | -0.309 |
aux | -0.298 |
Token | Glasgow |
Token ID | 23995 |
Feature activation | +1.92e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.003 |
rior | -0.003 |
Token | Warriors |
Token ID | 12090 |
Feature activation | +4.62e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.006 |
Developer | -0.006 |
rite | -0.006 |
taboola | -0.006 |
yip | -0.005 |
Token | appearances |
Token ID | 11057 |
Feature activation | +3.99e-01 |
Pos logit contributions | |
scribe | +0.102 |
results | +0.100 |
adem | +0.099 |
inen | +0.098 |
rior | +0.095 |
Neg logit contributions | |
ellen | -0.115 |
Developer | -0.110 |
rite | -0.107 |
taboola | -0.107 |
yip | -0.104 |
Token | and |
Token ID | 290 |
Feature activation | -3.69e-02 |
Pos logit contributions | |
scribe | +0.092 |
results | +0.090 |
adem | +0.089 |
inen | +0.088 |
rior | +0.086 |
Neg logit contributions | |
ellen | -0.096 |
Developer | -0.091 |
rite | -0.089 |
taboola | -0.089 |
yip | -0.087 |
Token | repeat |
Token ID | 44754 |
Feature activation | -2.55e-01 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | =" |
Token ID | 2625 |
Feature activation | -2.77e-01 |
Pos logit contributions | |
ellen | +0.044 |
Developer | +0.041 |
taboola | +0.040 |
rite | +0.040 |
yip | +0.038 |
Neg logit contributions | |
scribe | -0.076 |
results | -0.075 |
adem | -0.074 |
inen | -0.073 |
rior | -0.072 |
Token | phone |
Token ID | 4862 |
Feature activation | -3.50e-01 |
Pos logit contributions | |
ellen | +0.051 |
Developer | +0.048 |
rite | +0.047 |
taboola | +0.047 |
aux | +0.045 |
Neg logit contributions | |
scribe | -0.078 |
results | -0.077 |
adem | -0.076 |
inen | -0.076 |
rior | -0.074 |
Token | in |
Token ID | 287 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
ellen | +0.086 |
Developer | +0.082 |
rite | +0.081 |
taboola | +0.080 |
aux | +0.077 |
Neg logit contributions | |
scribe | -0.077 |
results | -0.076 |
adem | -0.075 |
inen | -0.074 |
rior | -0.073 |
Token | phones |
Token ID | 9512 |
Feature activation | -3.54e-01 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.010 |
inen | +0.010 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.006 |
Developer | -0.006 |
rite | -0.006 |
taboola | -0.006 |
aux | -0.006 |
Token | "> |
Token ID | 5320 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
ellen | +0.144 |
Developer | +0.140 |
rite | +0.139 |
taboola | +0.138 |
aux | +0.136 |
Neg logit contributions | |
scribe | -0.021 |
results | -0.020 |
adem | -0.019 |
inen | -0.018 |
rior | -0.016 |
Token | < |
Token ID | 1279 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
scribe | +0.255 |
results | +0.250 |
adem | +0.246 |
inen | +0.243 |
rior | +0.236 |
Neg logit contributions | |
ellen | -0.365 |
Developer | -0.349 |
rite | -0.344 |
taboola | -0.343 |
yip | -0.331 |
Token | span |
Token ID | 12626 |
Feature activation | +1.37e-02 |
Pos logit contributions | |
scribe | +0.104 |
results | +0.103 |
adem | +0.102 |
inen | +0.101 |
rior | +0.098 |
Neg logit contributions | |
ellen | -0.102 |
Developer | -0.096 |
rite | -0.095 |
taboola | -0.094 |
aux | -0.091 |
Token | ng |
Token ID | 23370 |
Feature activation | +2.42e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
taboola | -0.003 |
rite | -0.003 |
yip | -0.003 |
Token | - |
Token ID | 12 |
Feature activation | +4.29e-02 |
Pos logit contributions | |
scribe | +0.051 |
results | +0.050 |
adem | +0.049 |
inen | +0.048 |
rior | +0.047 |
Neg logit contributions | |
ellen | -0.063 |
Developer | -0.060 |
taboola | -0.058 |
rite | -0.058 |
yip | -0.057 |
Token | bind |
Token ID | 21653 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.010 |
inen | +0.010 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.010 |
Developer | -0.010 |
taboola | -0.009 |
rite | -0.009 |
yip | -0.009 |
Token | controller |
Token ID | 36500 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
taboola | +0.003 |
rite | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | =" |
Token ID | 2625 |
Feature activation | -2.71e-01 |
Pos logit contributions | |
ellen | +0.022 |
Developer | +0.021 |
taboola | +0.021 |
rite | +0.021 |
yip | +0.020 |
Neg logit contributions | |
scribe | -0.026 |
results | -0.026 |
adem | -0.025 |
inen | -0.025 |
rior | -0.024 |
Token | Phone |
Token ID | 6132 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
ellen | +0.063 |
Developer | +0.059 |
rite | +0.058 |
taboola | +0.058 |
yip | +0.056 |
Neg logit contributions | |
scribe | -0.064 |
results | -0.063 |
adem | -0.062 |
inen | -0.062 |
rior | -0.060 |
Token | List |
Token ID | 8053 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
aux | -0.003 |
Token | Ctrl |
Token ID | 40069 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
scribe | +0.041 |
results | +0.040 |
adem | +0.040 |
inen | +0.039 |
rior | +0.038 |
Neg logit contributions | |
ellen | -0.052 |
Developer | -0.050 |
rite | -0.049 |
taboola | -0.049 |
aux | -0.047 |
Token | "> |
Token ID | 5320 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
ellen | +0.067 |
Developer | +0.065 |
rite | +0.064 |
taboola | +0.064 |
aux | +0.063 |
Neg logit contributions | |
scribe | -0.023 |
results | -0.023 |
adem | -0.022 |
inen | -0.022 |
rior | -0.021 |
Token | < |
Token ID | 1279 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
scribe | +0.197 |
results | +0.193 |
adem | +0.187 |
inen | +0.183 |
rior | +0.178 |
Neg logit contributions | |
ellen | -0.424 |
Developer | -0.406 |
rite | -0.401 |
taboola | -0.401 |
yip | -0.391 |
Token | ul |
Token ID | 377 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
scribe | +0.100 |
results | +0.099 |
adem | +0.097 |
inen | +0.096 |
rior | +0.094 |
Neg logit contributions | |
ellen | -0.103 |
Developer | -0.098 |
rite | -0.096 |
taboola | -0.096 |
yip | -0.092 |
Token | > |
Token ID | 29 |
Feature activation | +3.77e-02 |
Pos logit contributions | |
scribe | +0.047 |
results | +0.047 |
adem | +0.046 |
inen | +0.045 |
rior | +0.044 |
Neg logit contributions | |
ellen | -0.053 |
Developer | -0.051 |
rite | -0.050 |
taboola | -0.050 |
aux | -0.048 |
Token | < |
Token ID | 1279 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
scribe | +0.006 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.012 |
rite | -0.012 |
taboola | -0.012 |
yip | -0.011 |
Token | li |
Token ID | 4528 |
Feature activation | -2.14e-01 |
Pos logit contributions | |
scribe | +0.125 |
results | +0.124 |
adem | +0.122 |
inen | +0.121 |
rior | +0.118 |
Neg logit contributions | |
ellen | -0.087 |
Developer | -0.082 |
rite | -0.080 |
taboola | -0.079 |
yip | -0.076 |
Token | controller |
Token ID | 36500 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.005 |
Developer | -0.005 |
rite | -0.005 |
taboola | -0.005 |
yip | -0.005 |
Token | =" |
Token ID | 2625 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.015 |
rite | +0.015 |
taboola | +0.015 |
aux | +0.014 |
Neg logit contributions | |
scribe | -0.030 |
results | -0.030 |
adem | -0.030 |
inen | -0.029 |
rior | -0.029 |
Token | Phone |
Token ID | 6132 |
Feature activation | +3.97e-02 |
Pos logit contributions | |
ellen | +0.058 |
Developer | +0.055 |
rite | +0.054 |
taboola | +0.054 |
aux | +0.052 |
Neg logit contributions | |
scribe | -0.065 |
results | -0.064 |
adem | -0.063 |
inen | -0.062 |
rior | -0.061 |
Token | List |
Token ID | 8053 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
scribe | +0.008 |
results | +0.008 |
adem | +0.008 |
inen | +0.008 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.010 |
Developer | -0.010 |
rite | -0.010 |
taboola | -0.010 |
aux | -0.009 |
Token | Ctrl |
Token ID | 40069 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
scribe | +0.049 |
results | +0.048 |
adem | +0.048 |
inen | +0.047 |
rior | +0.046 |
Neg logit contributions | |
ellen | -0.043 |
Developer | -0.041 |
rite | -0.040 |
taboola | -0.040 |
aux | -0.038 |
Token | "> |
Token ID | 5320 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
ellen | +0.064 |
Developer | +0.062 |
rite | +0.062 |
taboola | +0.061 |
aux | +0.060 |
Neg logit contributions | |
scribe | -0.009 |
results | -0.009 |
adem | -0.009 |
inen | -0.008 |
rior | -0.007 |
Token | < |
Token ID | 1279 |
Feature activation | +4.34e-01 |
Pos logit contributions | |
scribe | +0.195 |
results | +0.190 |
adem | +0.187 |
inen | +0.183 |
rior | +0.176 |
Neg logit contributions | |
ellen | -0.423 |
Developer | -0.408 |
rite | -0.402 |
taboola | -0.401 |
aux | -0.390 |
Token | ul |
Token ID | 377 |
Feature activation | +2.40e-01 |
Pos logit contributions | |
scribe | +0.087 |
results | +0.085 |
adem | +0.084 |
inen | +0.083 |
rior | +0.080 |
Neg logit contributions | |
ellen | -0.116 |
Developer | -0.111 |
rite | -0.110 |
taboola | -0.109 |
aux | -0.105 |
Token | > |
Token ID | 29 |
Feature activation | +7.62e-02 |
Pos logit contributions | |
scribe | +0.054 |
results | +0.053 |
adem | +0.052 |
inen | +0.052 |
rior | +0.050 |
Neg logit contributions | |
ellen | -0.059 |
Developer | -0.056 |
rite | -0.055 |
taboola | -0.055 |
aux | -0.053 |
Token | < |
Token ID | 1279 |
Feature activation | +4.56e-01 |
Pos logit contributions | |
scribe | +0.011 |
results | +0.011 |
adem | +0.011 |
inen | +0.011 |
rior | +0.010 |
Neg logit contributions | |
ellen | -0.024 |
Developer | -0.023 |
rite | -0.023 |
taboola | -0.023 |
aux | -0.022 |
Token | li |
Token ID | 4528 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
scribe | +0.128 |
results | +0.126 |
adem | +0.125 |
inen | +0.124 |
rior | +0.121 |
Neg logit contributions | |
ellen | -0.086 |
Developer | -0.081 |
rite | -0.079 |
taboola | -0.078 |
aux | -0.074 |
Token | repeat |
Token ID | 44754 |
Feature activation | -2.59e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
taboola | +0.002 |
rite | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | =" |
Token ID | 2625 |
Feature activation | -2.81e-01 |
Pos logit contributions | |
ellen | +0.045 |
Developer | +0.042 |
taboola | +0.041 |
rite | +0.040 |
yip | +0.038 |
Neg logit contributions | |
scribe | -0.076 |
results | -0.075 |
adem | -0.075 |
inen | -0.074 |
rior | -0.073 |
Token | phone |
Token ID | 4862 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
ellen | +0.064 |
Developer | +0.061 |
rite | +0.060 |
taboola | +0.060 |
aux | +0.057 |
Neg logit contributions | |
scribe | -0.067 |
results | -0.066 |
adem | -0.065 |
inen | -0.065 |
rior | -0.063 |
Token | in |
Token ID | 287 |
Feature activation | -6.69e-03 |
Pos logit contributions | |
ellen | +0.089 |
Developer | +0.085 |
rite | +0.083 |
taboola | +0.083 |
aux | +0.080 |
Neg logit contributions | |
scribe | -0.076 |
results | -0.075 |
adem | -0.074 |
inen | -0.073 |
rior | -0.071 |
Token | phones |
Token ID | 9512 |
Feature activation | -3.54e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.001 |
taboola | +0.001 |
aux | +0.001 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.001 |
rior | -0.001 |
Token | "> |
Token ID | 5320 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
ellen | +0.103 |
Developer | +0.099 |
rite | +0.098 |
taboola | +0.097 |
yip | +0.095 |
Neg logit contributions | |
scribe | -0.063 |
results | -0.061 |
adem | -0.060 |
inen | -0.059 |
rior | -0.057 |
Token | {{ |
Token ID | 22935 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
scribe | +0.205 |
results | +0.202 |
adem | +0.195 |
inen | +0.193 |
rior | +0.185 |
Neg logit contributions | |
ellen | -0.414 |
Developer | -0.396 |
rite | -0.391 |
taboola | -0.390 |
yip | -0.380 |
Token | phone |
Token ID | 3072 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
scribe | +0.088 |
results | +0.086 |
adem | +0.086 |
inen | +0.085 |
rior | +0.083 |
Neg logit contributions | |
ellen | -0.072 |
Developer | -0.068 |
rite | -0.067 |
taboola | -0.066 |
aux | -0.063 |
Token | . |
Token ID | 13 |
Feature activation | -4.41e-03 |
Pos logit contributions | |
ellen | +0.034 |
Developer | +0.033 |
rite | +0.032 |
taboola | +0.032 |
yip | +0.031 |
Neg logit contributions | |
scribe | -0.028 |
results | -0.027 |
adem | -0.027 |
inen | -0.027 |
rior | -0.026 |
Token | name |
Token ID | 3672 |
Feature activation | -9.38e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
aux | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | }} |
Token ID | 34949 |
Feature activation | +2.62e-01 |
Pos logit contributions | |
ellen | +0.025 |
Developer | +0.024 |
rite | +0.024 |
taboola | +0.024 |
yip | +0.023 |
Neg logit contributions | |
scribe | -0.019 |
results | -0.018 |
adem | -0.018 |
inen | -0.018 |
rior | -0.017 |
Token | phone |
Token ID | 4862 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
ellen | +0.053 |
Developer | +0.050 |
rite | +0.049 |
taboola | +0.048 |
aux | +0.046 |
Neg logit contributions | |
scribe | -0.080 |
results | -0.079 |
adem | -0.079 |
inen | -0.078 |
rior | -0.076 |
Token | . |
Token ID | 13 |
Feature activation | -6.38e-03 |
Pos logit contributions | |
ellen | +0.092 |
Developer | +0.089 |
rite | +0.087 |
taboola | +0.087 |
aux | +0.084 |
Neg logit contributions | |
scribe | -0.072 |
results | -0.071 |
adem | -0.070 |
inen | -0.069 |
rior | -0.067 |
Token | sn |
Token ID | 16184 |
Feature activation | -2.77e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
aux | +0.001 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | ipp |
Token ID | 3974 |
Feature activation | +3.95e-01 |
Pos logit contributions | |
ellen | +0.092 |
Developer | +0.090 |
taboola | +0.089 |
rite | +0.088 |
yip | +0.086 |
Neg logit contributions | |
scribe | -0.037 |
results | -0.036 |
adem | -0.036 |
inen | -0.035 |
rior | -0.033 |
Token | et |
Token ID | 316 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
scribe | +0.099 |
results | +0.097 |
adem | +0.097 |
inen | +0.095 |
rior | +0.093 |
Neg logit contributions | |
ellen | -0.085 |
Developer | -0.083 |
taboola | -0.081 |
rite | -0.080 |
yip | -0.076 |
Token | "> |
Token ID | 5320 |
Feature activation | +1.32e+00 |
Pos logit contributions | |
ellen | +0.051 |
Developer | +0.049 |
rite | +0.048 |
taboola | +0.048 |
aux | +0.047 |
Neg logit contributions | |
scribe | -0.016 |
results | -0.016 |
adem | -0.015 |
inen | -0.015 |
rior | -0.014 |
Token | Optional |
Token ID | 30719 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
scribe | +0.228 |
results | +0.223 |
adem | +0.219 |
inen | +0.216 |
rior | +0.208 |
Neg logit contributions | |
ellen | -0.388 |
Developer | -0.373 |
rite | -0.367 |
taboola | -0.367 |
yip | -0.355 |
Token | : |
Token ID | 25 |
Feature activation | -6.03e-02 |
Pos logit contributions | |
scribe | +0.054 |
results | +0.053 |
adem | +0.052 |
inen | +0.052 |
rior | +0.050 |
Neg logit contributions | |
ellen | -0.074 |
Developer | -0.071 |
taboola | -0.070 |
rite | -0.070 |
yip | -0.067 |
Token | visually |
Token ID | 22632 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ellen | +0.015 |
Developer | +0.014 |
taboola | +0.014 |
rite | +0.014 |
yip | +0.013 |
Neg logit contributions | |
scribe | -0.013 |
results | -0.013 |
adem | -0.013 |
inen | -0.013 |
rior | -0.012 |
Token | pleasing |
Token ID | 28790 |
Feature activation | -4.45e-01 |
Pos logit contributions | |
scribe | +0.028 |
results | +0.027 |
adem | +0.027 |
inen | +0.027 |
rior | +0.026 |
Neg logit contributions | |
ellen | -0.026 |
Developer | -0.025 |
rite | -0.025 |
taboola | -0.025 |
yip | -0.024 |
Token | placeholder |
Token ID | 46076 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
ellen | +0.115 |
Developer | +0.110 |
rite | +0.108 |
taboola | +0.108 |
yip | +0.104 |
Neg logit contributions | |
scribe | -0.093 |
results | -0.091 |
adem | -0.090 |
inen | -0.089 |
rior | -0.087 |
Token | omm |
Token ID | 2002 |
Feature activation | +4.63e-01 |
Pos logit contributions | |
ellen | +0.127 |
Developer | +0.122 |
rite | +0.119 |
taboola | +0.119 |
aux | +0.114 |
Neg logit contributions | |
scribe | -0.115 |
results | -0.113 |
adem | -0.112 |
inen | -0.110 |
rior | -0.107 |
Token | i |
Token ID | 72 |
Feature activation | -2.21e-03 |
Pos logit contributions | |
scribe | +0.108 |
results | +0.105 |
adem | +0.105 |
inen | +0.104 |
rior | +0.101 |
Neg logit contributions | |
ellen | -0.109 |
Developer | -0.104 |
taboola | -0.103 |
rite | -0.102 |
yip | -0.098 |
Token | L |
Token ID | 406 |
Feature activation | +1.75e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.000 |
aux | +0.000 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | ä |
Token ID | 11033 |
Feature activation | +3.60e-03 |
Pos logit contributions | |
scribe | +0.039 |
results | +0.038 |
adem | +0.038 |
inen | +0.037 |
rior | +0.036 |
Neg logit contributions | |
ellen | -0.043 |
Developer | -0.041 |
rite | -0.040 |
taboola | -0.040 |
yip | -0.039 |
Token | nt |
Token ID | 429 |
Feature activation | -4.74e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
taboola | -0.001 |
rite | -0.001 |
yip | -0.001 |
Token | inen |
Token ID | 42326 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
ellen | +0.120 |
Developer | +0.114 |
rite | +0.112 |
taboola | +0.112 |
aux | +0.108 |
Neg logit contributions | |
scribe | -0.102 |
results | -0.100 |
adem | -0.099 |
inen | -0.097 |
rior | -0.095 |
Token | , |
Token ID | 11 |
Feature activation | +2.38e-02 |
Pos logit contributions | |
scribe | +0.280 |
results | +0.274 |
adem | +0.272 |
inen | +0.270 |
rior | +0.261 |
Neg logit contributions | |
ellen | -0.334 |
Developer | -0.320 |
taboola | -0.314 |
rite | -0.314 |
yip | -0.302 |
Token | Sus |
Token ID | 8932 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
scribe | +0.006 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.006 |
Developer | -0.005 |
taboola | -0.005 |
rite | -0.005 |
yip | -0.005 |
Token | anna |
Token ID | 7697 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
scribe | +0.054 |
results | +0.053 |
adem | +0.052 |
inen | +0.052 |
rior | +0.050 |
Neg logit contributions | |
ellen | -0.052 |
Developer | -0.049 |
rite | -0.048 |
taboola | -0.048 |
aux | -0.046 |
Token | Ha |
Token ID | 9398 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
ellen | +0.042 |
Developer | +0.040 |
rite | +0.039 |
taboola | +0.039 |
yip | +0.038 |
Neg logit contributions | |
scribe | -0.039 |
results | -0.038 |
adem | -0.038 |
inen | -0.038 |
rior | -0.037 |
Token | av |
Token ID | 615 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
scribe | +0.051 |
results | +0.050 |
adem | +0.049 |
inen | +0.049 |
rior | +0.048 |
Neg logit contributions | |
ellen | -0.050 |
Developer | -0.048 |
rite | -0.047 |
taboola | -0.046 |
aux | -0.045 |
Token | ully |
Token ID | 2132 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
scribe | +0.052 |
results | +0.051 |
adem | +0.050 |
inen | +0.050 |
rior | +0.048 |
Neg logit contributions | |
ellen | -0.060 |
Developer | -0.057 |
taboola | -0.056 |
rite | -0.056 |
yip | -0.054 |
Token | / |
Token ID | 14 |
Feature activation | +9.27e-02 |
Pos logit contributions | |
scribe | +0.048 |
results | +0.047 |
adem | +0.046 |
inen | +0.046 |
rior | +0.045 |
Neg logit contributions | |
ellen | -0.054 |
Developer | -0.051 |
taboola | -0.050 |
rite | -0.050 |
yip | -0.048 |
Token | Vict |
Token ID | 21944 |
Feature activation | +1.50e-01 |
Pos logit contributions | |
scribe | +0.024 |
results | +0.024 |
adem | +0.023 |
inen | +0.023 |
rior | +0.023 |
Neg logit contributions | |
ellen | -0.020 |
Developer | -0.018 |
taboola | -0.018 |
rite | -0.018 |
yip | -0.017 |
Token | im |
Token ID | 320 |
Feature activation | +2.18e-01 |
Pos logit contributions | |
scribe | +0.028 |
results | +0.027 |
adem | +0.027 |
inen | +0.027 |
rior | +0.026 |
Neg logit contributions | |
ellen | -0.042 |
Developer | -0.041 |
rite | -0.040 |
taboola | -0.040 |
yip | -0.038 |
Token | Question |
Token ID | 18233 |
Feature activation | +5.90e-02 |
Pos logit contributions | |
scribe | +0.046 |
results | +0.045 |
adem | +0.045 |
inen | +0.044 |
rior | +0.043 |
Neg logit contributions | |
ellen | -0.056 |
Developer | -0.053 |
taboola | -0.052 |
rite | -0.052 |
yip | -0.050 |
Token | naire |
Token ID | 24042 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.024 |
Developer | -0.023 |
rite | -0.023 |
taboola | -0.023 |
aux | -0.023 |
Token | [ |
Token ID | 685 |
Feature activation | -2.24e-01 |
Pos logit contributions | |
scribe | +0.278 |
results | +0.273 |
adem | +0.270 |
inen | +0.267 |
rior | +0.259 |
Neg logit contributions | |
ellen | -0.321 |
Developer | -0.307 |
rite | -0.301 |
taboola | -0.300 |
yip | -0.289 |
Token | M |
Token ID | 44 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
ellen | +0.051 |
Developer | +0.049 |
taboola | +0.048 |
rite | +0.048 |
yip | +0.046 |
Neg logit contributions | |
scribe | -0.054 |
results | -0.053 |
adem | -0.052 |
inen | -0.052 |
rior | -0.050 |
Token | imeo |
Token ID | 47776 |
Feature activation | -5.93e-03 |
Pos logit contributions | |
scribe | +0.029 |
results | +0.029 |
adem | +0.028 |
inen | +0.028 |
rior | +0.027 |
Neg logit contributions | |
ellen | -0.032 |
Developer | -0.031 |
rite | -0.030 |
taboola | -0.030 |
aux | -0.029 |
Token | ]. |
Token ID | 4083 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.001 |
Token | Ber |
Token ID | 4312 |
Feature activation | +3.20e-01 |
Pos logit contributions | |
ellen | +0.034 |
Developer | +0.032 |
rite | +0.032 |
taboola | +0.032 |
yip | +0.031 |
Neg logit contributions | |
scribe | -0.029 |
results | -0.028 |
adem | -0.028 |
inen | -0.028 |
rior | -0.027 |
Token | not |
Token ID | 407 |
Feature activation | +7.00e-02 |
Pos logit contributions | |
ellen | +0.007 |
Developer | +0.007 |
rite | +0.007 |
taboola | +0.007 |
yip | +0.006 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.006 |
Token | - |
Token ID | 12 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
scribe | +0.016 |
results | +0.016 |
adem | +0.015 |
inen | +0.015 |
rior | +0.015 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.016 |
rite | -0.016 |
taboola | -0.016 |
yip | -0.015 |
Token | so |
Token ID | 568 |
Feature activation | +2.29e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | - |
Token ID | 12 |
Feature activation | +1.01e-05 |
Pos logit contributions | |
scribe | +0.051 |
results | +0.050 |
adem | +0.049 |
inen | +0.049 |
rior | +0.048 |
Neg logit contributions | |
ellen | -0.056 |
Developer | -0.054 |
rite | -0.053 |
taboola | -0.053 |
aux | -0.051 |
Token | sub |
Token ID | 7266 |
Feature activation | -1.59e-03 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.000 |
Developer | -0.000 |
rite | -0.000 |
taboola | -0.000 |
aux | -0.000 |
Token | tle |
Token ID | 7100 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
aux | +0.001 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | emotions |
Token ID | 10825 |
Feature activation | +9.81e-02 |
Pos logit contributions | |
scribe | +0.295 |
results | +0.290 |
adem | +0.287 |
inen | +0.284 |
rior | +0.277 |
Neg logit contributions | |
ellen | -0.298 |
Developer | -0.283 |
rite | -0.278 |
taboola | -0.277 |
yip | -0.266 |
Token | Robert |
Token ID | 5199 |
Feature activation | +3.34e-01 |
Pos logit contributions | |
scribe | +0.023 |
results | +0.023 |
adem | +0.022 |
inen | +0.022 |
rior | +0.022 |
Neg logit contributions | |
ellen | -0.023 |
Developer | -0.022 |
rite | -0.021 |
taboola | -0.021 |
aux | -0.020 |
Token | Black |
Token ID | 2619 |
Feature activation | +2.15e-01 |
Pos logit contributions | |
scribe | +0.075 |
results | +0.073 |
adem | +0.073 |
inen | +0.072 |
rior | +0.070 |
Neg logit contributions | |
ellen | -0.082 |
Developer | -0.078 |
rite | -0.076 |
taboola | -0.076 |
aux | -0.073 |
Token | and |
Token ID | 290 |
Feature activation | -2.96e-04 |
Pos logit contributions | |
scribe | +0.048 |
results | +0.047 |
adem | +0.047 |
inen | +0.046 |
rior | +0.045 |
Neg logit contributions | |
ellen | -0.052 |
Developer | -0.050 |
rite | -0.049 |
taboola | -0.049 |
yip | -0.047 |
Token | the |
Token ID | 262 |
Feature activation | -9.81e-03 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | Eco |
Token ID | 38719 |
Feature activation | -6.51e-02 |
Pos logit contributions | |
scribe | +0.033 |
results | +0.032 |
adem | +0.032 |
inen | +0.032 |
rior | +0.031 |
Neg logit contributions | |
ellen | -0.030 |
Developer | -0.028 |
taboola | -0.028 |
rite | -0.027 |
yip | -0.027 |
Token | Boost |
Token ID | 45686 |
Feature activation | -4.13e-01 |
Pos logit contributions | |
ellen | +0.010 |
Developer | +0.009 |
taboola | +0.009 |
rite | +0.009 |
yip | +0.009 |
Neg logit contributions | |
scribe | -0.020 |
results | -0.020 |
adem | -0.020 |
inen | -0.019 |
rior | -0.019 |
Token | proved |
Token ID | 8302 |
Feature activation | -3.00e-01 |
Pos logit contributions | |
ellen | +0.091 |
Developer | +0.087 |
taboola | +0.085 |
rite | +0.084 |
yip | +0.082 |
Neg logit contributions | |
scribe | -0.102 |
results | -0.101 |
adem | -0.099 |
inen | -0.098 |
rior | -0.096 |
Token | its |
Token ID | 663 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
ellen | +0.073 |
Developer | +0.070 |
taboola | +0.068 |
rite | +0.068 |
yip | +0.066 |
Neg logit contributions | |
scribe | -0.068 |
results | -0.067 |
adem | -0.066 |
inen | -0.065 |
rior | -0.063 |
Token | met |
Token ID | 1138 |
Feature activation | -4.91e-02 |
Pos logit contributions | |
ellen | +0.036 |
Developer | +0.034 |
rite | +0.033 |
taboola | +0.033 |
yip | +0.032 |
Neg logit contributions | |
scribe | -0.039 |
results | -0.039 |
adem | -0.038 |
inen | -0.038 |
rior | -0.037 |
Token | tle |
Token ID | 7100 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.017 |
rite | +0.016 |
taboola | +0.016 |
yip | +0.016 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.005 |
rior | -0.005 |
Token | off |
Token ID | 572 |
Feature activation | -1.96e-01 |
Pos logit contributions | |
scribe | +0.268 |
results | +0.264 |
adem | +0.261 |
inen | +0.258 |
rior | +0.251 |
Neg logit contributions | |
ellen | -0.321 |
Developer | -0.307 |
taboola | -0.302 |
rite | -0.301 |
yip | -0.291 |
Token | - |
Token ID | 12 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
ellen | +0.050 |
Developer | +0.047 |
rite | +0.047 |
taboola | +0.046 |
yip | +0.045 |
Neg logit contributions | |
scribe | -0.042 |
results | -0.041 |
adem | -0.041 |
inen | -0.040 |
rior | -0.039 |
Token | road |
Token ID | 6344 |
Feature activation | +3.28e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
taboola | -0.003 |
rite | -0.003 |
yip | -0.003 |
Token | – |
Token ID | 784 |
Feature activation | +2.37e-02 |
Pos logit contributions | |
scribe | +0.070 |
results | +0.069 |
adem | +0.068 |
inen | +0.067 |
rior | +0.066 |
Neg logit contributions | |
ellen | -0.084 |
Developer | -0.080 |
taboola | -0.078 |
rite | -0.078 |
yip | -0.076 |
Token | racing |
Token ID | 11717 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.006 |
Developer | -0.006 |
taboola | -0.005 |
rite | -0.005 |
yip | -0.005 |
Token | level |
Token ID | 1241 |
Feature activation | +1.59e-01 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
taboola | -0.004 |
rite | -0.004 |
yip | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
scribe | +0.036 |
results | +0.036 |
adem | +0.035 |
inen | +0.035 |
rior | +0.034 |
Neg logit contributions | |
ellen | -0.038 |
Developer | -0.036 |
taboola | -0.036 |
rite | -0.035 |
yip | -0.034 |
Token |
|
Token ID | 198 |
Feature activation | -1.07e-03 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +4.65e-03 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | ST |
Token ID | 2257 |
Feature activation | -9.32e-02 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token | ORY |
Token ID | 15513 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
ellen | +0.036 |
Developer | +0.035 |
rite | +0.035 |
taboola | +0.035 |
aux | +0.034 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.006 |
rior | -0.006 |
Token | : |
Token ID | 25 |
Feature activation | -3.48e-02 |
Pos logit contributions | |
scribe | +0.278 |
results | +0.273 |
inen | +0.268 |
adem | +0.268 |
rior | +0.261 |
Neg logit contributions | |
ellen | -0.308 |
Developer | -0.292 |
rite | -0.289 |
taboola | -0.287 |
yip | -0.281 |
Token | Treasury |
Token ID | 13419 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
ellen | +0.009 |
Developer | +0.008 |
rite | +0.008 |
taboola | +0.008 |
yip | +0.008 |
Neg logit contributions | |
scribe | -0.008 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token | will |
Token ID | 481 |
Feature activation | +6.21e-02 |
Pos logit contributions | |
ellen | +0.042 |
Developer | +0.040 |
rite | +0.039 |
taboola | +0.039 |
aux | +0.038 |
Neg logit contributions | |
scribe | -0.036 |
results | -0.036 |
adem | -0.035 |
inen | -0.035 |
rior | -0.034 |
Token | run |
Token ID | 1057 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.016 |
adem | +0.016 |
inen | +0.016 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.012 |
rite | -0.012 |
taboola | -0.012 |
yip | -0.011 |
Token | out |
Token ID | 503 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
ellen | +0.118 |
Developer | +0.112 |
rite | +0.110 |
taboola | +0.110 |
aux | +0.106 |
Neg logit contributions | |
scribe | -0.110 |
results | -0.108 |
adem | -0.106 |
inen | -0.105 |
rior | -0.102 |
Token | she |
Token ID | 673 |
Feature activation | +8.81e-02 |
Pos logit contributions | |
scribe | +0.008 |
results | +0.007 |
adem | +0.007 |
inen | +0.007 |
rior | +0.007 |
Neg logit contributions | |
ellen | -0.008 |
Developer | -0.008 |
rite | -0.008 |
taboola | -0.008 |
aux | -0.007 |
Token | reported |
Token ID | 2098 |
Feature activation | +6.85e-03 |
Pos logit contributions | |
scribe | +0.020 |
results | +0.019 |
adem | +0.019 |
inen | +0.019 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.021 |
Developer | -0.020 |
rite | -0.020 |
taboola | -0.020 |
yip | -0.019 |
Token | that |
Token ID | 326 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
aux | -0.001 |
Token | she |
Token ID | 673 |
Feature activation | +8.30e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.002 |
Token | had |
Token ID | 550 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.019 |
inen | +0.019 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.019 |
Developer | -0.018 |
rite | -0.018 |
taboola | -0.018 |
aux | -0.017 |
Token | sequ |
Token ID | 4726 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | enced |
Token ID | 5864 |
Feature activation | +5.18e-01 |
Pos logit contributions | |
scribe | +0.169 |
results | +0.164 |
adem | +0.161 |
inen | +0.160 |
rior | +0.149 |
Neg logit contributions | |
ellen | -0.413 |
Developer | -0.403 |
taboola | -0.399 |
rite | -0.396 |
yip | -0.389 |
Token | proteins |
Token ID | 15568 |
Feature activation | -5.06e-03 |
Pos logit contributions | |
scribe | +0.114 |
results | +0.112 |
adem | +0.111 |
inen | +0.109 |
rior | +0.106 |
Neg logit contributions | |
ellen | -0.129 |
Developer | -0.123 |
taboola | -0.120 |
rite | -0.120 |
yip | -0.116 |
Token | in |
Token ID | 287 |
Feature activation | -4.64e-03 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
taboola | +0.001 |
rite | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +3.23e-03 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | dinosaur |
Token ID | 28257 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
taboola | -0.001 |
rite | -0.001 |
yip | -0.001 |
Token | Journal |
Token ID | 4913 |
Feature activation | +1.83e-01 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
rite | -0.004 |
taboola | -0.004 |
yip | -0.004 |
Token | � |
Token ID | 447 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
scribe | +0.041 |
results | +0.040 |
adem | +0.039 |
inen | +0.039 |
rior | +0.038 |
Neg logit contributions | |
ellen | -0.045 |
Developer | -0.043 |
rite | -0.042 |
taboola | -0.042 |
yip | -0.041 |
Token | � |
Token ID | 247 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
ellen | +0.008 |
Developer | +0.008 |
rite | +0.008 |
taboola | +0.007 |
yip | +0.007 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
inen | -0.007 |
adem | -0.007 |
rior | -0.007 |
Token | s |
Token ID | 82 |
Feature activation | -4.42e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | Yar |
Token ID | 45184 |
Feature activation | +2.82e-02 |
Pos logit contributions | |
ellen | +0.011 |
Developer | +0.010 |
rite | +0.010 |
taboola | +0.010 |
yip | +0.010 |
Neg logit contributions | |
scribe | -0.010 |
results | -0.010 |
adem | -0.010 |
inen | -0.010 |
rior | -0.009 |
Token | oslav |
Token ID | 26388 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.009 |
Developer | -0.009 |
rite | -0.009 |
taboola | -0.009 |
yip | -0.008 |
Token | Tro |
Token ID | 8498 |
Feature activation | +2.03e-01 |
Pos logit contributions | |
scribe | +0.281 |
results | +0.276 |
adem | +0.273 |
inen | +0.271 |
rior | +0.264 |
Neg logit contributions | |
ellen | -0.302 |
Developer | -0.290 |
taboola | -0.285 |
rite | -0.284 |
yip | -0.272 |
Token | f |
Token ID | 69 |
Feature activation | +8.93e-02 |
Pos logit contributions | |
scribe | +0.044 |
results | +0.043 |
adem | +0.043 |
inen | +0.042 |
rior | +0.041 |
Neg logit contributions | |
ellen | -0.051 |
Developer | -0.049 |
rite | -0.048 |
taboola | -0.048 |
aux | -0.046 |
Token | imov |
Token ID | 44273 |
Feature activation | +4.24e-01 |
Pos logit contributions | |
scribe | +0.015 |
results | +0.014 |
adem | +0.014 |
inen | +0.014 |
rior | +0.014 |
Neg logit contributions | |
ellen | -0.027 |
Developer | -0.026 |
rite | -0.026 |
taboola | -0.026 |
yip | -0.025 |
Token | reports |
Token ID | 3136 |
Feature activation | -4.49e-02 |
Pos logit contributions | |
scribe | +0.096 |
results | +0.095 |
adem | +0.094 |
inen | +0.093 |
rior | +0.091 |
Neg logit contributions | |
ellen | -0.102 |
Developer | -0.097 |
rite | -0.095 |
taboola | -0.095 |
yip | -0.091 |
Token | this |
Token ID | 428 |
Feature activation | -8.40e-02 |
Pos logit contributions | |
ellen | +0.011 |
Developer | +0.011 |
rite | +0.011 |
taboola | +0.011 |
aux | +0.010 |
Neg logit contributions | |
scribe | -0.010 |
results | -0.009 |
adem | -0.009 |
inen | -0.009 |
rior | -0.009 |
Token | into |
Token ID | 656 |
Feature activation | +1.68e-01 |
Pos logit contributions | |
ellen | +0.086 |
Developer | +0.082 |
rite | +0.081 |
taboola | +0.081 |
yip | +0.078 |
Neg logit contributions | |
scribe | -0.063 |
results | -0.062 |
adem | -0.061 |
inen | -0.061 |
rior | -0.059 |
Token | beat |
Token ID | 4405 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
scribe | +0.037 |
results | +0.036 |
adem | +0.036 |
inen | +0.035 |
rior | +0.034 |
Neg logit contributions | |
ellen | -0.042 |
Developer | -0.040 |
rite | -0.039 |
taboola | -0.039 |
yip | -0.038 |
Token | ings |
Token ID | 654 |
Feature activation | +4.53e-01 |
Pos logit contributions | |
ellen | +0.059 |
Developer | +0.057 |
rite | +0.056 |
taboola | +0.056 |
yip | +0.055 |
Neg logit contributions | |
scribe | -0.021 |
results | -0.020 |
adem | -0.020 |
inen | -0.020 |
rior | -0.019 |
Token | in |
Token ID | 287 |
Feature activation | -1.41e-02 |
Pos logit contributions | |
scribe | +0.101 |
results | +0.100 |
adem | +0.098 |
inen | +0.098 |
rior | +0.095 |
Neg logit contributions | |
ellen | -0.111 |
Developer | -0.106 |
taboola | -0.103 |
rite | -0.103 |
yip | -0.099 |
Token | Yar |
Token ID | 45184 |
Feature activation | +3.13e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | oslav |
Token ID | 26388 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.013 |
Developer | -0.013 |
rite | -0.013 |
taboola | -0.013 |
yip | -0.013 |
Token | l |
Token ID | 75 |
Feature activation | +2.52e-01 |
Pos logit contributions | |
scribe | +0.235 |
results | +0.230 |
adem | +0.227 |
inen | +0.224 |
rior | +0.217 |
Neg logit contributions | |
ellen | -0.348 |
Developer | -0.335 |
taboola | -0.329 |
rite | -0.328 |
yip | -0.318 |
Token | Colony |
Token ID | 34480 |
Feature activation | -2.78e-01 |
Pos logit contributions | |
scribe | +0.053 |
results | +0.052 |
adem | +0.051 |
inen | +0.050 |
rior | +0.049 |
Neg logit contributions | |
ellen | -0.065 |
Developer | -0.062 |
rite | -0.061 |
taboola | -0.061 |
yip | -0.059 |
Token | No |
Token ID | 1400 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
ellen | +0.071 |
Developer | +0.068 |
rite | +0.067 |
taboola | +0.067 |
yip | +0.064 |
Neg logit contributions | |
scribe | -0.059 |
results | -0.058 |
adem | -0.057 |
inen | -0.056 |
rior | -0.055 |
Token | 1 |
Token ID | 352 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
ellen | +0.046 |
Developer | +0.044 |
rite | +0.043 |
taboola | +0.043 |
aux | +0.041 |
Neg logit contributions | |
scribe | -0.041 |
results | -0.040 |
adem | -0.040 |
inen | -0.039 |
rior | -0.038 |
Token | — |
Token ID | 851 |
Feature activation | +9.07e-02 |
Pos logit contributions | |
ellen | +0.037 |
Developer | +0.035 |
rite | +0.034 |
taboola | +0.034 |
yip | +0.033 |
Neg logit contributions | |
scribe | -0.030 |
results | -0.030 |
adem | -0.029 |
inen | -0.029 |
rior | -0.028 |
Token | / |
Token ID | 14 |
Feature activation | +8.22e-02 |
Pos logit contributions | |
ellen | +0.009 |
Developer | +0.008 |
rite | +0.008 |
taboola | +0.008 |
aux | +0.008 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token | 08 |
Token ID | 2919 |
Feature activation | -1.11e-02 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.019 |
inen | +0.019 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.019 |
Developer | -0.018 |
rite | -0.018 |
taboola | -0.018 |
yip | -0.017 |
Token | / |
Token ID | 14 |
Feature activation | +7.95e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | the |
Token ID | 1169 |
Feature activation | +3.29e-01 |
Pos logit contributions | |
scribe | +0.018 |
results | +0.018 |
adem | +0.017 |
inen | +0.017 |
rior | +0.017 |
Neg logit contributions | |
ellen | -0.019 |
Developer | -0.019 |
rite | -0.018 |
taboola | -0.018 |
yip | -0.017 |
Token | - |
Token ID | 12 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
scribe | +0.072 |
results | +0.071 |
adem | +0.070 |
inen | +0.070 |
rior | +0.068 |
Neg logit contributions | |
ellen | -0.081 |
Developer | -0.078 |
rite | -0.076 |
taboola | -0.076 |
aux | -0.073 |
Token | moon |
Token ID | 22977 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
ellen | +0.005 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
aux | +0.004 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.004 |
rior | -0.004 |
Token | - |
Token ID | 12 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
scribe | +0.265 |
results | +0.260 |
adem | +0.257 |
inen | +0.253 |
rior | +0.247 |
Neg logit contributions | |
ellen | -0.318 |
Developer | -0.304 |
rite | -0.298 |
taboola | -0.297 |
yip | -0.287 |
Token | still |
Token ID | 24219 |
Feature activation | -3.17e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
taboola | +0.003 |
rite | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | - |
Token ID | 12 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
ellen | +0.078 |
Developer | +0.074 |
rite | +0.073 |
taboola | +0.073 |
aux | +0.070 |
Neg logit contributions | |
scribe | -0.071 |
results | -0.069 |
adem | -0.069 |
inen | -0.068 |
rior | -0.066 |
Token | h |
Token ID | 71 |
Feature activation | -4.12e-01 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.004 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | angs |
Token ID | 27725 |
Feature activation | +1.15e-01 |
Pos logit contributions | |
ellen | +0.099 |
Developer | +0.094 |
rite | +0.093 |
taboola | +0.092 |
aux | +0.089 |
Neg logit contributions | |
scribe | -0.094 |
results | -0.092 |
adem | -0.090 |
inen | -0.089 |
rior | -0.088 |
Token | prison |
Token ID | 3770 |
Feature activation | +2.54e-01 |
Pos logit contributions | |
scribe | +0.008 |
results | +0.008 |
adem | +0.008 |
inen | +0.008 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.010 |
Developer | -0.010 |
rite | -0.009 |
taboola | -0.009 |
aux | -0.009 |
Token | officers |
Token ID | 3790 |
Feature activation | +3.83e-01 |
Pos logit contributions | |
scribe | +0.042 |
results | +0.041 |
adem | +0.041 |
inen | +0.040 |
rior | +0.039 |
Neg logit contributions | |
ellen | -0.077 |
Developer | -0.074 |
rite | -0.072 |
taboola | -0.072 |
yip | -0.070 |
Token | in |
Token ID | 287 |
Feature activation | -2.13e-02 |
Pos logit contributions | |
scribe | +0.083 |
results | +0.081 |
adem | +0.080 |
inen | +0.080 |
rior | +0.077 |
Neg logit contributions | |
ellen | -0.096 |
Developer | -0.092 |
rite | -0.090 |
taboola | -0.090 |
yip | -0.087 |
Token | a |
Token ID | 257 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
ellen | +0.005 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
aux | +0.005 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.005 |
rior | -0.004 |
Token | Yar |
Token ID | 45184 |
Feature activation | +3.95e-03 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
aux | -0.002 |
Token | oslav |
Token ID | 26388 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
aux | -0.002 |
Token | l |
Token ID | 75 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
scribe | +0.244 |
results | +0.239 |
adem | +0.236 |
inen | +0.233 |
rior | +0.226 |
Neg logit contributions | |
ellen | -0.337 |
Developer | -0.323 |
rite | -0.317 |
taboola | -0.317 |
yip | -0.306 |
Token | prison |
Token ID | 3770 |
Feature activation | +2.70e-01 |
Pos logit contributions | |
scribe | +0.055 |
results | +0.054 |
adem | +0.053 |
inen | +0.052 |
rior | +0.051 |
Neg logit contributions | |
ellen | -0.062 |
Developer | -0.060 |
rite | -0.058 |
taboola | -0.058 |
yip | -0.056 |
Token | colony |
Token ID | 18815 |
Feature activation | -4.74e-01 |
Pos logit contributions | |
scribe | +0.059 |
results | +0.058 |
adem | +0.058 |
inen | +0.057 |
rior | +0.055 |
Neg logit contributions | |
ellen | -0.067 |
Developer | -0.064 |
rite | -0.063 |
taboola | -0.063 |
yip | -0.060 |
Token | . |
Token ID | 13 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
ellen | +0.119 |
Developer | +0.114 |
rite | +0.112 |
taboola | +0.112 |
yip | +0.107 |
Neg logit contributions | |
scribe | -0.102 |
results | -0.101 |
adem | -0.100 |
inen | -0.098 |
rior | -0.096 |
Token | On |
Token ID | 1550 |
Feature activation | -5.79e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | none |
Token ID | 4844 |
Feature activation | +2.02e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.002 |
taboola | -0.002 |
yip | -0.002 |
Token | - |
Token ID | 12 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
scribe | +0.045 |
results | +0.043 |
adem | +0.043 |
inen | +0.043 |
rior | +0.042 |
Neg logit contributions | |
ellen | -0.050 |
Developer | -0.048 |
rite | -0.047 |
taboola | -0.046 |
yip | -0.044 |
Token | too |
Token ID | 18820 |
Feature activation | -5.61e-02 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
taboola | -0.003 |
rite | -0.003 |
yip | -0.003 |
Token | - |
Token ID | 12 |
Feature activation | +8.08e-03 |
Pos logit contributions | |
ellen | +0.014 |
Developer | +0.013 |
rite | +0.013 |
taboola | +0.013 |
aux | +0.013 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.012 |
adem | -0.012 |
inen | -0.012 |
rior | -0.011 |
Token | sub |
Token ID | 7266 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
taboola | -0.002 |
rite | -0.002 |
yip | -0.002 |
Token | tle |
Token ID | 7100 |
Feature activation | +1.23e+00 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
aux | +0.004 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | dig |
Token ID | 3100 |
Feature activation | +6.05e-02 |
Pos logit contributions | |
scribe | +0.279 |
results | +0.272 |
adem | +0.270 |
inen | +0.268 |
rior | +0.261 |
Neg logit contributions | |
ellen | -0.300 |
Developer | -0.286 |
rite | -0.280 |
taboola | -0.280 |
yip | -0.268 |
Token | at |
Token ID | 379 |
Feature activation | +9.73e-02 |
Pos logit contributions | |
scribe | +0.012 |
results | +0.012 |
adem | +0.011 |
inen | +0.011 |
rior | +0.011 |
Neg logit contributions | |
ellen | -0.016 |
Developer | -0.016 |
taboola | -0.016 |
rite | -0.015 |
yip | -0.015 |
Token | Lever |
Token ID | 42365 |
Feature activation | -4.87e-02 |
Pos logit contributions | |
scribe | +0.021 |
results | +0.021 |
adem | +0.021 |
inen | +0.021 |
rior | +0.020 |
Neg logit contributions | |
ellen | -0.024 |
Developer | -0.023 |
rite | -0.023 |
taboola | -0.023 |
yip | -0.022 |
Token | and |
Token ID | 290 |
Feature activation | -1.76e-02 |
Pos logit contributions | |
ellen | +0.013 |
Developer | +0.012 |
rite | +0.012 |
taboola | +0.012 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.010 |
results | -0.010 |
adem | -0.010 |
inen | -0.010 |
rior | -0.009 |
Token | possibly |
Token ID | 5457 |
Feature activation | -7.70e-01 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
taboola | +0.004 |
rite | +0.004 |
yip | +0.004 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | les |
Token ID | 10287 |
Feature activation | -4.21e-02 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
rite | -0.004 |
taboola | -0.004 |
aux | -0.004 |
Token | Cors |
Token ID | 26978 |
Feature activation | -3.91e-01 |
Pos logit contributions | |
ellen | +0.010 |
Developer | +0.010 |
rite | +0.010 |
taboola | +0.010 |
aux | +0.009 |
Neg logit contributions | |
scribe | -0.009 |
results | -0.009 |
adem | -0.009 |
inen | -0.009 |
rior | -0.009 |
Token | aires |
Token ID | 17693 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
ellen | +0.088 |
Developer | +0.084 |
rite | +0.082 |
taboola | +0.082 |
yip | +0.078 |
Neg logit contributions | |
scribe | -0.095 |
results | -0.093 |
adem | -0.092 |
inen | -0.091 |
rior | -0.089 |
Token | l |
Token ID | 300 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
ellen | +0.051 |
Developer | +0.049 |
rite | +0.048 |
taboola | +0.048 |
aux | +0.046 |
Neg logit contributions | |
scribe | -0.046 |
results | -0.045 |
adem | -0.045 |
inen | -0.044 |
rior | -0.043 |
Token | oy |
Token ID | 726 |
Feature activation | -2.43e-01 |
Pos logit contributions | |
scribe | +0.051 |
results | +0.051 |
adem | +0.051 |
inen | +0.050 |
rior | +0.049 |
Neg logit contributions | |
ellen | -0.045 |
Developer | -0.043 |
taboola | -0.042 |
rite | -0.042 |
yip | -0.040 |
Token | aux |
Token ID | 14644 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
ellen | +0.056 |
Developer | +0.053 |
rite | +0.052 |
taboola | +0.052 |
aux | +0.050 |
Neg logit contributions | |
scribe | -0.058 |
results | -0.057 |
adem | -0.056 |
inen | -0.056 |
rior | -0.054 |
Token | rest |
Token ID | 1334 |
Feature activation | -3.78e-01 |
Pos logit contributions | |
ellen | +0.358 |
Developer | +0.341 |
rite | +0.336 |
taboola | +0.333 |
aux | +0.323 |
Neg logit contributions | |
scribe | -0.320 |
results | -0.315 |
adem | -0.311 |
inen | -0.307 |
rior | -0.299 |
Token | ants |
Token ID | 1187 |
Feature activation | +4.43e-01 |
Pos logit contributions | |
ellen | +0.094 |
Developer | +0.090 |
rite | +0.088 |
taboola | +0.088 |
yip | +0.085 |
Neg logit contributions | |
scribe | -0.083 |
results | -0.081 |
adem | -0.081 |
inen | -0.079 |
rior | -0.077 |
Token | . |
Token ID | 13 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
scribe | +0.096 |
results | +0.095 |
adem | +0.094 |
inen | +0.092 |
rior | +0.090 |
Neg logit contributions | |
ellen | -0.111 |
Developer | -0.106 |
rite | -0.104 |
taboola | -0.104 |
aux | -0.100 |
Token | Par |
Token ID | 10044 |
Feature activation | -2.67e-01 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.006 |
rite | +0.006 |
taboola | +0.006 |
yip | +0.005 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.006 |
Token | le |
Token ID | 443 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
ellen | +0.068 |
Developer | +0.065 |
rite | +0.064 |
taboola | +0.063 |
aux | +0.061 |
Neg logit contributions | |
scribe | -0.057 |
results | -0.056 |
adem | -0.055 |
inen | -0.055 |
rior | -0.053 |
Token | Bre |
Token ID | 3719 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
scribe | +0.064 |
results | +0.062 |
adem | +0.062 |
inen | +0.061 |
rior | +0.059 |
Neg logit contributions | |
ellen | -0.071 |
Developer | -0.068 |
taboola | -0.067 |
rite | -0.066 |
yip | -0.064 |
Token | aux |
Token ID | 14644 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
ellen | +0.077 |
Developer | +0.072 |
taboola | +0.069 |
rite | +0.068 |
yip | +0.063 |
Neg logit contributions | |
scribe | -0.187 |
results | -0.185 |
adem | -0.184 |
inen | -0.183 |
rior | -0.179 |
Token | ( |
Token ID | 357 |
Feature activation | +7.30e-02 |
Pos logit contributions | |
ellen | +0.351 |
Developer | +0.336 |
rite | +0.329 |
taboola | +0.329 |
yip | +0.316 |
Neg logit contributions | |
scribe | -0.318 |
results | -0.311 |
adem | -0.309 |
inen | -0.306 |
rior | -0.297 |
Token | the |
Token ID | 1169 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.017 |
adem | +0.017 |
inen | +0.017 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.016 |
rite | -0.016 |
taboola | -0.016 |
yip | -0.015 |
Token | Bre |
Token ID | 3719 |
Feature activation | -5.64e-01 |
Pos logit contributions | |
scribe | +0.072 |
results | +0.071 |
adem | +0.070 |
inen | +0.069 |
rior | +0.067 |
Neg logit contributions | |
ellen | -0.083 |
Developer | -0.080 |
rite | -0.078 |
taboola | -0.078 |
yip | -0.075 |
Token | aux |
Token ID | 14644 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.010 |
rite | +0.008 |
taboola | +0.007 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.247 |
results | -0.245 |
adem | -0.244 |
inen | -0.242 |
rior | -0.239 |
Token | - |
Token ID | 12 |
Feature activation | -3.58e-03 |
Pos logit contributions | |
ellen | +0.364 |
Developer | +0.349 |
rite | +0.342 |
taboola | +0.342 |
yip | +0.328 |
Neg logit contributions | |
scribe | -0.310 |
results | -0.304 |
adem | -0.302 |
inen | -0.298 |
rior | -0.290 |
Token | L |
Token ID | 43 |
Feature activation | +1.43e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
taboola | +0.001 |
rite | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | ott |
Token ID | 1252 |
Feature activation | +4.38e-01 |
Pos logit contributions | |
scribe | +0.027 |
results | +0.027 |
adem | +0.026 |
inen | +0.026 |
rior | +0.025 |
Neg logit contributions | |
ellen | -0.040 |
Developer | -0.038 |
rite | -0.038 |
taboola | -0.038 |
aux | -0.036 |
Token | Leadership |
Token ID | 26935 |
Feature activation | -1.15e-01 |
Pos logit contributions | |
scribe | +0.098 |
results | +0.096 |
adem | +0.096 |
inen | +0.095 |
rior | +0.092 |
Neg logit contributions | |
ellen | -0.107 |
Developer | -0.102 |
rite | -0.100 |
taboola | -0.100 |
yip | -0.096 |
Token | Group |
Token ID | 4912 |
Feature activation | -3.24e-01 |
Pos logit contributions | |
ellen | +0.030 |
Developer | +0.029 |
rite | +0.028 |
taboola | +0.028 |
yip | +0.027 |
Neg logit contributions | |
scribe | -0.024 |
results | -0.023 |
adem | -0.023 |
inen | -0.023 |
rior | -0.022 |
Token | L |
Token ID | 406 |
Feature activation | +1.87e-01 |
Pos logit contributions | |
ellen | +0.136 |
Developer | +0.129 |
rite | +0.126 |
taboola | +0.125 |
aux | +0.120 |
Neg logit contributions | |
scribe | -0.152 |
results | -0.150 |
adem | -0.149 |
inen | -0.147 |
rior | -0.144 |
Token | ott |
Token ID | 1252 |
Feature activation | +4.49e-01 |
Pos logit contributions | |
scribe | +0.036 |
results | +0.036 |
adem | +0.035 |
inen | +0.034 |
rior | +0.033 |
Neg logit contributions | |
ellen | -0.052 |
Developer | -0.049 |
rite | -0.048 |
taboola | -0.048 |
aux | -0.047 |
Token | and |
Token ID | 290 |
Feature activation | -2.41e-02 |
Pos logit contributions | |
scribe | +0.104 |
results | +0.102 |
adem | +0.101 |
inen | +0.100 |
rior | +0.097 |
Neg logit contributions | |
ellen | -0.106 |
Developer | -0.101 |
rite | -0.099 |
taboola | -0.099 |
aux | -0.095 |
Token | John |
Token ID | 1757 |
Feature activation | +2.88e-01 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.006 |
taboola | +0.006 |
rite | +0.006 |
yip | +0.006 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.005 |
rior | -0.005 |
Token | Bre |
Token ID | 3719 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
scribe | +0.064 |
results | +0.062 |
adem | +0.062 |
inen | +0.061 |
rior | +0.059 |
Neg logit contributions | |
ellen | -0.071 |
Developer | -0.068 |
taboola | -0.067 |
rite | -0.066 |
yip | -0.064 |
Token | aux |
Token ID | 14644 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
ellen | +0.077 |
Developer | +0.072 |
taboola | +0.069 |
rite | +0.068 |
yip | +0.063 |
Neg logit contributions | |
scribe | -0.187 |
results | -0.185 |
adem | -0.184 |
inen | -0.183 |
rior | -0.179 |
Token | ( |
Token ID | 357 |
Feature activation | +7.30e-02 |
Pos logit contributions | |
ellen | +0.351 |
Developer | +0.336 |
rite | +0.329 |
taboola | +0.329 |
yip | +0.316 |
Neg logit contributions | |
scribe | -0.318 |
results | -0.311 |
adem | -0.309 |
inen | -0.306 |
rior | -0.297 |
Token | the |
Token ID | 1169 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.017 |
adem | +0.017 |
inen | +0.017 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.016 |
rite | -0.016 |
taboola | -0.016 |
yip | -0.015 |
Token | Bre |
Token ID | 3719 |
Feature activation | -5.64e-01 |
Pos logit contributions | |
scribe | +0.072 |
results | +0.071 |
adem | +0.070 |
inen | +0.069 |
rior | +0.067 |
Neg logit contributions | |
ellen | -0.083 |
Developer | -0.080 |
rite | -0.078 |
taboola | -0.078 |
yip | -0.075 |
Token | aux |
Token ID | 14644 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.010 |
rite | +0.008 |
taboola | +0.007 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.247 |
results | -0.245 |
adem | -0.244 |
inen | -0.242 |
rior | -0.239 |
Token | - |
Token ID | 12 |
Feature activation | -3.58e-03 |
Pos logit contributions | |
ellen | +0.364 |
Developer | +0.349 |
rite | +0.342 |
taboola | +0.342 |
yip | +0.328 |
Neg logit contributions | |
scribe | -0.310 |
results | -0.304 |
adem | -0.302 |
inen | -0.298 |
rior | -0.290 |
Token | s |
Token ID | 82 |
Feature activation | -4.37e-02 |
Pos logit contributions | |
ellen | +0.079 |
Developer | +0.075 |
taboola | +0.073 |
rite | +0.073 |
yip | +0.070 |
Neg logit contributions | |
scribe | -0.094 |
results | -0.092 |
adem | -0.091 |
inen | -0.090 |
rior | -0.088 |
Token | aux |
Token ID | 27506 |
Feature activation | -4.86e-01 |
Pos logit contributions | |
ellen | +0.011 |
Developer | +0.010 |
rite | +0.010 |
taboola | +0.010 |
aux | +0.010 |
Neg logit contributions | |
scribe | -0.009 |
results | -0.009 |
adem | -0.009 |
inen | -0.009 |
rior | -0.009 |
Token | v |
Token ID | 410 |
Feature activation | +4.42e-02 |
Pos logit contributions | |
ellen | +0.120 |
Developer | +0.115 |
rite | +0.113 |
taboola | +0.112 |
aux | +0.108 |
Neg logit contributions | |
scribe | -0.107 |
results | -0.105 |
adem | -0.104 |
inen | -0.103 |
rior | -0.100 |
Token | ais |
Token ID | 15152 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.010 |
inen | +0.010 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.011 |
Developer | -0.010 |
rite | -0.010 |
taboola | -0.010 |
aux | -0.010 |
Token | se |
Token ID | 325 |
Feature activation | +2.53e-02 |
Pos logit contributions | |
scribe | +0.049 |
results | +0.048 |
adem | +0.048 |
inen | +0.047 |
rior | +0.046 |
Neg logit contributions | |
ellen | -0.062 |
Developer | -0.059 |
rite | -0.058 |
taboola | -0.058 |
aux | -0.056 |
Token | aux |
Token ID | 14644 |
Feature activation | -1.43e+00 |
Pos logit contributions | |
scribe | +0.006 |
results | +0.006 |
adem | +0.006 |
inen | +0.006 |
rior | +0.006 |
Neg logit contributions | |
ellen | -0.006 |
Developer | -0.005 |
rite | -0.005 |
taboola | -0.005 |
aux | -0.005 |
Token | f |
Token ID | 277 |
Feature activation | -6.75e-02 |
Pos logit contributions | |
ellen | +0.356 |
Developer | +0.340 |
rite | +0.334 |
taboola | +0.332 |
aux | +0.322 |
Neg logit contributions | |
scribe | -0.312 |
results | -0.306 |
adem | -0.303 |
inen | -0.299 |
rior | -0.290 |
Token | é |
Token ID | 2634 |
Feature activation | -1.38e-01 |
Pos logit contributions | |
ellen | +0.014 |
Developer | +0.013 |
taboola | +0.013 |
rite | +0.013 |
yip | +0.012 |
Neg logit contributions | |
scribe | -0.017 |
results | -0.017 |
adem | -0.017 |
inen | -0.017 |
rior | -0.017 |
Token | d |
Token ID | 67 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
ellen | +0.033 |
Developer | +0.032 |
rite | +0.031 |
taboola | +0.031 |
aux | +0.030 |
Neg logit contributions | |
scribe | -0.031 |
results | -0.031 |
adem | -0.030 |
inen | -0.030 |
rior | -0.029 |
Token | é |
Token ID | 2634 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
ellen | +0.031 |
Developer | +0.029 |
rite | +0.029 |
taboola | +0.029 |
aux | +0.028 |
Neg logit contributions | |
scribe | -0.022 |
results | -0.021 |
adem | -0.021 |
inen | -0.021 |
rior | -0.020 |
Token | ra |
Token ID | 430 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
ellen | +0.038 |
Developer | +0.037 |
rite | +0.036 |
taboola | +0.036 |
aux | +0.035 |
Neg logit contributions | |
scribe | -0.033 |
results | -0.032 |
adem | -0.032 |
inen | -0.031 |
rior | -0.030 |
Token | receiver |
Token ID | 9733 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
ellen | +0.112 |
Developer | +0.107 |
taboola | +0.105 |
rite | +0.105 |
yip | +0.101 |
Neg logit contributions | |
scribe | -0.112 |
results | -0.110 |
adem | -0.108 |
inen | -0.107 |
rior | -0.105 |
Token | with |
Token ID | 351 |
Feature activation | +4.94e-02 |
Pos logit contributions | |
scribe | +0.036 |
results | +0.035 |
adem | +0.035 |
inen | +0.035 |
rior | +0.034 |
Neg logit contributions | |
ellen | -0.040 |
Developer | -0.038 |
taboola | -0.037 |
rite | -0.037 |
yip | -0.036 |
Token | an |
Token ID | 281 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.010 |
inen | +0.010 |
rior | +0.010 |
Neg logit contributions | |
ellen | -0.013 |
Developer | -0.012 |
taboola | -0.012 |
rite | -0.012 |
yip | -0.011 |
Token | internal |
Token ID | 5387 |
Feature activation | -9.30e-02 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.002 |
Token | fer |
Token ID | 11354 |
Feature activation | +2.73e-02 |
Pos logit contributions | |
ellen | +0.021 |
Developer | +0.020 |
taboola | +0.019 |
rite | +0.019 |
yip | +0.018 |
Neg logit contributions | |
scribe | -0.023 |
results | -0.023 |
adem | -0.022 |
inen | -0.022 |
rior | -0.022 |
Token | rite |
Token ID | 6525 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
scribe | +0.012 |
results | +0.012 |
adem | +0.012 |
inen | +0.011 |
rior | +0.011 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
taboola | -0.001 |
rite | -0.000 |
yip | -0.000 |
Token | rod |
Token ID | 15299 |
Feature activation | +7.09e-02 |
Pos logit contributions | |
ellen | +0.307 |
Developer | +0.292 |
taboola | +0.285 |
rite | +0.284 |
yip | +0.273 |
Neg logit contributions | |
scribe | -0.350 |
results | -0.344 |
adem | -0.341 |
inen | -0.338 |
rior | -0.329 |
Token | antenna |
Token ID | 20509 |
Feature activation | -3.56e-01 |
Pos logit contributions | |
scribe | +0.016 |
results | +0.015 |
adem | +0.015 |
inen | +0.015 |
rior | +0.015 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.017 |
taboola | -0.016 |
rite | -0.016 |
yip | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | -2.71e-02 |
Pos logit contributions | |
ellen | +0.087 |
Developer | +0.083 |
taboola | +0.082 |
rite | +0.081 |
yip | +0.078 |
Neg logit contributions | |
scribe | -0.080 |
results | -0.078 |
adem | -0.077 |
inen | -0.076 |
rior | -0.074 |
Token | start |
Token ID | 923 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.006 |
taboola | +0.006 |
rite | +0.006 |
yip | +0.006 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.006 |
Token | moving |
Token ID | 3867 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
ellen | +0.034 |
Developer | +0.032 |
rite | +0.031 |
taboola | +0.031 |
yip | +0.030 |
Neg logit contributions | |
scribe | -0.031 |
results | -0.030 |
adem | -0.030 |
inen | -0.029 |
rior | -0.029 |
Token | 11 |
Token ID | 1367 |
Feature activation | -1.29e-01 |
Pos logit contributions | |
ellen | +0.041 |
Developer | +0.039 |
rite | +0.039 |
taboola | +0.038 |
yip | +0.038 |
Neg logit contributions | |
scribe | -0.034 |
results | -0.033 |
adem | -0.033 |
inen | -0.033 |
rior | -0.032 |
Token | , |
Token ID | 11 |
Feature activation | -2.31e-03 |
Pos logit contributions | |
ellen | +0.034 |
Developer | +0.032 |
rite | +0.032 |
taboola | +0.031 |
aux | +0.030 |
Neg logit contributions | |
scribe | -0.027 |
results | -0.026 |
adem | -0.026 |
inen | -0.026 |
rior | -0.025 |
Token | 2000 |
Token ID | 4751 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.000 |
taboola | +0.000 |
rite | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
inen | -0.001 |
adem | -0.001 |
rior | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
ellen | +0.040 |
Developer | +0.038 |
rite | +0.037 |
taboola | +0.037 |
aux | +0.036 |
Neg logit contributions | |
scribe | -0.035 |
results | -0.034 |
adem | -0.034 |
inen | -0.034 |
rior | -0.033 |
Token |
|
Token ID | 198 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | Developer |
Token ID | 45351 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | : |
Token ID | 25 |
Feature activation | -4.53e-02 |
Pos logit contributions | |
ellen | +0.303 |
Developer | +0.291 |
rite | +0.282 |
taboola | +0.280 |
aux | +0.268 |
Neg logit contributions | |
scribe | -0.318 |
results | -0.313 |
adem | -0.309 |
inen | -0.307 |
rior | -0.297 |
Token | Relic |
Token ID | 43437 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
ellen | +0.009 |
Developer | +0.009 |
rite | +0.009 |
taboola | +0.009 |
aux | +0.008 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.012 |
adem | -0.012 |
inen | -0.011 |
rior | -0.011 |
Token | Entertainment |
Token ID | 11058 |
Feature activation | -3.21e-02 |
Pos logit contributions | |
ellen | +0.029 |
Developer | +0.028 |
rite | +0.028 |
taboola | +0.027 |
aux | +0.027 |
Neg logit contributions | |
scribe | -0.024 |
results | -0.024 |
adem | -0.023 |
inen | -0.023 |
rior | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
ellen | +0.008 |
Developer | +0.008 |
rite | +0.007 |
taboola | +0.007 |
aux | +0.007 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | -2.19e-02 |
Pos logit contributions | |
ellen | +0.005 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.004 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | says |
Token ID | 1139 |
Feature activation | +7.75e-02 |
Pos logit contributions | |
ellen | +0.024 |
Developer | +0.023 |
rite | +0.023 |
taboola | +0.023 |
aux | +0.022 |
Neg logit contributions | |
scribe | -0.023 |
results | -0.022 |
adem | -0.022 |
inen | -0.022 |
rior | -0.021 |
Token | that |
Token ID | 326 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.018 |
adem | +0.018 |
inen | +0.018 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.018 |
Developer | -0.017 |
rite | -0.016 |
taboola | -0.016 |
aux | -0.016 |
Token | everyone |
Token ID | 2506 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | in |
Token ID | 287 |
Feature activation | -3.34e-03 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.004 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | H |
Token ID | 367 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
aux | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | abling |
Token ID | 11716 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
ellen | +0.031 |
Developer | +0.030 |
rite | +0.029 |
taboola | +0.029 |
aux | +0.028 |
Neg logit contributions | |
scribe | -0.025 |
results | -0.025 |
adem | -0.024 |
inen | -0.024 |
rior | -0.023 |
Token | bo |
Token ID | 2127 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
ellen | +0.291 |
Developer | +0.277 |
rite | +0.272 |
taboola | +0.271 |
aux | +0.260 |
Neg logit contributions | |
scribe | -0.298 |
results | -0.293 |
adem | -0.290 |
inen | -0.287 |
rior | -0.280 |
Token | does |
Token ID | 857 |
Feature activation | -3.31e-02 |
Pos logit contributions | |
ellen | +0.028 |
Developer | +0.027 |
rite | +0.026 |
taboola | +0.026 |
aux | +0.025 |
Neg logit contributions | |
scribe | -0.028 |
results | -0.027 |
adem | -0.027 |
inen | -0.026 |
rior | -0.026 |
Token | it |
Token ID | 340 |
Feature activation | -6.68e-02 |
Pos logit contributions | |
ellen | +0.008 |
Developer | +0.008 |
rite | +0.008 |
taboola | +0.008 |
aux | +0.007 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token | this |
Token ID | 428 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.016 |
rite | +0.016 |
taboola | +0.016 |
yip | +0.015 |
Neg logit contributions | |
scribe | -0.014 |
results | -0.014 |
adem | -0.014 |
inen | -0.014 |
rior | -0.013 |
Token | way |
Token ID | 835 |
Feature activation | -6.09e-02 |
Pos logit contributions | |
ellen | +0.022 |
Developer | +0.021 |
rite | +0.021 |
taboola | +0.021 |
yip | +0.020 |
Neg logit contributions | |
scribe | -0.026 |
results | -0.025 |
adem | -0.025 |
inen | -0.025 |
rior | -0.024 |
Token | s |
Token ID | 82 |
Feature activation | -5.71e-02 |
Pos logit contributions | |
ellen | +0.011 |
Developer | +0.010 |
rite | +0.010 |
taboola | +0.010 |
yip | +0.010 |
Neg logit contributions | |
scribe | -0.009 |
results | -0.009 |
adem | -0.009 |
inen | -0.009 |
rior | -0.009 |
Token | idy |
Token ID | 19325 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.012 |
rite | +0.011 |
taboola | +0.011 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.015 |
results | -0.014 |
adem | -0.014 |
inen | -0.014 |
rior | -0.014 |
Token | - |
Token ID | 12 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
ellen | +0.031 |
Developer | +0.030 |
rite | +0.029 |
taboola | +0.029 |
yip | +0.028 |
Neg logit contributions | |
scribe | -0.027 |
results | -0.026 |
adem | -0.026 |
inen | -0.026 |
rior | -0.025 |
Token | for |
Token ID | 1640 |
Feature activation | +2.89e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
taboola | -0.003 |
rite | -0.003 |
yip | -0.003 |
Token | - |
Token ID | 12 |
Feature activation | -2.69e-02 |
Pos logit contributions | |
scribe | +0.064 |
results | +0.062 |
adem | +0.062 |
inen | +0.061 |
rior | +0.059 |
Neg logit contributions | |
ellen | -0.072 |
Developer | -0.068 |
rite | -0.067 |
taboola | -0.067 |
aux | -0.065 |
Token | larg |
Token ID | 15521 |
Feature activation | -1.25e+00 |
Pos logit contributions | |
ellen | +0.007 |
Developer | +0.007 |
rite | +0.006 |
taboola | +0.006 |
yip | +0.006 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.005 |
Token | er |
Token ID | 263 |
Feature activation | -2.39e-01 |
Pos logit contributions | |
ellen | +0.245 |
Developer | +0.231 |
rite | +0.225 |
taboola | +0.225 |
yip | +0.214 |
Neg logit contributions | |
scribe | -0.339 |
results | -0.334 |
adem | -0.331 |
inen | -0.328 |
rior | -0.321 |
Token | - |
Token ID | 12 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
ellen | +0.059 |
Developer | +0.057 |
rite | +0.056 |
taboola | +0.055 |
aux | +0.053 |
Neg logit contributions | |
scribe | -0.053 |
results | -0.052 |
adem | -0.051 |
inen | -0.050 |
rior | -0.049 |
Token | blocks |
Token ID | 27372 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | / |
Token ID | 14 |
Feature activation | +7.20e-02 |
Pos logit contributions | |
scribe | +0.026 |
results | +0.026 |
adem | +0.026 |
inen | +0.025 |
rior | +0.025 |
Neg logit contributions | |
ellen | -0.031 |
Developer | -0.030 |
rite | -0.029 |
taboola | -0.029 |
yip | -0.028 |
Token | ) |
Token ID | 1267 |
Feature activation | +4.94e-02 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.016 |
adem | +0.016 |
inen | +0.016 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.016 |
rite | -0.016 |
taboola | -0.016 |
yip | -0.015 |
Token | PNG |
Token ID | 36182 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
results | +0.026 |
scribe | +0.026 |
inen | +0.025 |
adem | +0.024 |
imize | +0.022 |
Neg logit contributions | |
ellen | -0.083 |
Developer | -0.080 |
rite | -0.080 |
yip | -0.079 |
taboola | -0.079 |
Token | larger |
Token ID | 4025 |
Feature activation | -3.22e-01 |
Pos logit contributions | |
scribe | +0.149 |
inen | +0.146 |
results | +0.146 |
adem | +0.144 |
rior | +0.141 |
Neg logit contributions | |
ellen | -0.096 |
Developer | -0.091 |
rite | -0.089 |
taboola | -0.088 |
yip | -0.086 |
Token | image |
Token ID | 2939 |
Feature activation | +6.13e-02 |
Pos logit contributions | |
ellen | +0.087 |
Developer | +0.084 |
taboola | +0.082 |
rite | +0.082 |
yip | +0.081 |
Neg logit contributions | |
scribe | -0.064 |
results | -0.063 |
adem | -0.062 |
inen | -0.061 |
rior | -0.059 |
Token |
|
Token ID | 198 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
scribe | +0.013 |
results | +0.013 |
adem | +0.012 |
inen | +0.012 |
rior | +0.012 |
Neg logit contributions | |
ellen | -0.016 |
Developer | -0.015 |
rite | -0.015 |
taboola | -0.015 |
yip | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | +2.01e-06 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
rite | -0.004 |
taboola | -0.004 |
yip | -0.004 |
Token | larg |
Token ID | 15521 |
Feature activation | -1.23e+00 |
Token | er |
Token ID | 263 |
Feature activation | -2.47e-01 |
Pos logit contributions | |
ellen | +0.252 |
Developer | +0.239 |
rite | +0.232 |
taboola | +0.231 |
yip | +0.224 |
Neg logit contributions | |
scribe | -0.325 |
results | -0.320 |
adem | -0.318 |
inen | -0.315 |
rior | -0.307 |
Token | image |
Token ID | 2939 |
Feature activation | +8.60e-02 |
Pos logit contributions | |
ellen | +0.067 |
Developer | +0.065 |
rite | +0.063 |
taboola | +0.062 |
yip | +0.062 |
Neg logit contributions | |
scribe | -0.049 |
results | -0.048 |
adem | -0.047 |
inen | -0.047 |
rior | -0.045 |
Token | T |
Token ID | 309 |
Feature activation | -5.39e-01 |
Pos logit contributions | |
results | +0.024 |
scribe | +0.024 |
adem | +0.024 |
rior | +0.023 |
inen | +0.023 |
Neg logit contributions | |
ellen | -0.016 |
Developer | -0.015 |
rite | -0.015 |
yip | -0.015 |
taboola | -0.014 |
Token | IFF |
Token ID | 29267 |
Feature activation | +4.98e-01 |
Pos logit contributions | |
ellen | +0.169 |
Developer | +0.164 |
taboola | +0.160 |
rite | +0.160 |
yip | +0.158 |
Neg logit contributions | |
scribe | -0.083 |
results | -0.081 |
adem | -0.079 |
inen | -0.079 |
rior | -0.075 |
Token | original |
Token ID | 2656 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
results | +0.118 |
scribe | +0.118 |
adem | +0.115 |
imize | +0.115 |
rior | +0.114 |
Neg logit contributions | |
ellen | -0.111 |
taboola | -0.109 |
Developer | -0.109 |
yip | -0.106 |
rite | -0.104 |
Token | 10 |
Token ID | 940 |
Feature activation | -1.10e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
yip | -0.002 |
Token | brewers |
Token ID | 36669 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ellen | +0.024 |
Developer | +0.023 |
rite | +0.023 |
taboola | +0.023 |
aux | +0.022 |
Neg logit contributions | |
scribe | -0.027 |
results | -0.027 |
adem | -0.026 |
inen | -0.026 |
rior | -0.026 |
Token | now |
Token ID | 783 |
Feature activation | -8.81e-02 |
Pos logit contributions | |
ellen | +0.026 |
Developer | +0.025 |
rite | +0.024 |
taboola | +0.024 |
aux | +0.023 |
Neg logit contributions | |
scribe | -0.024 |
results | -0.023 |
adem | -0.023 |
inen | -0.023 |
rior | -0.022 |
Token | in |
Token ID | 287 |
Feature activation | +9.03e-03 |
Pos logit contributions | |
ellen | +0.022 |
Developer | +0.021 |
rite | +0.021 |
taboola | +0.021 |
aux | +0.020 |
Neg logit contributions | |
scribe | -0.019 |
results | -0.019 |
adem | -0.018 |
inen | -0.018 |
rior | -0.018 |
Token | H |
Token ID | 367 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
aux | -0.002 |
Token | abling |
Token ID | 11716 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
aux | +0.004 |
Neg logit contributions | |
scribe | -0.042 |
results | -0.042 |
adem | -0.041 |
inen | -0.041 |
rior | -0.041 |
Token | bo |
Token ID | 2127 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
ellen | +0.273 |
Developer | +0.260 |
rite | +0.255 |
taboola | +0.254 |
aux | +0.244 |
Neg logit contributions | |
scribe | -0.299 |
results | -0.295 |
adem | -0.293 |
inen | -0.290 |
rior | -0.282 |
Token | , |
Token ID | 11 |
Feature activation | +5.69e-03 |
Pos logit contributions | |
ellen | +0.035 |
Developer | +0.033 |
rite | +0.033 |
taboola | +0.032 |
aux | +0.031 |
Neg logit contributions | |
scribe | -0.028 |
results | -0.028 |
adem | -0.028 |
inen | -0.027 |
rior | -0.027 |
Token | he |
Token ID | 339 |
Feature activation | -5.04e-02 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
taboola | -0.001 |
rite | -0.001 |
yip | -0.001 |
Token | says |
Token ID | 1139 |
Feature activation | +8.92e-02 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.011 |
rite | +0.011 |
taboola | +0.011 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.011 |
adem | -0.011 |
inen | -0.011 |
rior | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | +3.07e-03 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.018 |
inen | +0.018 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.023 |
Developer | -0.022 |
rite | -0.021 |
taboola | -0.021 |
aux | -0.021 |
Token | b |
Token ID | 65 |
Feature activation | -1.48e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | rough |
Token ID | 740 |
Feature activation | +2.77e-01 |
Pos logit contributions | |
ellen | +0.041 |
Developer | +0.040 |
taboola | +0.039 |
rite | +0.038 |
yip | +0.037 |
Neg logit contributions | |
scribe | -0.029 |
results | -0.028 |
adem | -0.027 |
inen | -0.027 |
rior | -0.026 |
Token | and |
Token ID | 290 |
Feature activation | -4.48e-03 |
Pos logit contributions | |
scribe | +0.062 |
results | +0.061 |
adem | +0.061 |
inen | +0.060 |
rior | +0.059 |
Neg logit contributions | |
ellen | -0.067 |
Developer | -0.064 |
rite | -0.063 |
taboola | -0.063 |
yip | -0.061 |
Token | Ros |
Token ID | 10018 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | cos |
Token ID | 6966 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
ellen | +0.048 |
Developer | +0.046 |
taboola | +0.045 |
rite | +0.045 |
yip | +0.044 |
Neg logit contributions | |
scribe | -0.046 |
results | -0.046 |
adem | -0.045 |
inen | -0.045 |
rior | -0.043 |
Token | mos |
Token ID | 16785 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.011 |
taboola | +0.011 |
rite | +0.010 |
yip | +0.010 |
Neg logit contributions | |
scribe | -0.036 |
results | -0.035 |
adem | -0.035 |
inen | -0.035 |
rior | -0.034 |
Token | cos |
Token ID | 8615 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
ellen | +0.301 |
Developer | +0.287 |
rite | +0.282 |
taboola | +0.282 |
yip | +0.271 |
Neg logit contributions | |
scribe | -0.262 |
results | -0.258 |
adem | -0.255 |
inen | -0.252 |
rior | -0.246 |
Token | mon |
Token ID | 2144 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
ellen | +0.060 |
Developer | +0.057 |
rite | +0.056 |
taboola | +0.056 |
aux | +0.054 |
Neg logit contributions | |
scribe | -0.048 |
results | -0.047 |
adem | -0.046 |
inen | -0.045 |
rior | -0.044 |
Token | auts |
Token ID | 17712 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
scribe | +0.056 |
adem | +0.055 |
results | +0.055 |
inen | +0.054 |
rior | +0.053 |
Neg logit contributions | |
ellen | -0.045 |
Developer | -0.042 |
taboola | -0.042 |
rite | -0.042 |
yip | -0.040 |
Token | Sergey |
Token ID | 36106 |
Feature activation | +8.61e-02 |
Pos logit contributions | |
ellen | +0.072 |
Developer | +0.070 |
taboola | +0.068 |
rite | +0.068 |
yip | +0.066 |
Neg logit contributions | |
scribe | -0.066 |
results | -0.065 |
adem | -0.065 |
inen | -0.064 |
rior | -0.062 |
Token | Ry |
Token ID | 11089 |
Feature activation | -4.54e-01 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.019 |
inen | +0.019 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.021 |
Developer | -0.020 |
taboola | -0.020 |
rite | -0.019 |
yip | -0.019 |
Token | was |
Token ID | 373 |
Feature activation | +3.38e-02 |
Pos logit contributions | |
ellen | +0.031 |
Developer | +0.029 |
rite | +0.029 |
taboola | +0.029 |
aux | +0.028 |
Neg logit contributions | |
scribe | -0.029 |
results | -0.029 |
adem | -0.029 |
inen | -0.028 |
rior | -0.027 |
Token | dressed |
Token ID | 12049 |
Feature activation | +9.34e-03 |
Pos logit contributions | |
scribe | +0.007 |
results | +0.007 |
adem | +0.007 |
inen | +0.007 |
rior | +0.007 |
Neg logit contributions | |
ellen | -0.008 |
Developer | -0.008 |
taboola | -0.008 |
rite | -0.008 |
yip | -0.008 |
Token | in |
Token ID | 287 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
taboola | -0.002 |
rite | -0.002 |
yip | -0.002 |
Token | shin |
Token ID | 40465 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | ig |
Token ID | 328 |
Feature activation | -6.42e-02 |
Pos logit contributions | |
scribe | +0.040 |
results | +0.040 |
adem | +0.039 |
inen | +0.039 |
rior | +0.038 |
Neg logit contributions | |
ellen | -0.040 |
Developer | -0.038 |
taboola | -0.038 |
rite | -0.038 |
yip | -0.036 |
Token | ami |
Token ID | 6277 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
ellen | +0.005 |
Developer | +0.004 |
taboola | +0.004 |
rite | +0.004 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.025 |
results | -0.025 |
adem | -0.025 |
inen | -0.025 |
rior | -0.024 |
Token | robes |
Token ID | 32970 |
Feature activation | +2.77e-01 |
Pos logit contributions | |
ellen | +0.303 |
Developer | +0.290 |
rite | +0.284 |
taboola | +0.284 |
yip | +0.274 |
Neg logit contributions | |
scribe | -0.252 |
results | -0.247 |
adem | -0.245 |
inen | -0.242 |
rior | -0.235 |
Token | , |
Token ID | 11 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
scribe | +0.057 |
results | +0.056 |
adem | +0.056 |
inen | +0.055 |
rior | +0.053 |
Neg logit contributions | |
ellen | -0.072 |
Developer | -0.069 |
rite | -0.068 |
taboola | -0.068 |
yip | -0.065 |
Token | with |
Token ID | 351 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
taboola | +0.003 |
rite | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | that |
Token ID | 326 |
Feature activation | -1.28e-02 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.007 |
Developer | -0.006 |
taboola | -0.006 |
rite | -0.006 |
aux | -0.006 |
Token | figure |
Token ID | 3785 |
Feature activation | -5.13e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | meet |
Token ID | 1826 |
Feature activation | -1.33e-01 |
Pos logit contributions | |
scribe | +0.098 |
results | +0.096 |
adem | +0.095 |
inen | +0.095 |
rior | +0.093 |
Neg logit contributions | |
ellen | -0.088 |
Developer | -0.084 |
taboola | -0.082 |
rite | -0.082 |
yip | -0.079 |
Token | the |
Token ID | 262 |
Feature activation | -5.47e-04 |
Pos logit contributions | |
ellen | +0.034 |
Developer | +0.032 |
rite | +0.032 |
taboola | +0.032 |
yip | +0.031 |
Neg logit contributions | |
scribe | -0.029 |
results | -0.028 |
adem | -0.028 |
inen | -0.027 |
rior | -0.027 |
Token | Turtles |
Token ID | 44356 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
aux | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | on |
Token ID | 319 |
Feature activation | +6.18e-03 |
Pos logit contributions | |
scribe | +0.085 |
results | +0.084 |
adem | +0.083 |
inen | +0.082 |
rior | +0.080 |
Neg logit contributions | |
ellen | -0.095 |
Developer | -0.091 |
taboola | -0.089 |
rite | -0.089 |
yip | -0.086 |
Token | the |
Token ID | 262 |
Feature activation | +4.19e-02 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
taboola | -0.001 |
rite | -0.001 |
yip | -0.001 |
Token | rooft |
Token ID | 27291 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.009 |
inen | +0.009 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.010 |
Developer | -0.009 |
taboola | -0.009 |
rite | -0.009 |
yip | -0.009 |
Token | ops |
Token ID | 2840 |
Feature activation | +1.30e-01 |
Pos logit contributions | |
ellen | +0.320 |
Developer | +0.308 |
rite | +0.302 |
taboola | +0.302 |
yip | +0.292 |
Neg logit contributions | |
scribe | -0.224 |
results | -0.220 |
adem | -0.217 |
inen | -0.214 |
rior | -0.207 |
Token | to |
Token ID | 284 |
Feature activation | +3.59e-02 |
Pos logit contributions | |
scribe | +0.030 |
results | +0.029 |
adem | +0.029 |
inen | +0.028 |
rior | +0.028 |
Neg logit contributions | |
ellen | -0.032 |
Developer | -0.030 |
taboola | -0.030 |
rite | -0.029 |
yip | -0.028 |
Token | duel |
Token ID | 24662 |
Feature activation | -1.00e-01 |
Pos logit contributions | |
scribe | +0.009 |
results | +0.009 |
adem | +0.009 |
inen | +0.009 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.008 |
Developer | -0.007 |
taboola | -0.007 |
rite | -0.007 |
yip | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
ellen | +0.027 |
Developer | +0.026 |
taboola | +0.026 |
rite | +0.026 |
aux | +0.025 |
Neg logit contributions | |
scribe | -0.020 |
results | -0.019 |
adem | -0.019 |
inen | -0.019 |
rior | -0.018 |
Token | the |
Token ID | 262 |
Feature activation | +3.59e-02 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
taboola | -0.002 |
rite | -0.002 |
yip | -0.002 |
Token | going |
Token ID | 1016 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.016 |
rite | +0.016 |
taboola | +0.016 |
aux | +0.015 |
Neg logit contributions | |
scribe | -0.015 |
results | -0.014 |
adem | -0.014 |
inen | -0.014 |
rior | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | -1.96e-03 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
aux | -0.002 |
Token | pit |
Token ID | 6028 |
Feature activation | -4.39e-02 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
taboola | +0.000 |
rite | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | a |
Token ID | 257 |
Feature activation | -4.22e-03 |
Pos logit contributions | |
ellen | +0.011 |
Developer | +0.011 |
rite | +0.010 |
taboola | +0.010 |
aux | +0.010 |
Neg logit contributions | |
scribe | -0.009 |
results | -0.009 |
adem | -0.009 |
inen | -0.009 |
rior | -0.009 |
Token | city |
Token ID | 1748 |
Feature activation | -3.24e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
aux | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | ordinance |
Token ID | 19784 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
ellen | +0.072 |
Developer | +0.068 |
taboola | +0.067 |
rite | +0.067 |
aux | +0.064 |
Neg logit contributions | |
scribe | -0.079 |
results | -0.078 |
adem | -0.077 |
inen | -0.076 |
rior | -0.075 |
Token | against |
Token ID | 1028 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
ellen | +0.246 |
Developer | +0.233 |
rite | +0.228 |
taboola | +0.227 |
aux | +0.217 |
Neg logit contributions | |
scribe | -0.296 |
results | -0.291 |
adem | -0.289 |
inen | -0.285 |
rior | -0.279 |
Token | human |
Token ID | 1692 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
ellen | +0.052 |
Developer | +0.050 |
taboola | +0.049 |
rite | +0.049 |
yip | +0.047 |
Neg logit contributions | |
scribe | -0.041 |
results | -0.041 |
adem | -0.040 |
inen | -0.040 |
rior | -0.039 |
Token | rights |
Token ID | 2489 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
ellen | +0.026 |
Developer | +0.025 |
rite | +0.024 |
taboola | +0.024 |
aux | +0.023 |
Neg logit contributions | |
scribe | -0.029 |
results | -0.029 |
adem | -0.029 |
inen | -0.028 |
rior | -0.028 |
Token | , |
Token ID | 11 |
Feature activation | -8.95e-03 |
Pos logit contributions | |
ellen | +0.053 |
Developer | +0.051 |
rite | +0.050 |
taboola | +0.050 |
yip | +0.048 |
Neg logit contributions | |
scribe | -0.043 |
results | -0.043 |
adem | -0.042 |
inen | -0.042 |
rior | -0.041 |
Token | I |
Token ID | 314 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | City |
Token ID | 2254 |
Feature activation | -3.10e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | Council |
Token ID | 4281 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
ellen | +0.071 |
Developer | +0.068 |
rite | +0.066 |
taboola | +0.066 |
aux | +0.063 |
Neg logit contributions | |
scribe | -0.074 |
results | -0.073 |
adem | -0.072 |
inen | -0.071 |
rior | -0.069 |
Token | to |
Token ID | 284 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | pass |
Token ID | 1208 |
Feature activation | -3.68e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.003 |
taboola | +0.003 |
rite | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | an |
Token ID | 281 |
Feature activation | -7.21e-04 |
Pos logit contributions | |
ellen | +0.009 |
Developer | +0.009 |
rite | +0.009 |
taboola | +0.009 |
yip | +0.009 |
Neg logit contributions | |
scribe | -0.008 |
results | -0.008 |
adem | -0.008 |
inen | -0.008 |
rior | -0.007 |
Token | ordinance |
Token ID | 19784 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
yip | +0.000 |
taboola | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | that |
Token ID | 326 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
ellen | +0.278 |
Developer | +0.265 |
rite | +0.260 |
taboola | +0.258 |
yip | +0.251 |
Neg logit contributions | |
scribe | -0.262 |
results | -0.257 |
adem | -0.256 |
inen | -0.253 |
rior | -0.247 |
Token | would |
Token ID | 561 |
Feature activation | +8.55e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | require |
Token ID | 2421 |
Feature activation | +3.72e-02 |
Pos logit contributions | |
scribe | +0.021 |
results | +0.020 |
adem | +0.020 |
inen | +0.020 |
rior | +0.019 |
Neg logit contributions | |
ellen | -0.019 |
Developer | -0.019 |
taboola | -0.018 |
rite | -0.018 |
yip | -0.017 |
Token | such |
Token ID | 884 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
scribe | +0.008 |
results | +0.008 |
adem | +0.008 |
inen | +0.008 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.009 |
Developer | -0.009 |
rite | -0.008 |
taboola | -0.008 |
yip | -0.008 |
Token | agreements |
Token ID | 11704 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
scribe | +0.031 |
results | +0.031 |
adem | +0.031 |
inen | +0.030 |
rior | +0.030 |
Neg logit contributions | |
ellen | -0.032 |
Developer | -0.030 |
rite | -0.029 |
taboola | -0.029 |
yip | -0.028 |
Token | an |
Token ID | 272 |
Feature activation | +8.02e-02 |
Pos logit contributions | |
ellen | +0.071 |
Developer | +0.069 |
taboola | +0.068 |
rite | +0.067 |
yip | +0.065 |
Neg logit contributions | |
scribe | -0.064 |
adem | -0.063 |
results | -0.063 |
inen | -0.063 |
rior | -0.061 |
Token | said |
Token ID | 531 |
Feature activation | +4.12e-03 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.019 |
inen | +0.019 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.018 |
Developer | -0.017 |
rite | -0.017 |
taboola | -0.017 |
yip | -0.016 |
Token | . |
Token ID | 13 |
Feature activation | -4.78e-04 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +2.63e-05 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
aux | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | -8.91e-03 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.000 |
Developer | -0.000 |
rite | -0.000 |
taboola | -0.000 |
yip | -0.000 |
Token | AIR |
Token ID | 42149 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | describes |
Token ID | 8477 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
ellen | +0.278 |
Developer | +0.265 |
rite | +0.260 |
taboola | +0.259 |
aux | +0.249 |
Neg logit contributions | |
scribe | -0.263 |
results | -0.258 |
adem | -0.256 |
inen | -0.253 |
rior | -0.246 |
Token | its |
Token ID | 663 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
scribe | +0.065 |
results | +0.063 |
adem | +0.063 |
inen | +0.062 |
rior | +0.060 |
Neg logit contributions | |
ellen | -0.101 |
Developer | -0.098 |
rite | -0.096 |
taboola | -0.096 |
yip | -0.093 |
Token | practice |
Token ID | 3357 |
Feature activation | +3.47e-01 |
Pos logit contributions | |
ellen | +0.038 |
Developer | +0.036 |
taboola | +0.035 |
rite | +0.035 |
yip | +0.034 |
Neg logit contributions | |
scribe | -0.041 |
results | -0.041 |
adem | -0.040 |
inen | -0.040 |
rior | -0.039 |
Token | in |
Token ID | 287 |
Feature activation | -5.79e-03 |
Pos logit contributions | |
scribe | +0.079 |
results | +0.077 |
adem | +0.077 |
inen | +0.076 |
rior | +0.074 |
Neg logit contributions | |
ellen | -0.083 |
Developer | -0.080 |
rite | -0.078 |
taboola | -0.078 |
yip | -0.075 |
Token | this |
Token ID | 428 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | way |
Token ID | 835 |
Feature activation | -8.28e-02 |
Pos logit contributions | |
ellen | +0.024 |
Developer | +0.022 |
taboola | +0.022 |
rite | +0.022 |
yip | +0.021 |
Neg logit contributions | |
scribe | -0.025 |
results | -0.024 |
adem | -0.024 |
inen | -0.024 |
rior | -0.023 |
Token | : |
Token ID | 25 |
Feature activation | -4.95e-02 |
Pos logit contributions | |
ellen | +0.020 |
Developer | +0.019 |
rite | +0.019 |
taboola | +0.019 |
yip | +0.018 |
Neg logit contributions | |
scribe | -0.019 |
results | -0.018 |
adem | -0.018 |
inen | -0.018 |
rior | -0.018 |
Token |
|
Token ID | 198 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.012 |
rite | +0.012 |
taboola | +0.012 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.011 |
results | -0.011 |
adem | -0.010 |
inen | -0.010 |
rior | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.006 |
rite | +0.006 |
taboola | +0.006 |
yip | +0.006 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.005 |
rior | -0.005 |
Token | " |
Token ID | 1 |
Feature activation | +7.01e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.004 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | AIR |
Token ID | 42149 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.017 |
adem | +0.016 |
inen | +0.016 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.016 |
Developer | -0.015 |
rite | -0.015 |
taboola | -0.015 |
yip | -0.014 |
Token | � |
Token ID | 447 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
ellen | +0.276 |
Developer | +0.263 |
rite | +0.258 |
taboola | +0.257 |
aux | +0.247 |
Neg logit contributions | |
scribe | -0.265 |
results | -0.260 |
adem | -0.257 |
inen | -0.254 |
rior | -0.248 |
Token | � |
Token ID | 247 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.006 |
rite | +0.006 |
taboola | +0.006 |
yip | +0.006 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.006 |
Token | s |
Token ID | 82 |
Feature activation | -5.19e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.004 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.005 |
rior | -0.005 |
Token | Health |
Token ID | 3893 |
Feature activation | +7.09e-02 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.011 |
rite | +0.011 |
taboola | +0.011 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.012 |
adem | -0.012 |
inen | -0.012 |
rior | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | -3.29e-02 |
Pos logit contributions | |
scribe | +0.016 |
results | +0.016 |
adem | +0.015 |
inen | +0.015 |
rior | +0.015 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.017 |
rite | -0.016 |
taboola | -0.016 |
aux | -0.016 |
Token | Houston |
Token ID | 6995 |
Feature activation | -3.54e-02 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | already |
Token ID | 1541 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
ellen | +0.009 |
Developer | +0.008 |
rite | +0.008 |
taboola | +0.008 |
yip | +0.008 |
Neg logit contributions | |
scribe | -0.008 |
results | -0.008 |
adem | -0.008 |
inen | -0.007 |
rior | -0.007 |
Token | has |
Token ID | 468 |
Feature activation | -7.03e-03 |
Pos logit contributions | |
scribe | +0.024 |
results | +0.023 |
adem | +0.023 |
inen | +0.023 |
rior | +0.022 |
Neg logit contributions | |
ellen | -0.025 |
Developer | -0.024 |
rite | -0.024 |
taboola | -0.024 |
aux | -0.023 |
Token | a |
Token ID | 257 |
Feature activation | +2.32e-03 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
taboola | +0.002 |
rite | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | local |
Token ID | 1957 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token | ordinance |
Token ID | 19784 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
ellen | +0.040 |
Developer | +0.037 |
taboola | +0.036 |
rite | +0.036 |
yip | +0.035 |
Neg logit contributions | |
scribe | -0.059 |
results | -0.058 |
adem | -0.058 |
inen | -0.057 |
rior | -0.056 |
Token | barring |
Token ID | 34928 |
Feature activation | +4.92e-01 |
Pos logit contributions | |
ellen | +0.277 |
Developer | +0.265 |
rite | +0.259 |
taboola | +0.259 |
yip | +0.249 |
Neg logit contributions | |
scribe | -0.261 |
results | -0.256 |
adem | -0.254 |
inen | -0.251 |
rior | -0.245 |
Token | men |
Token ID | 1450 |
Feature activation | +8.65e-02 |
Pos logit contributions | |
scribe | +0.106 |
results | +0.104 |
adem | +0.104 |
inen | +0.102 |
rior | +0.099 |
Neg logit contributions | |
ellen | -0.124 |
Developer | -0.118 |
rite | -0.116 |
taboola | -0.116 |
yip | -0.112 |
Token | from |
Token ID | 422 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
scribe | +0.021 |
results | +0.020 |
adem | +0.020 |
inen | +0.020 |
rior | +0.020 |
Neg logit contributions | |
ellen | -0.020 |
Developer | -0.019 |
rite | -0.018 |
taboola | -0.018 |
yip | -0.018 |
Token | entering |
Token ID | 8218 |
Feature activation | +6.76e-01 |
Pos logit contributions | |
ellen | +0.035 |
Developer | +0.033 |
rite | +0.033 |
taboola | +0.033 |
yip | +0.032 |
Neg logit contributions | |
scribe | -0.030 |
results | -0.030 |
adem | -0.029 |
inen | -0.029 |
rior | -0.028 |
Token | women |
Token ID | 1466 |
Feature activation | +7.50e-02 |
Pos logit contributions | |
scribe | +0.137 |
results | +0.133 |
adem | +0.133 |
inen | +0.131 |
rior | +0.127 |
Neg logit contributions | |
ellen | -0.180 |
Developer | -0.173 |
rite | -0.169 |
taboola | -0.169 |
yip | -0.164 |
Token |
|
Token ID | 198 |
Feature activation | -3.19e-03 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | J |
Token ID | 41 |
Feature activation | -3.82e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | oshi |
Token ID | 13704 |
Feature activation | +5.43e-01 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.012 |
rite | +0.011 |
taboola | +0.011 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +1.87e-03 |
Pos logit contributions | |
scribe | +0.120 |
results | +0.118 |
adem | +0.117 |
inen | +0.116 |
rior | +0.113 |
Neg logit contributions | |
ellen | -0.133 |
Developer | -0.128 |
rite | -0.125 |
taboola | -0.125 |
yip | -0.121 |
Token | Ok |
Token ID | 6762 |
Feature activation | -2.99e-01 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.000 |
Developer | -0.000 |
rite | -0.000 |
taboola | -0.000 |
yip | -0.000 |
Token | ami |
Token ID | 6277 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
ellen | +0.069 |
Developer | +0.066 |
taboola | +0.064 |
rite | +0.064 |
yip | +0.061 |
Neg logit contributions | |
scribe | -0.070 |
adem | -0.070 |
results | -0.069 |
inen | -0.068 |
rior | -0.067 |
Token | and |
Token ID | 290 |
Feature activation | -2.23e-02 |
Pos logit contributions | |
ellen | +0.285 |
Developer | +0.273 |
rite | +0.268 |
taboola | +0.267 |
yip | +0.258 |
Neg logit contributions | |
scribe | -0.250 |
results | -0.245 |
adem | -0.243 |
inen | -0.241 |
rior | -0.234 |
Token | Islam |
Token ID | 3449 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
aux | +0.005 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.005 |
rior | -0.005 |
Token | b |
Token ID | 65 |
Feature activation | -1.30e-01 |
Pos logit contributions | |
scribe | +0.086 |
results | +0.085 |
adem | +0.084 |
inen | +0.083 |
rior | +0.081 |
Neg logit contributions | |
ellen | -0.090 |
Developer | -0.086 |
rite | -0.084 |
taboola | -0.084 |
aux | -0.081 |
Token | oul |
Token ID | 2852 |
Feature activation | +3.37e-01 |
Pos logit contributions | |
ellen | +0.031 |
Developer | +0.030 |
rite | +0.029 |
taboola | +0.029 |
yip | +0.028 |
Neg logit contributions | |
scribe | -0.030 |
results | -0.029 |
adem | -0.029 |
inen | -0.029 |
rior | -0.028 |
Token | i |
Token ID | 72 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
scribe | +0.080 |
results | +0.078 |
adem | +0.078 |
inen | +0.078 |
rior | +0.076 |
Neg logit contributions | |
ellen | -0.077 |
Developer | -0.074 |
rite | -0.073 |
taboola | -0.072 |
yip | -0.069 |
Token | Fact |
Token ID | 29054 |
Feature activation | -1.39e-01 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
taboola | -0.004 |
rite | -0.004 |
yip | -0.004 |
Token | in |
Token ID | 287 |
Feature activation | -4.39e-03 |
Pos logit contributions | |
ellen | +0.036 |
Developer | +0.034 |
rite | +0.033 |
taboola | +0.033 |
aux | +0.032 |
Neg logit contributions | |
scribe | -0.029 |
results | -0.029 |
adem | -0.028 |
inen | -0.028 |
rior | -0.027 |
Token | March |
Token ID | 2805 |
Feature activation | -6.28e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.016 |
rite | +0.016 |
taboola | +0.016 |
yip | +0.015 |
Neg logit contributions | |
scribe | -0.013 |
results | -0.013 |
adem | -0.012 |
inen | -0.012 |
rior | -0.012 |
Token | " |
Token ID | 366 |
Feature activation | -3.18e-02 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
rite | -0.004 |
taboola | -0.004 |
yip | -0.004 |
Token | AIR |
Token ID | 42149 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
ellen | +0.007 |
Developer | +0.007 |
rite | +0.007 |
taboola | +0.007 |
yip | +0.007 |
Neg logit contributions | |
scribe | -0.008 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token | is |
Token ID | 318 |
Feature activation | -2.26e-03 |
Pos logit contributions | |
ellen | +0.268 |
Developer | +0.255 |
rite | +0.250 |
taboola | +0.249 |
yip | +0.239 |
Neg logit contributions | |
scribe | -0.268 |
results | -0.264 |
adem | -0.261 |
inen | -0.258 |
rior | -0.252 |
Token | a |
Token ID | 257 |
Feature activation | +2.95e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
taboola | +0.001 |
rite | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | non |
Token ID | 1729 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
scribe | +0.007 |
results | +0.006 |
adem | +0.006 |
inen | +0.006 |
rior | +0.006 |
Neg logit contributions | |
ellen | -0.007 |
Developer | -0.007 |
taboola | -0.007 |
rite | -0.007 |
yip | -0.007 |
Token | - |
Token ID | 12 |
Feature activation | +1.87e-02 |
Pos logit contributions | |
scribe | +0.042 |
results | +0.042 |
adem | +0.041 |
inen | +0.041 |
rior | +0.040 |
Neg logit contributions | |
ellen | -0.047 |
Developer | -0.045 |
rite | -0.044 |
taboola | -0.044 |
aux | -0.042 |
Token | partisan |
Token ID | 28226 |
Feature activation | +5.76e-01 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.005 |
Developer | -0.005 |
rite | -0.005 |
taboola | -0.005 |
aux | -0.005 |
Token | ] |
Token ID | 2361 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
scribe | +0.038 |
results | +0.038 |
inen | +0.037 |
adem | +0.037 |
rior | +0.036 |
Neg logit contributions | |
ellen | -0.027 |
Developer | -0.025 |
taboola | -0.025 |
rite | -0.024 |
yip | -0.024 |
Token |
|
Token ID | 198 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
ellen | +0.047 |
Developer | +0.045 |
rite | +0.044 |
taboola | +0.044 |
yip | +0.042 |
Neg logit contributions | |
scribe | -0.040 |
results | -0.039 |
adem | -0.039 |
inen | -0.038 |
rior | -0.037 |
Token |
|
Token ID | 198 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | Various |
Token ID | 40009 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
yip | -0.002 |
Token | sound |
Token ID | 2128 |
Feature activation | -8.01e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.004 |
rite | +0.004 |
taboola | +0.004 |
yip | +0.004 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | tracks |
Token ID | 46074 |
Feature activation | +7.05e-01 |
Pos logit contributions | |
ellen | +0.029 |
Developer | +0.028 |
rite | +0.028 |
taboola | +0.028 |
yip | +0.027 |
Neg logit contributions | |
scribe | -0.009 |
results | -0.008 |
adem | -0.008 |
inen | -0.008 |
rior | -0.007 |
Token | have |
Token ID | 423 |
Feature activation | +2.87e-02 |
Pos logit contributions | |
scribe | +0.169 |
results | +0.166 |
adem | +0.165 |
inen | +0.164 |
rior | +0.158 |
Neg logit contributions | |
ellen | -0.161 |
Developer | -0.152 |
taboola | -0.149 |
rite | -0.149 |
yip | -0.144 |
Token | been |
Token ID | 587 |
Feature activation | -5.14e-02 |
Pos logit contributions | |
scribe | +0.007 |
results | +0.007 |
adem | +0.007 |
inen | +0.007 |
rior | +0.007 |
Neg logit contributions | |
ellen | -0.006 |
Developer | -0.006 |
rite | -0.006 |
taboola | -0.006 |
yip | -0.006 |
Token | released |
Token ID | 2716 |
Feature activation | +5.94e-01 |
Pos logit contributions | |
ellen | +0.014 |
Developer | +0.013 |
taboola | +0.013 |
rite | +0.013 |
yip | +0.013 |
Neg logit contributions | |
scribe | -0.010 |
results | -0.010 |
adem | -0.010 |
inen | -0.010 |
rior | -0.009 |
Token | featuring |
Token ID | 9593 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
scribe | +0.135 |
results | +0.133 |
adem | +0.132 |
inen | +0.130 |
rior | +0.127 |
Neg logit contributions | |
ellen | -0.142 |
Developer | -0.136 |
rite | -0.133 |
taboola | -0.133 |
yip | -0.128 |
Token | music |
Token ID | 2647 |
Feature activation | -2.32e-01 |
Pos logit contributions | |
scribe | +0.050 |
results | +0.049 |
adem | +0.048 |
inen | +0.048 |
rior | +0.047 |
Neg logit contributions | |
ellen | -0.055 |
Developer | -0.053 |
rite | -0.052 |
taboola | -0.051 |
yip | -0.050 |
Token | requires |
Token ID | 4433 |
Feature activation | -3.46e-03 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.012 |
taboola | +0.012 |
rite | +0.011 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.012 |
adem | -0.012 |
results | -0.012 |
inen | -0.012 |
rior | -0.011 |
Token | JavaScript |
Token ID | 11933 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
ellen | +0.001 |
taboola | +0.001 |
Developer | +0.001 |
yip | +0.001 |
rite | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | -7.29e-03 |
Pos logit contributions | |
ellen | +0.046 |
Developer | +0.044 |
taboola | +0.043 |
rite | +0.043 |
yip | +0.042 |
Neg logit contributions | |
scribe | -0.044 |
results | -0.043 |
adem | -0.042 |
inen | -0.042 |
rior | -0.041 |
Token | play |
Token ID | 711 |
Feature activation | -6.04e-02 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e-02 |
Pos logit contributions | |
ellen | +0.016 |
Developer | +0.015 |
rite | +0.015 |
taboola | +0.015 |
yip | +0.014 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.012 |
adem | -0.012 |
inen | -0.012 |
rior | -0.012 |
Token | See |
Token ID | 4091 |
Feature activation | +6.99e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.004 |
Token | map |
Token ID | 3975 |
Feature activation | +2.75e-01 |
Pos logit contributions | |
results | +0.151 |
scribe | +0.151 |
adem | +0.148 |
inen | +0.143 |
rior | +0.138 |
Neg logit contributions | |
ellen | -0.176 |
Developer | -0.168 |
taboola | -0.166 |
rite | -0.166 |
yip | -0.162 |
Token | of |
Token ID | 286 |
Feature activation | +2.96e-03 |
Pos logit contributions | |
scribe | +0.059 |
results | +0.058 |
adem | +0.057 |
inen | +0.056 |
rior | +0.055 |
Neg logit contributions | |
ellen | -0.070 |
Developer | -0.066 |
rite | -0.066 |
taboola | -0.065 |
yip | -0.063 |
Token | affected |
Token ID | 5676 |
Feature activation | +4.01e-02 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
aux | -0.001 |
Token | area |
Token ID | 1989 |
Feature activation | -2.49e-01 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.009 |
inen | +0.009 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.009 |
Developer | -0.009 |
taboola | -0.008 |
rite | -0.008 |
yip | -0.008 |
Token | Russia |
Token ID | 3284 |
Feature activation | +1.61e-01 |
Pos logit contributions | |
ellen | +0.063 |
Developer | +0.061 |
rite | +0.060 |
taboola | +0.059 |
yip | +0.057 |
Neg logit contributions | |
scribe | -0.053 |
results | -0.052 |
adem | -0.052 |
inen | -0.051 |
rior | -0.050 |
Token | the |
Token ID | 262 |
Feature activation | -5.01e-03 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.006 |
Developer | -0.006 |
rite | -0.006 |
taboola | -0.006 |
yip | -0.006 |
Token | most |
Token ID | 749 |
Feature activation | +2.61e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
taboola | +0.001 |
rite | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | anti |
Token ID | 3098 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
scribe | +0.057 |
results | +0.056 |
adem | +0.056 |
inen | +0.055 |
rior | +0.053 |
Neg logit contributions | |
ellen | -0.065 |
Developer | -0.062 |
taboola | -0.061 |
rite | -0.061 |
yip | -0.059 |
Token | - |
Token ID | 12 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
ellen | +0.038 |
Developer | +0.037 |
rite | +0.036 |
taboola | +0.036 |
aux | +0.035 |
Neg logit contributions | |
scribe | -0.035 |
results | -0.035 |
adem | -0.034 |
inen | -0.034 |
rior | -0.033 |
Token | gun |
Token ID | 7145 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | president |
Token ID | 1893 |
Feature activation | +6.88e-01 |
Pos logit contributions | |
ellen | +0.069 |
Developer | +0.067 |
rite | +0.067 |
taboola | +0.066 |
yip | +0.065 |
Neg logit contributions | |
scribe | -0.019 |
results | -0.018 |
adem | -0.017 |
inen | -0.017 |
rior | -0.015 |
Token | in |
Token ID | 287 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
scribe | +0.148 |
results | +0.145 |
adem | +0.144 |
inen | +0.142 |
rior | +0.138 |
Neg logit contributions | |
ellen | -0.174 |
Developer | -0.166 |
rite | -0.163 |
taboola | -0.163 |
aux | -0.157 |
Token | American |
Token ID | 1605 |
Feature activation | -2.63e-01 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
aux | -0.002 |
Token | history |
Token ID | 2106 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
ellen | +0.059 |
Developer | +0.056 |
rite | +0.055 |
taboola | +0.054 |
aux | +0.052 |
Neg logit contributions | |
scribe | -0.064 |
results | -0.063 |
adem | -0.062 |
inen | -0.062 |
rior | -0.060 |
Token | . |
Token ID | 13 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
ellen | +0.026 |
Developer | +0.025 |
rite | +0.025 |
taboola | +0.024 |
yip | +0.024 |
Neg logit contributions | |
scribe | -0.023 |
results | -0.023 |
adem | -0.022 |
inen | -0.022 |
rior | -0.022 |
Token | Senator |
Token ID | 8962 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | it |
Token ID | 340 |
Feature activation | -7.50e-02 |
Pos logit contributions | |
scribe | +0.012 |
results | +0.012 |
adem | +0.011 |
inen | +0.011 |
rior | +0.011 |
Neg logit contributions | |
ellen | -0.015 |
Developer | -0.015 |
rite | -0.014 |
taboola | -0.014 |
aux | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | +5.08e-02 |
Pos logit contributions | |
ellen | +0.018 |
Developer | +0.018 |
rite | +0.017 |
taboola | +0.017 |
yip | +0.017 |
Neg logit contributions | |
scribe | -0.017 |
results | -0.016 |
adem | -0.016 |
inen | -0.016 |
rior | -0.016 |
Token | only |
Token ID | 691 |
Feature activation | -7.70e-02 |
Pos logit contributions | |
scribe | +0.012 |
results | +0.011 |
adem | +0.011 |
inen | +0.011 |
rior | +0.011 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.012 |
rite | -0.011 |
taboola | -0.011 |
yip | -0.011 |
Token | half |
Token ID | 2063 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
ellen | +0.019 |
Developer | +0.018 |
rite | +0.018 |
taboola | +0.018 |
yip | +0.017 |
Neg logit contributions | |
scribe | -0.017 |
results | -0.017 |
adem | -0.017 |
inen | -0.017 |
rior | -0.016 |
Token | - |
Token ID | 12 |
Feature activation | +6.51e-03 |
Pos logit contributions | |
ellen | +0.092 |
Developer | +0.087 |
rite | +0.086 |
taboola | +0.086 |
aux | +0.083 |
Neg logit contributions | |
scribe | -0.073 |
results | -0.072 |
adem | -0.071 |
inen | -0.070 |
rior | -0.068 |
Token | true |
Token ID | 7942 |
Feature activation | +7.82e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
aux | -0.002 |
Token | at |
Token ID | 379 |
Feature activation | +9.68e-02 |
Pos logit contributions | |
scribe | +0.166 |
results | +0.163 |
adem | +0.161 |
inen | +0.159 |
rior | +0.155 |
Neg logit contributions | |
ellen | -0.199 |
Developer | -0.191 |
rite | -0.187 |
taboola | -0.187 |
aux | -0.180 |
Token | best |
Token ID | 1266 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
scribe | +0.023 |
results | +0.023 |
adem | +0.022 |
inen | +0.022 |
rior | +0.022 |
Neg logit contributions | |
ellen | -0.022 |
Developer | -0.021 |
rite | -0.021 |
taboola | -0.021 |
yip | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | -8.09e-03 |
Pos logit contributions | |
ellen | +0.026 |
Developer | +0.025 |
rite | +0.025 |
taboola | +0.025 |
aux | +0.024 |
Neg logit contributions | |
scribe | -0.022 |
results | -0.022 |
adem | -0.021 |
inen | -0.021 |
rior | -0.021 |
Token | Let |
Token ID | 5756 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | 's |
Token ID | 338 |
Feature activation | +6.28e-02 |
Pos logit contributions | |
scribe | +0.031 |
results | +0.030 |
adem | +0.030 |
inen | +0.029 |
rior | +0.028 |
Neg logit contributions | |
ellen | -0.041 |
Developer | -0.039 |
rite | -0.038 |
taboola | -0.038 |
aux | -0.037 |
Token | Clinton |
Token ID | 2605 |
Feature activation | -1.12e-01 |
Pos logit contributions | |
ellen | +0.065 |
Developer | +0.063 |
taboola | +0.061 |
rite | +0.061 |
yip | +0.059 |
Neg logit contributions | |
scribe | -0.069 |
results | -0.069 |
adem | -0.068 |
inen | -0.067 |
rior | -0.066 |
Token | , |
Token ID | 11 |
Feature activation | -5.91e-04 |
Pos logit contributions | |
ellen | +0.028 |
Developer | +0.027 |
rite | +0.027 |
taboola | +0.027 |
yip | +0.026 |
Neg logit contributions | |
scribe | -0.024 |
results | -0.024 |
adem | -0.024 |
inen | -0.023 |
rior | -0.023 |
Token | Mary |
Token ID | 5335 |
Feature activation | -3.82e-01 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
taboola | +0.000 |
rite | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | Anne |
Token ID | 15397 |
Feature activation | -2.33e-01 |
Pos logit contributions | |
ellen | +0.088 |
Developer | +0.085 |
taboola | +0.083 |
rite | +0.082 |
yip | +0.079 |
Neg logit contributions | |
scribe | -0.090 |
results | -0.088 |
adem | -0.087 |
inen | -0.087 |
rior | -0.085 |
Token | N |
Token ID | 399 |
Feature activation | -3.53e-01 |
Pos logit contributions | |
ellen | +0.057 |
Developer | +0.055 |
taboola | +0.054 |
rite | +0.054 |
yip | +0.052 |
Neg logit contributions | |
scribe | -0.051 |
results | -0.051 |
adem | -0.050 |
inen | -0.049 |
rior | -0.048 |
Token | oland |
Token ID | 23573 |
Feature activation | +7.52e-01 |
Pos logit contributions | |
ellen | +0.087 |
Developer | +0.082 |
rite | +0.081 |
taboola | +0.081 |
aux | +0.078 |
Neg logit contributions | |
scribe | -0.079 |
results | -0.077 |
adem | -0.077 |
inen | -0.076 |
rior | -0.074 |
Token | of |
Token ID | 286 |
Feature activation | +4.56e-04 |
Pos logit contributions | |
scribe | +0.166 |
results | +0.163 |
adem | +0.162 |
inen | +0.161 |
rior | +0.155 |
Neg logit contributions | |
ellen | -0.185 |
Developer | -0.178 |
taboola | -0.174 |
rite | -0.173 |
yip | -0.167 |
Token | Richmond |
Token ID | 16940 |
Feature activation | +1.53e-01 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.000 |
Developer | -0.000 |
rite | -0.000 |
taboola | -0.000 |
aux | -0.000 |
Token | chose |
Token ID | 7690 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
scribe | +0.033 |
results | +0.032 |
adem | +0.032 |
inen | +0.032 |
rior | +0.031 |
Neg logit contributions | |
ellen | -0.039 |
Developer | -0.037 |
rite | -0.036 |
taboola | -0.036 |
yip | -0.035 |
Token | , |
Token ID | 11 |
Feature activation | +5.71e-03 |
Pos logit contributions | |
ellen | +0.026 |
Developer | +0.025 |
taboola | +0.024 |
rite | +0.024 |
yip | +0.024 |
Neg logit contributions | |
scribe | -0.023 |
results | -0.023 |
adem | -0.023 |
inen | -0.023 |
rior | -0.022 |
Token | instead |
Token ID | 2427 |
Feature activation | -4.97e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
taboola | -0.001 |
rite | -0.001 |
yip | -0.001 |
Token | be |
Token ID | 307 |
Feature activation | +6.74e-03 |
Pos logit contributions | |
scribe | +0.013 |
results | +0.013 |
adem | +0.013 |
inen | +0.013 |
rior | +0.013 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.011 |
taboola | -0.011 |
rite | -0.011 |
yip | -0.010 |
Token | at |
Token ID | 379 |
Feature activation | +1.20e-01 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +2.98e-02 |
Pos logit contributions | |
scribe | +0.026 |
results | +0.026 |
adem | +0.025 |
inen | +0.025 |
rior | +0.024 |
Neg logit contributions | |
ellen | -0.030 |
Developer | -0.029 |
taboola | -0.028 |
rite | -0.028 |
yip | -0.027 |
Token | certain |
Token ID | 1728 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
scribe | +0.007 |
results | +0.007 |
adem | +0.007 |
inen | +0.006 |
rior | +0.006 |
Neg logit contributions | |
ellen | -0.007 |
Developer | -0.007 |
taboola | -0.007 |
rite | -0.007 |
yip | -0.007 |
Token | metal |
Token ID | 6147 |
Feature activation | -2.96e-01 |
Pos logit contributions | |
scribe | +0.124 |
results | +0.122 |
adem | +0.121 |
inen | +0.119 |
rior | +0.117 |
Neg logit contributions | |
ellen | -0.133 |
Developer | -0.127 |
taboola | -0.125 |
rite | -0.124 |
yip | -0.120 |
Token | level |
Token ID | 1241 |
Feature activation | +1.85e-01 |
Pos logit contributions | |
ellen | +0.072 |
Developer | +0.069 |
rite | +0.068 |
taboola | +0.067 |
aux | +0.065 |
Neg logit contributions | |
scribe | -0.066 |
results | -0.065 |
adem | -0.065 |
inen | -0.064 |
rior | -0.062 |
Token | ." |
Token ID | 526 |
Feature activation | +2.60e-01 |
Pos logit contributions | |
scribe | +0.040 |
results | +0.039 |
adem | +0.039 |
inen | +0.038 |
rior | +0.037 |
Neg logit contributions | |
ellen | -0.047 |
Developer | -0.045 |
rite | -0.044 |
taboola | -0.044 |
yip | -0.042 |
Token |
|
Token ID | 198 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
scribe | +0.055 |
results | +0.054 |
adem | +0.054 |
inen | +0.053 |
rior | +0.052 |
Neg logit contributions | |
ellen | -0.066 |
Developer | -0.063 |
rite | -0.062 |
taboola | -0.062 |
yip | -0.060 |
Token |
|
Token ID | 198 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | The |
Token ID | 464 |
Feature activation | -3.13e-02 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.004 |
rite | -0.003 |
Developer | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | nonpartisan |
Token ID | 42157 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
ellen | +0.007 |
Developer | +0.007 |
taboola | +0.007 |
rite | +0.007 |
yip | +0.007 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
scribe | +0.009 |
results | +0.009 |
adem | +0.009 |
inen | +0.008 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.010 |
Developer | -0.010 |
rite | -0.010 |
taboola | -0.010 |
aux | -0.009 |
Token | Fed |
Token ID | 10169 |
Feature activation | -7.86e-01 |
Pos logit contributions | |
scribe | +0.006 |
results | +0.006 |
adem | +0.006 |
inen | +0.006 |
rior | +0.006 |
Neg logit contributions | |
ellen | -0.007 |
Developer | -0.006 |
taboola | -0.006 |
rite | -0.006 |
yip | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | -8.76e-03 |
Pos logit contributions | |
ellen | +0.187 |
Developer | +0.179 |
rite | +0.175 |
taboola | +0.175 |
yip | +0.168 |
Neg logit contributions | |
scribe | -0.180 |
results | -0.177 |
adem | -0.175 |
inen | -0.173 |
rior | -0.169 |
Token | politicians |
Token ID | 7602 |
Feature activation | -4.70e-02 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | in |
Token ID | 287 |
Feature activation | -1.12e-03 |
Pos logit contributions | |
ellen | +0.011 |
Developer | +0.010 |
taboola | +0.010 |
rite | +0.010 |
yip | +0.010 |
Neg logit contributions | |
scribe | -0.011 |
results | -0.011 |
adem | -0.011 |
inen | -0.011 |
rior | -0.011 |
Token | D |
Token ID | 360 |
Feature activation | +2.13e-01 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +4.25e-03 |
Pos logit contributions | |
scribe | +0.044 |
results | +0.043 |
adem | +0.043 |
inen | +0.042 |
rior | +0.041 |
Neg logit contributions | |
ellen | -0.055 |
Developer | -0.053 |
rite | -0.052 |
taboola | -0.052 |
yip | -0.051 |
Token | C |
Token ID | 34 |
Feature activation | +1.56e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
taboola | -0.001 |
rite | -0.001 |
yip | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
scribe | +0.033 |
results | +0.032 |
adem | +0.032 |
inen | +0.032 |
rior | +0.031 |
Neg logit contributions | |
ellen | -0.040 |
Developer | -0.038 |
rite | -0.038 |
taboola | -0.037 |
yip | -0.036 |
Token | rolled |
Token ID | 11686 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
taboola | -0.002 |
rite | -0.002 |
yip | -0.002 |
Token | out |
Token ID | 503 |
Feature activation | -6.45e-03 |
Pos logit contributions | |
scribe | +0.041 |
results | +0.041 |
adem | +0.040 |
inen | +0.040 |
rior | +0.039 |
Neg logit contributions | |
ellen | -0.048 |
Developer | -0.046 |
rite | -0.045 |
taboola | -0.045 |
aux | -0.043 |
Token | She |
Token ID | 1375 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
ellen | +0.009 |
Developer | +0.009 |
rite | +0.009 |
taboola | +0.009 |
yip | +0.009 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token | keeps |
Token ID | 7622 |
Feature activation | +3.25e-02 |
Pos logit contributions | |
scribe | +0.023 |
results | +0.023 |
adem | +0.022 |
inen | +0.022 |
rior | +0.022 |
Neg logit contributions | |
ellen | -0.024 |
Developer | -0.023 |
rite | -0.023 |
taboola | -0.023 |
yip | -0.022 |
Token | going |
Token ID | 1016 |
Feature activation | +4.91e-02 |
Pos logit contributions | |
scribe | +0.007 |
results | +0.007 |
adem | +0.007 |
inen | +0.007 |
rior | +0.007 |
Neg logit contributions | |
ellen | -0.008 |
Developer | -0.008 |
rite | -0.007 |
taboola | -0.007 |
yip | -0.007 |
Token | back |
Token ID | 736 |
Feature activation | -5.12e-02 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.010 |
inen | +0.010 |
rior | +0.010 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.012 |
rite | -0.012 |
taboola | -0.012 |
yip | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
ellen | +0.012 |
Developer | +0.012 |
rite | +0.011 |
taboola | +0.011 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.012 |
adem | -0.011 |
inen | -0.011 |
rior | -0.011 |
Token | So |
Token ID | 1406 |
Feature activation | +8.39e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | I |
Token ID | 314 |
Feature activation | -1.30e-03 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.019 |
inen | +0.018 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.020 |
Developer | -0.019 |
rite | -0.019 |
taboola | -0.019 |
yip | -0.018 |
Token | think |
Token ID | 892 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
yip | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | they |
Token ID | 484 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
ellen | +0.050 |
Developer | +0.048 |
taboola | +0.047 |
rite | +0.047 |
yip | +0.045 |
Neg logit contributions | |
scribe | -0.048 |
results | -0.048 |
adem | -0.047 |
inen | -0.047 |
rior | -0.045 |
Token | � |
Token ID | 447 |
Feature activation | -2.11e-02 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | � |
Token ID | 247 |
Feature activation | -2.55e-03 |
Pos logit contributions | |
ellen | +0.005 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
yip | +0.005 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.005 |
rior | -0.004 |
Token | q |
Token ID | 80 |
Feature activation | +2.68e-01 |
Pos logit contributions | |
ellen | +0.086 |
Developer | +0.082 |
rite | +0.080 |
taboola | +0.080 |
yip | +0.077 |
Neg logit contributions | |
scribe | -0.079 |
results | -0.077 |
adem | -0.076 |
inen | -0.076 |
rior | -0.074 |
Token | . |
Token ID | 13 |
Feature activation | +5.46e-04 |
Pos logit contributions | |
scribe | +0.058 |
results | +0.057 |
adem | +0.057 |
inen | +0.056 |
rior | +0.055 |
Neg logit contributions | |
ellen | -0.067 |
Developer | -0.064 |
rite | -0.063 |
taboola | -0.063 |
yip | -0.061 |
Token | 1 |
Token ID | 352 |
Feature activation | -1.63e-01 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.000 |
Developer | -0.000 |
taboola | -0.000 |
rite | -0.000 |
yip | -0.000 |
Token | ): |
Token ID | 2599 |
Feature activation | -1.36e-01 |
Pos logit contributions | |
ellen | +0.041 |
Developer | +0.040 |
rite | +0.039 |
taboola | +0.039 |
yip | +0.037 |
Neg logit contributions | |
scribe | -0.035 |
results | -0.034 |
adem | -0.034 |
inen | -0.033 |
rior | -0.033 |
Token |
|
Token ID | 198 |
Feature activation | +2.03e-02 |
Pos logit contributions | |
ellen | +0.034 |
Developer | +0.033 |
taboola | +0.032 |
rite | +0.032 |
yip | +0.031 |
Neg logit contributions | |
scribe | -0.029 |
results | -0.029 |
adem | -0.028 |
inen | -0.028 |
rior | -0.027 |
Token |
|
Token ID | 198 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.005 |
Developer | -0.005 |
rite | -0.005 |
taboola | -0.005 |
yip | -0.005 |
Token | the |
Token ID | 1169 |
Feature activation | +3.23e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | radi |
Token ID | 19772 |
Feature activation | +4.00e-01 |
Pos logit contributions | |
scribe | +0.075 |
results | +0.074 |
adem | +0.073 |
inen | +0.073 |
rior | +0.071 |
Neg logit contributions | |
ellen | -0.075 |
Developer | -0.072 |
taboola | -0.071 |
rite | -0.070 |
yip | -0.068 |
Token | ative |
Token ID | 876 |
Feature activation | -3.61e-01 |
Pos logit contributions | |
scribe | +0.097 |
results | +0.096 |
inen | +0.096 |
adem | +0.096 |
rior | +0.092 |
Neg logit contributions | |
ellen | -0.089 |
Developer | -0.085 |
rite | -0.084 |
taboola | -0.083 |
yip | -0.081 |
Token | forcing |
Token ID | 10833 |
Feature activation | -4.08e-01 |
Pos logit contributions | |
ellen | +0.070 |
Developer | +0.067 |
rite | +0.065 |
taboola | +0.065 |
yip | +0.062 |
Neg logit contributions | |
scribe | -0.098 |
results | -0.097 |
inen | -0.096 |
adem | -0.096 |
rior | -0.093 |
Token | Δ |
Token ID | 37455 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
ellen | +0.098 |
Developer | +0.094 |
rite | +0.092 |
taboola | +0.092 |
yip | +0.089 |
Neg logit contributions | |
scribe | -0.092 |
results | -0.091 |
adem | -0.089 |
inen | -0.089 |
rior | -0.087 |
Token | - |
Token ID | 532 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token | Skip |
Token ID | 32214 |
Feature activation | -2.26e-01 |
Pos logit contributions | |
ellen | +0.039 |
Developer | +0.037 |
rite | +0.037 |
taboola | +0.037 |
aux | +0.035 |
Neg logit contributions | |
scribe | -0.038 |
results | -0.037 |
adem | -0.037 |
inen | -0.036 |
rior | -0.035 |
Token | Bay |
Token ID | 4696 |
Feature activation | +5.99e-02 |
Pos logit contributions | |
ellen | +0.055 |
Developer | +0.053 |
rite | +0.052 |
taboola | +0.051 |
aux | +0.049 |
Neg logit contributions | |
scribe | -0.051 |
results | -0.050 |
adem | -0.049 |
inen | -0.049 |
rior | -0.047 |
Token | less |
Token ID | 1203 |
Feature activation | -6.79e-01 |
Pos logit contributions | |
scribe | +0.019 |
results | +0.019 |
adem | +0.019 |
inen | +0.019 |
rior | +0.018 |
Neg logit contributions | |
ellen | -0.009 |
Developer | -0.008 |
rite | -0.008 |
taboola | -0.008 |
yip | -0.007 |
Token | (@ |
Token ID | 4275 |
Feature activation | +7.43e-01 |
Pos logit contributions | |
ellen | +0.192 |
Developer | +0.184 |
rite | +0.181 |
taboola | +0.180 |
aux | +0.175 |
Neg logit contributions | |
scribe | -0.126 |
results | -0.123 |
adem | -0.122 |
inen | -0.120 |
rior | -0.116 |
Token | Real |
Token ID | 15633 |
Feature activation | +9.44e-02 |
Pos logit contributions | |
scribe | +0.174 |
results | +0.171 |
adem | +0.169 |
inen | +0.167 |
rior | +0.163 |
Neg logit contributions | |
ellen | -0.174 |
Developer | -0.165 |
rite | -0.162 |
taboola | -0.162 |
yip | -0.156 |
Token | Skip |
Token ID | 50232 |
Feature activation | +2.11e-01 |
Pos logit contributions | |
scribe | +0.021 |
results | +0.021 |
adem | +0.021 |
inen | +0.021 |
rior | +0.020 |
Neg logit contributions | |
ellen | -0.023 |
Developer | -0.022 |
rite | -0.021 |
taboola | -0.021 |
yip | -0.020 |
Token | Bay |
Token ID | 15262 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
scribe | +0.047 |
results | +0.046 |
adem | +0.046 |
inen | +0.045 |
rior | +0.044 |
Neg logit contributions | |
ellen | -0.052 |
Developer | -0.049 |
rite | -0.048 |
taboola | -0.048 |
aux | -0.047 |
Token | less |
Token ID | 1203 |
Feature activation | -7.09e-01 |
Pos logit contributions | |
scribe | +0.101 |
results | +0.099 |
adem | +0.098 |
inen | +0.097 |
rior | +0.096 |
Neg logit contributions | |
ellen | -0.048 |
Developer | -0.044 |
rite | -0.043 |
taboola | -0.043 |
yip | -0.040 |
Token | ) |
Token ID | 8 |
Feature activation | +8.02e-02 |
Pos logit contributions | |
ellen | +0.181 |
Developer | +0.173 |
rite | +0.169 |
taboola | +0.168 |
aux | +0.163 |
Neg logit contributions | |
scribe | -0.151 |
results | -0.148 |
adem | -0.147 |
inen | -0.145 |
rior | -0.140 |
Token | January |
Token ID | 3269 |
Feature activation | +6.26e-02 |
Pos logit contributions | |
scribe | +0.018 |
results | +0.017 |
adem | +0.017 |
inen | +0.017 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.020 |
Developer | -0.019 |
rite | -0.019 |
taboola | -0.019 |
yip | -0.018 |
Token | : |
Token ID | 25 |
Feature activation | -3.33e-02 |
Pos logit contributions | |
scribe | +0.051 |
results | +0.050 |
adem | +0.049 |
inen | +0.049 |
rior | +0.047 |
Neg logit contributions | |
ellen | -0.062 |
Developer | -0.059 |
rite | -0.058 |
taboola | -0.058 |
yip | -0.056 |
Token | The |
Token ID | 383 |
Feature activation | +3.70e-02 |
Pos logit contributions | |
ellen | +0.008 |
Developer | +0.008 |
taboola | +0.008 |
rite | +0.008 |
yip | +0.008 |
Neg logit contributions | |
scribe | -0.007 |
results | -0.007 |
adem | -0.007 |
inen | -0.007 |
rior | -0.007 |
Token | fear |
Token ID | 3252 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
scribe | +0.008 |
results | +0.008 |
adem | +0.008 |
inen | +0.008 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.009 |
Developer | -0.009 |
taboola | -0.008 |
rite | -0.008 |
yip | -0.008 |
Token | of |
Token ID | 286 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
ellen | +0.025 |
Developer | +0.024 |
taboola | +0.023 |
rite | +0.023 |
aux | +0.022 |
Neg logit contributions | |
scribe | -0.025 |
results | -0.025 |
adem | -0.024 |
inen | -0.024 |
rior | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | +7.33e-03 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.005 |
Developer | -0.005 |
taboola | -0.005 |
rite | -0.005 |
aux | -0.004 |
Token | unknown |
Token ID | 6439 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
taboola | -0.002 |
rite | -0.002 |
yip | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -6.38e-03 |
Pos logit contributions | |
ellen | +0.072 |
Developer | +0.069 |
taboola | +0.068 |
rite | +0.068 |
yip | +0.065 |
Neg logit contributions | |
scribe | -0.067 |
results | -0.066 |
adem | -0.065 |
inen | -0.064 |
rior | -0.063 |
Token |
|
Token ID | 198 |
Feature activation | +6.43e-03 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
taboola | -0.002 |
rite | -0.002 |
yip | -0.002 |
Token | What |
Token ID | 2061 |
Feature activation | -1.49e-02 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | Eid |
Token ID | 31022 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.003 |
taboola | +0.003 |
rite | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | we |
Token ID | 356 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
ellen | +0.044 |
Developer | +0.042 |
rite | +0.041 |
taboola | +0.041 |
yip | +0.039 |
Neg logit contributions | |
scribe | -0.039 |
results | -0.038 |
adem | -0.038 |
inen | -0.037 |
rior | -0.036 |
Token | head |
Token ID | 1182 |
Feature activation | +6.97e-01 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.004 |
results | -0.004 |
adem | -0.004 |
inen | -0.004 |
rior | -0.003 |
Token | towards |
Token ID | 3371 |
Feature activation | -1.34e-01 |
Pos logit contributions | |
scribe | +0.139 |
results | +0.136 |
adem | +0.134 |
inen | +0.133 |
rior | +0.129 |
Neg logit contributions | |
ellen | -0.187 |
Developer | -0.180 |
rite | -0.177 |
taboola | -0.176 |
aux | -0.170 |
Token | the |
Token ID | 262 |
Feature activation | +1.74e-02 |
Pos logit contributions | |
ellen | +0.035 |
Developer | +0.034 |
rite | +0.033 |
taboola | +0.033 |
aux | +0.032 |
Neg logit contributions | |
scribe | -0.028 |
results | -0.027 |
adem | -0.027 |
inen | -0.027 |
rior | -0.026 |
Token | Libyan |
Token ID | 28661 |
Feature activation | +4.18e-01 |
Pos logit contributions | |
scribe | +0.004 |
results | +0.004 |
adem | +0.004 |
inen | +0.004 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
taboola | -0.004 |
rite | -0.004 |
yip | -0.004 |
Token | war |
Token ID | 1175 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
scribe | +0.095 |
results | +0.093 |
adem | +0.093 |
inen | +0.091 |
rior | +0.089 |
Neg logit contributions | |
ellen | -0.101 |
Developer | -0.096 |
rite | -0.094 |
taboola | -0.094 |
yip | -0.090 |
Token | , |
Token ID | 11 |
Feature activation | +5.79e-03 |
Pos logit contributions | |
ellen | +0.044 |
Developer | +0.042 |
rite | +0.042 |
taboola | +0.042 |
aux | +0.040 |
Neg logit contributions | |
scribe | -0.036 |
results | -0.036 |
adem | -0.035 |
inen | -0.035 |
rior | -0.034 |
Token | the |
Token ID | 262 |
Feature activation | +4.41e-02 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token | French |
Token ID | 4141 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
scribe | +0.011 |
results | +0.011 |
adem | +0.011 |
inen | +0.011 |
rior | +0.010 |
Neg logit contributions | |
ellen | -0.010 |
Developer | -0.009 |
rite | -0.009 |
taboola | -0.009 |
yip | -0.009 |
Token | Total |
Token ID | 7472 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
ellen | +0.034 |
Developer | +0.032 |
rite | +0.031 |
taboola | +0.031 |
yip | +0.030 |
Neg logit contributions | |
scribe | -0.040 |
results | -0.040 |
adem | -0.039 |
inen | -0.039 |
rior | -0.038 |
Token | have |
Token ID | 423 |
Feature activation | +6.71e-02 |
Pos logit contributions | |
scribe | +0.133 |
results | +0.131 |
adem | +0.129 |
inen | +0.128 |
rior | +0.124 |
Neg logit contributions | |
ellen | -0.138 |
Developer | -0.131 |
rite | -0.129 |
taboola | -0.129 |
yip | -0.123 |
Token | Rated |
Token ID | 49949 |
Feature activation | +9.90e-02 |
Pos logit contributions | |
ellen | +0.046 |
Developer | +0.044 |
rite | +0.043 |
taboola | +0.043 |
yip | +0.041 |
Neg logit contributions | |
scribe | -0.039 |
results | -0.038 |
adem | -0.038 |
inen | -0.038 |
rior | -0.036 |
Token | : |
Token ID | 25 |
Feature activation | -2.58e-02 |
Pos logit contributions | |
scribe | +0.023 |
results | +0.023 |
adem | +0.023 |
inen | +0.022 |
rior | +0.022 |
Neg logit contributions | |
ellen | -0.023 |
Developer | -0.022 |
rite | -0.022 |
taboola | -0.022 |
yip | -0.021 |
Token | Everyone |
Token ID | 11075 |
Feature activation | -2.07e-01 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
yip | +0.005 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
ellen | +0.053 |
Developer | +0.050 |
taboola | +0.049 |
rite | +0.049 |
yip | +0.048 |
Neg logit contributions | |
scribe | -0.044 |
results | -0.044 |
adem | -0.043 |
inen | -0.043 |
rior | -0.041 |
Token |
|
Token ID | 198 |
Feature activation | +4.21e-03 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | H |
Token ID | 39 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token | omew |
Token ID | 28030 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
ellen | +0.035 |
Developer | +0.033 |
rite | +0.032 |
taboola | +0.032 |
aux | +0.030 |
Neg logit contributions | |
scribe | -0.047 |
results | -0.047 |
adem | -0.046 |
inen | -0.046 |
rior | -0.045 |
Token | orld |
Token ID | 1764 |
Feature activation | +4.14e-01 |
Pos logit contributions | |
ellen | +0.036 |
Developer | +0.034 |
taboola | +0.034 |
rite | +0.034 |
yip | +0.033 |
Neg logit contributions | |
scribe | -0.017 |
results | -0.017 |
adem | -0.017 |
inen | -0.016 |
rior | -0.016 |
Token | is |
Token ID | 318 |
Feature activation | -1.36e-02 |
Pos logit contributions | |
scribe | +0.095 |
results | +0.094 |
adem | +0.093 |
inen | +0.092 |
rior | +0.089 |
Neg logit contributions | |
ellen | -0.098 |
Developer | -0.094 |
rite | -0.092 |
taboola | -0.092 |
aux | -0.088 |
Token | a |
Token ID | 257 |
Feature activation | +9.90e-04 |
Pos logit contributions | |
ellen | +0.004 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
yip | +0.003 |
Neg logit contributions | |
scribe | -0.003 |
results | -0.003 |
adem | -0.003 |
inen | -0.003 |
rior | -0.003 |
Token | real |
Token ID | 1103 |
Feature activation | -7.14e-02 |
Pos logit contributions | |
scribe | +0.000 |
results | +0.000 |
adem | +0.000 |
inen | +0.000 |
rior | +0.000 |
Neg logit contributions | |
ellen | -0.000 |
Developer | -0.000 |
rite | -0.000 |
taboola | -0.000 |
yip | -0.000 |
Token | case |
Token ID | 1339 |
Feature activation | -5.20e-02 |
Pos logit contributions | |
scribe | +0.006 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.005 |
Developer | -0.005 |
rite | -0.005 |
taboola | -0.005 |
yip | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -2.18e-02 |
Pos logit contributions | |
ellen | +0.013 |
Developer | +0.012 |
rite | +0.012 |
taboola | +0.012 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.011 |
adem | -0.011 |
inen | -0.011 |
rior | -0.011 |
Token | � |
Token ID | 447 |
Feature activation | -2.26e-02 |
Pos logit contributions | |
ellen | +0.005 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
yip | +0.005 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
adem | -0.005 |
inen | -0.005 |
rior | -0.004 |
Token | � |
Token ID | 251 |
Feature activation | -7.72e-03 |
Pos logit contributions | |
ellen | +0.006 |
Developer | +0.005 |
rite | +0.005 |
taboola | +0.005 |
yip | +0.005 |
Neg logit contributions | |
scribe | -0.005 |
results | -0.005 |
inen | -0.005 |
adem | -0.005 |
rior | -0.005 |
Token | B |
Token ID | 347 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
rite | +0.002 |
taboola | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | amber |
Token ID | 7789 |
Feature activation | -2.58e-01 |
Pos logit contributions | |
scribe | +0.063 |
results | +0.062 |
adem | +0.062 |
inen | +0.061 |
rior | +0.060 |
Neg logit contributions | |
ellen | -0.042 |
Developer | -0.040 |
rite | -0.039 |
taboola | -0.039 |
yip | -0.037 |
Token | ger |
Token ID | 1362 |
Feature activation | +7.07e-02 |
Pos logit contributions | |
ellen | +0.066 |
Developer | +0.063 |
rite | +0.062 |
taboola | +0.062 |
yip | +0.060 |
Neg logit contributions | |
scribe | -0.055 |
results | -0.054 |
adem | -0.053 |
inen | -0.053 |
rior | -0.051 |
Token | said |
Token ID | 531 |
Feature activation | -1.49e-03 |
Pos logit contributions | |
scribe | +0.016 |
results | +0.016 |
adem | +0.016 |
inen | +0.016 |
rior | +0.015 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.016 |
rite | -0.016 |
taboola | -0.016 |
yip | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | -4.99e-03 |
Pos logit contributions | |
ellen | +0.000 |
Developer | +0.000 |
rite | +0.000 |
taboola | +0.000 |
aux | +0.000 |
Neg logit contributions | |
scribe | -0.000 |
results | -0.000 |
adem | -0.000 |
inen | -0.000 |
rior | -0.000 |
Token | � |
Token ID | 564 |
Feature activation | +7.16e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | � |
Token ID | 250 |
Feature activation | -5.19e-02 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.017 |
adem | +0.017 |
inen | +0.016 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.016 |
rite | -0.015 |
taboola | -0.015 |
yip | -0.015 |
Token | : |
Token ID | 25 |
Feature activation | -5.79e-02 |
Pos logit contributions | |
ellen | +0.047 |
Developer | +0.045 |
rite | +0.044 |
taboola | +0.044 |
aux | +0.042 |
Neg logit contributions | |
scribe | -0.046 |
results | -0.045 |
adem | -0.045 |
inen | -0.044 |
rior | -0.043 |
Token | Harvard |
Token ID | 11131 |
Feature activation | +3.12e-02 |
Pos logit contributions | |
ellen | +0.015 |
Developer | +0.014 |
rite | +0.014 |
taboola | +0.014 |
yip | +0.014 |
Neg logit contributions | |
scribe | -0.012 |
results | -0.012 |
adem | -0.012 |
inen | -0.012 |
rior | -0.011 |
Token | University |
Token ID | 2059 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
scribe | +0.007 |
results | +0.007 |
adem | +0.007 |
inen | +0.007 |
rior | +0.006 |
Neg logit contributions | |
ellen | -0.008 |
Developer | -0.007 |
rite | -0.007 |
taboola | -0.007 |
yip | -0.007 |
Token | Press |
Token ID | 4332 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
ellen | +0.003 |
Developer | +0.003 |
rite | +0.003 |
taboola | +0.003 |
aux | +0.003 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | ; |
Token ID | 26 |
Feature activation | +3.52e-02 |
Pos logit contributions | |
ellen | +0.030 |
Developer | +0.029 |
rite | +0.028 |
taboola | +0.028 |
aux | +0.027 |
Neg logit contributions | |
scribe | -0.028 |
results | -0.027 |
adem | -0.027 |
inen | -0.027 |
rior | -0.026 |
Token | 2005 |
Token ID | 5075 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
scribe | +0.008 |
results | +0.008 |
adem | +0.008 |
inen | +0.008 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.008 |
Developer | -0.008 |
rite | -0.008 |
taboola | -0.008 |
yip | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | -2.71e-02 |
Pos logit contributions | |
ellen | +0.029 |
Developer | +0.028 |
rite | +0.028 |
taboola | +0.028 |
yip | +0.027 |
Neg logit contributions | |
scribe | -0.022 |
results | -0.021 |
adem | -0.021 |
inen | -0.021 |
rior | -0.020 |
Token | Alexander |
Token ID | 10009 |
Feature activation | +9.77e-02 |
Pos logit contributions | |
ellen | +0.007 |
Developer | +0.006 |
rite | +0.006 |
taboola | +0.006 |
yip | +0.006 |
Neg logit contributions | |
scribe | -0.006 |
results | -0.006 |
adem | -0.006 |
inen | -0.006 |
rior | -0.006 |
Token | J |
Token ID | 449 |
Feature activation | -3.29e-01 |
Pos logit contributions | |
scribe | +0.023 |
results | +0.023 |
adem | +0.023 |
inen | +0.023 |
rior | +0.022 |
Neg logit contributions | |
ellen | -0.022 |
Developer | -0.021 |
taboola | -0.021 |
rite | -0.021 |
yip | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | +4.23e-03 |
Pos logit contributions | |
ellen | +0.083 |
Developer | +0.080 |
rite | +0.078 |
taboola | +0.078 |
aux | +0.075 |
Neg logit contributions | |
scribe | -0.071 |
results | -0.069 |
adem | -0.069 |
inen | -0.068 |
rior | -0.066 |
Token | K |
Token ID | 509 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
taboola | -0.001 |
rite | -0.001 |
yip | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
scribe | +0.011 |
results | +0.011 |
adem | +0.011 |
inen | +0.011 |
rior | +0.011 |
Neg logit contributions | |
ellen | -0.014 |
Developer | -0.014 |
taboola | -0.013 |
rite | -0.013 |
yip | -0.013 |
Token | 8 |
Token ID | 807 |
Feature activation | -7.63e-03 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.003 |
taboola | -0.003 |
rite | -0.003 |
yip | -0.003 |
Token | 80 |
Token ID | 1795 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
ellen | +0.002 |
Developer | +0.002 |
taboola | +0.002 |
rite | +0.002 |
yip | +0.002 |
Neg logit contributions | |
scribe | -0.002 |
results | -0.002 |
adem | -0.002 |
inen | -0.002 |
rior | -0.002 |
Token | hp |
Token ID | 24831 |
Feature activation | -5.35e-02 |
Pos logit contributions | |
ellen | +0.069 |
Developer | +0.066 |
taboola | +0.064 |
rite | +0.064 |
yip | +0.062 |
Neg logit contributions | |
scribe | -0.068 |
results | -0.066 |
adem | -0.066 |
inen | -0.065 |
rior | -0.064 |
Token | twin |
Token ID | 15203 |
Feature activation | -9.51e-02 |
Pos logit contributions | |
ellen | +0.013 |
Developer | +0.012 |
taboola | +0.012 |
rite | +0.012 |
yip | +0.011 |
Neg logit contributions | |
scribe | -0.013 |
results | -0.012 |
adem | -0.012 |
inen | -0.012 |
rior | -0.012 |
Token | turbo |
Token ID | 29292 |
Feature activation | -8.99e-01 |
Pos logit contributions | |
ellen | +0.019 |
Developer | +0.018 |
taboola | +0.018 |
rite | +0.018 |
yip | +0.017 |
Neg logit contributions | |
scribe | -0.025 |
results | -0.025 |
adem | -0.024 |
inen | -0.024 |
rior | -0.024 |
Token | V |
Token ID | 569 |
Feature activation | +5.28e-02 |
Pos logit contributions | |
ellen | +0.213 |
Developer | +0.203 |
taboola | +0.198 |
rite | +0.198 |
yip | +0.191 |
Neg logit contributions | |
scribe | -0.208 |
results | -0.204 |
adem | -0.202 |
inen | -0.200 |
rior | -0.195 |
Token | 12 |
Token ID | 1065 |
Feature activation | -7.84e-02 |
Pos logit contributions | |
scribe | +0.013 |
results | +0.012 |
adem | +0.012 |
inen | +0.012 |
rior | +0.012 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.011 |
taboola | -0.011 |
rite | -0.011 |
yip | -0.011 |
Token | engine |
Token ID | 3113 |
Feature activation | -6.77e-02 |
Pos logit contributions | |
ellen | +0.019 |
Developer | +0.018 |
taboola | +0.017 |
rite | +0.017 |
yip | +0.017 |
Neg logit contributions | |
scribe | -0.018 |
results | -0.018 |
adem | -0.018 |
inen | -0.017 |
rior | -0.017 |
Token | , |
Token ID | 11 |
Feature activation | +2.69e-03 |
Pos logit contributions | |
ellen | +0.017 |
Developer | +0.016 |
rite | +0.016 |
taboola | +0.016 |
yip | +0.016 |
Neg logit contributions | |
scribe | -0.015 |
results | -0.014 |
adem | -0.014 |
inen | -0.014 |
rior | -0.014 |
Token | that |
Token ID | 326 |
Feature activation | +2.56e-02 |
Pos logit contributions | |
scribe | +0.001 |
results | +0.001 |
adem | +0.001 |
inen | +0.001 |
rior | +0.001 |
Neg logit contributions | |
ellen | -0.001 |
Developer | -0.001 |
rite | -0.001 |
taboola | -0.001 |
yip | -0.001 |
Token | pol |
Token ID | 16104 |
Feature activation | +4.48e-02 |
Pos logit contributions | |
scribe | +0.012 |
results | +0.012 |
adem | +0.012 |
inen | +0.012 |
rior | +0.011 |
Neg logit contributions | |
ellen | -0.018 |
Developer | -0.017 |
rite | -0.017 |
taboola | -0.017 |
aux | -0.016 |
Token | blacklist |
Token ID | 38810 |
Feature activation | +3.51e-01 |
Pos logit contributions | |
scribe | +0.008 |
results | +0.008 |
adem | +0.008 |
inen | +0.008 |
rior | +0.007 |
Neg logit contributions | |
ellen | -0.013 |
Developer | -0.012 |
rite | -0.012 |
taboola | -0.012 |
yip | -0.012 |
Token | rather |
Token ID | 2138 |
Feature activation | -3.97e-01 |
Pos logit contributions | |
scribe | +0.078 |
results | +0.077 |
adem | +0.075 |
inen | +0.075 |
rior | +0.073 |
Neg logit contributions | |
ellen | -0.086 |
Developer | -0.082 |
rite | -0.081 |
taboola | -0.080 |
yip | -0.078 |
Token | than |
Token ID | 621 |
Feature activation | +9.68e-02 |
Pos logit contributions | |
ellen | +0.112 |
Developer | +0.107 |
taboola | +0.106 |
rite | +0.105 |
yip | +0.102 |
Neg logit contributions | |
scribe | -0.074 |
results | -0.073 |
adem | -0.071 |
inen | -0.071 |
rior | -0.069 |
Token | one |
Token ID | 530 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
scribe | +0.020 |
results | +0.020 |
adem | +0.020 |
inen | +0.020 |
rior | +0.019 |
Neg logit contributions | |
ellen | -0.025 |
Developer | -0.024 |
taboola | -0.023 |
rite | -0.023 |
yip | -0.022 |
Token | sourced |
Token ID | 18229 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
scribe | +0.043 |
results | +0.043 |
adem | +0.042 |
inen | +0.042 |
rior | +0.041 |
Neg logit contributions | |
ellen | -0.044 |
Developer | -0.042 |
rite | -0.041 |
taboola | -0.041 |
yip | -0.040 |
Token | from |
Token ID | 422 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
ellen | +0.240 |
Developer | +0.228 |
rite | +0.223 |
taboola | +0.223 |
yip | +0.215 |
Neg logit contributions | |
scribe | -0.232 |
results | -0.228 |
adem | -0.226 |
inen | -0.223 |
rior | -0.218 |
Token | AC |
Token ID | 7125 |
Feature activation | -3.59e-03 |
Pos logit contributions | |
ellen | +0.041 |
Developer | +0.040 |
rite | +0.039 |
taboola | +0.039 |
yip | +0.037 |
Neg logit contributions | |
scribe | -0.033 |
results | -0.032 |
adem | -0.032 |
inen | -0.031 |
rior | -0.031 |
Token | MA |
Token ID | 5673 |
Feature activation | +3.80e-01 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
aux | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | will |
Token ID | 481 |
Feature activation | +5.17e-02 |
Pos logit contributions | |
scribe | +0.084 |
results | +0.083 |
adem | +0.082 |
inen | +0.081 |
rior | +0.079 |
Neg logit contributions | |
ellen | -0.093 |
Developer | -0.089 |
rite | -0.087 |
taboola | -0.087 |
yip | -0.084 |
Token | affect |
Token ID | 2689 |
Feature activation | +2.55e-01 |
Pos logit contributions | |
scribe | +0.013 |
results | +0.012 |
adem | +0.012 |
inen | +0.012 |
rior | +0.012 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.011 |
rite | -0.011 |
taboola | -0.011 |
yip | -0.010 |
Token | Rest |
Token ID | 8324 |
Feature activation | -3.37e-01 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.005 |
Neg logit contributions | |
ellen | -0.005 |
Developer | -0.005 |
rite | -0.005 |
taboola | -0.005 |
yip | -0.005 |
Token | art |
Token ID | 433 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
ellen | +0.076 |
Developer | +0.072 |
taboola | +0.071 |
rite | +0.070 |
yip | +0.067 |
Neg logit contributions | |
scribe | -0.082 |
results | -0.080 |
adem | -0.080 |
inen | -0.079 |
rior | -0.077 |
Token | Network |
Token ID | 7311 |
Feature activation | +3.72e-01 |
Pos logit contributions | |
ellen | +0.039 |
Developer | +0.037 |
rite | +0.037 |
taboola | +0.036 |
aux | +0.035 |
Neg logit contributions | |
scribe | -0.035 |
results | -0.034 |
adem | -0.034 |
inen | -0.033 |
rior | -0.032 |
Token | Manager |
Token ID | 9142 |
Feature activation | +2.59e-01 |
Pos logit contributions | |
scribe | +0.076 |
results | +0.075 |
adem | +0.074 |
inen | +0.073 |
rior | +0.071 |
Neg logit contributions | |
ellen | -0.098 |
Developer | -0.093 |
taboola | -0.092 |
rite | -0.092 |
yip | -0.089 |
Token | at |
Token ID | 379 |
Feature activation | +8.56e-02 |
Pos logit contributions | |
scribe | +0.056 |
results | +0.055 |
adem | +0.054 |
inen | +0.054 |
rior | +0.052 |
Neg logit contributions | |
ellen | -0.065 |
Developer | -0.062 |
rite | -0.061 |
taboola | -0.061 |
yip | -0.059 |
Token | boot |
Token ID | 6297 |
Feature activation | -7.68e-01 |
Pos logit contributions | |
scribe | +0.024 |
results | +0.024 |
adem | +0.023 |
inen | +0.023 |
rior | +0.022 |
Neg logit contributions | |
ellen | -0.016 |
Developer | -0.015 |
rite | -0.015 |
taboola | -0.015 |
yip | -0.014 |
Token | up |
Token ID | 510 |
Feature activation | +6.77e-02 |
Pos logit contributions | |
ellen | +0.183 |
Developer | +0.174 |
rite | +0.171 |
taboola | +0.171 |
aux | +0.164 |
Neg logit contributions | |
scribe | -0.176 |
results | -0.173 |
adem | -0.171 |
inen | -0.170 |
rior | -0.165 |
Token |
|
Token ID | 198 |
Feature activation | -3.59e-03 |
Pos logit contributions | |
scribe | +0.015 |
results | +0.015 |
adem | +0.015 |
inen | +0.015 |
rior | +0.014 |
Neg logit contributions | |
ellen | -0.017 |
Developer | -0.016 |
rite | -0.015 |
taboola | -0.015 |
aux | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -4.09e-03 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | So |
Token ID | 2396 |
Feature activation | +7.73e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | your |
Token ID | 534 |
Feature activation | -4.45e-02 |
Pos logit contributions | |
scribe | +0.017 |
results | +0.017 |
adem | +0.017 |
inen | +0.017 |
rior | +0.016 |
Neg logit contributions | |
ellen | -0.019 |
Developer | -0.018 |
taboola | -0.018 |
rite | -0.018 |
aux | -0.017 |
Token | screw |
Token ID | 9580 |
Feature activation | -6.96e-02 |
Pos logit contributions | |
scribe | +0.014 |
results | +0.014 |
adem | +0.014 |
inen | +0.014 |
rior | +0.013 |
Neg logit contributions | |
ellen | -0.015 |
Developer | -0.015 |
rite | -0.014 |
taboola | -0.014 |
yip | -0.014 |
Token | - |
Token ID | 12 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
ellen | +0.018 |
Developer | +0.017 |
taboola | +0.017 |
rite | +0.017 |
yip | +0.016 |
Neg logit contributions | |
scribe | -0.014 |
results | -0.014 |
adem | -0.014 |
inen | -0.014 |
rior | -0.013 |
Token | up |
Token ID | 929 |
Feature activation | -5.75e-02 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.004 |
Developer | -0.004 |
taboola | -0.003 |
rite | -0.003 |
yip | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | +2.05e-02 |
Pos logit contributions | |
ellen | +0.014 |
Developer | +0.014 |
taboola | +0.013 |
rite | +0.013 |
yip | +0.013 |
Neg logit contributions | |
scribe | -0.013 |
results | -0.012 |
adem | -0.012 |
inen | -0.012 |
rior | -0.012 |
Token | what |
Token ID | 644 |
Feature activation | +3.82e-02 |
Pos logit contributions | |
scribe | +0.005 |
results | +0.005 |
adem | +0.005 |
inen | +0.005 |
rior | +0.004 |
Neg logit contributions | |
ellen | -0.005 |
Developer | -0.005 |
rite | -0.005 |
taboola | -0.005 |
yip | -0.004 |
Token | caused |
Token ID | 4073 |
Feature activation | -7.74e-01 |
Pos logit contributions | |
scribe | +0.009 |
results | +0.009 |
adem | +0.009 |
inen | +0.008 |
rior | +0.008 |
Neg logit contributions | |
ellen | -0.009 |
Developer | -0.009 |
rite | -0.009 |
taboola | -0.008 |
yip | -0.008 |
Token | it |
Token ID | 340 |
Feature activation | -7.33e-02 |
Pos logit contributions | |
ellen | +0.193 |
Developer | +0.185 |
rite | +0.181 |
taboola | +0.181 |
yip | +0.174 |
Neg logit contributions | |
scribe | -0.169 |
results | -0.166 |
adem | -0.164 |
inen | -0.162 |
rior | -0.158 |
Token | , |
Token ID | 11 |
Feature activation | +1.29e-02 |
Pos logit contributions | |
ellen | +0.018 |
Developer | +0.017 |
rite | +0.017 |
taboola | +0.017 |
aux | +0.016 |
Neg logit contributions | |
scribe | -0.016 |
results | -0.016 |
adem | -0.016 |
inen | -0.015 |
rior | -0.015 |
Token | what |
Token ID | 644 |
Feature activation | +4.39e-02 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.003 |
adem | +0.003 |
inen | +0.003 |
rior | +0.003 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
rite | -0.003 |
taboola | -0.003 |
yip | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | +7.16e-02 |
Pos logit contributions | |
scribe | +0.010 |
results | +0.010 |
adem | +0.010 |
inen | +0.010 |
rior | +0.009 |
Neg logit contributions | |
ellen | -0.011 |
Developer | -0.010 |
rite | -0.010 |
taboola | -0.010 |
yip | -0.010 |
Token | done |
Token ID | 1760 |
Feature activation | +1.48e-01 |
Pos logit contributions | |
scribe | +0.016 |
results | +0.016 |
adem | +0.015 |
inen | +0.015 |
rior | +0.015 |
Neg logit contributions | |
ellen | -0.018 |
Developer | -0.017 |
rite | -0.017 |
taboola | -0.016 |
yip | -0.016 |
Token | hope |
Token ID | 2911 |
Feature activation | +2.73e-02 |
Pos logit contributions | |
scribe | +0.058 |
results | +0.057 |
adem | +0.056 |
inen | +0.056 |
rior | +0.055 |
Neg logit contributions | |
ellen | -0.049 |
Developer | -0.046 |
taboola | -0.045 |
rite | -0.045 |
yip | -0.043 |
Token | that |
Token ID | 326 |
Feature activation | -3.39e-03 |
Pos logit contributions | |
scribe | +0.006 |
results | +0.006 |
adem | +0.006 |
inen | +0.006 |
rior | +0.006 |
Neg logit contributions | |
ellen | -0.007 |
Developer | -0.006 |
taboola | -0.006 |
rite | -0.006 |
yip | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
rite | +0.001 |
taboola | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | com |
Token ID | 401 |
Feature activation | -7.94e-02 |
Pos logit contributions | |
scribe | +0.003 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.003 |
Developer | -0.003 |
taboola | -0.003 |
rite | -0.003 |
yip | -0.002 |
Token | er |
Token ID | 263 |
Feature activation | -2.48e-01 |
Pos logit contributions | |
ellen | +0.019 |
Developer | +0.018 |
taboola | +0.018 |
rite | +0.018 |
yip | +0.017 |
Neg logit contributions | |
scribe | -0.018 |
results | -0.018 |
adem | -0.018 |
inen | -0.017 |
rior | -0.017 |
Token | cial |
Token ID | 2413 |
Feature activation | -7.52e-01 |
Pos logit contributions | |
ellen | +0.058 |
Developer | +0.055 |
rite | +0.054 |
taboola | +0.054 |
yip | +0.052 |
Neg logit contributions | |
scribe | -0.058 |
results | -0.057 |
adem | -0.057 |
inen | -0.056 |
rior | -0.055 |
Token | version |
Token ID | 2196 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
ellen | +0.177 |
Developer | +0.168 |
taboola | +0.165 |
rite | +0.165 |
yip | +0.159 |
Neg logit contributions | |
scribe | -0.175 |
results | -0.171 |
adem | -0.170 |
inen | -0.168 |
rior | -0.164 |
Token | of |
Token ID | 286 |
Feature activation | +7.98e-03 |
Pos logit contributions | |
scribe | +0.048 |
results | +0.048 |
adem | +0.047 |
inen | +0.047 |
rior | +0.045 |
Neg logit contributions | |
ellen | -0.049 |
Developer | -0.046 |
rite | -0.045 |
taboola | -0.045 |
yip | -0.044 |
Token | the |
Token ID | 262 |
Feature activation | -6.19e-03 |
Pos logit contributions | |
scribe | +0.002 |
results | +0.002 |
adem | +0.002 |
inen | +0.002 |
rior | +0.002 |
Neg logit contributions | |
ellen | -0.002 |
Developer | -0.002 |
rite | -0.002 |
taboola | -0.002 |
yip | -0.002 |
Token | Rift |
Token ID | 21222 |
Feature activation | +4.77e-02 |
Pos logit contributions | |
ellen | +0.001 |
Developer | +0.001 |
taboola | +0.001 |
rite | +0.001 |
yip | +0.001 |
Neg logit contributions | |
scribe | -0.001 |
results | -0.001 |
adem | -0.001 |
inen | -0.001 |
rior | -0.001 |
Token | would |
Token ID | 561 |
Feature activation | +9.69e-02 |
Pos logit contributions | |
scribe | +0.011 |
results | +0.010 |
adem | +0.010 |
inen | +0.010 |
rior | +0.010 |
Neg logit contributions | |
ellen | -0.012 |
Developer | -0.011 |
taboola | -0.011 |
rite | -0.011 |
yip | -0.010 |