Token | other |
Token ID | 584 |
Feature activation | -3.80e-02 |
Pos logit contributions | |
fid | +0.067 |
acci | +0.064 |
ank | +0.059 |
obey | +0.056 |
ihil | +0.055 |
Neg logit contributions | |
ARC | -0.067 |
ked | -0.063 |
ILA | -0.060 |
OVA | -0.060 |
pool | -0.057 |
Token | state |
Token ID | 1181 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
fid | +0.027 |
acci | +0.026 |
ank | +0.024 |
obey | +0.023 |
ihil | +0.022 |
Neg logit contributions | |
ARC | -0.029 |
ked | -0.028 |
ILA | -0.026 |
OVA | -0.026 |
pool | -0.025 |
Token | housing |
Token ID | 5627 |
Feature activation | -8.23e-02 |
Pos logit contributions | |
ARC | +0.156 |
ked | +0.148 |
ILA | +0.142 |
OVA | +0.141 |
pool | +0.135 |
Neg logit contributions | |
fid | -0.127 |
acci | -0.120 |
ank | -0.109 |
obey | -0.104 |
ihil | -0.102 |
Token | / |
Token ID | 14 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
fid | +0.067 |
acci | +0.063 |
ank | +0.059 |
obey | +0.057 |
obe | +0.056 |
Neg logit contributions | |
ARC | -0.056 |
ked | -0.052 |
ILA | -0.049 |
OVA | -0.049 |
pool | -0.047 |
Token | Ma |
Token ID | 21467 |
Feature activation | -5.32e-02 |
Pos logit contributions | |
fid | +0.015 |
acci | +0.014 |
ank | +0.013 |
obey | +0.013 |
ihil | +0.012 |
Neg logit contributions | |
ARC | -0.011 |
ked | -0.010 |
ILA | -0.010 |
OVA | -0.010 |
kers | -0.009 |
Token | ori |
Token ID | 10145 |
Feature activation | +5.97e-01 |
Pos logit contributions | |
fid | +0.068 |
acci | +0.066 |
ank | +0.063 |
obey | +0.062 |
ihil | +0.061 |
Neg logit contributions | |
ARC | -0.011 |
ked | -0.009 |
ILA | -0.006 |
OVA | -0.006 |
pool | -0.005 |
Token | affairs |
Token ID | 9674 |
Feature activation | +4.66e-02 |
Pos logit contributions | |
ARC | +0.450 |
ked | +0.426 |
ILA | +0.404 |
OVA | +0.402 |
pool | +0.386 |
Neg logit contributions | |
fid | -0.435 |
acci | -0.414 |
ank | -0.380 |
obey | -0.364 |
ihil | -0.357 |
Token | houses |
Token ID | 7777 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
ARC | +0.034 |
ked | +0.032 |
ILA | +0.031 |
OVA | +0.031 |
pool | +0.029 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.033 |
ank | -0.031 |
obey | -0.029 |
obe | -0.029 |
Token | in |
Token ID | 287 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
fid | +0.181 |
acci | +0.173 |
ank | +0.161 |
obey | +0.155 |
ihil | +0.152 |
Neg logit contributions | |
ARC | -0.159 |
ked | -0.149 |
ILA | -0.142 |
OVA | -0.140 |
pool | -0.133 |
Token | the |
Token ID | 262 |
Feature activation | -9.28e-03 |
Pos logit contributions | |
ARC | +0.013 |
ked | +0.012 |
ILA | +0.011 |
OVA | +0.011 |
pool | +0.011 |
Neg logit contributions | |
fid | -0.014 |
acci | -0.013 |
ank | -0.012 |
obey | -0.012 |
ihil | -0.012 |
Token | street |
Token ID | 4675 |
Feature activation | +4.21e-02 |
Pos logit contributions | |
fid | +0.007 |
acci | +0.007 |
ank | +0.007 |
obey | +0.006 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.006 |
ked | -0.006 |
ILA | -0.006 |
OVA | -0.006 |
pool | -0.005 |
Token | av |
Token ID | 615 |
Feature activation | +1.99e-01 |
Pos logit contributions | |
ARC | +0.023 |
ked | +0.022 |
ILA | +0.021 |
OVA | +0.021 |
pool | +0.020 |
Neg logit contributions | |
fid | -0.024 |
acci | -0.023 |
ank | -0.021 |
obey | -0.020 |
ihil | -0.020 |
Token | o |
Token ID | 78 |
Feature activation | +1.52e-01 |
Pos logit contributions | |
ARC | +0.108 |
ked | +0.100 |
ILA | +0.093 |
OVA | +0.092 |
Region | +0.087 |
Neg logit contributions | |
fid | -0.186 |
acci | -0.180 |
ank | -0.169 |
obey | -0.163 |
ihil | -0.162 |
Token | super |
Token ID | 2208 |
Feature activation | +1.14e-01 |
Pos logit contributions | |
ARC | +0.111 |
ked | +0.105 |
ILA | +0.099 |
OVA | +0.099 |
pool | +0.095 |
Neg logit contributions | |
fid | -0.113 |
acci | -0.108 |
ank | -0.100 |
obey | -0.096 |
ihil | -0.094 |
Token | t |
Token ID | 256 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
ARC | +0.076 |
ked | +0.071 |
ILA | +0.068 |
OVA | +0.067 |
Region | +0.064 |
Neg logit contributions | |
fid | -0.092 |
acci | -0.088 |
ank | -0.082 |
obey | -0.078 |
ihil | -0.078 |
Token | us |
Token ID | 385 |
Feature activation | -1.07e-01 |
Pos logit contributions | |
ARC | +0.013 |
ked | +0.012 |
ILA | +0.012 |
OVA | +0.011 |
Region | +0.011 |
Neg logit contributions | |
fid | -0.015 |
acci | -0.014 |
ank | -0.013 |
obey | -0.013 |
ihil | -0.013 |
Token | kers |
Token ID | 15949 |
Feature activation | +5.58e-01 |
Pos logit contributions | |
fid | +0.108 |
acci | +0.105 |
ank | +0.100 |
obey | +0.096 |
ihil | +0.095 |
Neg logit contributions | |
ARC | -0.050 |
ked | -0.042 |
OVA | -0.042 |
ILA | -0.041 |
Region | -0.039 |
Token | enjoy |
Token ID | 2883 |
Feature activation | +7.93e-02 |
Pos logit contributions | |
ARC | +0.407 |
ked | +0.385 |
ILA | +0.362 |
OVA | +0.361 |
pool | +0.347 |
Neg logit contributions | |
fid | -0.418 |
acci | -0.401 |
ank | -0.369 |
obey | -0.352 |
ihil | -0.349 |
Token | a |
Token ID | 257 |
Feature activation | +4.74e-02 |
Pos logit contributions | |
ARC | +0.057 |
ked | +0.053 |
ILA | +0.050 |
OVA | +0.050 |
pool | +0.048 |
Neg logit contributions | |
fid | -0.061 |
acci | -0.058 |
ank | -0.054 |
obey | -0.051 |
ihil | -0.051 |
Token | Presidential |
Token ID | 17471 |
Feature activation | -2.04e-01 |
Pos logit contributions | |
ARC | +0.034 |
ked | +0.032 |
ILA | +0.030 |
OVA | +0.030 |
pool | +0.029 |
Neg logit contributions | |
fid | -0.036 |
acci | -0.035 |
ank | -0.032 |
obey | -0.031 |
ihil | -0.030 |
Token | Security |
Token ID | 4765 |
Feature activation | +1.11e-01 |
Pos logit contributions | |
fid | +0.160 |
acci | +0.153 |
ank | +0.142 |
obey | +0.136 |
obe | +0.133 |
Neg logit contributions | |
ARC | -0.143 |
ked | -0.134 |
ILA | -0.126 |
OVA | -0.126 |
pool | -0.121 |
Token | Dec |
Token ID | 4280 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
ARC | +0.079 |
ked | +0.075 |
ILA | +0.070 |
OVA | +0.070 |
pool | +0.067 |
Neg logit contributions | |
fid | -0.085 |
acci | -0.081 |
ank | -0.075 |
obey | -0.072 |
ihil | -0.071 |
Token | basement |
Token ID | 17012 |
Feature activation | +1.93e-01 |
Pos logit contributions | |
fid | +0.029 |
acci | +0.027 |
ank | +0.025 |
obey | +0.024 |
ihil | +0.024 |
Neg logit contributions | |
ARC | -0.028 |
ked | -0.027 |
ILA | -0.025 |
OVA | -0.025 |
pool | -0.024 |
Token | of |
Token ID | 286 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
ARC | +0.138 |
ked | +0.130 |
ILA | +0.124 |
OVA | +0.123 |
pool | +0.117 |
Neg logit contributions | |
fid | -0.148 |
acci | -0.140 |
ank | -0.131 |
obey | -0.125 |
ihil | -0.123 |
Token | concrete |
Token ID | 10017 |
Feature activation | -9.03e-02 |
Pos logit contributions | |
fid | +0.007 |
acci | +0.006 |
ank | +0.006 |
obey | +0.005 |
ihil | +0.005 |
Neg logit contributions | |
ARC | -0.009 |
ked | -0.009 |
ILA | -0.008 |
OVA | -0.008 |
pool | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
fid | +0.070 |
acci | +0.067 |
ank | +0.062 |
obey | +0.060 |
ihil | +0.059 |
Neg logit contributions | |
ARC | -0.063 |
ked | -0.060 |
ILA | -0.056 |
OVA | -0.056 |
Region | -0.053 |
Token | Ma |
Token ID | 6669 |
Feature activation | +8.33e-02 |
Pos logit contributions | |
ARC | +0.007 |
ked | +0.007 |
ILA | +0.006 |
OVA | +0.006 |
pool | +0.006 |
Neg logit contributions | |
fid | -0.008 |
acci | -0.008 |
ank | -0.007 |
obey | -0.007 |
ihil | -0.007 |
Token | ori |
Token ID | 10145 |
Feature activation | +5.54e-01 |
Pos logit contributions | |
ARC | +0.061 |
ked | +0.058 |
ILA | +0.055 |
OVA | +0.055 |
pool | +0.053 |
Neg logit contributions | |
fid | -0.062 |
acci | -0.059 |
ank | -0.054 |
obey | -0.052 |
ihil | -0.051 |
Token | affairs |
Token ID | 9674 |
Feature activation | +3.46e-02 |
Pos logit contributions | |
ARC | +0.394 |
ked | +0.371 |
ILA | +0.351 |
OVA | +0.349 |
pool | +0.334 |
Neg logit contributions | |
fid | -0.427 |
acci | -0.407 |
ank | -0.378 |
obey | -0.363 |
ihil | -0.356 |
Token | and |
Token ID | 290 |
Feature activation | +6.99e-04 |
Pos logit contributions | |
ARC | +0.024 |
ked | +0.023 |
ILA | +0.022 |
OVA | +0.022 |
pool | +0.021 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.026 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.022 |
Token | state |
Token ID | 1181 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
ARC | +0.001 |
ked | +0.000 |
ILA | +0.000 |
OVA | +0.000 |
pool | +0.000 |
Neg logit contributions | |
fid | -0.001 |
acci | -0.001 |
ank | -0.000 |
obey | -0.000 |
ihil | -0.000 |
Token | housing |
Token ID | 5627 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
ARC | +0.139 |
ked | +0.131 |
ILA | +0.124 |
OVA | +0.123 |
pool | +0.118 |
Neg logit contributions | |
fid | -0.154 |
acci | -0.147 |
ank | -0.135 |
obey | -0.131 |
obe | -0.128 |
Token | did |
Token ID | 750 |
Feature activation | +2.69e-02 |
Pos logit contributions | |
fid | +0.079 |
acci | +0.075 |
ank | +0.070 |
obey | +0.067 |
ihil | +0.066 |
Neg logit contributions | |
ARC | -0.073 |
ked | -0.069 |
ILA | -0.065 |
OVA | -0.065 |
pool | -0.062 |
Token | The |
Token ID | 464 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
ARC | +0.023 |
ked | +0.022 |
ILA | +0.021 |
OVA | +0.021 |
kers | +0.020 |
Neg logit contributions | |
fid | -0.029 |
acci | -0.027 |
ank | -0.025 |
obey | -0.024 |
ihil | -0.024 |
Token | International |
Token ID | 4037 |
Feature activation | +1.94e-01 |
Pos logit contributions | |
ARC | +0.008 |
ked | +0.008 |
ILA | +0.007 |
OVA | +0.007 |
pool | +0.007 |
Neg logit contributions | |
fid | -0.009 |
acci | -0.009 |
ank | -0.008 |
obey | -0.008 |
ihil | -0.008 |
Token | Brotherhood |
Token ID | 17987 |
Feature activation | -2.61e-01 |
Pos logit contributions | |
ARC | +0.152 |
ked | +0.143 |
ILA | +0.137 |
OVA | +0.137 |
Region | +0.131 |
Neg logit contributions | |
fid | -0.134 |
acci | -0.128 |
ank | -0.117 |
obey | -0.111 |
ihil | -0.110 |
Token | of |
Token ID | 286 |
Feature activation | +7.17e-02 |
Pos logit contributions | |
fid | +0.206 |
acci | +0.198 |
ank | +0.184 |
obey | +0.176 |
ihil | +0.174 |
Neg logit contributions | |
ARC | -0.179 |
ked | -0.168 |
OVA | -0.158 |
ILA | -0.158 |
pool | -0.151 |
Token | Electrical |
Token ID | 40224 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
ARC | +0.049 |
ked | +0.045 |
OVA | +0.044 |
ILA | +0.043 |
Region | +0.041 |
Neg logit contributions | |
fid | -0.056 |
acci | -0.055 |
ank | -0.050 |
ihil | -0.049 |
obey | -0.048 |
Token | Workers |
Token ID | 16847 |
Feature activation | +5.50e-01 |
Pos logit contributions | |
ARC | +0.034 |
ked | +0.028 |
OVA | +0.025 |
ILA | +0.023 |
Region | +0.021 |
Neg logit contributions | |
fid | -0.161 |
acci | -0.158 |
ank | -0.151 |
obey | -0.147 |
ihil | -0.146 |
Token | represents |
Token ID | 6870 |
Feature activation | -8.79e-02 |
Pos logit contributions | |
ARC | +0.393 |
ked | +0.371 |
ILA | +0.350 |
OVA | +0.349 |
pool | +0.334 |
Neg logit contributions | |
fid | -0.420 |
acci | -0.401 |
ank | -0.372 |
obey | -0.356 |
ihil | -0.351 |
Token | nearly |
Token ID | 3016 |
Feature activation | +1.32e-01 |
Pos logit contributions | |
fid | +0.068 |
acci | +0.065 |
ank | +0.060 |
obey | +0.058 |
ihil | +0.057 |
Neg logit contributions | |
ARC | -0.062 |
ked | -0.058 |
ILA | -0.055 |
OVA | -0.055 |
pool | -0.053 |
Token | 3 |
Token ID | 513 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
ARC | +0.097 |
ked | +0.091 |
ILA | +0.087 |
OVA | +0.086 |
pool | +0.083 |
Neg logit contributions | |
fid | -0.098 |
acci | -0.093 |
ank | -0.086 |
obey | -0.083 |
ihil | -0.081 |
Token | , |
Token ID | 11 |
Feature activation | +7.32e-02 |
Pos logit contributions | |
fid | +0.017 |
acci | +0.016 |
ank | +0.015 |
obey | +0.014 |
ihil | +0.014 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.014 |
ILA | -0.013 |
OVA | -0.013 |
Region | -0.012 |
Token | 000 |
Token ID | 830 |
Feature activation | -3.21e-02 |
Pos logit contributions | |
ARC | +0.056 |
ked | +0.053 |
ILA | +0.051 |
OVA | +0.050 |
Region | +0.048 |
Neg logit contributions | |
fid | -0.052 |
acci | -0.050 |
ank | -0.045 |
obey | -0.043 |
ihil | -0.043 |
Token | Mer |
Token ID | 4638 |
Feature activation | -1.95e-01 |
Pos logit contributions | |
fid | +0.042 |
acci | +0.040 |
ank | +0.037 |
obey | +0.035 |
ihil | +0.035 |
Neg logit contributions | |
ARC | -0.039 |
ked | -0.037 |
ILA | -0.035 |
OVA | -0.035 |
pool | -0.033 |
Token | r |
Token ID | 81 |
Feature activation | -2.67e-02 |
Pos logit contributions | |
fid | +0.146 |
acci | +0.140 |
ank | +0.129 |
obey | +0.124 |
ihil | +0.122 |
Neg logit contributions | |
ARC | -0.142 |
ked | -0.134 |
ILA | -0.126 |
OVA | -0.126 |
pool | -0.121 |
Token | ion |
Token ID | 295 |
Feature activation | -7.42e-02 |
Pos logit contributions | |
fid | +0.016 |
acci | +0.015 |
ank | +0.014 |
obey | +0.013 |
ihil | +0.013 |
Neg logit contributions | |
ARC | -0.024 |
ked | -0.023 |
ILA | -0.021 |
OVA | -0.021 |
pool | -0.021 |
Token | Stock |
Token ID | 10500 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
fid | +0.055 |
acci | +0.053 |
ank | +0.049 |
obey | +0.046 |
ihil | +0.046 |
Neg logit contributions | |
ARC | -0.055 |
ked | -0.052 |
ILA | -0.049 |
OVA | -0.049 |
pool | -0.047 |
Token | bro |
Token ID | 7957 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
ARC | +0.087 |
ked | +0.082 |
ILA | +0.077 |
OVA | +0.077 |
pool | +0.073 |
Neg logit contributions | |
fid | -0.095 |
acci | -0.091 |
ank | -0.084 |
obey | -0.080 |
ihil | -0.080 |
Token | kers |
Token ID | 15949 |
Feature activation | +5.46e-01 |
Pos logit contributions | |
ARC | +0.028 |
ked | +0.023 |
ILA | +0.017 |
OVA | +0.017 |
pool | +0.013 |
Neg logit contributions | |
fid | -0.178 |
acci | -0.174 |
ank | -0.166 |
obey | -0.162 |
ihil | -0.161 |
Token | chief |
Token ID | 4039 |
Feature activation | -8.66e-02 |
Pos logit contributions | |
ARC | +0.426 |
ked | +0.404 |
ILA | +0.383 |
OVA | +0.381 |
pool | +0.367 |
Neg logit contributions | |
fid | -0.381 |
acci | -0.364 |
ank | -0.333 |
obey | -0.319 |
ihil | -0.313 |
Token | economist |
Token ID | 17646 |
Feature activation | +1.05e-01 |
Pos logit contributions | |
fid | +0.066 |
acci | +0.063 |
ank | +0.059 |
obey | +0.056 |
ihil | +0.055 |
Neg logit contributions | |
ARC | -0.062 |
ked | -0.058 |
ILA | -0.055 |
OVA | -0.055 |
pool | -0.052 |
Token | Alan |
Token ID | 12246 |
Feature activation | +4.07e-02 |
Pos logit contributions | |
ARC | +0.073 |
ked | +0.069 |
ILA | +0.065 |
OVA | +0.065 |
pool | +0.061 |
Neg logit contributions | |
fid | -0.083 |
acci | -0.079 |
ank | -0.073 |
obey | -0.070 |
ihil | -0.069 |
Token | Mc |
Token ID | 1982 |
Feature activation | -4.62e-02 |
Pos logit contributions | |
ARC | +0.030 |
ked | +0.028 |
ILA | +0.027 |
OVA | +0.027 |
pool | +0.026 |
Neg logit contributions | |
fid | -0.030 |
acci | -0.029 |
ank | -0.027 |
obey | -0.025 |
ihil | -0.025 |
Token | Qu |
Token ID | 4507 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
fid | +0.036 |
acci | +0.034 |
ank | +0.032 |
obey | +0.030 |
ihil | +0.030 |
Neg logit contributions | |
ARC | -0.032 |
ked | -0.031 |
ILA | -0.029 |
OVA | -0.029 |
kers | -0.027 |
Token | _ |
Token ID | 62 |
Feature activation | +7.60e-02 |
Pos logit contributions | |
fid | +0.075 |
acci | +0.072 |
ank | +0.067 |
obey | +0.065 |
ihil | +0.064 |
Neg logit contributions | |
ARC | -0.051 |
ked | -0.048 |
ILA | -0.044 |
OVA | -0.044 |
pool | -0.042 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
ARC | +0.071 |
ked | +0.068 |
ILA | +0.065 |
OVA | +0.065 |
pool | +0.063 |
Neg logit contributions | |
fid | -0.041 |
acci | -0.039 |
ank | -0.035 |
obey | -0.032 |
ihil | -0.032 |
Token | 64 |
Token ID | 2414 |
Feature activation | -7.38e-02 |
Pos logit contributions | |
fid | +0.126 |
acci | +0.120 |
ank | +0.110 |
obey | +0.105 |
ihil | +0.103 |
Neg logit contributions | |
ARC | -0.144 |
ked | -0.137 |
ILA | -0.130 |
OVA | -0.129 |
pool | -0.125 |
Token | E |
Token ID | 36 |
Feature activation | -5.84e-02 |
Pos logit contributions | |
fid | +0.050 |
acci | +0.047 |
ank | +0.043 |
obey | +0.041 |
ihil | +0.040 |
Neg logit contributions | |
ARC | -0.060 |
ked | -0.057 |
ILA | -0.054 |
OVA | -0.054 |
pool | -0.052 |
Token | , |
Token ID | 11 |
Feature activation | +6.46e-03 |
Pos logit contributions | |
fid | +0.047 |
acci | +0.045 |
ank | +0.042 |
obey | +0.040 |
ihil | +0.040 |
Neg logit contributions | |
ARC | -0.039 |
ked | -0.037 |
ILA | -0.035 |
OVA | -0.034 |
pool | -0.033 |
Token | DP |
Token ID | 6322 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
ARC | +0.002 |
ked | +0.001 |
ILA | +0.001 |
OVA | +0.001 |
kers | +0.001 |
Neg logit contributions | |
fid | -0.008 |
acci | -0.008 |
ank | -0.007 |
obey | -0.007 |
ihil | -0.007 |
Token | 02 |
Token ID | 2999 |
Feature activation | -8.71e-02 |
Pos logit contributions | |
ARC | +0.485 |
ked | +0.464 |
ILA | +0.443 |
OVA | +0.440 |
kers | +0.427 |
Neg logit contributions | |
fid | -0.317 |
acci | -0.299 |
ank | -0.267 |
obey | -0.253 |
ihil | -0.249 |
Token | _ |
Token ID | 62 |
Feature activation | +6.71e-02 |
Pos logit contributions | |
fid | +0.076 |
acci | +0.074 |
ank | +0.068 |
obey | +0.066 |
ihil | +0.065 |
Neg logit contributions | |
ARC | -0.052 |
ked | -0.048 |
ILA | -0.045 |
OVA | -0.045 |
pool | -0.043 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.87e-01 |
Pos logit contributions | |
ARC | +0.063 |
ked | +0.060 |
ILA | +0.058 |
OVA | +0.057 |
pool | +0.056 |
Neg logit contributions | |
fid | -0.036 |
acci | -0.034 |
ank | -0.030 |
obey | -0.028 |
ihil | -0.028 |
Token | 65 |
Token ID | 2996 |
Feature activation | +1.74e-04 |
Pos logit contributions | |
fid | +0.144 |
acci | +0.138 |
ank | +0.128 |
obey | +0.123 |
ihil | +0.121 |
Neg logit contributions | |
ARC | -0.132 |
ked | -0.124 |
ILA | -0.117 |
OVA | -0.116 |
pool | -0.112 |
Token | E |
Token ID | 36 |
Feature activation | -6.76e-02 |
Pos logit contributions | |
ARC | +0.000 |
ked | +0.000 |
ILA | +0.000 |
OVA | +0.000 |
pool | +0.000 |
Neg logit contributions | |
fid | -0.000 |
acci | -0.000 |
ank | -0.000 |
obey | -0.000 |
ihil | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +7.83e-03 |
Pos logit contributions | |
ARC | +0.062 |
ked | +0.058 |
ILA | +0.055 |
OVA | +0.054 |
pool | +0.052 |
Neg logit contributions | |
fid | -0.076 |
acci | -0.073 |
ank | -0.068 |
obey | -0.066 |
ihil | -0.065 |
Token |
|
Token ID | 198 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
ARC | +0.005 |
ked | +0.005 |
ILA | +0.005 |
OVA | +0.005 |
pool | +0.004 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.006 |
ank | -0.006 |
obey | -0.005 |
ihil | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +8.91e-03 |
Pos logit contributions | |
ARC | +0.008 |
ked | +0.008 |
ILA | +0.007 |
OVA | +0.007 |
pool | +0.007 |
Neg logit contributions | |
fid | -0.010 |
acci | -0.010 |
ank | -0.009 |
obey | -0.009 |
ihil | -0.009 |
Token | Miami |
Token ID | 41191 |
Feature activation | +9.65e-02 |
Pos logit contributions | |
ARC | +0.006 |
ked | +0.006 |
ILA | +0.005 |
OVA | +0.005 |
pool | +0.005 |
Neg logit contributions | |
fid | -0.007 |
acci | -0.007 |
ank | -0.006 |
obey | -0.006 |
ihil | -0.006 |
Token | in |
Token ID | 287 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
ARC | +0.061 |
ked | +0.057 |
ILA | +0.054 |
OVA | +0.053 |
pool | +0.051 |
Neg logit contributions | |
fid | -0.081 |
acci | -0.078 |
ank | -0.073 |
obey | -0.070 |
ihil | -0.069 |
Token | ked |
Token ID | 9091 |
Feature activation | +5.44e-01 |
Pos logit contributions | |
ARC | +0.012 |
ked | +0.011 |
ILA | +0.011 |
OVA | +0.011 |
Region | +0.010 |
Neg logit contributions | |
fid | -0.018 |
acci | -0.017 |
ank | -0.016 |
obey | -0.015 |
ihil | -0.015 |
Token | Vol |
Token ID | 4709 |
Feature activation | +5.13e-02 |
Pos logit contributions | |
ARC | +0.381 |
ked | +0.358 |
ILA | +0.338 |
OVA | +0.337 |
pool | +0.322 |
Neg logit contributions | |
fid | -0.423 |
acci | -0.404 |
ank | -0.375 |
obey | -0.360 |
ihil | -0.355 |
Token | quez |
Token ID | 22281 |
Feature activation | +6.83e-02 |
Pos logit contributions | |
ARC | +0.037 |
ked | +0.034 |
ILA | +0.033 |
OVA | +0.032 |
Region | +0.031 |
Neg logit contributions | |
fid | -0.039 |
acci | -0.038 |
ank | -0.034 |
obey | -0.033 |
ihil | -0.033 |
Token | to |
Token ID | 284 |
Feature activation | -2.52e-02 |
Pos logit contributions | |
ARC | +0.049 |
ked | +0.046 |
ILA | +0.044 |
OVA | +0.044 |
Region | +0.042 |
Neg logit contributions | |
fid | -0.052 |
acci | -0.049 |
ank | -0.046 |
obey | -0.044 |
ihil | -0.043 |
Token | a |
Token ID | 257 |
Feature activation | +1.93e-03 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.018 |
ank | +0.017 |
obey | +0.016 |
ihil | +0.016 |
Neg logit contributions | |
ARC | -0.018 |
ked | -0.017 |
ILA | -0.016 |
OVA | -0.016 |
pool | -0.016 |
Token | two |
Token ID | 734 |
Feature activation | +6.02e-02 |
Pos logit contributions | |
ARC | +0.001 |
ked | +0.001 |
ILA | +0.001 |
OVA | +0.001 |
pool | +0.001 |
Neg logit contributions | |
fid | -0.002 |
acci | -0.001 |
ank | -0.001 |
obey | -0.001 |
ihil | -0.001 |
Token | _ |
Token ID | 62 |
Feature activation | +8.30e-02 |
Pos logit contributions | |
fid | +0.074 |
acci | +0.072 |
ank | +0.066 |
obey | +0.064 |
ihil | +0.064 |
Neg logit contributions | |
ARC | -0.050 |
ked | -0.047 |
ILA | -0.044 |
OVA | -0.044 |
pool | -0.041 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
ARC | +0.078 |
ked | +0.074 |
ILA | +0.071 |
OVA | +0.071 |
pool | +0.069 |
Neg logit contributions | |
fid | -0.045 |
acci | -0.042 |
ank | -0.038 |
obey | -0.035 |
ihil | -0.035 |
Token | 63 |
Token ID | 5066 |
Feature activation | +3.75e-02 |
Pos logit contributions | |
fid | +0.142 |
acci | +0.136 |
ank | +0.125 |
obey | +0.120 |
ihil | +0.119 |
Neg logit contributions | |
ARC | -0.130 |
ked | -0.124 |
ILA | -0.117 |
OVA | -0.116 |
pool | -0.111 |
Token | E |
Token ID | 36 |
Feature activation | -6.22e-02 |
Pos logit contributions | |
ARC | +0.030 |
ked | +0.029 |
ILA | +0.027 |
OVA | +0.027 |
pool | +0.026 |
Neg logit contributions | |
fid | -0.025 |
acci | -0.024 |
ank | -0.022 |
obey | -0.021 |
ihil | -0.021 |
Token | , |
Token ID | 11 |
Feature activation | +7.99e-03 |
Pos logit contributions | |
fid | +0.050 |
acci | +0.048 |
ank | +0.045 |
obey | +0.043 |
ihil | +0.042 |
Neg logit contributions | |
ARC | -0.042 |
ked | -0.039 |
ILA | -0.037 |
OVA | -0.037 |
pool | -0.035 |
Token | DP |
Token ID | 6322 |
Feature activation | +5.31e-01 |
Pos logit contributions | |
ARC | +0.002 |
ked | +0.002 |
ILA | +0.002 |
OVA | +0.002 |
kers | +0.001 |
Neg logit contributions | |
fid | -0.010 |
acci | -0.009 |
ank | -0.009 |
obey | -0.009 |
ihil | -0.009 |
Token | 02 |
Token ID | 2999 |
Feature activation | -8.55e-02 |
Pos logit contributions | |
ARC | +0.470 |
ked | +0.448 |
ILA | +0.428 |
OVA | +0.426 |
pool | +0.413 |
Neg logit contributions | |
fid | -0.314 |
acci | -0.297 |
ank | -0.267 |
obey | -0.253 |
ihil | -0.248 |
Token | _ |
Token ID | 62 |
Feature activation | +7.60e-02 |
Pos logit contributions | |
fid | +0.075 |
acci | +0.072 |
ank | +0.067 |
obey | +0.065 |
ihil | +0.064 |
Neg logit contributions | |
ARC | -0.051 |
ked | -0.048 |
ILA | -0.044 |
OVA | -0.044 |
pool | -0.042 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
ARC | +0.071 |
ked | +0.068 |
ILA | +0.065 |
OVA | +0.065 |
pool | +0.063 |
Neg logit contributions | |
fid | -0.041 |
acci | -0.039 |
ank | -0.035 |
obey | -0.032 |
ihil | -0.032 |
Token | 64 |
Token ID | 2414 |
Feature activation | -7.38e-02 |
Pos logit contributions | |
fid | +0.126 |
acci | +0.120 |
ank | +0.110 |
obey | +0.105 |
ihil | +0.103 |
Neg logit contributions | |
ARC | -0.144 |
ked | -0.137 |
ILA | -0.130 |
OVA | -0.129 |
pool | -0.125 |
Token | E |
Token ID | 36 |
Feature activation | -5.84e-02 |
Pos logit contributions | |
fid | +0.050 |
acci | +0.047 |
ank | +0.043 |
obey | +0.041 |
ihil | +0.040 |
Neg logit contributions | |
ARC | -0.060 |
ked | -0.057 |
ILA | -0.054 |
OVA | -0.054 |
pool | -0.052 |
Token | The |
Token ID | 383 |
Feature activation | -2.90e-02 |
Pos logit contributions | |
ARC | +0.014 |
ked | +0.013 |
ILA | +0.012 |
OVA | +0.012 |
pool | +0.012 |
Neg logit contributions | |
fid | -0.016 |
acci | -0.015 |
ank | -0.014 |
obey | -0.013 |
ihil | -0.013 |
Token | MLB |
Token ID | 18532 |
Feature activation | +3.18e-02 |
Pos logit contributions | |
fid | +0.022 |
acci | +0.021 |
ank | +0.020 |
obey | +0.019 |
ihil | +0.019 |
Neg logit contributions | |
ARC | -0.020 |
ked | -0.019 |
ILA | -0.018 |
OVA | -0.018 |
pool | -0.017 |
Token | Network |
Token ID | 7311 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
ARC | +0.022 |
ked | +0.020 |
ILA | +0.019 |
OVA | +0.019 |
pool | +0.018 |
Neg logit contributions | |
fid | -0.025 |
acci | -0.024 |
ank | -0.022 |
obey | -0.021 |
ihil | -0.021 |
Token | squ |
Token ID | 2809 |
Feature activation | -4.63e-03 |
Pos logit contributions | |
fid | +0.099 |
acci | +0.094 |
ank | +0.088 |
obey | +0.084 |
ihil | +0.082 |
Neg logit contributions | |
ARC | -0.090 |
ked | -0.085 |
ILA | -0.080 |
OVA | -0.079 |
Region | -0.076 |
Token | aw |
Token ID | 707 |
Feature activation | +7.95e-03 |
Pos logit contributions | |
fid | +0.004 |
acci | +0.003 |
ank | +0.003 |
obey | +0.003 |
ihil | +0.003 |
Neg logit contributions | |
ARC | -0.003 |
ked | -0.003 |
ILA | -0.003 |
OVA | -0.003 |
pool | -0.003 |
Token | ked |
Token ID | 9091 |
Feature activation | +5.29e-01 |
Pos logit contributions | |
ARC | +0.001 |
ILA | +0.000 |
OVA | +0.000 |
ked | +0.000 |
Region | -0.000 |
Neg logit contributions | |
fid | -0.011 |
acci | -0.011 |
ank | -0.010 |
obey | -0.010 |
ihil | -0.010 |
Token | from |
Token ID | 422 |
Feature activation | -9.29e-02 |
Pos logit contributions | |
ARC | +0.363 |
ked | +0.340 |
ILA | +0.321 |
OVA | +0.319 |
pool | +0.305 |
Neg logit contributions | |
fid | -0.420 |
acci | -0.403 |
ank | -0.374 |
obey | -0.359 |
ihil | -0.354 |
Token | the |
Token ID | 262 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
fid | +0.071 |
acci | +0.067 |
ank | +0.063 |
obey | +0.060 |
ihil | +0.059 |
Neg logit contributions | |
ARC | -0.067 |
ked | -0.062 |
ILA | -0.060 |
OVA | -0.059 |
pool | -0.057 |
Token | television |
Token ID | 5581 |
Feature activation | -5.76e-02 |
Pos logit contributions | |
fid | +0.011 |
acci | +0.011 |
ank | +0.010 |
obey | +0.009 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.010 |
ked | -0.010 |
ILA | -0.009 |
OVA | -0.009 |
pool | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | +1.32e-03 |
Pos logit contributions | |
fid | +0.045 |
acci | +0.043 |
ank | +0.040 |
obey | +0.039 |
ihil | +0.038 |
Neg logit contributions | |
ARC | -0.040 |
ked | -0.037 |
ILA | -0.036 |
OVA | -0.035 |
pool | -0.034 |
Token | news |
Token ID | 1705 |
Feature activation | +6.38e-02 |
Pos logit contributions | |
ARC | +0.001 |
ked | +0.001 |
ILA | +0.001 |
OVA | +0.001 |
pool | +0.001 |
Neg logit contributions | |
fid | -0.001 |
acci | -0.001 |
ank | -0.001 |
obey | -0.001 |
ihil | -0.001 |
Token | _ |
Token ID | 62 |
Feature activation | +9.19e-02 |
Pos logit contributions | |
fid | +0.078 |
acci | +0.076 |
ank | +0.070 |
obey | +0.068 |
ihil | +0.067 |
Neg logit contributions | |
ARC | -0.053 |
ked | -0.050 |
ILA | -0.047 |
OVA | -0.046 |
pool | -0.044 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
ARC | +0.086 |
ked | +0.082 |
ILA | +0.079 |
OVA | +0.078 |
pool | +0.076 |
Neg logit contributions | |
fid | -0.050 |
acci | -0.047 |
ank | -0.042 |
obey | -0.039 |
ihil | -0.038 |
Token | 62 |
Token ID | 5237 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
fid | +0.130 |
acci | +0.124 |
ank | +0.114 |
obey | +0.109 |
ihil | +0.108 |
Neg logit contributions | |
ARC | -0.129 |
ked | -0.122 |
ILA | -0.115 |
OVA | -0.115 |
pool | -0.110 |
Token | E |
Token ID | 36 |
Feature activation | -6.81e-02 |
Pos logit contributions | |
ARC | +0.009 |
ked | +0.009 |
ILA | +0.008 |
OVA | +0.008 |
pool | +0.008 |
Neg logit contributions | |
fid | -0.007 |
acci | -0.007 |
ank | -0.006 |
obey | -0.006 |
ihil | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
fid | +0.055 |
acci | +0.052 |
ank | +0.049 |
obey | +0.047 |
ihil | +0.046 |
Neg logit contributions | |
ARC | -0.046 |
ked | -0.043 |
ILA | -0.041 |
OVA | -0.040 |
pool | -0.039 |
Token | DP |
Token ID | 6322 |
Feature activation | +5.27e-01 |
Pos logit contributions | |
ARC | +0.005 |
ked | +0.004 |
ILA | +0.004 |
OVA | +0.004 |
kers | +0.003 |
Neg logit contributions | |
fid | -0.021 |
acci | -0.021 |
ank | -0.020 |
obey | -0.019 |
ihil | -0.019 |
Token | 02 |
Token ID | 2999 |
Feature activation | -8.46e-02 |
Pos logit contributions | |
ARC | +0.466 |
ked | +0.445 |
ILA | +0.425 |
OVA | +0.423 |
pool | +0.410 |
Neg logit contributions | |
fid | -0.312 |
acci | -0.295 |
ank | -0.266 |
obey | -0.251 |
ihil | -0.246 |
Token | _ |
Token ID | 62 |
Feature activation | +8.30e-02 |
Pos logit contributions | |
fid | +0.074 |
acci | +0.072 |
ank | +0.066 |
obey | +0.064 |
ihil | +0.064 |
Neg logit contributions | |
ARC | -0.050 |
ked | -0.047 |
ILA | -0.044 |
OVA | -0.044 |
pool | -0.041 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
ARC | +0.078 |
ked | +0.074 |
ILA | +0.071 |
OVA | +0.071 |
pool | +0.069 |
Neg logit contributions | |
fid | -0.045 |
acci | -0.042 |
ank | -0.038 |
obey | -0.035 |
ihil | -0.035 |
Token | 63 |
Token ID | 5066 |
Feature activation | +3.75e-02 |
Pos logit contributions | |
fid | +0.142 |
acci | +0.136 |
ank | +0.125 |
obey | +0.120 |
ihil | +0.119 |
Neg logit contributions | |
ARC | -0.130 |
ked | -0.124 |
ILA | -0.117 |
OVA | -0.116 |
pool | -0.111 |
Token | E |
Token ID | 36 |
Feature activation | -6.22e-02 |
Pos logit contributions | |
ARC | +0.030 |
ked | +0.029 |
ILA | +0.027 |
OVA | +0.027 |
pool | +0.026 |
Neg logit contributions | |
fid | -0.025 |
acci | -0.024 |
ank | -0.022 |
obey | -0.021 |
ihil | -0.021 |
Token | , |
Token ID | 11 |
Feature activation | -5.25e-03 |
Pos logit contributions | |
ARC | +0.137 |
ked | +0.129 |
ILA | +0.122 |
OVA | +0.121 |
Region | +0.115 |
Neg logit contributions | |
fid | -0.156 |
acci | -0.149 |
ank | -0.138 |
obey | -0.133 |
obe | -0.131 |
Token | Canada |
Token ID | 3340 |
Feature activation | -1.85e-01 |
Pos logit contributions | |
fid | +0.004 |
acci | +0.004 |
ank | +0.003 |
obey | +0.003 |
obe | +0.003 |
Neg logit contributions | |
ARC | -0.004 |
ked | -0.004 |
ILA | -0.004 |
OVA | -0.004 |
pool | -0.003 |
Token | has |
Token ID | 468 |
Feature activation | +4.71e-02 |
Pos logit contributions | |
fid | +0.148 |
acci | +0.142 |
ank | +0.132 |
obey | +0.126 |
obe | +0.125 |
Neg logit contributions | |
ARC | -0.125 |
ked | -0.116 |
ILA | -0.111 |
OVA | -0.110 |
pool | -0.105 |
Token | sh |
Token ID | 427 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
ARC | +0.035 |
ked | +0.032 |
ILA | +0.031 |
OVA | +0.031 |
pool | +0.030 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.034 |
ank | -0.031 |
obey | -0.030 |
ihil | -0.029 |
Token | ir |
Token ID | 343 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
ARC | +0.007 |
ked | +0.006 |
ILA | +0.006 |
OVA | +0.006 |
Region | +0.006 |
Neg logit contributions | |
fid | -0.008 |
acci | -0.008 |
ank | -0.007 |
obey | -0.007 |
ihil | -0.007 |
Token | ked |
Token ID | 9091 |
Feature activation | +5.26e-01 |
Pos logit contributions | |
fid | +0.219 |
acci | +0.215 |
ank | +0.206 |
obey | +0.202 |
ihil | +0.200 |
Neg logit contributions | |
ARC | -0.010 |
ked | -0.000 |
ILA | +0.002 |
OVA | +0.002 |
Region | +0.007 |
Token | several |
Token ID | 1811 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
ARC | +0.393 |
ked | +0.370 |
ILA | +0.351 |
OVA | +0.350 |
pool | +0.335 |
Neg logit contributions | |
fid | -0.387 |
acci | -0.368 |
ank | -0.340 |
obey | -0.326 |
ihil | -0.320 |
Token | of |
Token ID | 286 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
fid | +0.013 |
acci | +0.012 |
ank | +0.011 |
obey | +0.011 |
ihil | +0.010 |
Neg logit contributions | |
ARC | -0.011 |
ked | -0.011 |
ILA | -0.010 |
OVA | -0.010 |
pool | -0.010 |
Token | those |
Token ID | 883 |
Feature activation | -3.78e-03 |
Pos logit contributions | |
fid | +0.014 |
acci | +0.013 |
ank | +0.012 |
obey | +0.012 |
ihil | +0.012 |
Neg logit contributions | |
ARC | -0.015 |
ked | -0.014 |
ILA | -0.013 |
OVA | -0.013 |
pool | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | +3.25e-02 |
Pos logit contributions | |
fid | +0.003 |
acci | +0.003 |
ank | +0.002 |
obey | +0.002 |
ihil | +0.002 |
Neg logit contributions | |
ARC | -0.003 |
ked | -0.003 |
ILA | -0.002 |
OVA | -0.002 |
pool | -0.002 |
Token | It |
Token ID | 632 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
ARC | +0.023 |
ked | +0.021 |
ILA | +0.020 |
OVA | +0.020 |
pool | +0.019 |
Neg logit contributions | |
fid | -0.025 |
acci | -0.024 |
ank | -0.022 |
obey | -0.021 |
ihil | -0.021 |
Token | a |
Token ID | 257 |
Feature activation | +5.18e-02 |
Pos logit contributions | |
ARC | +0.053 |
ked | +0.050 |
ILA | +0.047 |
OVA | +0.047 |
Region | +0.045 |
Neg logit contributions | |
fid | -0.057 |
acci | -0.054 |
ank | -0.050 |
obey | -0.048 |
obe | -0.048 |
Token | Zel |
Token ID | 40071 |
Feature activation | +3.15e-01 |
Pos logit contributions | |
ARC | +0.038 |
ked | +0.036 |
ILA | +0.034 |
OVA | +0.034 |
pool | +0.032 |
Neg logit contributions | |
fid | -0.039 |
acci | -0.037 |
ank | -0.034 |
obey | -0.033 |
ihil | -0.032 |
Token | ig |
Token ID | 328 |
Feature activation | +3.57e-02 |
Pos logit contributions | |
ARC | +0.228 |
ked | +0.216 |
ILA | +0.203 |
OVA | +0.203 |
pool | +0.195 |
Neg logit contributions | |
fid | -0.238 |
acci | -0.227 |
ank | -0.210 |
obey | -0.201 |
ihil | -0.198 |
Token | who |
Token ID | 508 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
ARC | +0.025 |
ked | +0.023 |
ILA | +0.022 |
OVA | +0.022 |
pool | +0.021 |
Neg logit contributions | |
fid | -0.028 |
acci | -0.027 |
ank | -0.025 |
obey | -0.024 |
ihil | -0.024 |
Token | trek |
Token ID | 30784 |
Feature activation | -3.46e-02 |
Pos logit contributions | |
ARC | +0.009 |
ked | +0.008 |
ILA | +0.008 |
OVA | +0.008 |
pool | +0.007 |
Neg logit contributions | |
fid | -0.009 |
acci | -0.009 |
ank | -0.008 |
obey | -0.008 |
ihil | -0.008 |
Token | ked |
Token ID | 9091 |
Feature activation | +5.22e-01 |
Pos logit contributions | |
fid | +0.048 |
acci | +0.047 |
ank | +0.045 |
obey | +0.044 |
ihil | +0.044 |
Neg logit contributions | |
ARC | -0.003 |
ILA | -0.000 |
ked | -0.000 |
OVA | +0.000 |
Region | +0.001 |
Token | to |
Token ID | 284 |
Feature activation | -1.85e-03 |
Pos logit contributions | |
ARC | +0.376 |
ked | +0.357 |
ILA | +0.334 |
OVA | +0.333 |
pool | +0.321 |
Neg logit contributions | |
fid | -0.394 |
acci | -0.379 |
ank | -0.348 |
obey | -0.334 |
ihil | -0.330 |
Token | the |
Token ID | 262 |
Feature activation | +6.13e-02 |
Pos logit contributions | |
fid | +0.001 |
acci | +0.001 |
ank | +0.001 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.001 |
ked | -0.001 |
ILA | -0.001 |
OVA | -0.001 |
pool | -0.001 |
Token | North |
Token ID | 2258 |
Feature activation | -4.44e-02 |
Pos logit contributions | |
ARC | +0.045 |
ked | +0.043 |
ILA | +0.040 |
OVA | +0.040 |
pool | +0.039 |
Neg logit contributions | |
fid | -0.045 |
acci | -0.043 |
ank | -0.040 |
obey | -0.038 |
ihil | -0.038 |
Token | Pole |
Token ID | 29385 |
Feature activation | -2.38e-02 |
Pos logit contributions | |
fid | +0.031 |
acci | +0.029 |
ank | +0.027 |
obey | +0.026 |
ihil | +0.025 |
Neg logit contributions | |
ARC | -0.035 |
ked | -0.033 |
ILA | -0.032 |
OVA | -0.031 |
pool | -0.030 |
Token | but |
Token ID | 475 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
fid | +0.018 |
acci | +0.017 |
ank | +0.016 |
obey | +0.016 |
ihil | +0.015 |
Neg logit contributions | |
ARC | -0.017 |
ked | -0.016 |
ILA | -0.015 |
OVA | -0.015 |
pool | -0.014 |
Token | _ |
Token ID | 62 |
Feature activation | +9.76e-02 |
Pos logit contributions | |
fid | +0.086 |
acci | +0.084 |
ank | +0.077 |
obey | +0.075 |
ihil | +0.074 |
Neg logit contributions | |
ARC | -0.059 |
ked | -0.055 |
ILA | -0.051 |
OVA | -0.051 |
pool | -0.048 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
ARC | +0.091 |
ked | +0.087 |
ILA | +0.084 |
OVA | +0.083 |
pool | +0.081 |
Neg logit contributions | |
fid | -0.053 |
acci | -0.050 |
ank | -0.044 |
obey | -0.042 |
ihil | -0.041 |
Token | 61 |
Token ID | 5333 |
Feature activation | -4.06e-02 |
Pos logit contributions | |
fid | +0.126 |
acci | +0.119 |
ank | +0.109 |
obey | +0.104 |
ihil | +0.103 |
Neg logit contributions | |
ARC | -0.139 |
ked | -0.132 |
ILA | -0.125 |
OVA | -0.124 |
pool | -0.120 |
Token | E |
Token ID | 36 |
Feature activation | -7.21e-02 |
Pos logit contributions | |
fid | +0.027 |
acci | +0.026 |
ank | +0.024 |
obey | +0.023 |
ihil | +0.022 |
Neg logit contributions | |
ARC | -0.033 |
ked | -0.031 |
ILA | -0.030 |
OVA | -0.030 |
pool | -0.028 |
Token | , |
Token ID | 11 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
fid | +0.057 |
acci | +0.055 |
ank | +0.051 |
obey | +0.049 |
ihil | +0.048 |
Neg logit contributions | |
ARC | -0.049 |
ked | -0.046 |
ILA | -0.043 |
OVA | -0.043 |
pool | -0.041 |
Token | DP |
Token ID | 6322 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
ARC | +0.005 |
ked | +0.004 |
ILA | +0.003 |
OVA | +0.003 |
kers | +0.003 |
Neg logit contributions | |
fid | -0.019 |
acci | -0.018 |
ank | -0.018 |
obey | -0.017 |
ihil | -0.017 |
Token | 02 |
Token ID | 2999 |
Feature activation | -8.97e-02 |
Pos logit contributions | |
ARC | +0.460 |
ked | +0.440 |
ILA | +0.420 |
OVA | +0.418 |
pool | +0.405 |
Neg logit contributions | |
fid | -0.309 |
acci | -0.292 |
ank | -0.263 |
obey | -0.249 |
ihil | -0.244 |
Token | _ |
Token ID | 62 |
Feature activation | +9.19e-02 |
Pos logit contributions | |
fid | +0.078 |
acci | +0.076 |
ank | +0.070 |
obey | +0.068 |
ihil | +0.067 |
Neg logit contributions | |
ARC | -0.053 |
ked | -0.050 |
ILA | -0.047 |
OVA | -0.046 |
pool | -0.044 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.76e-01 |
Pos logit contributions | |
ARC | +0.086 |
ked | +0.082 |
ILA | +0.079 |
OVA | +0.078 |
pool | +0.076 |
Neg logit contributions | |
fid | -0.050 |
acci | -0.047 |
ank | -0.042 |
obey | -0.039 |
ihil | -0.038 |
Token | 62 |
Token ID | 5237 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
fid | +0.130 |
acci | +0.124 |
ank | +0.114 |
obey | +0.109 |
ihil | +0.108 |
Neg logit contributions | |
ARC | -0.129 |
ked | -0.122 |
ILA | -0.115 |
OVA | -0.115 |
pool | -0.110 |
Token | E |
Token ID | 36 |
Feature activation | -6.81e-02 |
Pos logit contributions | |
ARC | +0.009 |
ked | +0.009 |
ILA | +0.008 |
OVA | +0.008 |
pool | +0.008 |
Neg logit contributions | |
fid | -0.007 |
acci | -0.007 |
ank | -0.006 |
obey | -0.006 |
ihil | -0.006 |
Token | _ |
Token ID | 62 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
fid | +0.070 |
acci | +0.067 |
ank | +0.062 |
obey | +0.060 |
ihil | +0.060 |
Neg logit contributions | |
ARC | -0.047 |
ked | -0.044 |
ILA | -0.041 |
OVA | -0.041 |
pool | -0.039 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
ARC | +0.102 |
ked | +0.097 |
ILA | +0.093 |
OVA | +0.093 |
pool | +0.090 |
Neg logit contributions | |
fid | -0.059 |
acci | -0.056 |
ank | -0.050 |
obey | -0.047 |
ihil | -0.046 |
Token | 60 |
Token ID | 1899 |
Feature activation | -3.41e-02 |
Pos logit contributions | |
fid | +0.129 |
acci | +0.123 |
ank | +0.113 |
obey | +0.108 |
ihil | +0.106 |
Neg logit contributions | |
ARC | -0.136 |
ked | -0.129 |
ILA | -0.122 |
OVA | -0.122 |
pool | -0.117 |
Token | E |
Token ID | 36 |
Feature activation | -7.95e-02 |
Pos logit contributions | |
fid | +0.023 |
acci | +0.022 |
ank | +0.020 |
obey | +0.019 |
ihil | +0.019 |
Neg logit contributions | |
ARC | -0.027 |
ked | -0.026 |
ILA | -0.025 |
OVA | -0.025 |
pool | -0.024 |
Token | , |
Token ID | 11 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
fid | +0.062 |
acci | +0.060 |
ank | +0.055 |
obey | +0.053 |
ihil | +0.052 |
Neg logit contributions | |
ARC | -0.055 |
ked | -0.052 |
ILA | -0.049 |
OVA | -0.049 |
pool | -0.047 |
Token | DP |
Token ID | 6322 |
Feature activation | +5.17e-01 |
Pos logit contributions | |
ARC | +0.008 |
ked | +0.007 |
ILA | +0.006 |
OVA | +0.006 |
kers | +0.006 |
Neg logit contributions | |
fid | -0.028 |
acci | -0.028 |
ank | -0.026 |
obey | -0.025 |
ihil | -0.025 |
Token | 02 |
Token ID | 2999 |
Feature activation | -9.88e-02 |
Pos logit contributions | |
ARC | +0.457 |
ked | +0.437 |
ILA | +0.417 |
OVA | +0.415 |
pool | +0.402 |
Neg logit contributions | |
fid | -0.306 |
acci | -0.289 |
ank | -0.260 |
obey | -0.246 |
ihil | -0.242 |
Token | _ |
Token ID | 62 |
Feature activation | +9.76e-02 |
Pos logit contributions | |
fid | +0.086 |
acci | +0.084 |
ank | +0.077 |
obey | +0.075 |
ihil | +0.074 |
Neg logit contributions | |
ARC | -0.059 |
ked | -0.055 |
ILA | -0.051 |
OVA | -0.051 |
pool | -0.048 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.80e-01 |
Pos logit contributions | |
ARC | +0.091 |
ked | +0.087 |
ILA | +0.084 |
OVA | +0.083 |
pool | +0.081 |
Neg logit contributions | |
fid | -0.053 |
acci | -0.050 |
ank | -0.044 |
obey | -0.042 |
ihil | -0.041 |
Token | 61 |
Token ID | 5333 |
Feature activation | -4.06e-02 |
Pos logit contributions | |
fid | +0.126 |
acci | +0.119 |
ank | +0.109 |
obey | +0.104 |
ihil | +0.103 |
Neg logit contributions | |
ARC | -0.139 |
ked | -0.132 |
ILA | -0.125 |
OVA | -0.124 |
pool | -0.120 |
Token | E |
Token ID | 36 |
Feature activation | -7.21e-02 |
Pos logit contributions | |
fid | +0.027 |
acci | +0.026 |
ank | +0.024 |
obey | +0.023 |
ihil | +0.022 |
Neg logit contributions | |
ARC | -0.033 |
ked | -0.031 |
ILA | -0.030 |
OVA | -0.030 |
pool | -0.028 |
Token | cases |
Token ID | 2663 |
Feature activation | +4.60e-02 |
Pos logit contributions | |
ARC | +0.004 |
ked | +0.004 |
ILA | +0.004 |
OVA | +0.004 |
pool | +0.004 |
Neg logit contributions | |
fid | -0.005 |
acci | -0.005 |
ank | -0.004 |
obey | -0.004 |
ihil | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
ARC | +0.033 |
ked | +0.031 |
ILA | +0.030 |
OVA | +0.030 |
pool | +0.028 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.033 |
ank | -0.031 |
obey | -0.029 |
ihil | -0.029 |
Token |
|
Token ID | 198 |
Feature activation | +3.33e-02 |
Pos logit contributions | |
ARC | +0.017 |
ked | +0.016 |
ILA | +0.015 |
OVA | +0.015 |
pool | +0.014 |
Neg logit contributions | |
fid | -0.019 |
acci | -0.018 |
ank | -0.017 |
obey | -0.016 |
ihil | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +3.87e-02 |
Pos logit contributions | |
ARC | +0.022 |
ked | +0.021 |
ILA | +0.020 |
OVA | +0.019 |
pool | +0.019 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.026 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.023 |
Token | Book |
Token ID | 10482 |
Feature activation | +5.73e-02 |
Pos logit contributions | |
ARC | +0.026 |
ked | +0.025 |
ILA | +0.023 |
OVA | +0.023 |
kers | +0.022 |
Neg logit contributions | |
fid | -0.031 |
acci | -0.030 |
ank | -0.027 |
obey | -0.026 |
ihil | -0.026 |
Token | mark |
Token ID | 4102 |
Feature activation | +5.08e-01 |
Pos logit contributions | |
ARC | +0.018 |
ked | +0.015 |
ILA | +0.014 |
OVA | +0.013 |
pool | +0.011 |
Neg logit contributions | |
fid | -0.067 |
acci | -0.065 |
ank | -0.061 |
obey | -0.060 |
eeper | -0.059 |
Token | with |
Token ID | 351 |
Feature activation | +5.51e-02 |
Pos logit contributions | |
ARC | +0.331 |
ked | +0.309 |
ILA | +0.291 |
OVA | +0.288 |
pool | +0.275 |
Neg logit contributions | |
fid | -0.422 |
acci | -0.404 |
ank | -0.377 |
obey | -0.362 |
ihil | -0.359 |
Token | : |
Token ID | 25 |
Feature activation | -2.91e-02 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.037 |
ILA | +0.035 |
OVA | +0.035 |
pool | +0.033 |
Neg logit contributions | |
fid | -0.042 |
acci | -0.041 |
ank | -0.038 |
obey | -0.036 |
ihil | -0.035 |
Token | Delicious |
Token ID | 39528 |
Feature activation | +2.25e-01 |
Pos logit contributions | |
fid | +0.025 |
acci | +0.024 |
ank | +0.023 |
obey | +0.022 |
ihil | +0.022 |
Neg logit contributions | |
ARC | -0.018 |
ked | -0.017 |
ILA | -0.015 |
OVA | -0.015 |
pool | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | +9.04e-02 |
Pos logit contributions | |
ARC | +0.149 |
ked | +0.139 |
ILA | +0.131 |
OVA | +0.130 |
pool | +0.125 |
Neg logit contributions | |
fid | -0.184 |
acci | -0.177 |
ank | -0.165 |
obey | -0.158 |
ihil | -0.156 |
Token |
|
Token ID | 198 |
Feature activation | +8.50e-02 |
Pos logit contributions | |
ARC | +0.060 |
ked | +0.056 |
ILA | +0.053 |
OVA | +0.052 |
pool | +0.050 |
Neg logit contributions | |
fid | -0.074 |
acci | -0.071 |
ank | -0.066 |
obey | -0.063 |
ihil | -0.063 |
Token | after |
Token ID | 706 |
Feature activation | -6.99e-03 |
Pos logit contributions | |
fid | +0.201 |
acci | +0.191 |
ank | +0.178 |
obey | +0.171 |
obe | +0.168 |
Neg logit contributions | |
ARC | -0.175 |
ked | -0.163 |
ILA | -0.157 |
OVA | -0.156 |
Region | -0.148 |
Token | all |
Token ID | 477 |
Feature activation | -6.49e-02 |
Pos logit contributions | |
fid | +0.006 |
acci | +0.005 |
ank | +0.005 |
obey | +0.005 |
obe | +0.005 |
Neg logit contributions | |
ARC | -0.005 |
ked | -0.005 |
ILA | -0.004 |
OVA | -0.004 |
Region | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
fid | +0.051 |
acci | +0.049 |
ank | +0.046 |
obey | +0.044 |
obe | +0.043 |
Neg logit contributions | |
ARC | -0.045 |
ked | -0.042 |
OVA | -0.040 |
ILA | -0.040 |
Region | -0.038 |
Token | " |
Token ID | 366 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
fid | +0.009 |
acci | +0.008 |
ank | +0.008 |
obey | +0.007 |
ihil | +0.007 |
Neg logit contributions | |
ARC | -0.007 |
ked | -0.007 |
ILA | -0.006 |
OVA | -0.006 |
pool | -0.006 |
Token | Dar |
Token ID | 32708 |
Feature activation | -3.93e-02 |
Pos logit contributions | |
fid | +0.008 |
acci | +0.008 |
ank | +0.007 |
obey | +0.007 |
ihil | +0.007 |
Neg logit contributions | |
ARC | -0.006 |
ked | -0.006 |
ILA | -0.006 |
OVA | -0.006 |
kers | -0.005 |
Token | ren |
Token ID | 918 |
Feature activation | +5.07e-01 |
Pos logit contributions | |
fid | +0.047 |
acci | +0.045 |
ank | +0.043 |
obey | +0.042 |
ihil | +0.042 |
Neg logit contributions | |
ARC | -0.012 |
ked | -0.010 |
ILA | -0.009 |
OVA | -0.008 |
Region | -0.007 |
Token | must |
Token ID | 1276 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
ARC | +0.359 |
ked | +0.338 |
ILA | +0.319 |
OVA | +0.318 |
pool | +0.304 |
Neg logit contributions | |
fid | -0.391 |
acci | -0.374 |
ank | -0.346 |
obey | -0.332 |
ihil | -0.327 |
Token | be |
Token ID | 307 |
Feature activation | +9.72e-02 |
Pos logit contributions | |
fid | +0.010 |
acci | +0.010 |
ank | +0.009 |
obey | +0.009 |
ihil | +0.008 |
Neg logit contributions | |
ARC | -0.009 |
ked | -0.008 |
ILA | -0.008 |
OVA | -0.008 |
pool | -0.007 |
Token | in |
Token ID | 287 |
Feature activation | +4.42e-02 |
Pos logit contributions | |
ARC | +0.067 |
ked | +0.063 |
ILA | +0.060 |
OVA | +0.060 |
pool | +0.057 |
Neg logit contributions | |
fid | -0.077 |
acci | -0.073 |
ank | -0.068 |
obey | -0.065 |
ihil | -0.064 |
Token | Fab |
Token ID | 14236 |
Feature activation | +9.11e-02 |
Pos logit contributions | |
ARC | +0.031 |
ked | +0.029 |
ILA | +0.028 |
OVA | +0.028 |
pool | +0.026 |
Neg logit contributions | |
fid | -0.034 |
acci | -0.033 |
ank | -0.030 |
obey | -0.029 |
ihil | -0.029 |
Token | io |
Token ID | 952 |
Feature activation | +2.49e-01 |
Pos logit contributions | |
ARC | +0.052 |
ked | +0.048 |
ILA | +0.045 |
OVA | +0.045 |
pool | +0.042 |
Neg logit contributions | |
fid | -0.083 |
acci | -0.080 |
ank | -0.075 |
obey | -0.072 |
ihil | -0.071 |
Token | _ |
Token ID | 62 |
Feature activation | +1.22e-01 |
Pos logit contributions | |
fid | +0.079 |
acci | +0.076 |
ank | +0.071 |
obey | +0.069 |
ihil | +0.068 |
Neg logit contributions | |
ARC | -0.053 |
ked | -0.049 |
ILA | -0.046 |
OVA | -0.046 |
pool | -0.043 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
ARC | +0.113 |
ked | +0.108 |
ILA | +0.103 |
OVA | +0.103 |
pool | +0.100 |
Neg logit contributions | |
fid | -0.067 |
acci | -0.064 |
ank | -0.057 |
obey | -0.053 |
ihil | -0.052 |
Token | 59 |
Token ID | 3270 |
Feature activation | -3.06e-02 |
Pos logit contributions | |
fid | +0.135 |
acci | +0.129 |
ank | +0.119 |
obey | +0.114 |
ihil | +0.113 |
Neg logit contributions | |
ARC | -0.134 |
ked | -0.127 |
ILA | -0.120 |
OVA | -0.119 |
pool | -0.114 |
Token | E |
Token ID | 36 |
Feature activation | -7.60e-02 |
Pos logit contributions | |
fid | +0.022 |
acci | +0.021 |
ank | +0.019 |
obey | +0.018 |
ihil | +0.018 |
Neg logit contributions | |
ARC | -0.023 |
ked | -0.022 |
ILA | -0.021 |
OVA | -0.021 |
pool | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | +3.52e-02 |
Pos logit contributions | |
fid | +0.059 |
acci | +0.057 |
ank | +0.053 |
obey | +0.051 |
ihil | +0.050 |
Neg logit contributions | |
ARC | -0.053 |
ked | -0.050 |
ILA | -0.047 |
OVA | -0.047 |
pool | -0.045 |
Token | DP |
Token ID | 6322 |
Feature activation | +5.04e-01 |
Pos logit contributions | |
ARC | +0.013 |
ked | +0.012 |
ILA | +0.010 |
OVA | +0.010 |
kers | +0.009 |
Neg logit contributions | |
fid | -0.039 |
acci | -0.037 |
ank | -0.036 |
obey | -0.034 |
ihil | -0.034 |
Token | 02 |
Token ID | 2999 |
Feature activation | -7.93e-02 |
Pos logit contributions | |
ARC | +0.445 |
ked | +0.425 |
ILA | +0.406 |
OVA | +0.404 |
pool | +0.391 |
Neg logit contributions | |
fid | -0.299 |
acci | -0.282 |
ank | -0.254 |
obey | -0.240 |
ihil | -0.236 |
Token | _ |
Token ID | 62 |
Feature activation | +1.09e-01 |
Pos logit contributions | |
fid | +0.070 |
acci | +0.067 |
ank | +0.062 |
obey | +0.060 |
ihil | +0.060 |
Neg logit contributions | |
ARC | -0.047 |
ked | -0.044 |
ILA | -0.041 |
OVA | -0.041 |
pool | -0.039 |
Token | 00 |
Token ID | 405 |
Feature activation | -1.79e-01 |
Pos logit contributions | |
ARC | +0.102 |
ked | +0.097 |
ILA | +0.093 |
OVA | +0.093 |
pool | +0.090 |
Neg logit contributions | |
fid | -0.059 |
acci | -0.056 |
ank | -0.050 |
obey | -0.047 |
ihil | -0.046 |
Token | 60 |
Token ID | 1899 |
Feature activation | -3.41e-02 |
Pos logit contributions | |
fid | +0.129 |
acci | +0.123 |
ank | +0.113 |
obey | +0.108 |
ihil | +0.106 |
Neg logit contributions | |
ARC | -0.136 |
ked | -0.129 |
ILA | -0.122 |
OVA | -0.122 |
pool | -0.117 |
Token | E |
Token ID | 36 |
Feature activation | -7.95e-02 |
Pos logit contributions | |
fid | +0.023 |
acci | +0.022 |
ank | +0.020 |
obey | +0.019 |
ihil | +0.019 |
Neg logit contributions | |
ARC | -0.027 |
ked | -0.026 |
ILA | -0.025 |
OVA | -0.025 |
pool | -0.024 |
Token | have |
Token ID | 423 |
Feature activation | +2.28e-02 |
Pos logit contributions | |
ARC | +0.063 |
ked | +0.059 |
ILA | +0.056 |
OVA | +0.055 |
pool | +0.053 |
Neg logit contributions | |
fid | -0.069 |
acci | -0.066 |
ank | -0.061 |
obey | -0.059 |
ihil | -0.058 |
Token | also |
Token ID | 635 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
ARC | +0.017 |
ked | +0.016 |
ILA | +0.015 |
OVA | +0.015 |
pool | +0.014 |
Neg logit contributions | |
fid | -0.017 |
acci | -0.016 |
ank | -0.015 |
obey | -0.014 |
ihil | -0.014 |
Token | improved |
Token ID | 6596 |
Feature activation | +4.84e-02 |
Pos logit contributions | |
fid | +0.092 |
acci | +0.087 |
ank | +0.081 |
obey | +0.077 |
ihil | +0.076 |
Neg logit contributions | |
ARC | -0.093 |
ked | -0.087 |
ILA | -0.083 |
OVA | -0.083 |
pool | -0.079 |
Token | the |
Token ID | 262 |
Feature activation | -8.20e-03 |
Pos logit contributions | |
ARC | +0.034 |
ked | +0.031 |
OVA | +0.030 |
ILA | +0.030 |
kers | +0.028 |
Neg logit contributions | |
fid | -0.038 |
acci | -0.036 |
ank | -0.034 |
obey | -0.033 |
obe | -0.032 |
Token | Sail |
Token ID | 27783 |
Feature activation | -5.55e-02 |
Pos logit contributions | |
fid | +0.006 |
acci | +0.006 |
ank | +0.006 |
obey | +0.005 |
obe | +0.005 |
Neg logit contributions | |
ARC | -0.006 |
ked | -0.005 |
ILA | -0.005 |
OVA | -0.005 |
pool | -0.005 |
Token | fish |
Token ID | 11084 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
fid | +0.066 |
acci | +0.064 |
ank | +0.061 |
obey | +0.059 |
ihil | +0.059 |
Neg logit contributions | |
ARC | -0.016 |
ked | -0.014 |
ILA | -0.012 |
OVA | -0.012 |
pool | -0.010 |
Token | browser |
Token ID | 6444 |
Feature activation | +3.67e-02 |
Pos logit contributions | |
ARC | +0.262 |
ked | +0.239 |
ILA | +0.222 |
OVA | +0.220 |
Region | +0.206 |
Neg logit contributions | |
fid | -0.482 |
acci | -0.464 |
ank | -0.437 |
obey | -0.424 |
obe | -0.417 |
Token | and |
Token ID | 290 |
Feature activation | +3.54e-02 |
Pos logit contributions | |
ARC | +0.025 |
ked | +0.024 |
ILA | +0.023 |
OVA | +0.022 |
kers | +0.021 |
Neg logit contributions | |
fid | -0.029 |
acci | -0.028 |
ank | -0.026 |
obey | -0.025 |
obe | -0.024 |
Token | [ |
Token ID | 685 |
Feature activation | +6.86e-03 |
Pos logit contributions | |
ARC | +0.026 |
ked | +0.024 |
ILA | +0.023 |
OVA | +0.023 |
pool | +0.022 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.025 |
ank | -0.024 |
obey | -0.023 |
obe | -0.022 |
Token | the |
Token ID | 1169 |
Feature activation | +6.68e-02 |
Pos logit contributions | |
ARC | +0.004 |
ked | +0.004 |
ILA | +0.004 |
OVA | +0.004 |
kers | +0.004 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.005 |
ank | -0.005 |
obey | -0.005 |
ihil | -0.005 |
Token | phone |
Token ID | 3072 |
Feature activation | +9.09e-02 |
Pos logit contributions | |
ARC | +0.045 |
ked | +0.042 |
ILA | +0.040 |
OVA | +0.040 |
Region | +0.038 |
Neg logit contributions | |
fid | -0.054 |
acci | -0.051 |
ank | -0.048 |
obey | -0.046 |
ihil | -0.045 |
Token | sank |
Token ID | 30895 |
Feature activation | +4.98e-02 |
Pos logit contributions | |
fid | +0.055 |
acci | +0.052 |
ank | +0.049 |
obey | +0.047 |
ihil | +0.046 |
Neg logit contributions | |
ARC | -0.050 |
ked | -0.047 |
ILA | -0.044 |
OVA | -0.044 |
pool | -0.042 |
Token | quickly |
Token ID | 2952 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
ARC | +0.035 |
ked | +0.033 |
ILA | +0.031 |
OVA | +0.031 |
Region | +0.029 |
Neg logit contributions | |
fid | -0.039 |
acci | -0.037 |
ank | -0.034 |
obey | -0.033 |
ihil | -0.032 |
Token | into |
Token ID | 656 |
Feature activation | +4.44e-02 |
Pos logit contributions | |
ARC | +0.142 |
ked | +0.133 |
ILA | +0.126 |
OVA | +0.125 |
pool | +0.120 |
Neg logit contributions | |
fid | -0.162 |
acci | -0.155 |
ank | -0.144 |
obey | -0.138 |
ihil | -0.137 |
Token | a |
Token ID | 257 |
Feature activation | -2.90e-02 |
Pos logit contributions | |
ARC | +0.031 |
ked | +0.029 |
ILA | +0.028 |
OVA | +0.028 |
pool | +0.026 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.033 |
ank | -0.031 |
obey | -0.029 |
ihil | -0.029 |
Token | mud |
Token ID | 17492 |
Feature activation | -7.80e-02 |
Pos logit contributions | |
fid | +0.023 |
acci | +0.022 |
ank | +0.021 |
obey | +0.020 |
ihil | +0.020 |
Neg logit contributions | |
ARC | -0.020 |
ked | -0.018 |
ILA | -0.018 |
OVA | -0.017 |
kers | -0.017 |
Token | pool |
Token ID | 7742 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
fid | +0.066 |
acci | +0.062 |
ank | +0.059 |
obey | +0.057 |
ihil | +0.056 |
Neg logit contributions | |
ARC | -0.050 |
ked | -0.046 |
ILA | -0.044 |
OVA | -0.043 |
Region | -0.041 |
Token | that |
Token ID | 326 |
Feature activation | -3.57e-02 |
Pos logit contributions | |
ARC | +0.344 |
ked | +0.321 |
ILA | +0.305 |
OVA | +0.302 |
kers | +0.287 |
Neg logit contributions | |
fid | -0.400 |
acci | -0.381 |
ank | -0.356 |
obey | -0.341 |
ihil | -0.336 |
Token | froze |
Token ID | 37785 |
Feature activation | -7.11e-02 |
Pos logit contributions | |
fid | +0.027 |
acci | +0.026 |
ank | +0.024 |
obey | +0.023 |
ihil | +0.023 |
Neg logit contributions | |
ARC | -0.026 |
ked | -0.024 |
ILA | -0.023 |
OVA | -0.023 |
Region | -0.022 |
Token | and |
Token ID | 290 |
Feature activation | -2.64e-02 |
Pos logit contributions | |
fid | +0.055 |
acci | +0.052 |
ank | +0.048 |
obey | +0.046 |
ihil | +0.046 |
Neg logit contributions | |
ARC | -0.051 |
ked | -0.048 |
ILA | -0.045 |
OVA | -0.045 |
pool | -0.043 |
Token | preserved |
Token ID | 17232 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
fid | +0.020 |
acci | +0.019 |
ank | +0.018 |
obey | +0.017 |
ihil | +0.017 |
Neg logit contributions | |
ARC | -0.019 |
ked | -0.018 |
ILA | -0.017 |
OVA | -0.017 |
Region | -0.016 |
Token | her |
Token ID | 607 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
ARC | +0.086 |
ked | +0.081 |
ILA | +0.077 |
OVA | +0.076 |
pool | +0.073 |
Neg logit contributions | |
fid | -0.090 |
acci | -0.086 |
ank | -0.080 |
obey | -0.077 |
ihil | -0.076 |
Token | like |
Token ID | 588 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.018 |
ank | +0.017 |
obey | +0.016 |
ihil | +0.016 |
Neg logit contributions | |
ARC | -0.017 |
ked | -0.016 |
ILA | -0.015 |
OVA | -0.015 |
pool | -0.015 |
Token | Jake |
Token ID | 14757 |
Feature activation | +2.39e-01 |
Pos logit contributions | |
ARC | +0.025 |
ked | +0.023 |
ILA | +0.022 |
OVA | +0.022 |
Region | +0.021 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.025 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.022 |
Token | Lloyd |
Token ID | 22361 |
Feature activation | +1.08e-01 |
Pos logit contributions | |
ARC | +0.228 |
ked | +0.218 |
ILA | +0.209 |
OVA | +0.208 |
pool | +0.202 |
Neg logit contributions | |
fid | -0.126 |
acci | -0.117 |
ank | -0.104 |
obey | -0.098 |
ihil | -0.096 |
Token | and |
Token ID | 290 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
ARC | +0.073 |
ked | +0.069 |
ILA | +0.065 |
OVA | +0.065 |
Region | +0.062 |
Neg logit contributions | |
fid | -0.087 |
acci | -0.083 |
ank | -0.077 |
obey | -0.074 |
ihil | -0.073 |
Token | Hayden |
Token ID | 35805 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
ARC | +0.018 |
ked | +0.016 |
ILA | +0.016 |
OVA | +0.015 |
Region | +0.015 |
Neg logit contributions | |
fid | -0.020 |
acci | -0.019 |
ank | -0.018 |
obey | -0.017 |
ihil | -0.017 |
Token | Christensen |
Token ID | 49195 |
Feature activation | +4.99e-01 |
Pos logit contributions | |
ARC | +0.048 |
ked | +0.044 |
OVA | +0.040 |
ILA | +0.040 |
kers | +0.036 |
Neg logit contributions | |
fid | -0.123 |
acci | -0.120 |
ank | -0.112 |
obey | -0.110 |
ihil | -0.109 |
Token | , |
Token ID | 11 |
Feature activation | -1.21e-03 |
Pos logit contributions | |
ARC | +0.334 |
ked | +0.313 |
ILA | +0.294 |
OVA | +0.293 |
pool | +0.279 |
Neg logit contributions | |
fid | -0.405 |
acci | -0.389 |
ank | -0.361 |
obey | -0.347 |
ihil | -0.343 |
Token | it |
Token ID | 340 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
fid | +0.001 |
acci | +0.001 |
ank | +0.001 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.001 |
ked | -0.001 |
ILA | -0.001 |
OVA | -0.001 |
pool | -0.001 |
Token | kind |
Token ID | 1611 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
ARC | +0.010 |
ked | +0.009 |
ILA | +0.009 |
OVA | +0.009 |
pool | +0.008 |
Neg logit contributions | |
fid | -0.010 |
acci | -0.010 |
ank | -0.009 |
obey | -0.009 |
ihil | -0.009 |
Token | of |
Token ID | 286 |
Feature activation | +9.70e-03 |
Pos logit contributions | |
fid | +0.181 |
acci | +0.174 |
ank | +0.161 |
obey | +0.155 |
ihil | +0.153 |
Neg logit contributions | |
ARC | -0.159 |
ked | -0.149 |
ILA | -0.141 |
OVA | -0.140 |
pool | -0.133 |
Token | destroys |
Token ID | 27838 |
Feature activation | -5.14e-02 |
Pos logit contributions | |
ARC | +0.007 |
ked | +0.007 |
ILA | +0.006 |
OVA | +0.006 |
pool | +0.006 |
Neg logit contributions | |
fid | -0.007 |
acci | -0.007 |
ank | -0.006 |
obey | -0.006 |
ihil | -0.006 |
Token | � |
Token ID | 447 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.036 |
ILA | +0.034 |
OVA | +0.034 |
pool | +0.033 |
Neg logit contributions | |
fid | -0.042 |
acci | -0.040 |
ank | -0.037 |
obey | -0.036 |
ihil | -0.035 |
Token | � |
Token ID | 247 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
ARC | +0.009 |
ked | +0.008 |
ILA | +0.008 |
OVA | +0.008 |
pool | +0.007 |
Neg logit contributions | |
fid | -0.011 |
acci | -0.011 |
ank | -0.010 |
obey | -0.010 |
ihil | -0.010 |
Token | m |
Token ID | 76 |
Feature activation | +7.99e-02 |
Pos logit contributions | |
ARC | +0.016 |
ked | +0.015 |
ILA | +0.014 |
OVA | +0.014 |
pool | +0.013 |
Neg logit contributions | |
fid | -0.019 |
acci | -0.018 |
ank | -0.017 |
obey | -0.017 |
ihil | -0.016 |
Token | a |
Token ID | 257 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
ARC | +0.056 |
ked | +0.052 |
ILA | +0.049 |
OVA | +0.049 |
pool | +0.047 |
Neg logit contributions | |
fid | -0.062 |
acci | -0.060 |
ank | -0.056 |
obey | -0.053 |
ihil | -0.053 |
Token | Hust |
Token ID | 42941 |
Feature activation | -1.87e-01 |
Pos logit contributions | |
ARC | +0.003 |
ked | +0.003 |
ILA | +0.003 |
OVA | +0.003 |
pool | +0.003 |
Neg logit contributions | |
fid | -0.003 |
acci | -0.003 |
ank | -0.003 |
obey | -0.003 |
ihil | -0.003 |
Token | la |
Token ID | 5031 |
Feature activation | -6.46e-01 |
Pos logit contributions | |
fid | +0.088 |
acci | +0.083 |
ank | +0.072 |
obey | +0.067 |
ihil | +0.065 |
Neg logit contributions | |
ARC | -0.188 |
ked | -0.180 |
ILA | -0.173 |
OVA | -0.173 |
pool | -0.168 |
Token | . |
Token ID | 13 |
Feature activation | -1.74e-02 |
Pos logit contributions | |
fid | +0.456 |
acci | +0.434 |
ank | +0.400 |
obey | +0.381 |
ihil | +0.375 |
Neg logit contributions | |
ARC | -0.501 |
ked | -0.473 |
ILA | -0.450 |
OVA | -0.447 |
pool | -0.429 |
Token | � |
Token ID | 447 |
Feature activation | -7.23e-02 |
Pos logit contributions | |
fid | +0.013 |
acci | +0.012 |
ank | +0.011 |
obey | +0.011 |
ihil | +0.011 |
Neg logit contributions | |
ARC | -0.013 |
ked | -0.012 |
ILA | -0.011 |
OVA | -0.011 |
pool | -0.011 |
Token | � |
Token ID | 251 |
Feature activation | -4.52e-02 |
Pos logit contributions | |
fid | +0.055 |
acci | +0.053 |
ank | +0.049 |
obey | +0.047 |
ihil | +0.046 |
Neg logit contributions | |
ARC | -0.052 |
ked | -0.049 |
ILA | -0.046 |
OVA | -0.046 |
pool | -0.044 |
Token |
|
Token ID | 198 |
Feature activation | +1.46e-02 |
Pos logit contributions | |
fid | +0.036 |
acci | +0.035 |
ank | +0.032 |
obey | +0.031 |
ihil | +0.031 |
Neg logit contributions | |
ARC | -0.030 |
ked | -0.028 |
ILA | -0.027 |
OVA | -0.027 |
pool | -0.025 |
Token |
|
Token ID | 198 |
Feature activation | +2.64e-02 |
Pos logit contributions | |
ARC | +0.010 |
ked | +0.009 |
ILA | +0.008 |
OVA | +0.008 |
pool | +0.008 |
Neg logit contributions | |
fid | -0.012 |
acci | -0.011 |
ank | -0.011 |
obey | -0.010 |
ihil | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +5.89e-02 |
Pos logit contributions | |
ARC | +0.043 |
ked | +0.040 |
ILA | +0.038 |
OVA | +0.038 |
pool | +0.036 |
Neg logit contributions | |
fid | -0.054 |
acci | -0.051 |
ank | -0.048 |
obey | -0.046 |
ihil | -0.045 |
Token | Media |
Token ID | 13152 |
Feature activation | -1.38e-02 |
Pos logit contributions | |
ARC | +0.041 |
ked | +0.039 |
ILA | +0.036 |
OVA | +0.036 |
kers | +0.035 |
Neg logit contributions | |
fid | -0.046 |
acci | -0.044 |
ank | -0.041 |
obey | -0.039 |
ihil | -0.039 |
Token | : |
Token ID | 25 |
Feature activation | -9.57e-02 |
Pos logit contributions | |
fid | +0.011 |
acci | +0.011 |
ank | +0.010 |
obey | +0.010 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.009 |
ked | -0.009 |
ILA | -0.008 |
OVA | -0.008 |
kers | -0.008 |
Token | CD |
Token ID | 6458 |
Feature activation | -8.13e-02 |
Pos logit contributions | |
fid | +0.070 |
acci | +0.067 |
ank | +0.062 |
obey | +0.059 |
ihil | +0.058 |
Neg logit contributions | |
ARC | -0.071 |
ked | -0.067 |
ILA | -0.064 |
OVA | -0.063 |
pool | -0.061 |
Token | - |
Token ID | 12 |
Feature activation | +9.13e-02 |
Pos logit contributions | |
fid | +0.074 |
acci | +0.071 |
ank | +0.067 |
obey | +0.064 |
ihil | +0.064 |
Neg logit contributions | |
ARC | -0.046 |
ked | -0.043 |
ILA | -0.040 |
OVA | -0.040 |
kers | -0.038 |
Token | ROM |
Token ID | 33676 |
Feature activation | -5.59e-01 |
Pos logit contributions | |
ARC | +0.114 |
ked | +0.112 |
ILA | +0.107 |
OVA | +0.107 |
kers | +0.105 |
Neg logit contributions | |
fid | -0.020 |
acci | -0.017 |
ank | -0.012 |
obey | -0.009 |
ihil | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +4.15e-02 |
Pos logit contributions | |
fid | +0.444 |
acci | +0.424 |
ank | +0.394 |
obey | +0.379 |
ihil | +0.373 |
Neg logit contributions | |
ARC | -0.382 |
ked | -0.361 |
ILA | -0.339 |
OVA | -0.336 |
kers | -0.322 |
Token |
|
Token ID | 198 |
Feature activation | +4.40e-02 |
Pos logit contributions | |
ARC | +0.027 |
ked | +0.026 |
ILA | +0.024 |
OVA | +0.024 |
pool | +0.023 |
Neg logit contributions | |
fid | -0.034 |
acci | -0.033 |
ank | -0.030 |
obey | -0.029 |
ihil | -0.029 |
Token | Rating |
Token ID | 29321 |
Feature activation | +8.15e-02 |
Pos logit contributions | |
ARC | +0.030 |
ked | +0.029 |
ILA | +0.027 |
OVA | +0.027 |
kers | +0.026 |
Neg logit contributions | |
fid | -0.034 |
acci | -0.033 |
ank | -0.030 |
obey | -0.029 |
ihil | -0.029 |
Token | : |
Token ID | 25 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ARC | +0.059 |
ked | +0.056 |
ILA | +0.053 |
OVA | +0.052 |
kers | +0.050 |
Neg logit contributions | |
fid | -0.062 |
acci | -0.059 |
ank | -0.054 |
obey | -0.052 |
ihil | -0.051 |
Token | E |
Token ID | 412 |
Feature activation | +4.54e-02 |
Pos logit contributions | |
fid | +0.081 |
acci | +0.077 |
ank | +0.071 |
obey | +0.068 |
ihil | +0.067 |
Neg logit contributions | |
ARC | -0.076 |
ked | -0.072 |
ILA | -0.068 |
OVA | -0.067 |
pool | -0.065 |
Token | de |
Token ID | 390 |
Feature activation | -2.60e-01 |
Pos logit contributions | |
fid | +0.082 |
acci | +0.079 |
ank | +0.073 |
obey | +0.070 |
ihil | +0.069 |
Neg logit contributions | |
ARC | -0.073 |
ked | -0.068 |
ILA | -0.065 |
OVA | -0.064 |
pool | -0.062 |
Token | jar |
Token ID | 9491 |
Feature activation | -1.46e-01 |
Pos logit contributions | |
fid | +0.187 |
acci | +0.179 |
ank | +0.165 |
obey | +0.157 |
ihil | +0.155 |
Neg logit contributions | |
ARC | -0.198 |
ked | -0.187 |
ILA | -0.177 |
OVA | -0.176 |
pool | -0.169 |
Token | ía |
Token ID | 29690 |
Feature activation | +2.54e-02 |
Pos logit contributions | |
fid | +0.113 |
acci | +0.109 |
ank | +0.101 |
obey | +0.097 |
ihil | +0.095 |
Neg logit contributions | |
ARC | -0.102 |
ked | -0.096 |
ILA | -0.090 |
OVA | -0.090 |
pool | -0.086 |
Token | que |
Token ID | 8358 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
ARC | +0.017 |
ked | +0.016 |
ILA | +0.015 |
OVA | +0.015 |
pool | +0.014 |
Neg logit contributions | |
fid | -0.021 |
acci | -0.020 |
ank | -0.018 |
obey | -0.018 |
ihil | -0.018 |
Token | mi |
Token ID | 21504 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
fid | +0.008 |
acci | +0.008 |
ank | +0.007 |
obey | +0.007 |
ihil | +0.007 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.007 |
ILA | -0.007 |
OVA | -0.007 |
pool | -0.007 |
Token | hij |
Token ID | 16836 |
Feature activation | -5.32e-01 |
Pos logit contributions | |
fid | +0.080 |
acci | +0.077 |
ank | +0.071 |
obey | +0.068 |
ihil | +0.067 |
Neg logit contributions | |
ARC | -0.076 |
ked | -0.072 |
ILA | -0.068 |
OVA | -0.068 |
pool | -0.065 |
Token | a |
Token ID | 64 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
fid | +0.447 |
acci | +0.432 |
ank | +0.401 |
obey | +0.387 |
ihil | +0.382 |
Neg logit contributions | |
ARC | -0.339 |
ked | -0.317 |
ILA | -0.297 |
OVA | -0.296 |
pool | -0.282 |
Token | jug |
Token ID | 45808 |
Feature activation | -1.43e-01 |
Pos logit contributions | |
fid | +0.084 |
acci | +0.081 |
ank | +0.075 |
obey | +0.072 |
ihil | +0.071 |
Neg logit contributions | |
ARC | -0.072 |
ked | -0.068 |
ILA | -0.064 |
OVA | -0.064 |
pool | -0.061 |
Token | ara |
Token ID | 3301 |
Feature activation | -1.78e-01 |
Pos logit contributions | |
fid | +0.105 |
acci | +0.101 |
ank | +0.092 |
obey | +0.089 |
ihil | +0.087 |
Neg logit contributions | |
ARC | -0.107 |
ked | -0.100 |
ILA | -0.095 |
OVA | -0.095 |
pool | -0.091 |
Token | con |
Token ID | 369 |
Feature activation | -7.80e-02 |
Pos logit contributions | |
fid | +0.143 |
acci | +0.137 |
ank | +0.128 |
obey | +0.123 |
ihil | +0.121 |
Neg logit contributions | |
ARC | -0.120 |
ked | -0.112 |
ILA | -0.105 |
OVA | -0.105 |
pool | -0.100 |
Token | e |
Token ID | 304 |
Feature activation | -3.43e-02 |
Pos logit contributions | |
fid | +0.057 |
acci | +0.054 |
ank | +0.050 |
obey | +0.048 |
ihil | +0.047 |
Neg logit contributions | |
ARC | -0.059 |
ked | -0.055 |
ILA | -0.053 |
OVA | -0.052 |
pool | -0.050 |
Token | represent |
Token ID | 2380 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
fid | +0.010 |
acci | +0.010 |
ank | +0.009 |
obey | +0.008 |
ihil | +0.008 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.013 |
ILA | -0.013 |
OVA | -0.012 |
pool | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
fid | +0.085 |
acci | +0.081 |
ank | +0.075 |
obey | +0.072 |
ihil | +0.071 |
Neg logit contributions | |
ARC | -0.077 |
ked | -0.072 |
ILA | -0.068 |
OVA | -0.068 |
pool | -0.065 |
Token | views |
Token ID | 5009 |
Feature activation | +4.55e-02 |
Pos logit contributions | |
ARC | +0.011 |
ked | +0.011 |
ILA | +0.010 |
OVA | +0.010 |
pool | +0.009 |
Neg logit contributions | |
fid | -0.014 |
acci | -0.014 |
ank | -0.013 |
obey | -0.012 |
ihil | -0.012 |
Token | of |
Token ID | 286 |
Feature activation | +3.28e-03 |
Pos logit contributions | |
ARC | +0.031 |
ked | +0.029 |
ILA | +0.027 |
OVA | +0.027 |
pool | +0.026 |
Neg logit contributions | |
fid | -0.037 |
acci | -0.035 |
ank | -0.033 |
obey | -0.031 |
ihil | -0.031 |
Token | Town |
Token ID | 8329 |
Feature activation | -3.92e-02 |
Pos logit contributions | |
ARC | +0.003 |
ked | +0.002 |
ILA | +0.002 |
OVA | +0.002 |
pool | +0.002 |
Neg logit contributions | |
fid | -0.002 |
acci | -0.002 |
ank | -0.002 |
obey | -0.002 |
ihil | -0.002 |
Token | hall |
Token ID | 18323 |
Feature activation | -5.24e-01 |
Pos logit contributions | |
fid | +0.014 |
acci | +0.013 |
ank | +0.011 |
obey | +0.009 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.044 |
ked | -0.042 |
ILA | -0.041 |
OVA | -0.041 |
pool | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | -1.00e-03 |
Pos logit contributions | |
fid | +0.440 |
acci | +0.424 |
ank | +0.395 |
obey | +0.379 |
ihil | +0.376 |
Neg logit contributions | |
ARC | -0.335 |
ked | -0.314 |
ILA | -0.294 |
OVA | -0.293 |
pool | -0.279 |
Token | com |
Token ID | 785 |
Feature activation | -2.00e-01 |
Pos logit contributions | |
fid | +0.001 |
acci | +0.001 |
ank | +0.001 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.001 |
ked | -0.001 |
OVA | -0.001 |
ILA | -0.001 |
pool | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
fid | +0.170 |
acci | +0.165 |
ank | +0.154 |
obey | +0.148 |
ihil | +0.147 |
Neg logit contributions | |
ARC | -0.124 |
ked | -0.115 |
ILA | -0.108 |
OVA | -0.108 |
pool | -0.103 |
Token |
|
Token ID | 198 |
Feature activation | -4.64e-03 |
Pos logit contributions | |
fid | +0.009 |
acci | +0.009 |
ank | +0.008 |
obey | +0.008 |
ihil | +0.008 |
Neg logit contributions | |
ARC | -0.007 |
ked | -0.006 |
ILA | -0.006 |
OVA | -0.006 |
pool | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +1.66e-03 |
Pos logit contributions | |
fid | +0.004 |
acci | +0.004 |
ank | +0.003 |
obey | +0.003 |
ihil | +0.003 |
Neg logit contributions | |
ARC | -0.003 |
ked | -0.003 |
ILA | -0.003 |
OVA | -0.003 |
pool | -0.003 |
Token | s |
Token ID | 82 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
ARC | +0.015 |
ked | +0.014 |
ILA | +0.014 |
OVA | +0.013 |
pool | +0.013 |
Neg logit contributions | |
fid | -0.017 |
acci | -0.016 |
ank | -0.015 |
obey | -0.014 |
ihil | -0.014 |
Token | theme |
Token ID | 7505 |
Feature activation | +3.27e-02 |
Pos logit contributions | |
fid | +0.028 |
acci | +0.027 |
ank | +0.025 |
obey | +0.024 |
ihil | +0.023 |
Neg logit contributions | |
ARC | -0.026 |
ked | -0.024 |
ILA | -0.023 |
OVA | -0.023 |
pool | -0.022 |
Token | for |
Token ID | 329 |
Feature activation | +2.59e-02 |
Pos logit contributions | |
ARC | +0.024 |
ked | +0.022 |
ILA | +0.021 |
OVA | +0.021 |
Region | +0.020 |
Neg logit contributions | |
fid | -0.025 |
acci | -0.024 |
ank | -0.022 |
obey | -0.021 |
ihil | -0.020 |
Token | The |
Token ID | 383 |
Feature activation | -5.14e-02 |
Pos logit contributions | |
ARC | +0.018 |
ked | +0.017 |
ILA | +0.016 |
OVA | +0.016 |
pool | +0.015 |
Neg logit contributions | |
fid | -0.020 |
acci | -0.019 |
ank | -0.018 |
obey | -0.017 |
ihil | -0.017 |
Token | Hust |
Token ID | 42941 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
fid | +0.039 |
acci | +0.037 |
ank | +0.034 |
obey | +0.033 |
ihil | +0.032 |
Neg logit contributions | |
ARC | -0.037 |
ked | -0.035 |
ILA | -0.033 |
OVA | -0.033 |
pool | -0.031 |
Token | le |
Token ID | 293 |
Feature activation | -5.19e-01 |
Pos logit contributions | |
fid | +0.090 |
acci | +0.084 |
ank | +0.073 |
obey | +0.068 |
ihil | +0.066 |
Neg logit contributions | |
ARC | -0.197 |
ked | -0.188 |
ILA | -0.181 |
OVA | -0.181 |
pool | -0.175 |
Token | is |
Token ID | 318 |
Feature activation | -7.11e-02 |
Pos logit contributions | |
fid | +0.391 |
acci | +0.374 |
ank | +0.346 |
obey | +0.331 |
ihil | +0.326 |
Neg logit contributions | |
ARC | -0.375 |
ked | -0.353 |
ILA | -0.335 |
OVA | -0.333 |
Region | -0.318 |
Token | people |
Token ID | 661 |
Feature activation | -2.02e-02 |
Pos logit contributions | |
fid | +0.054 |
acci | +0.052 |
ank | +0.048 |
obey | +0.046 |
ihil | +0.045 |
Neg logit contributions | |
ARC | -0.051 |
ked | -0.048 |
ILA | -0.045 |
OVA | -0.045 |
pool | -0.043 |
Token | who |
Token ID | 508 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
fid | +0.016 |
acci | +0.015 |
ank | +0.014 |
obey | +0.013 |
ihil | +0.013 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.013 |
ILA | -0.012 |
OVA | -0.012 |
Region | -0.012 |
Token | game |
Token ID | 983 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
fid | +0.076 |
acci | +0.073 |
ank | +0.067 |
obey | +0.064 |
ihil | +0.063 |
Neg logit contributions | |
ARC | -0.074 |
ked | -0.070 |
ILA | -0.066 |
OVA | -0.066 |
pool | -0.063 |
Token | the |
Token ID | 262 |
Feature activation | -5.55e-02 |
Pos logit contributions | |
fid | +0.082 |
acci | +0.079 |
ank | +0.073 |
obey | +0.070 |
ihil | +0.069 |
Neg logit contributions | |
ARC | -0.072 |
ked | -0.068 |
ILA | -0.064 |
OVA | -0.063 |
pool | -0.061 |
Token | R |
Token ID | 371 |
Feature activation | +1.60e-01 |
Pos logit contributions | |
ARC | +0.017 |
ked | +0.016 |
ILA | +0.015 |
OVA | +0.015 |
pool | +0.014 |
Neg logit contributions | |
fid | -0.017 |
acci | -0.017 |
ank | -0.015 |
obey | -0.015 |
ihil | -0.015 |
Token | itter |
Token ID | 1967 |
Feature activation | +1.33e-01 |
Pos logit contributions | |
ARC | +0.115 |
ked | +0.108 |
ILA | +0.102 |
OVA | +0.101 |
pool | +0.097 |
Neg logit contributions | |
fid | -0.122 |
acci | -0.117 |
ank | -0.108 |
obey | -0.104 |
ihil | -0.102 |
Token | 1989 |
Token ID | 11104 |
Feature activation | +9.51e-02 |
Pos logit contributions | |
ARC | +0.084 |
ked | +0.079 |
ILA | +0.074 |
OVA | +0.073 |
pool | +0.070 |
Neg logit contributions | |
fid | -0.112 |
acci | -0.108 |
ank | -0.101 |
obey | -0.097 |
ihil | -0.096 |
Token | Richard |
Token ID | 6219 |
Feature activation | +3.05e-02 |
Pos logit contributions | |
ARC | +0.065 |
ked | +0.061 |
ILA | +0.057 |
OVA | +0.057 |
pool | +0.054 |
Neg logit contributions | |
fid | -0.076 |
acci | -0.073 |
ank | -0.068 |
obey | -0.065 |
ihil | -0.064 |
Token | Mull |
Token ID | 19574 |
Feature activation | -2.85e-01 |
Pos logit contributions | |
ARC | +0.022 |
ked | +0.021 |
ILA | +0.020 |
OVA | +0.019 |
pool | +0.019 |
Neg logit contributions | |
fid | -0.023 |
acci | -0.022 |
ank | -0.020 |
obey | -0.020 |
ihil | -0.019 |
Token | igan |
Token ID | 5516 |
Feature activation | -5.18e-01 |
Pos logit contributions | |
fid | +0.174 |
acci | +0.166 |
ank | +0.149 |
obey | +0.141 |
ihil | +0.139 |
Neg logit contributions | |
ARC | -0.248 |
ked | -0.235 |
ILA | -0.226 |
OVA | -0.225 |
Region | -0.217 |
Token |
|
Token ID | 198 |
Feature activation | +4.90e-02 |
Pos logit contributions | |
fid | +0.424 |
acci | +0.407 |
ank | +0.379 |
obey | +0.364 |
ihil | +0.360 |
Neg logit contributions | |
ARC | -0.342 |
ked | -0.320 |
ILA | -0.302 |
OVA | -0.299 |
pool | -0.285 |
Token |
|
Token ID | 198 |
Feature activation | +5.19e-02 |
Pos logit contributions | |
ARC | +0.032 |
ked | +0.030 |
ILA | +0.028 |
OVA | +0.028 |
pool | +0.027 |
Neg logit contributions | |
fid | -0.040 |
acci | -0.039 |
ank | -0.036 |
obey | -0.035 |
ihil | -0.034 |
Token | 1989 |
Token ID | 25475 |
Feature activation | -7.61e-02 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.037 |
ILA | +0.035 |
OVA | +0.035 |
pool | +0.034 |
Neg logit contributions | |
fid | -0.037 |
acci | -0.036 |
ank | -0.033 |
obey | -0.031 |
ihil | -0.031 |
Token | Ted |
Token ID | 11396 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
fid | +0.060 |
acci | +0.058 |
ank | +0.054 |
obey | +0.051 |
ihil | +0.051 |
Neg logit contributions | |
ARC | -0.052 |
ked | -0.049 |
ILA | -0.046 |
OVA | -0.046 |
pool | -0.044 |
Token | D |
Token ID | 360 |
Feature activation | +9.84e-02 |
Pos logit contributions | |
ARC | +0.069 |
ked | +0.065 |
ILA | +0.061 |
OVA | +0.061 |
pool | +0.058 |
Neg logit contributions | |
fid | -0.080 |
acci | -0.077 |
ank | -0.071 |
obey | -0.068 |
ihil | -0.068 |
Token | 46 |
Token ID | 3510 |
Feature activation | -6.62e-02 |
Pos logit contributions | |
fid | +0.004 |
acci | +0.003 |
ank | +0.003 |
obey | +0.003 |
ihil | +0.003 |
Neg logit contributions | |
ARC | -0.004 |
ked | -0.004 |
ILA | -0.003 |
OVA | -0.003 |
pool | -0.003 |
Token | "] |
Token ID | 8973 |
Feature activation | -4.39e-02 |
Pos logit contributions | |
fid | +0.047 |
acci | +0.044 |
ank | +0.041 |
obey | +0.039 |
ihil | +0.038 |
Neg logit contributions | |
ARC | -0.051 |
ked | -0.049 |
ILA | -0.046 |
OVA | -0.046 |
pool | -0.044 |
Token | [ |
Token ID | 685 |
Feature activation | +2.44e-02 |
Pos logit contributions | |
fid | +0.031 |
acci | +0.030 |
ank | +0.027 |
obey | +0.026 |
ihil | +0.026 |
Neg logit contributions | |
ARC | -0.033 |
ked | -0.032 |
ILA | -0.030 |
OVA | -0.030 |
kers | -0.029 |
Token | White |
Token ID | 12256 |
Feature activation | -1.58e-01 |
Pos logit contributions | |
ARC | +0.019 |
ked | +0.018 |
ILA | +0.017 |
OVA | +0.017 |
pool | +0.017 |
Neg logit contributions | |
fid | -0.017 |
acci | -0.016 |
ank | -0.015 |
obey | -0.014 |
ihil | -0.014 |
Token | E |
Token ID | 36 |
Feature activation | -1.42e-01 |
Pos logit contributions | |
fid | +0.109 |
acci | +0.106 |
ank | +0.097 |
obey | +0.093 |
eeper | +0.092 |
Neg logit contributions | |
ARC | -0.124 |
ked | -0.116 |
OVA | -0.111 |
ILA | -0.110 |
Region | -0.106 |
Token | lo |
Token ID | 5439 |
Feature activation | -5.17e-01 |
Pos logit contributions | |
fid | +0.045 |
acci | +0.042 |
ank | +0.032 |
obey | +0.029 |
ihil | +0.029 |
Neg logit contributions | |
ARC | -0.164 |
ked | -0.157 |
ILA | -0.153 |
OVA | -0.151 |
pool | -0.149 |
Token | " |
Token ID | 366 |
Feature activation | +8.38e-03 |
Pos logit contributions | |
fid | +0.355 |
acci | +0.338 |
ank | +0.309 |
obey | +0.294 |
ihil | +0.290 |
Neg logit contributions | |
ARC | -0.410 |
ked | -0.388 |
ILA | -0.369 |
OVA | -0.367 |
pool | -0.354 |
Token | 25 |
Token ID | 1495 |
Feature activation | -4.68e-02 |
Pos logit contributions | |
ARC | +0.006 |
ked | +0.006 |
ILA | +0.006 |
OVA | +0.005 |
kers | +0.005 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.006 |
ank | -0.005 |
obey | -0.005 |
ihil | -0.005 |
Token | 56 |
Token ID | 3980 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
fid | +0.035 |
acci | +0.034 |
ank | +0.031 |
obey | +0.030 |
ihil | +0.029 |
Neg logit contributions | |
ARC | -0.034 |
ked | -0.032 |
ILA | -0.030 |
OVA | -0.030 |
Region | -0.029 |
Token | "] |
Token ID | 8973 |
Feature activation | -3.86e-02 |
Pos logit contributions | |
fid | +0.009 |
acci | +0.008 |
ank | +0.007 |
obey | +0.007 |
ihil | +0.007 |
Neg logit contributions | |
ARC | -0.010 |
ked | -0.009 |
ILA | -0.009 |
OVA | -0.009 |
pool | -0.008 |
Token | [ |
Token ID | 685 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
fid | +0.028 |
acci | +0.027 |
ank | +0.024 |
obey | +0.023 |
ihil | +0.023 |
Neg logit contributions | |
ARC | -0.029 |
ked | -0.028 |
ILA | -0.026 |
OVA | -0.026 |
pool | -0.025 |
Token | ka |
Token ID | 38387 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
fid | +0.078 |
acci | +0.074 |
ank | +0.069 |
obey | +0.066 |
ihil | +0.065 |
Neg logit contributions | |
ARC | -0.073 |
ked | -0.068 |
ILA | -0.064 |
OVA | -0.064 |
pool | -0.062 |
Token | mo |
Token ID | 6941 |
Feature activation | -4.30e-01 |
Pos logit contributions | |
fid | +0.102 |
acci | +0.097 |
ank | +0.090 |
obey | +0.086 |
ihil | +0.085 |
Neg logit contributions | |
ARC | -0.093 |
ked | -0.087 |
ILA | -0.082 |
OVA | -0.082 |
pool | -0.079 |
Token | � |
Token ID | 134 |
Feature activation | -6.22e-02 |
Pos logit contributions | |
fid | +0.341 |
acci | +0.326 |
ank | +0.304 |
obey | +0.291 |
ihil | +0.287 |
Neg logit contributions | |
ARC | -0.296 |
ked | -0.276 |
OVA | -0.261 |
ILA | -0.261 |
Region | -0.249 |
Token | � |
Token ID | 119 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
fid | +0.039 |
acci | +0.037 |
ank | +0.034 |
obey | +0.032 |
ihil | +0.031 |
Neg logit contributions | |
ARC | -0.053 |
ked | -0.050 |
ILA | -0.048 |
OVA | -0.048 |
pool | -0.046 |
Token | ole |
Token ID | 2305 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
fid | +0.103 |
acci | +0.099 |
ank | +0.091 |
obey | +0.088 |
ihil | +0.087 |
Neg logit contributions | |
ARC | -0.093 |
ked | -0.087 |
ILA | -0.083 |
OVA | -0.082 |
pool | -0.079 |
Token | lo |
Token ID | 5439 |
Feature activation | -5.14e-01 |
Pos logit contributions | |
fid | +0.097 |
acci | +0.092 |
ank | +0.086 |
obey | +0.082 |
ihil | +0.081 |
Neg logit contributions | |
ARC | -0.090 |
ked | -0.084 |
ILA | -0.080 |
OVA | -0.079 |
pool | -0.076 |
Token | o |
Token ID | 267 |
Feature activation | +4.40e-02 |
Pos logit contributions | |
fid | +0.386 |
acci | +0.367 |
ank | +0.341 |
obey | +0.326 |
ihil | +0.321 |
Neg logit contributions | |
ARC | -0.376 |
ked | -0.352 |
ILA | -0.334 |
OVA | -0.332 |
pool | -0.319 |
Token | Kal |
Token ID | 12612 |
Feature activation | -1.49e-01 |
Pos logit contributions | |
ARC | +0.032 |
ked | +0.030 |
ILA | +0.028 |
OVA | +0.028 |
pool | +0.027 |
Neg logit contributions | |
fid | -0.033 |
acci | -0.032 |
ank | -0.029 |
obey | -0.028 |
ihil | -0.028 |
Token | ap |
Token ID | 499 |
Feature activation | +1.39e-01 |
Pos logit contributions | |
fid | +0.115 |
acci | +0.110 |
ank | +0.102 |
obey | +0.097 |
ihil | +0.097 |
Neg logit contributions | |
ARC | -0.107 |
ked | -0.100 |
ILA | -0.094 |
OVA | -0.094 |
Region | -0.090 |
Token | ana |
Token ID | 2271 |
Feature activation | -1.26e-01 |
Pos logit contributions | |
ARC | +0.105 |
ked | +0.099 |
ILA | +0.094 |
OVA | +0.093 |
pool | +0.090 |
Neg logit contributions | |
fid | -0.101 |
acci | -0.096 |
ank | -0.089 |
obey | -0.085 |
ihil | -0.084 |
Token | me |
Token ID | 502 |
Feature activation | +2.86e-02 |
Pos logit contributions | |
fid | +0.097 |
acci | +0.092 |
ank | +0.086 |
obey | +0.082 |
ihil | +0.081 |
Neg logit contributions | |
ARC | -0.089 |
ked | -0.084 |
ILA | -0.079 |
OVA | -0.079 |
pool | -0.076 |
Token |
|
Token ID | 198 |
Feature activation | +7.03e-02 |
Pos logit contributions | |
ARC | +0.096 |
ked | +0.090 |
ILA | +0.085 |
OVA | +0.084 |
pool | +0.080 |
Neg logit contributions | |
fid | -0.120 |
acci | -0.116 |
ank | -0.108 |
obey | -0.103 |
ihil | -0.102 |
Token |
|
Token ID | 198 |
Feature activation | +6.54e-02 |
Pos logit contributions | |
ARC | +0.046 |
ked | +0.043 |
ILA | +0.041 |
OVA | +0.040 |
pool | +0.038 |
Neg logit contributions | |
fid | -0.058 |
acci | -0.056 |
ank | -0.052 |
obey | -0.050 |
ihil | -0.049 |
Token | 1990 |
Token ID | 19891 |
Feature activation | +1.63e-02 |
Pos logit contributions | |
ARC | +0.047 |
ked | +0.045 |
ILA | +0.042 |
OVA | +0.042 |
kers | +0.040 |
Neg logit contributions | |
fid | -0.049 |
acci | -0.047 |
ank | -0.044 |
obey | -0.042 |
ihil | -0.041 |
Token | Richard |
Token ID | 6219 |
Feature activation | +2.96e-03 |
Pos logit contributions | |
ARC | +0.011 |
ked | +0.010 |
ILA | +0.010 |
OVA | +0.010 |
pool | +0.009 |
Neg logit contributions | |
fid | -0.013 |
acci | -0.013 |
ank | -0.012 |
obey | -0.011 |
ihil | -0.011 |
Token | Mull |
Token ID | 19574 |
Feature activation | -3.03e-01 |
Pos logit contributions | |
ARC | +0.003 |
ked | +0.002 |
ILA | +0.002 |
OVA | +0.002 |
pool | +0.002 |
Neg logit contributions | |
fid | -0.002 |
acci | -0.002 |
ank | -0.002 |
obey | -0.001 |
ihil | -0.001 |
Token | igan |
Token ID | 5516 |
Feature activation | -5.12e-01 |
Pos logit contributions | |
fid | +0.095 |
acci | +0.084 |
ank | +0.070 |
obey | +0.060 |
ihil | +0.055 |
Neg logit contributions | |
ARC | -0.352 |
ked | -0.343 |
ILA | -0.329 |
OVA | -0.329 |
pool | -0.324 |
Token |
|
Token ID | 198 |
Feature activation | +4.28e-02 |
Pos logit contributions | |
fid | +0.431 |
acci | +0.414 |
ank | +0.386 |
obey | +0.371 |
ihil | +0.367 |
Neg logit contributions | |
ARC | -0.327 |
ked | -0.306 |
ILA | -0.287 |
OVA | -0.284 |
pool | -0.270 |
Token |
|
Token ID | 198 |
Feature activation | +4.51e-02 |
Pos logit contributions | |
ARC | +0.028 |
ked | +0.026 |
ILA | +0.025 |
OVA | +0.025 |
pool | +0.023 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.034 |
ank | -0.031 |
obey | -0.030 |
ihil | -0.030 |
Token | 1990 |
Token ID | 19891 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
ARC | +0.032 |
ked | +0.031 |
ILA | +0.029 |
OVA | +0.029 |
kers | +0.027 |
Neg logit contributions | |
fid | -0.034 |
acci | -0.033 |
ank | -0.030 |
obey | -0.029 |
ihil | -0.029 |
Token | Craig |
Token ID | 13854 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
ARC | +0.008 |
ked | +0.008 |
ILA | +0.007 |
OVA | +0.007 |
pool | +0.007 |
Neg logit contributions | |
fid | -0.010 |
acci | -0.010 |
ank | -0.009 |
obey | -0.009 |
ihil | -0.009 |
Token | T |
Token ID | 309 |
Feature activation | +8.44e-02 |
Pos logit contributions | |
fid | +0.008 |
acci | +0.007 |
ank | +0.007 |
obey | +0.007 |
ihil | +0.007 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.007 |
ILA | -0.007 |
OVA | -0.007 |
pool | -0.007 |
Token | Earlier |
Token ID | 20635 |
Feature activation | -1.01e-01 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.018 |
ank | +0.017 |
obey | +0.016 |
ihil | +0.016 |
Neg logit contributions | |
ARC | -0.016 |
ked | -0.015 |
ILA | -0.014 |
OVA | -0.014 |
pool | -0.013 |
Token | this |
Token ID | 428 |
Feature activation | +4.96e-02 |
Pos logit contributions | |
fid | +0.081 |
acci | +0.077 |
ank | +0.072 |
obey | +0.069 |
ihil | +0.068 |
Neg logit contributions | |
ARC | -0.068 |
ked | -0.063 |
ILA | -0.061 |
OVA | -0.061 |
Region | -0.057 |
Token | month |
Token ID | 1227 |
Feature activation | +2.79e-02 |
Pos logit contributions | |
ARC | +0.031 |
ked | +0.029 |
ILA | +0.027 |
OVA | +0.027 |
pool | +0.025 |
Neg logit contributions | |
fid | -0.042 |
acci | -0.041 |
ank | -0.038 |
obey | -0.037 |
ihil | -0.036 |
Token | , |
Token ID | 11 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
ARC | +0.019 |
ked | +0.018 |
ILA | +0.017 |
OVA | +0.017 |
Region | +0.016 |
Neg logit contributions | |
fid | -0.022 |
acci | -0.021 |
ank | -0.020 |
obey | -0.019 |
ihil | -0.019 |
Token | O |
Token ID | 440 |
Feature activation | -9.87e-03 |
Pos logit contributions | |
fid | +0.018 |
acci | +0.017 |
ank | +0.016 |
obey | +0.015 |
ihil | +0.015 |
Neg logit contributions | |
ARC | -0.016 |
ked | -0.015 |
ILA | -0.015 |
OVA | -0.015 |
Region | -0.014 |
Token | la |
Token ID | 5031 |
Feature activation | -5.08e-01 |
Pos logit contributions | |
fid | +0.007 |
acci | +0.007 |
ank | +0.007 |
obey | +0.006 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.007 |
ked | -0.007 |
ILA | -0.006 |
OVA | -0.006 |
Region | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -3.67e-02 |
Pos logit contributions | |
fid | +0.390 |
acci | +0.372 |
ank | +0.346 |
obey | +0.330 |
ihil | +0.328 |
Neg logit contributions | |
ARC | -0.359 |
ked | -0.338 |
ILA | -0.321 |
OVA | -0.320 |
Region | -0.305 |
Token | a |
Token ID | 257 |
Feature activation | -2.21e-02 |
Pos logit contributions | |
fid | +0.028 |
acci | +0.027 |
ank | +0.025 |
obey | +0.024 |
ihil | +0.023 |
Neg logit contributions | |
ARC | -0.026 |
ked | -0.025 |
ILA | -0.023 |
OVA | -0.023 |
pool | -0.022 |
Token | local |
Token ID | 1957 |
Feature activation | -8.99e-02 |
Pos logit contributions | |
fid | +0.017 |
acci | +0.016 |
ank | +0.015 |
obey | +0.014 |
ihil | +0.014 |
Neg logit contributions | |
ARC | -0.016 |
ked | -0.015 |
ILA | -0.014 |
OVA | -0.014 |
Region | -0.013 |
Token | taxi |
Token ID | 17536 |
Feature activation | -1.13e-04 |
Pos logit contributions | |
fid | +0.073 |
acci | +0.069 |
ank | +0.065 |
obey | +0.062 |
ihil | +0.061 |
Neg logit contributions | |
ARC | -0.060 |
ked | -0.057 |
ILA | -0.054 |
OVA | -0.053 |
Region | -0.051 |
Token | aggreg |
Token ID | 13262 |
Feature activation | -1.32e-01 |
Pos logit contributions | |
fid | +0.000 |
acci | +0.000 |
ank | +0.000 |
obey | +0.000 |
obe | +0.000 |
Neg logit contributions | |
ARC | -0.000 |
ked | -0.000 |
ILA | -0.000 |
OVA | -0.000 |
Region | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | +6.69e-02 |
Pos logit contributions | |
ARC | +0.098 |
ked | +0.092 |
ILA | +0.086 |
OVA | +0.085 |
pool | +0.081 |
Neg logit contributions | |
fid | -0.124 |
acci | -0.119 |
ank | -0.111 |
obey | -0.106 |
ihil | -0.105 |
Token |
|
Token ID | 198 |
Feature activation | +5.71e-02 |
Pos logit contributions | |
ARC | +0.044 |
ked | +0.041 |
ILA | +0.039 |
OVA | +0.038 |
pool | +0.037 |
Neg logit contributions | |
fid | -0.055 |
acci | -0.053 |
ank | -0.049 |
obey | -0.047 |
ihil | -0.047 |
Token | 1991 |
Token ID | 24529 |
Feature activation | -3.81e-03 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.037 |
ILA | +0.035 |
OVA | +0.035 |
kers | +0.033 |
Neg logit contributions | |
fid | -0.045 |
acci | -0.043 |
ank | -0.040 |
obey | -0.038 |
ihil | -0.038 |
Token | Richard |
Token ID | 6219 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
fid | +0.003 |
acci | +0.003 |
ank | +0.003 |
obey | +0.003 |
ihil | +0.003 |
Neg logit contributions | |
ARC | -0.003 |
ked | -0.002 |
ILA | -0.002 |
OVA | -0.002 |
pool | -0.002 |
Token | Mull |
Token ID | 19574 |
Feature activation | -2.92e-01 |
Pos logit contributions | |
ARC | +0.017 |
ked | +0.016 |
ILA | +0.016 |
OVA | +0.016 |
pool | +0.015 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.005 |
ank | -0.004 |
obey | -0.004 |
ihil | -0.004 |
Token | igan |
Token ID | 5516 |
Feature activation | -5.07e-01 |
Pos logit contributions | |
fid | +0.088 |
acci | +0.078 |
ank | +0.064 |
obey | +0.055 |
ihil | +0.051 |
Neg logit contributions | |
ARC | -0.344 |
ked | -0.333 |
ILA | -0.321 |
OVA | -0.320 |
pool | -0.314 |
Token |
|
Token ID | 198 |
Feature activation | +3.86e-02 |
Pos logit contributions | |
fid | +0.429 |
acci | +0.412 |
ank | +0.384 |
obey | +0.370 |
ihil | +0.366 |
Neg logit contributions | |
ARC | -0.321 |
ked | -0.299 |
ILA | -0.282 |
OVA | -0.278 |
pool | -0.264 |
Token |
|
Token ID | 198 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
ARC | +0.025 |
ked | +0.024 |
ILA | +0.022 |
OVA | +0.022 |
pool | +0.021 |
Neg logit contributions | |
fid | -0.032 |
acci | -0.030 |
ank | -0.028 |
obey | -0.027 |
ihil | -0.027 |
Token | 1991 |
Token ID | 24529 |
Feature activation | +9.38e-04 |
Pos logit contributions | |
ARC | +0.024 |
ked | +0.022 |
ILA | +0.021 |
OVA | +0.021 |
kers | +0.020 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.026 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.023 |
Token | Craig |
Token ID | 13854 |
Feature activation | +3.20e-03 |
Pos logit contributions | |
ARC | +0.001 |
ked | +0.001 |
ILA | +0.001 |
OVA | +0.001 |
pool | +0.001 |
Neg logit contributions | |
fid | -0.001 |
acci | -0.001 |
ank | -0.001 |
obey | -0.001 |
ihil | -0.001 |
Token | T |
Token ID | 309 |
Feature activation | +9.25e-02 |
Pos logit contributions | |
ARC | +0.002 |
ked | +0.002 |
ILA | +0.002 |
OVA | +0.001 |
pool | +0.001 |
Neg logit contributions | |
fid | -0.003 |
acci | -0.003 |
ank | -0.003 |
obey | -0.003 |
ihil | -0.003 |
Token | to |
Token ID | 284 |
Feature activation | -5.42e-02 |
Pos logit contributions | |
ARC | +0.035 |
ked | +0.033 |
ILA | +0.032 |
OVA | +0.032 |
pool | +0.030 |
Neg logit contributions | |
fid | -0.032 |
acci | -0.031 |
ank | -0.028 |
obey | -0.027 |
ihil | -0.026 |
Token | Goodell |
Token ID | 41648 |
Feature activation | -2.95e-02 |
Pos logit contributions | |
fid | +0.042 |
acci | +0.040 |
ank | +0.037 |
obey | +0.036 |
ihil | +0.035 |
Neg logit contributions | |
ARC | -0.038 |
ked | -0.036 |
ILA | -0.034 |
OVA | -0.034 |
pool | -0.032 |
Token | Comments |
Token ID | 19502 |
Feature activation | +4.36e-02 |
Pos logit contributions | |
fid | +0.023 |
acci | +0.022 |
ank | +0.020 |
obey | +0.019 |
ihil | +0.019 |
Neg logit contributions | |
ARC | -0.021 |
ked | -0.020 |
ILA | -0.019 |
OVA | -0.019 |
Region | -0.018 |
Token |
|
Token ID | 198 |
Feature activation | -2.84e-02 |
Pos logit contributions | |
ARC | +0.029 |
ked | +0.027 |
ILA | +0.026 |
OVA | +0.026 |
pool | +0.024 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.034 |
ank | -0.032 |
obey | -0.030 |
ihil | -0.030 |
Token |
|
Token ID | 198 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
fid | +0.023 |
acci | +0.023 |
ank | +0.021 |
obey | +0.020 |
ihil | +0.020 |
Neg logit contributions | |
ARC | -0.019 |
ked | -0.017 |
ILA | -0.016 |
OVA | -0.016 |
pool | -0.015 |
Token | NFL |
Token ID | 32078 |
Feature activation | -5.06e-01 |
Pos logit contributions | |
fid | +0.026 |
acci | +0.025 |
ank | +0.023 |
obey | +0.022 |
ihil | +0.022 |
Neg logit contributions | |
ARC | -0.023 |
ked | -0.021 |
ILA | -0.020 |
OVA | -0.020 |
kers | -0.019 |
Token | Players |
Token ID | 13094 |
Feature activation | -5.44e-02 |
Pos logit contributions | |
fid | +0.387 |
acci | +0.368 |
ank | +0.341 |
obey | +0.327 |
ihil | +0.321 |
Neg logit contributions | |
ARC | -0.362 |
ked | -0.340 |
OVA | -0.321 |
ILA | -0.321 |
pool | -0.306 |
Token | v |
Token ID | 410 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
fid | +0.042 |
acci | +0.040 |
ank | +0.037 |
obey | +0.036 |
ihil | +0.035 |
Neg logit contributions | |
ARC | -0.039 |
ked | -0.036 |
OVA | -0.034 |
ILA | -0.034 |
pool | -0.033 |
Token | . |
Token ID | 13 |
Feature activation | -5.12e-02 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.018 |
ank | +0.017 |
obey | +0.016 |
ihil | +0.016 |
Neg logit contributions | |
ARC | -0.015 |
ked | -0.014 |
ILA | -0.013 |
OVA | -0.013 |
pool | -0.013 |
Token | NFL |
Token ID | 5134 |
Feature activation | -1.18e-01 |
Pos logit contributions | |
fid | +0.037 |
acci | +0.036 |
ank | +0.033 |
obey | +0.031 |
ihil | +0.031 |
Neg logit contributions | |
ARC | -0.038 |
ked | -0.036 |
ILA | -0.034 |
OVA | -0.034 |
pool | -0.033 |
Token | Key |
Token ID | 7383 |
Feature activation | -8.58e-02 |
Pos logit contributions | |
fid | +0.095 |
acci | +0.092 |
ank | +0.085 |
obey | +0.082 |
ihil | +0.081 |
Neg logit contributions | |
ARC | -0.079 |
ked | -0.074 |
ILA | -0.070 |
OVA | -0.070 |
pool | -0.067 |
Token | about |
Token ID | 546 |
Feature activation | -4.15e-02 |
Pos logit contributions | |
ARC | +0.037 |
ked | +0.034 |
OVA | +0.032 |
ILA | +0.032 |
Region | +0.031 |
Neg logit contributions | |
fid | -0.041 |
acci | -0.039 |
ank | -0.036 |
obey | -0.035 |
ihil | -0.034 |
Token | this |
Token ID | 428 |
Feature activation | +4.07e-02 |
Pos logit contributions | |
fid | +0.033 |
acci | +0.031 |
ank | +0.029 |
obey | +0.028 |
obe | +0.027 |
Neg logit contributions | |
ARC | -0.029 |
ked | -0.027 |
ILA | -0.025 |
OVA | -0.025 |
pool | -0.024 |
Token | fish |
Token ID | 5916 |
Feature activation | +2.99e-01 |
Pos logit contributions | |
ARC | +0.028 |
ked | +0.027 |
ILA | +0.025 |
OVA | +0.025 |
pool | +0.024 |
Neg logit contributions | |
fid | -0.032 |
acci | -0.031 |
ank | -0.028 |
obey | -0.027 |
ihil | -0.027 |
Token | - |
Token ID | 12 |
Feature activation | +4.37e-02 |
Pos logit contributions | |
ARC | +0.205 |
ked | +0.191 |
ILA | +0.181 |
OVA | +0.180 |
Region | +0.171 |
Neg logit contributions | |
fid | -0.239 |
acci | -0.229 |
ank | -0.213 |
obey | -0.204 |
ihil | -0.201 |
Token | tra |
Token ID | 9535 |
Feature activation | -2.17e-01 |
Pos logit contributions | |
ARC | +0.029 |
ked | +0.027 |
ILA | +0.026 |
OVA | +0.026 |
Region | +0.024 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.034 |
ank | -0.032 |
obey | -0.030 |
ihil | -0.030 |
Token | umat |
Token ID | 27798 |
Feature activation | -5.06e-01 |
Pos logit contributions | |
fid | +0.190 |
acci | +0.183 |
ank | +0.171 |
obey | +0.164 |
ihil | +0.163 |
Neg logit contributions | |
ARC | -0.131 |
ked | -0.120 |
ILA | -0.114 |
OVA | -0.114 |
Region | -0.108 |
Token | izing |
Token ID | 2890 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
fid | +0.293 |
acci | +0.277 |
ank | +0.249 |
obey | +0.235 |
ihil | +0.231 |
Neg logit contributions | |
ARC | -0.455 |
ked | -0.433 |
ILA | -0.415 |
OVA | -0.413 |
pool | -0.399 |
Token | f |
Token ID | 277 |
Feature activation | -5.22e-02 |
Pos logit contributions | |
fid | +0.122 |
acci | +0.117 |
ank | +0.110 |
obey | +0.105 |
ihil | +0.103 |
Neg logit contributions | |
ARC | -0.103 |
ked | -0.095 |
ILA | -0.091 |
OVA | -0.090 |
pool | -0.086 |
Token | auc |
Token ID | 14272 |
Feature activation | +9.70e-02 |
Pos logit contributions | |
fid | +0.048 |
acci | +0.046 |
ank | +0.043 |
obey | +0.042 |
ihil | +0.041 |
Neg logit contributions | |
ARC | -0.029 |
ked | -0.027 |
ILA | -0.025 |
OVA | -0.025 |
Region | -0.024 |
Token | et |
Token ID | 316 |
Feature activation | -2.56e-01 |
Pos logit contributions | |
ARC | +0.086 |
ked | +0.083 |
ILA | +0.079 |
OVA | +0.078 |
pool | +0.076 |
Neg logit contributions | |
fid | -0.057 |
acci | -0.054 |
ank | -0.049 |
obey | -0.046 |
ihil | -0.045 |
Token | . |
Token ID | 13 |
Feature activation | -6.56e-02 |
Pos logit contributions | |
fid | +0.205 |
acci | +0.195 |
ank | +0.183 |
obey | +0.176 |
ihil | +0.172 |
Neg logit contributions | |
ARC | -0.176 |
ked | -0.164 |
ILA | -0.156 |
OVA | -0.155 |
Region | -0.147 |
Token | fy |
Token ID | 24928 |
Feature activation | +8.58e-02 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.037 |
ILA | +0.035 |
OVA | +0.034 |
pool | +0.033 |
Neg logit contributions | |
fid | -0.048 |
acci | -0.046 |
ank | -0.043 |
obey | -0.041 |
ihil | -0.041 |
Token | ( |
Token ID | 357 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
ARC | +0.060 |
ked | +0.057 |
ILA | +0.054 |
OVA | +0.053 |
pool | +0.051 |
Neg logit contributions | |
fid | -0.066 |
acci | -0.064 |
ank | -0.059 |
obey | -0.057 |
ihil | -0.056 |
Token | pre |
Token ID | 3866 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
fid | +0.103 |
acci | +0.099 |
ank | +0.091 |
obey | +0.087 |
ihil | +0.086 |
Neg logit contributions | |
ARC | -0.098 |
ked | -0.092 |
ILA | -0.087 |
OVA | -0.087 |
kers | -0.083 |
Token | viously |
Token ID | 8647 |
Feature activation | +1.69e-02 |
Pos logit contributions | |
fid | +0.011 |
acci | +0.010 |
ank | +0.010 |
obey | +0.009 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.007 |
ILA | -0.007 |
OVA | -0.007 |
Region | -0.007 |
Token | Sci |
Token ID | 10286 |
Feature activation | +1.19e-01 |
Pos logit contributions | |
ARC | +0.011 |
ked | +0.010 |
ILA | +0.010 |
OVA | +0.010 |
Region | +0.009 |
Neg logit contributions | |
fid | -0.014 |
acci | -0.013 |
ank | -0.012 |
obey | -0.012 |
ihil | -0.012 |
Token | Fi |
Token ID | 10547 |
Feature activation | -5.04e-01 |
Pos logit contributions | |
ARC | +0.103 |
ked | +0.098 |
OVA | +0.093 |
ILA | +0.093 |
pool | +0.090 |
Neg logit contributions | |
fid | -0.073 |
acci | -0.068 |
ank | -0.062 |
obey | -0.059 |
ihil | -0.058 |
Token | ) |
Token ID | 8 |
Feature activation | -4.47e-02 |
Pos logit contributions | |
fid | +0.390 |
acci | +0.373 |
ank | +0.346 |
obey | +0.332 |
ihil | +0.328 |
Neg logit contributions | |
ARC | -0.355 |
ked | -0.334 |
ILA | -0.316 |
OVA | -0.313 |
pool | -0.300 |
Token | re |
Token ID | 302 |
Feature activation | -8.72e-03 |
Pos logit contributions | |
fid | +0.034 |
acci | +0.033 |
ank | +0.031 |
obey | +0.029 |
ihil | +0.029 |
Neg logit contributions | |
ARC | -0.032 |
ked | -0.030 |
ILA | -0.028 |
OVA | -0.028 |
pool | -0.027 |
Token | brand |
Token ID | 17938 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
fid | +0.007 |
acci | +0.007 |
ank | +0.007 |
obey | +0.006 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.005 |
ked | -0.005 |
ILA | -0.005 |
OVA | -0.005 |
Region | -0.004 |
Token | in |
Token ID | 287 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
ARC | +0.104 |
ked | +0.098 |
ILA | +0.093 |
OVA | +0.093 |
pool | +0.089 |
Neg logit contributions | |
fid | -0.105 |
acci | -0.100 |
ank | -0.093 |
obey | -0.088 |
ihil | -0.087 |
Token | 2009 |
Token ID | 3717 |
Feature activation | -7.61e-02 |
Pos logit contributions | |
fid | +0.016 |
acci | +0.015 |
ank | +0.014 |
obey | +0.014 |
ihil | +0.013 |
Neg logit contributions | |
ARC | -0.012 |
ked | -0.011 |
ILA | -0.011 |
OVA | -0.011 |
pool | -0.010 |
Token | DEN |
Token ID | 37692 |
Feature activation | +2.97e-01 |
Pos logit contributions | |
fid | +0.008 |
acci | +0.007 |
ank | +0.007 |
obey | +0.006 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.011 |
ked | -0.010 |
ILA | -0.010 |
OVA | -0.010 |
pool | -0.009 |
Token | R |
Token ID | 49 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
ARC | +0.183 |
ked | +0.171 |
ILA | +0.160 |
OVA | +0.159 |
pool | +0.151 |
Neg logit contributions | |
fid | -0.255 |
acci | -0.246 |
ank | -0.229 |
obey | -0.221 |
ihil | -0.219 |
Token | Secretary |
Token ID | 4986 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
fid | +0.012 |
acci | +0.011 |
ank | +0.010 |
obey | +0.010 |
ihil | +0.010 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.013 |
OVA | -0.012 |
ILA | -0.012 |
kers | -0.012 |
Token | Sk |
Token ID | 3661 |
Feature activation | -1.50e-01 |
Pos logit contributions | |
fid | +0.134 |
acci | +0.128 |
ank | +0.119 |
obey | +0.114 |
ihil | +0.113 |
Neg logit contributions | |
ARC | -0.117 |
ked | -0.110 |
OVA | -0.104 |
ILA | -0.103 |
Region | -0.098 |
Token | var |
Token ID | 7785 |
Feature activation | -1.16e-01 |
Pos logit contributions | |
fid | +0.110 |
acci | +0.105 |
ank | +0.097 |
obey | +0.093 |
ihil | +0.091 |
Neg logit contributions | |
ARC | -0.111 |
ked | -0.106 |
ILA | -0.099 |
OVA | -0.099 |
pool | -0.095 |
Token | la |
Token ID | 5031 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
fid | +0.088 |
acci | +0.085 |
ank | +0.078 |
obey | +0.075 |
ihil | +0.074 |
Neg logit contributions | |
ARC | -0.083 |
ked | -0.078 |
ILA | -0.074 |
OVA | -0.074 |
Region | -0.070 |
Token | made |
Token ID | 925 |
Feature activation | +6.46e-02 |
Pos logit contributions | |
fid | +0.381 |
acci | +0.363 |
ank | +0.335 |
obey | +0.320 |
ihil | +0.317 |
Neg logit contributions | |
ARC | -0.364 |
ked | -0.342 |
OVA | -0.325 |
ILA | -0.324 |
Region | -0.309 |
Token | it |
Token ID | 340 |
Feature activation | -3.80e-02 |
Pos logit contributions | |
ARC | +0.046 |
ked | +0.043 |
ILA | +0.041 |
OVA | +0.040 |
pool | +0.039 |
Neg logit contributions | |
fid | -0.050 |
acci | -0.048 |
ank | -0.044 |
obey | -0.042 |
ihil | -0.042 |
Token | clear |
Token ID | 1598 |
Feature activation | -5.05e-02 |
Pos logit contributions | |
fid | +0.027 |
acci | +0.025 |
ank | +0.023 |
obey | +0.022 |
ihil | +0.022 |
Neg logit contributions | |
ARC | -0.030 |
ked | -0.028 |
ILA | -0.027 |
OVA | -0.027 |
pool | -0.025 |
Token | that |
Token ID | 326 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
fid | +0.037 |
acci | +0.035 |
ank | +0.032 |
obey | +0.031 |
ihil | +0.030 |
Neg logit contributions | |
ARC | -0.038 |
ked | -0.036 |
ILA | -0.034 |
OVA | -0.034 |
kers | -0.032 |
Token | Good |
Token ID | 4599 |
Feature activation | +1.92e-01 |
Pos logit contributions | |
fid | +0.010 |
acci | +0.009 |
ank | +0.009 |
obey | +0.008 |
ihil | +0.008 |
Neg logit contributions | |
ARC | -0.009 |
ked | -0.009 |
ILA | -0.008 |
OVA | -0.008 |
pool | -0.008 |
Token | b |
Token ID | 275 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
ARC | +0.067 |
ked | +0.063 |
ILA | +0.060 |
OVA | +0.059 |
pool | +0.057 |
Neg logit contributions | |
fid | -0.073 |
acci | -0.070 |
ank | -0.065 |
obey | -0.062 |
ihil | -0.061 |
Token | ikers |
Token ID | 24913 |
Feature activation | +2.45e-01 |
Pos logit contributions | |
ARC | +0.012 |
ked | +0.011 |
ILA | +0.011 |
OVA | +0.011 |
Region | +0.010 |
Neg logit contributions | |
fid | -0.019 |
acci | -0.018 |
ank | -0.017 |
obey | -0.017 |
ihil | -0.016 |
Token | dislike |
Token ID | 23109 |
Feature activation | +2.04e-01 |
Pos logit contributions | |
ARC | +0.172 |
ked | +0.161 |
ILA | +0.153 |
OVA | +0.152 |
pool | +0.145 |
Neg logit contributions | |
fid | -0.190 |
acci | -0.182 |
ank | -0.169 |
obey | -0.162 |
ihil | -0.159 |
Token | the |
Token ID | 262 |
Feature activation | +2.59e-02 |
Pos logit contributions | |
ARC | +0.145 |
ked | +0.137 |
ILA | +0.128 |
OVA | +0.128 |
pool | +0.123 |
Neg logit contributions | |
fid | -0.157 |
acci | -0.151 |
ank | -0.139 |
obey | -0.133 |
ihil | -0.132 |
Token | st |
Token ID | 336 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
ARC | +0.019 |
ked | +0.018 |
ILA | +0.017 |
OVA | +0.017 |
pool | +0.016 |
Neg logit contributions | |
fid | -0.019 |
acci | -0.019 |
ank | -0.017 |
obey | -0.016 |
ihil | -0.016 |
Token | eeper |
Token ID | 41278 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
ARC | +0.146 |
ked | +0.142 |
ILA | +0.136 |
OVA | +0.136 |
pool | +0.134 |
Neg logit contributions | |
fid | -0.021 |
acci | -0.017 |
ank | -0.012 |
obey | -0.008 |
ihil | -0.007 |
Token | paths |
Token ID | 13532 |
Feature activation | -1.67e-01 |
Pos logit contributions | |
fid | +0.348 |
acci | +0.332 |
ank | +0.304 |
obey | +0.290 |
ihil | +0.286 |
Neg logit contributions | |
ARC | -0.396 |
ked | -0.375 |
ILA | -0.356 |
OVA | -0.354 |
pool | -0.341 |
Token | up |
Token ID | 510 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
fid | +0.132 |
acci | +0.126 |
ank | +0.117 |
obey | +0.112 |
ihil | +0.111 |
Neg logit contributions | |
ARC | -0.115 |
ked | -0.109 |
ILA | -0.102 |
OVA | -0.102 |
pool | -0.097 |
Token | to |
Token ID | 284 |
Feature activation | -5.06e-02 |
Pos logit contributions | |
fid | +0.014 |
acci | +0.014 |
ank | +0.013 |
obey | +0.012 |
ihil | +0.012 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.013 |
ILA | -0.012 |
OVA | -0.012 |
pool | -0.012 |
Token | Lynd |
Token ID | 33561 |
Feature activation | -6.72e-02 |
Pos logit contributions | |
fid | +0.038 |
acci | +0.037 |
ank | +0.034 |
obey | +0.032 |
ihil | +0.032 |
Neg logit contributions | |
ARC | -0.037 |
ked | -0.035 |
ILA | -0.033 |
OVA | -0.033 |
pool | -0.031 |
Token | ale |
Token ID | 1000 |
Feature activation | -1.28e-01 |
Pos logit contributions | |
fid | +0.047 |
acci | +0.045 |
ank | +0.042 |
obey | +0.040 |
ihil | +0.039 |
Neg logit contributions | |
ARC | -0.052 |
ked | -0.050 |
ILA | -0.047 |
OVA | -0.047 |
pool | -0.045 |
Token | v |
Token ID | 410 |
Feature activation | -4.68e-02 |
Pos logit contributions | |
fid | +0.015 |
acci | +0.014 |
ank | +0.013 |
obey | +0.013 |
ihil | +0.012 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.013 |
ILA | -0.012 |
OVA | -0.012 |
pool | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -4.59e-02 |
Pos logit contributions | |
fid | +0.039 |
acci | +0.037 |
ank | +0.035 |
obey | +0.033 |
ihil | +0.033 |
Neg logit contributions | |
ARC | -0.031 |
ked | -0.029 |
ILA | -0.027 |
OVA | -0.027 |
pool | -0.026 |
Token | NFL |
Token ID | 5134 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
fid | +0.033 |
acci | +0.032 |
ank | +0.029 |
obey | +0.028 |
ihil | +0.027 |
Neg logit contributions | |
ARC | -0.035 |
ked | -0.033 |
ILA | -0.031 |
OVA | -0.031 |
pool | -0.030 |
Token |
|
Token ID | 198 |
Feature activation | -5.47e-02 |
Pos logit contributions | |
fid | +0.082 |
acci | +0.079 |
ank | +0.073 |
obey | +0.069 |
ihil | +0.068 |
Neg logit contributions | |
ARC | -0.081 |
ked | -0.077 |
ILA | -0.073 |
OVA | -0.072 |
pool | -0.069 |
Token |
|
Token ID | 198 |
Feature activation | -5.67e-02 |
Pos logit contributions | |
fid | +0.045 |
acci | +0.043 |
ank | +0.040 |
obey | +0.039 |
ihil | +0.038 |
Neg logit contributions | |
ARC | -0.036 |
ked | -0.033 |
ILA | -0.031 |
OVA | -0.031 |
pool | -0.030 |
Token | NFL |
Token ID | 32078 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
fid | +0.043 |
acci | +0.041 |
ank | +0.038 |
obey | +0.036 |
ihil | +0.036 |
Neg logit contributions | |
ARC | -0.041 |
ked | -0.038 |
ILA | -0.036 |
OVA | -0.036 |
kers | -0.035 |
Token | PA |
Token ID | 4537 |
Feature activation | -8.39e-02 |
Pos logit contributions | |
fid | +0.395 |
acci | +0.377 |
ank | +0.350 |
obey | +0.335 |
ihil | +0.330 |
Neg logit contributions | |
ARC | -0.350 |
ked | -0.329 |
OVA | -0.310 |
ILA | -0.310 |
Region | -0.295 |
Token | ( |
Token ID | 357 |
Feature activation | -9.98e-02 |
Pos logit contributions | |
fid | +0.063 |
acci | +0.060 |
ank | +0.056 |
obey | +0.054 |
ihil | +0.053 |
Neg logit contributions | |
ARC | -0.061 |
ked | -0.057 |
OVA | -0.054 |
ILA | -0.054 |
pool | -0.052 |
Token | on |
Token ID | 261 |
Feature activation | -2.42e-01 |
Pos logit contributions | |
fid | +0.072 |
acci | +0.069 |
ank | +0.064 |
obey | +0.061 |
ihil | +0.060 |
Neg logit contributions | |
ARC | -0.075 |
ked | -0.071 |
ILA | -0.067 |
OVA | -0.067 |
pool | -0.064 |
Token | behalf |
Token ID | 8378 |
Feature activation | -1.83e-01 |
Pos logit contributions | |
fid | +0.155 |
acci | +0.146 |
ank | +0.134 |
obey | +0.127 |
ihil | +0.124 |
Neg logit contributions | |
ARC | -0.204 |
ked | -0.192 |
OVA | -0.184 |
ILA | -0.184 |
Region | -0.177 |
Token | of |
Token ID | 286 |
Feature activation | +2.18e-02 |
Pos logit contributions | |
fid | +0.145 |
acci | +0.139 |
ank | +0.129 |
obey | +0.124 |
ihil | +0.122 |
Neg logit contributions | |
ARC | -0.126 |
ked | -0.118 |
ILA | -0.111 |
OVA | -0.111 |
pool | -0.106 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.20e-02 |
Pos logit contributions | |
fid | +0.010 |
acci | +0.010 |
ank | +0.009 |
obey | +0.008 |
ihil | +0.008 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.008 |
ILA | -0.007 |
OVA | -0.007 |
pool | -0.007 |
Token | WH |
Token ID | 12418 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
fid | +0.034 |
acci | +0.032 |
ank | +0.030 |
obey | +0.029 |
ihil | +0.029 |
Neg logit contributions | |
ARC | -0.028 |
ked | -0.026 |
ILA | -0.025 |
OVA | -0.025 |
pool | -0.024 |
Token | EN |
Token ID | 1677 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
ARC | +0.061 |
ked | +0.058 |
OVA | +0.053 |
ILA | +0.053 |
pool | +0.051 |
Neg logit contributions | |
fid | -0.088 |
acci | -0.084 |
ank | -0.079 |
obey | -0.076 |
ihil | -0.075 |
Token | Catherine |
Token ID | 22578 |
Feature activation | +1.35e-01 |
Pos logit contributions | |
ARC | +0.097 |
ked | +0.091 |
ILA | +0.086 |
OVA | +0.086 |
pool | +0.082 |
Neg logit contributions | |
fid | -0.103 |
acci | -0.098 |
ank | -0.091 |
obey | -0.088 |
ihil | -0.086 |
Token | Mull |
Token ID | 19574 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
ARC | +0.098 |
ked | +0.093 |
ILA | +0.087 |
OVA | +0.087 |
pool | +0.083 |
Neg logit contributions | |
fid | -0.101 |
acci | -0.097 |
ank | -0.090 |
obey | -0.086 |
ihil | -0.085 |
Token | igan |
Token ID | 5516 |
Feature activation | -5.01e-01 |
Pos logit contributions | |
fid | +0.137 |
acci | +0.130 |
ank | +0.118 |
obey | +0.112 |
ihil | +0.110 |
Neg logit contributions | |
ARC | -0.175 |
ked | -0.166 |
ILA | -0.159 |
OVA | -0.158 |
Region | -0.152 |
Token | , |
Token ID | 11 |
Feature activation | +2.33e-02 |
Pos logit contributions | |
fid | +0.393 |
acci | +0.376 |
ank | +0.348 |
obey | +0.333 |
ihil | +0.329 |
Neg logit contributions | |
ARC | -0.349 |
ked | -0.329 |
ILA | -0.311 |
OVA | -0.308 |
Region | -0.295 |
Token | a |
Token ID | 257 |
Feature activation | -1.77e-02 |
Pos logit contributions | |
ARC | +0.017 |
ked | +0.016 |
ILA | +0.015 |
OVA | +0.015 |
pool | +0.014 |
Neg logit contributions | |
fid | -0.018 |
acci | -0.017 |
ank | -0.016 |
obey | -0.015 |
ihil | -0.015 |
Token | part |
Token ID | 636 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
fid | +0.013 |
acci | +0.013 |
ank | +0.012 |
obey | +0.011 |
ihil | +0.011 |
Neg logit contributions | |
ARC | -0.013 |
ked | -0.012 |
ILA | -0.011 |
OVA | -0.011 |
pool | -0.011 |
Token | - |
Token ID | 12 |
Feature activation | +5.69e-02 |
Pos logit contributions | |
ARC | +0.016 |
ked | +0.014 |
ILA | +0.013 |
OVA | +0.013 |
Region | +0.012 |
Neg logit contributions | |
fid | -0.028 |
acci | -0.027 |
ank | -0.025 |
obey | -0.025 |
ihil | -0.024 |
Token | time |
Token ID | 2435 |
Feature activation | -2.41e-01 |
Pos logit contributions | |
ARC | +0.051 |
ked | +0.049 |
ILA | +0.046 |
OVA | +0.046 |
pool | +0.045 |
Neg logit contributions | |
fid | -0.033 |
acci | -0.031 |
ank | -0.028 |
obey | -0.027 |
ihil | -0.026 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
fid | +0.036 |
acci | +0.035 |
ank | +0.032 |
obey | +0.031 |
ihil | +0.030 |
Neg logit contributions | |
ARC | -0.034 |
ked | -0.032 |
ILA | -0.030 |
OVA | -0.030 |
pool | -0.029 |
Token | his |
Token ID | 465 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
fid | +0.011 |
acci | +0.011 |
ank | +0.010 |
obey | +0.010 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.010 |
ked | -0.009 |
ILA | -0.009 |
OVA | -0.009 |
pool | -0.008 |
Token | recent |
Token ID | 2274 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
ARC | +0.073 |
ked | +0.069 |
ILA | +0.065 |
OVA | +0.065 |
Region | +0.062 |
Neg logit contributions | |
fid | -0.079 |
acci | -0.075 |
ank | -0.069 |
obey | -0.066 |
ihil | -0.065 |
Token | town |
Token ID | 3240 |
Feature activation | +3.71e-02 |
Pos logit contributions | |
ARC | +0.024 |
ked | +0.023 |
ILA | +0.022 |
OVA | +0.022 |
Region | +0.021 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.025 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.022 |
Token | - |
Token ID | 12 |
Feature activation | +1.96e-02 |
Pos logit contributions | |
ARC | +0.027 |
ked | +0.026 |
ILA | +0.024 |
OVA | +0.024 |
kers | +0.023 |
Neg logit contributions | |
fid | -0.028 |
acci | -0.026 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.023 |
Token | hall |
Token ID | 18323 |
Feature activation | -5.01e-01 |
Pos logit contributions | |
ARC | +0.023 |
ked | +0.022 |
ILA | +0.021 |
OVA | +0.021 |
kers | +0.021 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.005 |
ank | -0.004 |
obey | -0.004 |
ihil | -0.003 |
Token | response |
Token ID | 2882 |
Feature activation | +1.31e-01 |
Pos logit contributions | |
fid | +0.433 |
acci | +0.413 |
ank | +0.388 |
obey | +0.373 |
ihil | +0.369 |
Neg logit contributions | |
ARC | -0.309 |
ked | -0.289 |
OVA | -0.270 |
ILA | -0.270 |
Region | -0.254 |
Token | to |
Token ID | 284 |
Feature activation | -7.44e-02 |
Pos logit contributions | |
ARC | +0.096 |
ked | +0.090 |
ILA | +0.086 |
OVA | +0.086 |
pool | +0.082 |
Neg logit contributions | |
fid | -0.097 |
acci | -0.092 |
ank | -0.086 |
obey | -0.082 |
ihil | -0.081 |
Token | a |
Token ID | 257 |
Feature activation | -4.66e-02 |
Pos logit contributions | |
fid | +0.057 |
acci | +0.054 |
ank | +0.050 |
obey | +0.048 |
ihil | +0.047 |
Neg logit contributions | |
ARC | -0.053 |
ked | -0.050 |
OVA | -0.048 |
ILA | -0.048 |
pool | -0.045 |
Token | man |
Token ID | 582 |
Feature activation | -4.43e-02 |
Pos logit contributions | |
fid | +0.036 |
acci | +0.034 |
ank | +0.032 |
obey | +0.030 |
ihil | +0.030 |
Neg logit contributions | |
ARC | -0.033 |
ked | -0.031 |
ILA | -0.030 |
OVA | -0.030 |
pool | -0.028 |
Token | who |
Token ID | 508 |
Feature activation | -4.25e-02 |
Pos logit contributions | |
fid | +0.033 |
acci | +0.031 |
ank | +0.029 |
obey | +0.027 |
ihil | +0.027 |
Neg logit contributions | |
ARC | -0.033 |
ked | -0.031 |
ILA | -0.029 |
OVA | -0.029 |
Region | -0.028 |
Token | p |
Token ID | 79 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
ARC | +0.007 |
ked | +0.007 |
ILA | +0.006 |
OVA | +0.006 |
pool | +0.006 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.006 |
ank | -0.005 |
obey | -0.005 |
ihil | -0.005 |
Token | ren |
Token ID | 918 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
ARC | +0.020 |
ked | +0.019 |
ILA | +0.018 |
OVA | +0.018 |
pool | +0.017 |
Neg logit contributions | |
fid | -0.019 |
acci | -0.018 |
ank | -0.016 |
obey | -0.016 |
ihil | -0.015 |
Token | ant |
Token ID | 415 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
ARC | +0.160 |
ked | +0.151 |
ILA | +0.143 |
OVA | +0.142 |
pool | +0.137 |
Neg logit contributions | |
fid | -0.159 |
acci | -0.152 |
ank | -0.140 |
obey | -0.134 |
ihil | -0.132 |
Token | que |
Token ID | 8358 |
Feature activation | -1.09e-02 |
Pos logit contributions | |
fid | +0.099 |
acci | +0.095 |
ank | +0.088 |
obey | +0.084 |
ihil | +0.083 |
Neg logit contributions | |
ARC | -0.103 |
ked | -0.097 |
ILA | -0.092 |
OVA | -0.091 |
pool | -0.088 |
Token | tr |
Token ID | 491 |
Feature activation | +4.53e-02 |
Pos logit contributions | |
fid | +0.008 |
acci | +0.007 |
ank | +0.007 |
obey | +0.007 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.008 |
ILA | -0.007 |
OVA | -0.007 |
pool | -0.007 |
Token | iste |
Token ID | 40833 |
Feature activation | -4.96e-01 |
Pos logit contributions | |
ARC | +0.026 |
ked | +0.024 |
ILA | +0.023 |
OVA | +0.022 |
pool | +0.021 |
Neg logit contributions | |
fid | -0.041 |
acci | -0.039 |
ank | -0.037 |
obey | -0.036 |
ihil | -0.035 |
Token | . |
Token ID | 13 |
Feature activation | -5.02e-02 |
Pos logit contributions | |
fid | +0.364 |
acci | +0.347 |
ank | +0.320 |
obey | +0.306 |
ihil | +0.301 |
Neg logit contributions | |
ARC | -0.371 |
ked | -0.351 |
ILA | -0.332 |
OVA | -0.331 |
pool | -0.317 |
Token | J |
Token ID | 41 |
Feature activation | -1.27e-01 |
Pos logit contributions | |
fid | +0.039 |
acci | +0.037 |
ank | +0.034 |
obey | +0.033 |
ihil | +0.032 |
Neg logit contributions | |
ARC | -0.036 |
ked | -0.034 |
ILA | -0.032 |
OVA | -0.032 |
pool | -0.030 |
Token | ' |
Token ID | 6 |
Feature activation | -1.22e-01 |
Pos logit contributions | |
fid | +0.094 |
acci | +0.090 |
ank | +0.083 |
obey | +0.080 |
ihil | +0.078 |
Neg logit contributions | |
ARC | -0.093 |
ked | -0.088 |
ILA | -0.083 |
OVA | -0.083 |
pool | -0.079 |
Token | ai |
Token ID | 1872 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
fid | +0.095 |
acci | +0.092 |
ank | +0.084 |
obey | +0.081 |
ihil | +0.080 |
Neg logit contributions | |
ARC | -0.086 |
ked | -0.081 |
ILA | -0.076 |
OVA | -0.075 |
Region | -0.072 |
Token | l |
Token ID | 300 |
Feature activation | -2.09e-02 |
Pos logit contributions | |
ARC | +0.013 |
ked | +0.012 |
ILA | +0.011 |
OVA | +0.011 |
pool | +0.011 |
Neg logit contributions | |
fid | -0.013 |
acci | -0.012 |
ank | -0.011 |
obey | -0.011 |
ihil | -0.011 |
Token | ple |
Token ID | 1154 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
fid | +0.202 |
acci | +0.195 |
ank | +0.184 |
obey | +0.177 |
ihil | +0.176 |
Neg logit contributions | |
ARC | -0.111 |
ked | -0.102 |
OVA | -0.095 |
ILA | -0.095 |
pool | -0.088 |
Token | tes |
Token ID | 4879 |
Feature activation | -1.24e-01 |
Pos logit contributions | |
ARC | +0.105 |
ked | +0.098 |
ILA | +0.094 |
OVA | +0.094 |
Region | +0.090 |
Neg logit contributions | |
fid | -0.098 |
acci | -0.093 |
ank | -0.085 |
obey | -0.081 |
ihil | -0.080 |
Token | glucose |
Token ID | 15701 |
Feature activation | -8.84e-02 |
Pos logit contributions | |
fid | +0.094 |
acci | +0.089 |
ank | +0.083 |
obey | +0.079 |
ihil | +0.078 |
Neg logit contributions | |
ARC | -0.091 |
ked | -0.085 |
ILA | -0.081 |
OVA | -0.081 |
pool | -0.077 |
Token | and |
Token ID | 290 |
Feature activation | +5.30e-03 |
Pos logit contributions | |
fid | +0.069 |
acci | +0.066 |
ank | +0.061 |
obey | +0.059 |
ihil | +0.058 |
Neg logit contributions | |
ARC | -0.062 |
ked | -0.058 |
ILA | -0.055 |
OVA | -0.055 |
pool | -0.052 |
Token | glyc |
Token ID | 40232 |
Feature activation | +3.98e-02 |
Pos logit contributions | |
ARC | +0.004 |
ked | +0.004 |
ILA | +0.004 |
OVA | +0.004 |
pool | +0.003 |
Neg logit contributions | |
fid | -0.004 |
acci | -0.004 |
ank | -0.003 |
obey | -0.003 |
ihil | -0.003 |
Token | ogen |
Token ID | 6644 |
Feature activation | +3.22e-01 |
Pos logit contributions | |
ARC | +0.014 |
ked | +0.012 |
ILA | +0.011 |
OVA | +0.011 |
Region | +0.010 |
Neg logit contributions | |
fid | -0.045 |
acci | -0.044 |
ank | -0.041 |
obey | -0.040 |
ihil | -0.040 |
Token | rapidly |
Token ID | 8902 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
ARC | +0.229 |
ked | +0.216 |
ILA | +0.204 |
OVA | +0.203 |
pool | +0.194 |
Neg logit contributions | |
fid | -0.248 |
acci | -0.237 |
ank | -0.219 |
obey | -0.210 |
ihil | -0.207 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e-03 |
Pos logit contributions | |
ARC | +0.102 |
ked | +0.096 |
ILA | +0.090 |
OVA | +0.090 |
pool | +0.086 |
Neg logit contributions | |
fid | -0.120 |
acci | -0.116 |
ank | -0.107 |
obey | -0.103 |
ihil | -0.102 |
Token | forcing |
Token ID | 10833 |
Feature activation | -4.21e-02 |
Pos logit contributions | |
fid | +0.001 |
acci | +0.001 |
ank | +0.001 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.001 |
ked | -0.001 |
ILA | -0.001 |
OVA | -0.001 |
pool | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -2.97e-02 |
Pos logit contributions | |
fid | +0.032 |
acci | +0.031 |
ank | +0.028 |
obey | +0.027 |
ihil | +0.027 |
Neg logit contributions | |
ARC | -0.030 |
ked | -0.028 |
ILA | -0.027 |
OVA | -0.027 |
pool | -0.026 |
Token | body |
Token ID | 1767 |
Feature activation | -2.83e-02 |
Pos logit contributions | |
fid | +0.024 |
acci | +0.023 |
ank | +0.021 |
obey | +0.020 |
ihil | +0.020 |
Neg logit contributions | |
ARC | -0.020 |
ked | -0.019 |
ILA | -0.018 |
OVA | -0.018 |
pool | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | +5.79e-02 |
Pos logit contributions | |
fid | +0.045 |
acci | +0.043 |
ank | +0.040 |
obey | +0.038 |
ihil | +0.038 |
Neg logit contributions | |
ARC | -0.038 |
ked | -0.036 |
ILA | -0.034 |
OVA | -0.034 |
pool | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | +6.00e-02 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.036 |
ILA | +0.034 |
OVA | +0.034 |
Region | +0.032 |
Neg logit contributions | |
fid | -0.046 |
acci | -0.045 |
ank | -0.041 |
obey | -0.040 |
ihil | -0.039 |
Token | Reviewer |
Token ID | 35407 |
Feature activation | +3.01e-01 |
Pos logit contributions | |
ARC | +0.022 |
ked | +0.020 |
ILA | +0.018 |
OVA | +0.018 |
Region | +0.015 |
Neg logit contributions | |
fid | -0.065 |
acci | -0.064 |
ank | -0.060 |
ihil | -0.059 |
eeper | -0.058 |
Token | : |
Token ID | 25 |
Feature activation | +1.80e-02 |
Pos logit contributions | |
ARC | +0.210 |
ked | +0.198 |
ILA | +0.186 |
OVA | +0.185 |
pool | +0.178 |
Neg logit contributions | |
fid | -0.236 |
acci | -0.226 |
ank | -0.211 |
obey | -0.201 |
ihil | -0.198 |
Token | j |
Token ID | 474 |
Feature activation | -6.20e-02 |
Pos logit contributions | |
ARC | +0.013 |
ked | +0.012 |
ILA | +0.012 |
OVA | +0.012 |
pool | +0.011 |
Neg logit contributions | |
fid | -0.014 |
acci | -0.013 |
ank | -0.012 |
obey | -0.012 |
ihil | -0.011 |
Token | wt |
Token ID | 46569 |
Feature activation | +3.55e-01 |
Pos logit contributions | |
fid | +0.048 |
acci | +0.046 |
ank | +0.042 |
obey | +0.041 |
ihil | +0.040 |
Neg logit contributions | |
ARC | -0.044 |
ked | -0.041 |
ILA | -0.039 |
OVA | -0.039 |
Region | -0.037 |
Token | 0001 |
Token ID | 18005 |
Feature activation | +5.19e-03 |
Pos logit contributions | |
ARC | +0.251 |
ked | +0.235 |
ILA | +0.223 |
OVA | +0.222 |
pool | +0.212 |
Neg logit contributions | |
fid | -0.275 |
acci | -0.263 |
ank | -0.244 |
obey | -0.233 |
ihil | -0.231 |
Token | - |
Token ID | 532 |
Feature activation | +6.43e-02 |
Pos logit contributions | |
ARC | +0.004 |
ked | +0.003 |
ILA | +0.003 |
OVA | +0.003 |
pool | +0.003 |
Neg logit contributions | |
fid | -0.004 |
acci | -0.004 |
ank | -0.004 |
obey | -0.003 |
ihil | -0.003 |
Token | favorite |
Token ID | 4004 |
Feature activation | -7.05e-03 |
Pos logit contributions | |
ARC | +0.043 |
ked | +0.040 |
ILA | +0.038 |
OVA | +0.038 |
pool | +0.036 |
Neg logit contributions | |
fid | -0.052 |
acci | -0.050 |
ank | -0.046 |
obey | -0.045 |
ihil | -0.044 |
Token | favorite |
Token ID | 4004 |
Feature activation | -3.30e-02 |
Pos logit contributions | |
fid | +0.006 |
acci | +0.006 |
ank | +0.005 |
obey | +0.005 |
ihil | +0.005 |
Neg logit contributions | |
ARC | -0.005 |
ked | -0.004 |
ILA | -0.004 |
OVA | -0.004 |
pool | -0.004 |
Token | favorite |
Token ID | 4004 |
Feature activation | -5.12e-02 |
Pos logit contributions | |
fid | +0.027 |
acci | +0.026 |
ank | +0.024 |
obey | +0.023 |
ihil | +0.023 |
Neg logit contributions | |
ARC | -0.022 |
ked | -0.020 |
ILA | -0.019 |
OVA | -0.019 |
pool | -0.018 |
Token | some |
Token ID | 617 |
Feature activation | -6.06e-02 |
Pos logit contributions | |
fid | +0.090 |
acci | +0.085 |
ank | +0.079 |
obey | +0.076 |
obe | +0.075 |
Neg logit contributions | |
ARC | -0.081 |
ked | -0.077 |
ILA | -0.073 |
OVA | -0.072 |
Region | -0.069 |
Token | are |
Token ID | 389 |
Feature activation | -4.02e-02 |
Pos logit contributions | |
fid | +0.052 |
acci | +0.049 |
ank | +0.046 |
obey | +0.045 |
ihil | +0.044 |
Neg logit contributions | |
ARC | -0.038 |
ked | -0.036 |
ILA | -0.034 |
OVA | -0.033 |
Region | -0.032 |
Token | network |
Token ID | 3127 |
Feature activation | +1.64e-01 |
Pos logit contributions | |
fid | +0.032 |
acci | +0.030 |
ank | +0.028 |
obey | +0.027 |
ihil | +0.026 |
Neg logit contributions | |
ARC | -0.028 |
ked | -0.026 |
ILA | -0.025 |
OVA | -0.025 |
pool | -0.023 |
Token | bound |
Token ID | 5421 |
Feature activation | +2.27e-02 |
Pos logit contributions | |
ARC | +0.112 |
ked | +0.105 |
ILA | +0.099 |
OVA | +0.099 |
pool | +0.094 |
Neg logit contributions | |
fid | -0.130 |
acci | -0.124 |
ank | -0.115 |
obey | -0.111 |
ihil | -0.109 |
Token | ( |
Token ID | 357 |
Feature activation | -1.08e-01 |
Pos logit contributions | |
ARC | +0.016 |
ked | +0.015 |
ILA | +0.014 |
OVA | +0.014 |
Region | +0.013 |
Neg logit contributions | |
fid | -0.018 |
acci | -0.017 |
ank | -0.016 |
obey | -0.015 |
ihil | -0.015 |
Token | pro |
Token ID | 1676 |
Feature activation | +3.03e-01 |
Pos logit contributions | |
fid | +0.085 |
acci | +0.082 |
ank | +0.076 |
obey | +0.073 |
ihil | +0.072 |
Neg logit contributions | |
ARC | -0.074 |
ked | -0.070 |
ILA | -0.066 |
OVA | -0.065 |
kers | -0.062 |
Token | x |
Token ID | 87 |
Feature activation | -8.51e-03 |
Pos logit contributions | |
ARC | +0.208 |
ked | +0.195 |
ILA | +0.184 |
OVA | +0.183 |
pool | +0.175 |
Neg logit contributions | |
fid | -0.240 |
acci | -0.230 |
ank | -0.213 |
obey | -0.205 |
ihil | -0.202 |
Token | ies |
Token ID | 444 |
Feature activation | +1.16e-01 |
Pos logit contributions | |
fid | +0.008 |
acci | +0.007 |
ank | +0.007 |
obey | +0.007 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.005 |
ked | -0.005 |
ILA | -0.004 |
OVA | -0.004 |
pool | -0.004 |
Token | ) |
Token ID | 8 |
Feature activation | -4.70e-02 |
Pos logit contributions | |
ARC | +0.082 |
ked | +0.077 |
ILA | +0.073 |
OVA | +0.072 |
pool | +0.069 |
Neg logit contributions | |
fid | -0.090 |
acci | -0.086 |
ank | -0.080 |
obey | -0.077 |
ihil | -0.075 |
Token | and |
Token ID | 290 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
fid | +0.037 |
acci | +0.036 |
ank | +0.033 |
obey | +0.032 |
ihil | +0.031 |
Neg logit contributions | |
ARC | -0.032 |
ked | -0.030 |
ILA | -0.029 |
OVA | -0.028 |
pool | -0.027 |
Token | storage |
Token ID | 6143 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
fid | +0.011 |
acci | +0.010 |
ank | +0.009 |
obey | +0.009 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.012 |
ked | -0.011 |
ILA | -0.011 |
OVA | -0.011 |
pool | -0.010 |
Token | ) |
Token ID | 8 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
fid | +0.093 |
acci | +0.089 |
ank | +0.082 |
obey | +0.079 |
ihil | +0.078 |
Neg logit contributions | |
ARC | -0.079 |
ked | -0.074 |
ILA | -0.071 |
OVA | -0.070 |
Region | -0.066 |
Token | is |
Token ID | 318 |
Feature activation | +5.99e-03 |
Pos logit contributions | |
ARC | +0.014 |
ked | +0.013 |
ILA | +0.013 |
OVA | +0.013 |
pool | +0.012 |
Neg logit contributions | |
fid | -0.015 |
acci | -0.015 |
ank | -0.013 |
obey | -0.013 |
ihil | -0.013 |
Token | Harvard |
Token ID | 11131 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
ARC | +0.004 |
ked | +0.004 |
ILA | +0.004 |
OVA | +0.004 |
kers | +0.004 |
Neg logit contributions | |
fid | -0.005 |
acci | -0.004 |
ank | -0.004 |
obey | -0.004 |
obe | -0.004 |
Token | - |
Token ID | 12 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
fid | +0.092 |
acci | +0.089 |
ank | +0.083 |
obey | +0.080 |
ihil | +0.079 |
Neg logit contributions | |
ARC | -0.063 |
ked | -0.059 |
ILA | -0.055 |
OVA | -0.054 |
pool | -0.052 |
Token | West |
Token ID | 15045 |
Feature activation | -6.63e-02 |
Pos logit contributions | |
ARC | +0.089 |
ked | +0.085 |
ILA | +0.080 |
OVA | +0.079 |
kers | +0.076 |
Neg logit contributions | |
fid | -0.092 |
acci | -0.088 |
ank | -0.081 |
obey | -0.078 |
ihil | -0.077 |
Token | lake |
Token ID | 27180 |
Feature activation | +3.06e-01 |
Pos logit contributions | |
fid | +0.074 |
acci | +0.072 |
ank | +0.068 |
obey | +0.066 |
ihil | +0.065 |
Neg logit contributions | |
ARC | -0.024 |
ked | -0.022 |
ILA | -0.019 |
OVA | -0.019 |
pool | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
ARC | +0.217 |
ked | +0.205 |
ILA | +0.193 |
OVA | +0.192 |
pool | +0.184 |
Neg logit contributions | |
fid | -0.236 |
acci | -0.226 |
ank | -0.209 |
obey | -0.200 |
ihil | -0.197 |
Token | It |
Token ID | 632 |
Feature activation | +2.11e-02 |
Pos logit contributions | |
ARC | +0.018 |
ked | +0.017 |
ILA | +0.016 |
OVA | +0.016 |
pool | +0.016 |
Neg logit contributions | |
fid | -0.020 |
acci | -0.019 |
ank | -0.018 |
obey | -0.017 |
ihil | -0.017 |
Token | � |
Token ID | 447 |
Feature activation | -2.29e-02 |
Pos logit contributions | |
ARC | +0.015 |
ked | +0.014 |
ILA | +0.014 |
OVA | +0.014 |
pool | +0.013 |
Neg logit contributions | |
fid | -0.016 |
acci | -0.015 |
ank | -0.014 |
obey | -0.013 |
ihil | -0.013 |
Token | � |
Token ID | 247 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
fid | +0.020 |
acci | +0.019 |
ank | +0.018 |
obey | +0.017 |
ihil | +0.017 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.013 |
ILA | -0.012 |
OVA | -0.012 |
pool | -0.011 |
Token | s |
Token ID | 82 |
Feature activation | -4.44e-02 |
Pos logit contributions | |
ARC | +0.017 |
ked | +0.016 |
ILA | +0.015 |
OVA | +0.015 |
Region | +0.014 |
Neg logit contributions | |
fid | -0.014 |
acci | -0.014 |
ank | -0.012 |
obey | -0.012 |
ihil | -0.012 |
Token | Capitol |
Token ID | 13241 |
Feature activation | -6.83e-02 |
Pos logit contributions | |
fid | +0.037 |
acci | +0.036 |
ank | +0.033 |
obey | +0.031 |
ihil | +0.031 |
Neg logit contributions | |
ARC | -0.033 |
ked | -0.031 |
OVA | -0.029 |
ILA | -0.029 |
pool | -0.028 |
Token | Tuesday |
Token ID | 3431 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
fid | +0.056 |
acci | +0.054 |
ank | +0.050 |
obey | +0.048 |
ihil | +0.048 |
Neg logit contributions | |
ARC | -0.045 |
ked | -0.042 |
ILA | -0.039 |
OVA | -0.039 |
kers | -0.037 |
Token | morning |
Token ID | 3329 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
ARC | +0.011 |
ked | +0.011 |
ILA | +0.010 |
OVA | +0.010 |
pool | +0.010 |
Neg logit contributions | |
fid | -0.011 |
acci | -0.010 |
ank | -0.010 |
obey | -0.009 |
ihil | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
fid | +0.221 |
acci | +0.212 |
ank | +0.197 |
obey | +0.189 |
ihil | +0.187 |
Neg logit contributions | |
ARC | -0.183 |
ked | -0.172 |
ILA | -0.162 |
OVA | -0.161 |
pool | -0.154 |
Token | Hutch |
Token ID | 30492 |
Feature activation | -1.38e-03 |
Pos logit contributions | |
ARC | +0.007 |
ked | +0.007 |
ILA | +0.006 |
OVA | +0.006 |
pool | +0.006 |
Neg logit contributions | |
fid | -0.008 |
acci | -0.007 |
ank | -0.007 |
obey | -0.007 |
ihil | -0.007 |
Token | ison |
Token ID | 1653 |
Feature activation | +3.50e-01 |
Pos logit contributions | |
fid | +0.001 |
acci | +0.001 |
ank | +0.001 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.001 |
ked | -0.001 |
ILA | -0.001 |
OVA | -0.001 |
pool | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
ARC | +0.251 |
ked | +0.236 |
ILA | +0.223 |
OVA | +0.222 |
pool | +0.212 |
Neg logit contributions | |
fid | -0.267 |
acci | -0.256 |
ank | -0.236 |
obey | -0.226 |
ihil | -0.223 |
Token | who |
Token ID | 508 |
Feature activation | +1.25e-03 |
Pos logit contributions | |
ARC | +0.009 |
ked | +0.008 |
ILA | +0.008 |
OVA | +0.008 |
Region | +0.007 |
Neg logit contributions | |
fid | -0.009 |
acci | -0.008 |
ank | -0.008 |
obey | -0.007 |
obe | -0.007 |
Token | serves |
Token ID | 9179 |
Feature activation | -1.04e-01 |
Pos logit contributions | |
ARC | +0.001 |
ked | +0.001 |
ILA | +0.001 |
OVA | +0.001 |
Region | +0.001 |
Neg logit contributions | |
fid | -0.001 |
acci | -0.001 |
ank | -0.001 |
obey | -0.001 |
ihil | -0.001 |
Token | as |
Token ID | 355 |
Feature activation | -2.22e-02 |
Pos logit contributions | |
fid | +0.086 |
acci | +0.082 |
ank | +0.076 |
obey | +0.073 |
ihil | +0.073 |
Neg logit contributions | |
ARC | -0.069 |
ked | -0.064 |
ILA | -0.060 |
OVA | -0.060 |
kers | -0.057 |
Token | the |
Token ID | 262 |
Feature activation | +3.53e-02 |
Pos logit contributions | |
fid | +0.016 |
acci | +0.015 |
ank | +0.014 |
obey | +0.013 |
ihil | +0.013 |
Neg logit contributions | |
ARC | -0.017 |
ked | -0.016 |
ILA | -0.015 |
OVA | -0.015 |
pool | -0.015 |
Token | � |
Token ID | 447 |
Feature activation | +7.10e-03 |
Pos logit contributions | |
ARC | +0.035 |
ked | +0.033 |
ILA | +0.032 |
OVA | +0.032 |
pool | +0.030 |
Neg logit contributions | |
fid | -0.033 |
acci | -0.031 |
ank | -0.028 |
obey | -0.027 |
ihil | -0.027 |
Token | � |
Token ID | 247 |
Feature activation | +5.94e-02 |
Pos logit contributions | |
ARC | +0.004 |
ked | +0.004 |
ILA | +0.004 |
OVA | +0.004 |
pool | +0.003 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.006 |
ank | -0.006 |
obey | -0.005 |
ihil | -0.005 |
Token | s |
Token ID | 82 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
ARC | +0.046 |
ked | +0.044 |
ILA | +0.042 |
OVA | +0.042 |
pool | +0.040 |
Neg logit contributions | |
fid | -0.041 |
acci | -0.039 |
ank | -0.036 |
obey | -0.035 |
ihil | -0.034 |
Token | about |
Token ID | 546 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
fid | +0.010 |
acci | +0.010 |
ank | +0.009 |
obey | +0.009 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.007 |
ILA | -0.007 |
OVA | -0.007 |
pool | -0.006 |
Token | being |
Token ID | 852 |
Feature activation | +1.07e-01 |
Pos logit contributions | |
ARC | +0.008 |
ked | +0.007 |
ILA | +0.007 |
OVA | +0.007 |
pool | +0.007 |
Neg logit contributions | |
fid | -0.008 |
acci | -0.008 |
ank | -0.007 |
obey | -0.007 |
ihil | -0.007 |
Token | � |
Token ID | 564 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
ARC | +0.077 |
ked | +0.072 |
ILA | +0.068 |
OVA | +0.068 |
pool | +0.065 |
Neg logit contributions | |
fid | -0.081 |
acci | -0.078 |
ank | -0.072 |
obey | -0.069 |
ihil | -0.068 |
Token | � |
Token ID | 246 |
Feature activation | +4.82e-02 |
Pos logit contributions | |
ARC | +0.027 |
ked | +0.025 |
ILA | +0.024 |
OVA | +0.024 |
kers | +0.023 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.033 |
ank | -0.031 |
obey | -0.030 |
ihil | -0.029 |
Token | better |
Token ID | 27903 |
Feature activation | +8.83e-02 |
Pos logit contributions | |
ARC | +0.034 |
ked | +0.032 |
ILA | +0.030 |
OVA | +0.030 |
pool | +0.029 |
Neg logit contributions | |
fid | -0.037 |
acci | -0.036 |
ank | -0.033 |
obey | -0.032 |
ihil | -0.031 |
Token | � |
Token ID | 447 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
ARC | +0.065 |
ked | +0.061 |
ILA | +0.058 |
OVA | +0.058 |
pool | +0.056 |
Neg logit contributions | |
fid | -0.065 |
acci | -0.062 |
ank | -0.058 |
obey | -0.055 |
ihil | -0.054 |
Token | � |
Token ID | 247 |
Feature activation | +4.67e-02 |
Pos logit contributions | |
ARC | +0.009 |
ked | +0.009 |
ILA | +0.008 |
OVA | +0.008 |
pool | +0.008 |
Neg logit contributions | |
fid | -0.013 |
acci | -0.013 |
ank | -0.012 |
obey | -0.012 |
ihil | -0.011 |
Token | than |
Token ID | 621 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
ARC | +0.031 |
ked | +0.029 |
ILA | +0.027 |
OVA | +0.027 |
pool | +0.026 |
Neg logit contributions | |
fid | -0.038 |
acci | -0.037 |
ank | -0.034 |
obey | -0.033 |
ihil | -0.032 |
Token | play |
Token ID | 711 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
ARC | +0.002 |
ked | +0.002 |
ILA | +0.002 |
OVA | +0.002 |
pool | +0.002 |
Neg logit contributions | |
fid | -0.002 |
acci | -0.002 |
ank | -0.002 |
obey | -0.002 |
ihil | -0.002 |
Token | Wii |
Token ID | 16591 |
Feature activation | -9.74e-03 |
Pos logit contributions | |
fid | +0.009 |
acci | +0.009 |
ank | +0.008 |
obey | +0.008 |
ihil | +0.008 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.007 |
ILA | -0.007 |
OVA | -0.007 |
pool | -0.006 |
Token | Sports |
Token ID | 7092 |
Feature activation | +2.81e-01 |
Pos logit contributions | |
fid | +0.009 |
acci | +0.009 |
ank | +0.008 |
obey | +0.008 |
ihil | +0.008 |
Neg logit contributions | |
ARC | -0.005 |
ked | -0.005 |
ILA | -0.005 |
OVA | -0.005 |
pool | -0.004 |
Token | Club |
Token ID | 6289 |
Feature activation | -2.79e-02 |
Pos logit contributions | |
ARC | +0.169 |
ked | +0.158 |
ILA | +0.147 |
OVA | +0.146 |
pool | +0.139 |
Neg logit contributions | |
fid | -0.246 |
acci | -0.237 |
ank | -0.222 |
obey | -0.214 |
ihil | -0.211 |
Token | together |
Token ID | 1978 |
Feature activation | -3.30e-03 |
Pos logit contributions | |
fid | +0.023 |
acci | +0.022 |
ank | +0.021 |
obey | +0.020 |
ihil | +0.019 |
Neg logit contributions | |
ARC | -0.018 |
ked | -0.017 |
ILA | -0.016 |
OVA | -0.016 |
pool | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +3.47e-02 |
Pos logit contributions | |
fid | +0.003 |
acci | +0.003 |
ank | +0.002 |
obey | +0.002 |
ihil | +0.002 |
Neg logit contributions | |
ARC | -0.002 |
ked | -0.002 |
ILA | -0.002 |
OVA | -0.002 |
pool | -0.002 |
Token | Players |
Token ID | 13094 |
Feature activation | +2.37e-02 |
Pos logit contributions | |
ARC | +0.023 |
ked | +0.022 |
ILA | +0.021 |
OVA | +0.020 |
pool | +0.020 |
Neg logit contributions | |
fid | -0.028 |
acci | -0.027 |
ank | -0.025 |
obey | -0.024 |
ihil | -0.024 |
Token | also |
Token ID | 635 |
Feature activation | -9.38e-02 |
Pos logit contributions | |
ARC | +0.018 |
ked | +0.017 |
ILA | +0.016 |
OVA | +0.016 |
pool | +0.015 |
Neg logit contributions | |
fid | -0.017 |
acci | -0.016 |
ank | -0.015 |
obey | -0.014 |
ihil | -0.014 |
Token | can |
Token ID | 460 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
fid | +0.068 |
acci | +0.065 |
ank | +0.060 |
obey | +0.058 |
ihil | +0.056 |
Neg logit contributions | |
ARC | -0.071 |
ked | -0.067 |
ILA | -0.064 |
OVA | -0.063 |
Region | -0.060 |
Token | join |
Token ID | 4654 |
Feature activation | -7.35e-02 |
Pos logit contributions | |
fid | +0.007 |
acci | +0.007 |
ank | +0.007 |
obey | +0.006 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.007 |
ILA | -0.007 |
OVA | -0.007 |
Region | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
fid | +0.058 |
acci | +0.055 |
ank | +0.051 |
obey | +0.049 |
ihil | +0.048 |
Neg logit contributions | |
ARC | -0.051 |
ked | -0.048 |
ILA | -0.046 |
OVA | -0.045 |
kers | -0.043 |
Token | - |
Token ID | 532 |
Feature activation | +5.25e-02 |
Pos logit contributions | |
fid | +0.053 |
acci | +0.051 |
ank | +0.047 |
obey | +0.045 |
ihil | +0.045 |
Neg logit contributions | |
ARC | -0.046 |
ked | -0.043 |
ILA | -0.040 |
OVA | -0.040 |
Region | -0.038 |
Token | and |
Token ID | 290 |
Feature activation | +6.43e-02 |
Pos logit contributions | |
ARC | +0.038 |
ked | +0.036 |
ILA | +0.034 |
OVA | +0.034 |
pool | +0.032 |
Neg logit contributions | |
fid | -0.040 |
acci | -0.038 |
ank | -0.035 |
obey | -0.034 |
ihil | -0.033 |
Token | admins |
Token ID | 44563 |
Feature activation | +7.67e-02 |
Pos logit contributions | |
ARC | +0.046 |
ked | +0.044 |
ILA | +0.041 |
OVA | +0.041 |
pool | +0.039 |
Neg logit contributions | |
fid | -0.049 |
acci | -0.047 |
ank | -0.043 |
obey | -0.042 |
ihil | -0.041 |
Token | always |
Token ID | 1464 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
ARC | +0.057 |
ked | +0.053 |
ILA | +0.051 |
OVA | +0.050 |
Region | +0.048 |
Neg logit contributions | |
fid | -0.057 |
acci | -0.054 |
ank | -0.050 |
obey | -0.048 |
ihil | -0.047 |
Token | grant |
Token ID | 7264 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
fid | +0.008 |
acci | +0.007 |
ank | +0.007 |
obey | +0.006 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.008 |
ked | -0.007 |
ILA | -0.007 |
OVA | -0.007 |
Region | -0.006 |
Token | it |
Token ID | 340 |
Feature activation | +4.38e-02 |
Pos logit contributions | |
fid | +0.011 |
acci | +0.011 |
ank | +0.010 |
obey | +0.009 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.010 |
ked | -0.010 |
ILA | -0.009 |
OVA | -0.009 |
pool | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +6.56e-02 |
Pos logit contributions | |
ARC | +0.030 |
ked | +0.028 |
ILA | +0.027 |
OVA | +0.026 |
pool | +0.025 |
Neg logit contributions | |
fid | -0.035 |
acci | -0.033 |
ank | -0.031 |
obey | -0.030 |
ihil | -0.029 |
Token | It |
Token ID | 632 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
ARC | +0.045 |
ked | +0.042 |
ILA | +0.040 |
OVA | +0.040 |
pool | +0.038 |
Neg logit contributions | |
fid | -0.052 |
acci | -0.050 |
ank | -0.046 |
obey | -0.044 |
ihil | -0.044 |
Token | 's |
Token ID | 338 |
Feature activation | +1.10e-01 |
Pos logit contributions | |
ARC | +0.011 |
ked | +0.010 |
ILA | +0.010 |
OVA | +0.010 |
pool | +0.009 |
Neg logit contributions | |
fid | -0.012 |
acci | -0.011 |
ank | -0.010 |
obey | -0.010 |
ihil | -0.010 |
Token | time |
Token ID | 640 |
Feature activation | -1.06e-01 |
Pos logit contributions | |
ARC | +0.080 |
ked | +0.076 |
ILA | +0.072 |
OVA | +0.071 |
pool | +0.068 |
Neg logit contributions | |
fid | -0.083 |
acci | -0.079 |
ank | -0.073 |
obey | -0.070 |
ihil | -0.069 |
Token | , |
Token ID | 11 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
fid | +0.077 |
acci | +0.073 |
ank | +0.068 |
obey | +0.065 |
ihil | +0.064 |
Neg logit contributions | |
ARC | -0.080 |
ked | -0.075 |
ILA | -0.072 |
OVA | -0.071 |
pool | -0.068 |
Token | s |
Token ID | 82 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
ARC | +0.032 |
ked | +0.030 |
ILA | +0.028 |
OVA | +0.028 |
pool | +0.027 |
Neg logit contributions | |
fid | -0.028 |
acci | -0.027 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.023 |
Token | intended |
Token ID | 5292 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.018 |
ank | +0.017 |
obey | +0.016 |
ihil | +0.016 |
Neg logit contributions | |
ARC | -0.017 |
ked | -0.016 |
ILA | -0.015 |
OVA | -0.015 |
pool | -0.015 |
Token | in |
Token ID | 287 |
Feature activation | +9.26e-02 |
Pos logit contributions | |
ARC | +0.093 |
ked | +0.087 |
ILA | +0.083 |
OVA | +0.082 |
pool | +0.078 |
Neg logit contributions | |
fid | -0.109 |
acci | -0.104 |
ank | -0.097 |
obey | -0.093 |
ihil | -0.092 |
Token | large |
Token ID | 1588 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
ARC | +0.067 |
ked | +0.063 |
ILA | +0.059 |
OVA | +0.059 |
pool | +0.057 |
Neg logit contributions | |
fid | -0.070 |
acci | -0.067 |
ank | -0.062 |
obey | -0.059 |
ihil | -0.059 |
Token | part |
Token ID | 636 |
Feature activation | +8.66e-02 |
Pos logit contributions | |
ARC | +0.011 |
ked | +0.010 |
ILA | +0.010 |
OVA | +0.010 |
pool | +0.009 |
Neg logit contributions | |
fid | -0.014 |
acci | -0.014 |
ank | -0.013 |
obey | -0.012 |
ihil | -0.012 |
Token | for |
Token ID | 329 |
Feature activation | +8.84e-02 |
Pos logit contributions | |
ARC | +0.066 |
ked | +0.062 |
ILA | +0.059 |
OVA | +0.059 |
pool | +0.056 |
Neg logit contributions | |
fid | -0.062 |
acci | -0.060 |
ank | -0.055 |
obey | -0.052 |
ihil | -0.052 |
Token | the |
Token ID | 262 |
Feature activation | +4.60e-02 |
Pos logit contributions | |
ARC | +0.064 |
ked | +0.060 |
ILA | +0.057 |
OVA | +0.057 |
pool | +0.054 |
Neg logit contributions | |
fid | -0.067 |
acci | -0.064 |
ank | -0.059 |
obey | -0.057 |
ihil | -0.056 |
Token | consumer |
Token ID | 7172 |
Feature activation | -2.30e-01 |
Pos logit contributions | |
ARC | +0.034 |
ked | +0.032 |
ILA | +0.030 |
OVA | +0.030 |
pool | +0.029 |
Neg logit contributions | |
fid | -0.034 |
acci | -0.033 |
ank | -0.030 |
obey | -0.029 |
ihil | -0.029 |
Token | not |
Token ID | 407 |
Feature activation | +1.31e-02 |
Pos logit contributions | |
fid | +0.183 |
acci | +0.175 |
ank | +0.163 |
obey | +0.156 |
ihil | +0.154 |
Neg logit contributions | |
ARC | -0.158 |
ked | -0.148 |
ILA | -0.140 |
OVA | -0.139 |
pool | -0.133 |
Token | to |
Token ID | 284 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
ARC | +0.010 |
ked | +0.009 |
ILA | +0.009 |
OVA | +0.009 |
pool | +0.009 |
Neg logit contributions | |
fid | -0.009 |
acci | -0.009 |
ank | -0.008 |
obey | -0.008 |
ihil | -0.008 |
Token | get |
Token ID | 651 |
Feature activation | +2.21e-02 |
Pos logit contributions | |
ARC | +0.032 |
ked | +0.030 |
ILA | +0.029 |
OVA | +0.028 |
pool | +0.027 |
Neg logit contributions | |
fid | -0.030 |
acci | -0.029 |
ank | -0.026 |
obey | -0.025 |
ihil | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | -2.28e-02 |
Pos logit contributions | |
ARC | +0.007 |
ked | +0.007 |
ILA | +0.006 |
OVA | +0.006 |
Region | +0.006 |
Neg logit contributions | |
fid | -0.008 |
acci | -0.008 |
ank | -0.007 |
obey | -0.007 |
ihil | -0.007 |
Token | Place |
Token ID | 8474 |
Feature activation | -9.21e-02 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.019 |
ank | +0.017 |
obey | +0.017 |
ihil | +0.016 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.013 |
ILA | -0.013 |
OVA | -0.013 |
kers | -0.012 |
Token | f |
Token ID | 277 |
Feature activation | -2.74e-02 |
Pos logit contributions | |
fid | +0.072 |
acci | +0.068 |
ank | +0.064 |
obey | +0.061 |
ihil | +0.060 |
Neg logit contributions | |
ARC | -0.065 |
ked | -0.061 |
OVA | -0.058 |
ILA | -0.058 |
pool | -0.055 |
Token | rit |
Token ID | 799 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.018 |
ank | +0.016 |
obey | +0.015 |
ihil | +0.015 |
Neg logit contributions | |
ARC | -0.022 |
ked | -0.021 |
ILA | -0.020 |
OVA | -0.020 |
pool | -0.019 |
Token | ters |
Token ID | 1010 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
fid | +0.184 |
acci | +0.179 |
ank | +0.170 |
obey | +0.165 |
ihil | +0.164 |
Neg logit contributions | |
ARC | -0.053 |
ked | -0.046 |
ILA | -0.041 |
OVA | -0.041 |
Region | -0.036 |
Token | in |
Token ID | 287 |
Feature activation | -9.14e-03 |
Pos logit contributions | |
ARC | +0.160 |
ked | +0.149 |
ILA | +0.141 |
OVA | +0.141 |
Region | +0.133 |
Neg logit contributions | |
fid | -0.194 |
acci | -0.185 |
ank | -0.172 |
obey | -0.165 |
ihil | -0.163 |
Token | the |
Token ID | 262 |
Feature activation | -3.54e-02 |
Pos logit contributions | |
fid | +0.007 |
acci | +0.007 |
ank | +0.006 |
obey | +0.006 |
ihil | +0.006 |
Neg logit contributions | |
ARC | -0.006 |
ked | -0.006 |
ILA | -0.006 |
OVA | -0.006 |
Region | -0.005 |
Token | skillet |
Token ID | 41306 |
Feature activation | +4.75e-02 |
Pos logit contributions | |
fid | +0.029 |
acci | +0.027 |
ank | +0.026 |
obey | +0.025 |
ihil | +0.024 |
Neg logit contributions | |
ARC | -0.024 |
ked | -0.022 |
ILA | -0.021 |
OVA | -0.021 |
pool | -0.020 |
Token | ( |
Token ID | 357 |
Feature activation | -9.96e-02 |
Pos logit contributions | |
ARC | +0.033 |
ked | +0.030 |
ILA | +0.029 |
OVA | +0.029 |
Region | +0.027 |
Neg logit contributions | |
fid | -0.038 |
acci | -0.036 |
ank | -0.034 |
obey | -0.032 |
ihil | -0.032 |
Token | don |
Token ID | 9099 |
Feature activation | +7.31e-03 |
Pos logit contributions | |
fid | +0.078 |
acci | +0.075 |
ank | +0.069 |
obey | +0.067 |
ihil | +0.066 |
Neg logit contributions | |
ARC | -0.069 |
ked | -0.064 |
ILA | -0.061 |
OVA | -0.060 |
kers | -0.058 |
Token | � |
Token ID | 447 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
ARC | +0.005 |
ked | +0.005 |
ILA | +0.004 |
OVA | +0.004 |
Region | +0.004 |
Neg logit contributions | |
fid | -0.006 |
acci | -0.006 |
ank | -0.005 |
obey | -0.005 |
ihil | -0.005 |
Token | + |
Token ID | 10 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
fid | +0.042 |
acci | +0.040 |
ank | +0.036 |
obey | +0.035 |
ihil | +0.034 |
Neg logit contributions | |
ARC | -0.047 |
ked | -0.044 |
ILA | -0.042 |
OVA | -0.042 |
pool | -0.040 |
Token | " |
Token ID | 1 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
fid | +0.010 |
acci | +0.010 |
ank | +0.009 |
obey | +0.009 |
ihil | +0.009 |
Neg logit contributions | |
ARC | -0.011 |
ked | -0.011 |
ILA | -0.010 |
OVA | -0.010 |
pool | -0.010 |
Token | \ |
Token ID | 59 |
Feature activation | -1.35e-01 |
Pos logit contributions | |
fid | +0.144 |
acci | +0.137 |
ank | +0.127 |
obey | +0.121 |
ihil | +0.120 |
Neg logit contributions | |
ARC | -0.142 |
ked | -0.134 |
ILA | -0.127 |
OVA | -0.126 |
pool | -0.121 |
Token | S |
Token ID | 50 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
fid | +0.102 |
acci | +0.098 |
ank | +0.091 |
obey | +0.087 |
ihil | +0.086 |
Neg logit contributions | |
ARC | -0.096 |
ked | -0.091 |
ILA | -0.086 |
OVA | -0.085 |
pool | -0.082 |
Token | + |
Token ID | 10 |
Feature activation | -2.89e-02 |
Pos logit contributions | |
ARC | +0.012 |
ked | +0.011 |
ILA | +0.011 |
OVA | +0.011 |
pool | +0.010 |
Neg logit contributions | |
fid | -0.013 |
acci | -0.013 |
ank | -0.012 |
obey | -0.011 |
ihil | -0.011 |
Token | "] |
Token ID | 8973 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
fid | +0.019 |
acci | +0.018 |
ank | +0.016 |
obey | +0.016 |
ihil | +0.015 |
Neg logit contributions | |
ARC | -0.024 |
ked | -0.023 |
ILA | -0.022 |
OVA | -0.021 |
pool | -0.021 |
Token | ' |
Token ID | 6 |
Feature activation | -1.60e-01 |
Pos logit contributions | |
fid | +0.081 |
acci | +0.077 |
ank | +0.071 |
obey | +0.067 |
ihil | +0.066 |
Neg logit contributions | |
ARC | -0.088 |
ked | -0.084 |
ILA | -0.079 |
OVA | -0.079 |
pool | -0.076 |
Token | ) |
Token ID | 1267 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
fid | +0.124 |
acci | +0.118 |
ank | +0.109 |
obey | +0.105 |
ihil | +0.103 |
Neg logit contributions | |
ARC | -0.113 |
ked | -0.106 |
ILA | -0.100 |
OVA | -0.100 |
pool | -0.096 |
Token | AS |
Token ID | 7054 |
Feature activation | +8.21e-02 |
Pos logit contributions | |
fid | +0.018 |
acci | +0.018 |
ank | +0.016 |
obey | +0.016 |
ihil | +0.016 |
Neg logit contributions | |
ARC | -0.016 |
ked | -0.015 |
ILA | -0.014 |
OVA | -0.014 |
pool | -0.013 |
Token | library |
Token ID | 5888 |
Feature activation | -1.14e-01 |
Pos logit contributions | |
ARC | +0.058 |
ked | +0.054 |
ILA | +0.051 |
OVA | +0.051 |
pool | +0.049 |
Neg logit contributions | |
fid | -0.064 |
acci | -0.061 |
ank | -0.056 |
obey | -0.054 |
ihil | -0.053 |
Token | , |
Token ID | 837 |
Feature activation | +3.89e-02 |
Pos logit contributions | |
fid | +0.094 |
acci | +0.090 |
ank | +0.084 |
obey | +0.080 |
ihil | +0.079 |
Neg logit contributions | |
ARC | -0.074 |
ked | -0.070 |
ILA | -0.065 |
OVA | -0.065 |
kers | -0.062 |
Token | x |
Token ID | 87 |
Feature activation | -7.78e-02 |
Pos logit contributions | |
fid | +0.061 |
acci | +0.059 |
ank | +0.054 |
obey | +0.052 |
ihil | +0.051 |
Neg logit contributions | |
ARC | -0.059 |
ked | -0.055 |
ILA | -0.053 |
OVA | -0.052 |
pool | -0.050 |
Token | . |
Token ID | 13 |
Feature activation | -9.56e-02 |
Pos logit contributions | |
fid | +0.064 |
acci | +0.062 |
ank | +0.057 |
obey | +0.055 |
ihil | +0.055 |
Neg logit contributions | |
ARC | -0.051 |
ked | -0.048 |
ILA | -0.045 |
OVA | -0.044 |
pool | -0.042 |
Token | 177 |
Token ID | 22413 |
Feature activation | +1.01e-01 |
Pos logit contributions | |
fid | +0.091 |
acci | +0.088 |
ank | +0.082 |
obey | +0.081 |
ihil | +0.080 |
Neg logit contributions | |
ARC | -0.050 |
ked | -0.046 |
ILA | -0.042 |
OVA | -0.042 |
kers | -0.039 |
Token | 119 |
Token ID | 15136 |
Feature activation | -1.59e-01 |
Pos logit contributions | |
ARC | +0.070 |
ked | +0.066 |
ILA | +0.062 |
OVA | +0.062 |
pool | +0.060 |
Neg logit contributions | |
fid | -0.079 |
acci | -0.076 |
ank | -0.070 |
obey | -0.067 |
ihil | -0.066 |
Token | 3 |
Token ID | 18 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
fid | +0.116 |
acci | +0.111 |
ank | +0.102 |
obey | +0.098 |
ihil | +0.097 |
Neg logit contributions | |
ARC | -0.118 |
ked | -0.112 |
ILA | -0.106 |
OVA | -0.105 |
pool | -0.101 |
Token | 184 |
Token ID | 22883 |
Feature activation | -1.25e-01 |
Pos logit contributions | |
fid | +0.152 |
acci | +0.147 |
ank | +0.135 |
obey | +0.131 |
ihil | +0.129 |
Neg logit contributions | |
ARC | -0.125 |
ked | -0.118 |
ILA | -0.111 |
OVA | -0.110 |
kers | -0.105 |
Token | x |
Token ID | 2124 |
Feature activation | +7.99e-02 |
Pos logit contributions | |
fid | +0.108 |
acci | +0.104 |
ank | +0.097 |
obey | +0.093 |
ihil | +0.092 |
Neg logit contributions | |
ARC | -0.077 |
ked | -0.071 |
ILA | -0.067 |
OVA | -0.067 |
pool | -0.063 |
Token | . |
Token ID | 13 |
Feature activation | -7.92e-02 |
Pos logit contributions | |
ARC | +0.052 |
ked | +0.049 |
ILA | +0.046 |
OVA | +0.045 |
pool | +0.043 |
Neg logit contributions | |
fid | -0.066 |
acci | -0.064 |
ank | -0.059 |
obey | -0.057 |
ihil | -0.056 |
Token | x |
Token ID | 87 |
Feature activation | -5.90e-02 |
Pos logit contributions | |
fid | +0.061 |
acci | +0.058 |
ank | +0.054 |
obey | +0.052 |
ihil | +0.051 |
Neg logit contributions | |
ARC | -0.056 |
ked | -0.053 |
ILA | -0.050 |
OVA | -0.050 |
pool | -0.048 |
Token | . |
Token ID | 13 |
Feature activation | -8.31e-02 |
Pos logit contributions | |
fid | +0.049 |
acci | +0.047 |
ank | +0.044 |
obey | +0.042 |
ihil | +0.042 |
Neg logit contributions | |
ARC | -0.038 |
ked | -0.036 |
ILA | -0.034 |
OVA | -0.033 |
pool | -0.032 |
Token | x |
Token ID | 87 |
Feature activation | -2.38e-01 |
Pos logit contributions | |
fid | +0.063 |
acci | +0.060 |
ank | +0.056 |
obey | +0.053 |
ihil | +0.053 |
Neg logit contributions | |
ARC | -0.060 |
ked | -0.056 |
ILA | -0.053 |
OVA | -0.053 |
pool | -0.051 |
Token | Jav |
Token ID | 49247 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
ARC | +0.028 |
ked | +0.026 |
ILA | +0.025 |
OVA | +0.025 |
pool | +0.024 |
Neg logit contributions | |
fid | -0.029 |
acci | -0.027 |
ank | -0.026 |
obey | -0.024 |
ihil | -0.024 |
Token | akh |
Token ID | 11322 |
Feature activation | +2.50e-01 |
Pos logit contributions | |
ARC | +0.188 |
ked | +0.176 |
ILA | +0.167 |
OVA | +0.166 |
pool | +0.159 |
Neg logit contributions | |
fid | -0.201 |
acci | -0.193 |
ank | -0.178 |
obey | -0.171 |
ihil | -0.169 |
Token | k |
Token ID | 74 |
Feature activation | +2.19e-01 |
Pos logit contributions | |
ARC | +0.176 |
ked | +0.166 |
ILA | +0.157 |
OVA | +0.156 |
pool | +0.149 |
Neg logit contributions | |
fid | -0.193 |
acci | -0.185 |
ank | -0.171 |
obey | -0.164 |
ihil | -0.162 |
Token | to |
Token ID | 284 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
ARC | +0.152 |
ked | +0.142 |
OVA | +0.134 |
ILA | +0.133 |
pool | +0.127 |
Neg logit contributions | |
fid | -0.173 |
acci | -0.166 |
ank | -0.153 |
obey | -0.147 |
ihil | -0.146 |
Token | the |
Token ID | 262 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
ARC | +0.008 |
ked | +0.008 |
ILA | +0.007 |
OVA | +0.007 |
pool | +0.007 |
Neg logit contributions | |
fid | -0.009 |
acci | -0.008 |
ank | -0.008 |
obey | -0.007 |
ihil | -0.007 |
Token | Americas |
Token ID | 25733 |
Feature activation | -3.89e-02 |
Pos logit contributions | |
ARC | +0.011 |
ked | +0.011 |
ILA | +0.010 |
OVA | +0.010 |
pool | +0.010 |
Neg logit contributions | |
fid | -0.013 |
acci | -0.012 |
ank | -0.011 |
obey | -0.011 |
ihil | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | +3.65e-02 |
Pos logit contributions | |
fid | +0.031 |
acci | +0.030 |
ank | +0.028 |
obey | +0.026 |
ihil | +0.026 |
Neg logit contributions | |
ARC | -0.027 |
ked | -0.025 |
ILA | -0.024 |
OVA | -0.024 |
pool | -0.022 |
Token | Europe |
Token ID | 2031 |
Feature activation | -1.66e-01 |
Pos logit contributions | |
ARC | +0.027 |
ked | +0.026 |
ILA | +0.024 |
OVA | +0.024 |
pool | +0.023 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.025 |
ank | -0.023 |
obey | -0.022 |
ihil | -0.022 |
Token | , |
Token ID | 11 |
Feature activation | +3.29e-02 |
Pos logit contributions | |
fid | +0.134 |
acci | +0.128 |
ank | +0.119 |
obey | +0.115 |
ihil | +0.113 |
Neg logit contributions | |
ARC | -0.111 |
ked | -0.104 |
ILA | -0.098 |
OVA | -0.097 |
pool | -0.093 |
Token | Russia |
Token ID | 3284 |
Feature activation | +9.18e-02 |
Pos logit contributions | |
ARC | +0.024 |
ked | +0.023 |
ILA | +0.022 |
OVA | +0.022 |
pool | +0.021 |
Neg logit contributions | |
fid | -0.024 |
acci | -0.023 |
ank | -0.022 |
obey | -0.021 |
ihil | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
ARC | +0.062 |
ked | +0.058 |
ILA | +0.055 |
OVA | +0.054 |
pool | +0.052 |
Neg logit contributions | |
fid | -0.074 |
acci | -0.071 |
ank | -0.066 |
obey | -0.063 |
ihil | -0.062 |
Token | masterpiece |
Token ID | 30669 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
ARC | +0.030 |
ked | +0.028 |
ILA | +0.027 |
OVA | +0.026 |
pool | +0.025 |
Neg logit contributions | |
fid | -0.032 |
acci | -0.031 |
ank | -0.028 |
obey | -0.027 |
ihil | -0.027 |
Token | . |
Token ID | 13 |
Feature activation | +6.96e-05 |
Pos logit contributions | |
ARC | +0.097 |
ked | +0.090 |
ILA | +0.085 |
OVA | +0.085 |
pool | +0.081 |
Neg logit contributions | |
fid | -0.114 |
acci | -0.109 |
ank | -0.102 |
obey | -0.098 |
ihil | -0.097 |
Token | That |
Token ID | 1320 |
Feature activation | -3.59e-02 |
Pos logit contributions | |
ARC | +0.000 |
ked | +0.000 |
ILA | +0.000 |
OVA | +0.000 |
pool | +0.000 |
Neg logit contributions | |
fid | -0.000 |
acci | -0.000 |
ank | -0.000 |
obey | -0.000 |
ihil | -0.000 |
Token | � |
Token ID | 447 |
Feature activation | +4.03e-03 |
Pos logit contributions | |
fid | +0.028 |
acci | +0.026 |
ank | +0.024 |
obey | +0.023 |
ihil | +0.023 |
Neg logit contributions | |
ARC | -0.026 |
ked | -0.024 |
ILA | -0.023 |
OVA | -0.023 |
pool | -0.022 |
Token | � |
Token ID | 247 |
Feature activation | +1.95e-02 |
Pos logit contributions | |
ARC | +0.002 |
ked | +0.002 |
ILA | +0.002 |
OVA | +0.002 |
pool | +0.002 |
Neg logit contributions | |
fid | -0.003 |
acci | -0.003 |
ank | -0.003 |
obey | -0.003 |
ihil | -0.003 |
Token | s |
Token ID | 82 |
Feature activation | -4.61e-02 |
Pos logit contributions | |
ARC | +0.015 |
ked | +0.014 |
ILA | +0.014 |
OVA | +0.014 |
Region | +0.013 |
Neg logit contributions | |
fid | -0.013 |
acci | -0.013 |
ank | -0.012 |
obey | -0.011 |
ihil | -0.011 |
Token | badass |
Token ID | 37289 |
Feature activation | -7.73e-02 |
Pos logit contributions | |
fid | +0.036 |
acci | +0.035 |
ank | +0.032 |
obey | +0.031 |
ihil | +0.031 |
Neg logit contributions | |
ARC | -0.032 |
ked | -0.030 |
ILA | -0.028 |
OVA | -0.028 |
pool | -0.027 |
Token | . |
Token ID | 13 |
Feature activation | -4.43e-02 |
Pos logit contributions | |
fid | +0.062 |
acci | +0.060 |
ank | +0.055 |
obey | +0.053 |
ihil | +0.053 |
Neg logit contributions | |
ARC | -0.052 |
ked | -0.049 |
ILA | -0.046 |
OVA | -0.046 |
Region | -0.044 |
Token | But |
Token ID | 887 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
fid | +0.035 |
acci | +0.033 |
ank | +0.031 |
obey | +0.030 |
ihil | +0.029 |
Neg logit contributions | |
ARC | -0.031 |
ked | -0.029 |
ILA | -0.027 |
OVA | -0.027 |
pool | -0.026 |
Token | then |
Token ID | 788 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
fid | +0.086 |
acci | +0.082 |
ank | +0.076 |
obey | +0.073 |
ihil | +0.072 |
Neg logit contributions | |
ARC | -0.075 |
ked | -0.071 |
ILA | -0.067 |
OVA | -0.067 |
pool | -0.064 |
Token | , |
Token ID | 11 |
Feature activation | +2.83e-03 |
Pos logit contributions | |
ARC | +0.093 |
ked | +0.087 |
ILA | +0.082 |
OVA | +0.082 |
pool | +0.078 |
Neg logit contributions | |
fid | -0.111 |
acci | -0.105 |
ank | -0.099 |
obey | -0.095 |
ihil | -0.093 |
Token | constructed |
Token ID | 12006 |
Feature activation | +3.57e-02 |
Pos logit contributions | |
fid | +0.022 |
acci | +0.021 |
ank | +0.020 |
obey | +0.019 |
ihil | +0.018 |
Neg logit contributions | |
ARC | -0.020 |
ked | -0.018 |
ILA | -0.017 |
OVA | -0.017 |
pool | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
ARC | +0.023 |
ked | +0.022 |
ILA | +0.021 |
OVA | +0.020 |
pool | +0.020 |
Neg logit contributions | |
fid | -0.029 |
acci | -0.028 |
ank | -0.026 |
obey | -0.025 |
ihil | -0.025 |
Token | Dri |
Token ID | 5809 |
Feature activation | +8.67e-02 |
Pos logit contributions | |
ARC | +0.016 |
ked | +0.015 |
ILA | +0.014 |
OVA | +0.014 |
pool | +0.014 |
Neg logit contributions | |
fid | -0.019 |
acci | -0.018 |
ank | -0.017 |
obey | -0.016 |
ihil | -0.016 |
Token | ven |
Token ID | 574 |
Feature activation | +2.46e-01 |
Pos logit contributions | |
ARC | +0.038 |
ked | +0.034 |
ILA | +0.031 |
OVA | +0.031 |
pool | +0.029 |
Neg logit contributions | |
fid | -0.090 |
acci | -0.087 |
ank | -0.082 |
obey | -0.080 |
ihil | -0.079 |
Token | by |
Token ID | 416 |
Feature activation | -7.81e-02 |
Pos logit contributions | |
ARC | +0.187 |
ked | +0.176 |
ILA | +0.167 |
OVA | +0.166 |
pool | +0.160 |
Neg logit contributions | |
fid | -0.177 |
acci | -0.169 |
ank | -0.156 |
obey | -0.149 |
ihil | -0.147 |
Token | utility |
Token ID | 10361 |
Feature activation | -5.86e-02 |
Pos logit contributions | |
fid | +0.060 |
acci | +0.058 |
ank | +0.053 |
obey | +0.051 |
ihil | +0.050 |
Neg logit contributions | |
ARC | -0.055 |
ked | -0.052 |
ILA | -0.049 |
OVA | -0.049 |
pool | -0.047 |
Token | , |
Token ID | 11 |
Feature activation | +2.17e-02 |
Pos logit contributions | |
fid | +0.046 |
acci | +0.044 |
ank | +0.041 |
obey | +0.040 |
obe | +0.039 |
Neg logit contributions | |
ARC | -0.040 |
ked | -0.038 |
ILA | -0.036 |
OVA | -0.036 |
kers | -0.034 |
Token | aesthetic |
Token ID | 19713 |
Feature activation | +7.03e-02 |
Pos logit contributions | |
ARC | +0.015 |
ked | +0.014 |
ILA | +0.014 |
OVA | +0.014 |
pool | +0.013 |
Neg logit contributions | |
fid | -0.017 |
acci | -0.016 |
ank | -0.015 |
obey | -0.014 |
ihil | -0.014 |
Token | concerns |
Token ID | 4786 |
Feature activation | -5.83e-03 |
Pos logit contributions | |
ARC | +0.047 |
ked | +0.044 |
ILA | +0.041 |
OVA | +0.041 |
pool | +0.039 |
Neg logit contributions | |
fid | -0.057 |
acci | -0.055 |
ank | -0.051 |
obey | -0.049 |
ihil | -0.048 |
Token | are |
Token ID | 389 |
Feature activation | -3.24e-04 |
Pos logit contributions | |
fid | +0.005 |
acci | +0.004 |
ank | +0.004 |
obey | +0.004 |
ihil | +0.004 |
Neg logit contributions | |
ARC | -0.004 |
ked | -0.004 |
ILA | -0.004 |
OVA | -0.004 |
Region | -0.003 |
Token | rarely |
Token ID | 8365 |
Feature activation | +2.47e-01 |
Pos logit contributions | |
fid | +0.000 |
acci | +0.000 |
ank | +0.000 |
obey | +0.000 |
ihil | +0.000 |
Neg logit contributions | |
ARC | -0.000 |
ked | -0.000 |
ILA | -0.000 |
OVA | -0.000 |
pool | -0.000 |
Token | through |
Token ID | 832 |
Feature activation | -8.75e-02 |
Pos logit contributions | |
ARC | +0.071 |
ked | +0.068 |
ILA | +0.064 |
OVA | +0.064 |
pool | +0.061 |
Neg logit contributions | |
fid | -0.070 |
acci | -0.067 |
ank | -0.062 |
obey | -0.059 |
ihil | -0.059 |
Token | 251 |
Token ID | 34489 |
Feature activation | -1.19e-01 |
Pos logit contributions | |
fid | +0.066 |
acci | +0.063 |
ank | +0.059 |
obey | +0.056 |
ihil | +0.055 |
Neg logit contributions | |
ARC | -0.063 |
ked | -0.059 |
ILA | -0.056 |
OVA | -0.056 |
pool | -0.054 |
Token | , |
Token ID | 11 |
Feature activation | -5.85e-03 |
Pos logit contributions | |
fid | +0.088 |
acci | +0.084 |
ank | +0.078 |
obey | +0.074 |
ihil | +0.073 |
Neg logit contributions | |
ARC | -0.088 |
ked | -0.083 |
ILA | -0.078 |
OVA | -0.078 |
pool | -0.075 |
Token | 000 |
Token ID | 830 |
Feature activation | -6.60e-02 |
Pos logit contributions | |
fid | +0.004 |
acci | +0.004 |
ank | +0.004 |
obey | +0.003 |
ihil | +0.003 |
Neg logit contributions | |
ARC | -0.005 |
ked | -0.004 |
ILA | -0.004 |
OVA | -0.004 |
pool | -0.004 |
Token | [ |
Token ID | 685 |
Feature activation | -2.80e-03 |
Pos logit contributions | |
fid | +0.039 |
acci | +0.037 |
ank | +0.033 |
obey | +0.031 |
ihil | +0.031 |
Neg logit contributions | |
ARC | -0.059 |
ked | -0.056 |
ILA | -0.053 |
OVA | -0.053 |
pool | -0.052 |
Token | le |
Token ID | 293 |
Feature activation | -3.50e-01 |
Pos logit contributions | |
fid | +0.002 |
acci | +0.002 |
ank | +0.002 |
obey | +0.002 |
ihil | +0.002 |
Neg logit contributions | |
ARC | -0.002 |
ked | -0.002 |
ILA | -0.002 |
OVA | -0.002 |
pool | -0.002 |
Token | aked |
Token ID | 4335 |
Feature activation | +9.04e-02 |
Pos logit contributions | |
fid | +0.332 |
acci | +0.321 |
ank | +0.298 |
obey | +0.289 |
ihil | +0.288 |
Neg logit contributions | |
ARC | -0.186 |
ked | -0.170 |
ILA | -0.162 |
OVA | -0.160 |
Region | -0.150 |
Token | ] |
Token ID | 60 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
ARC | +0.057 |
ked | +0.054 |
ILA | +0.050 |
OVA | +0.050 |
pool | +0.048 |
Neg logit contributions | |
fid | -0.076 |
acci | -0.073 |
ank | -0.068 |
obey | -0.066 |
ihil | -0.065 |
Token | documents |
Token ID | 4963 |
Feature activation | +4.64e-02 |
Pos logit contributions | |
ARC | +0.014 |
ked | +0.013 |
ILA | +0.012 |
OVA | +0.012 |
pool | +0.011 |
Neg logit contributions | |
fid | -0.016 |
acci | -0.016 |
ank | -0.015 |
obey | -0.014 |
ihil | -0.014 |
Token | – |
Token ID | 784 |
Feature activation | +8.14e-02 |
Pos logit contributions | |
ARC | +0.032 |
ked | +0.031 |
ILA | +0.029 |
OVA | +0.029 |
pool | +0.027 |
Neg logit contributions | |
fid | -0.036 |
acci | -0.035 |
ank | -0.032 |
obey | -0.031 |
ihil | -0.030 |
Token | or |
Token ID | 393 |
Feature activation | +7.19e-02 |
Pos logit contributions | |
ARC | +0.059 |
ked | +0.055 |
ILA | +0.052 |
OVA | +0.052 |
pool | +0.050 |
Neg logit contributions | |
fid | -0.062 |
acci | -0.059 |
ank | -0.054 |
obey | -0.052 |
ihil | -0.051 |
Token | olve |
Token ID | 6442 |
Feature activation | -3.76e-01 |
Pos logit contributions | |
ARC | +0.025 |
ked | +0.024 |
ILA | +0.023 |
OVA | +0.023 |
pool | +0.022 |
Neg logit contributions | |
fid | -0.013 |
acci | -0.012 |
ank | -0.011 |
obey | -0.010 |
ihil | -0.010 |
Token | in |
Token ID | 287 |
Feature activation | -2.12e-03 |
Pos logit contributions | |
fid | +0.308 |
acci | +0.295 |
ank | +0.275 |
obey | +0.264 |
ihil | +0.261 |
Neg logit contributions | |
ARC | -0.249 |
ked | -0.233 |
ILA | -0.219 |
OVA | -0.218 |
pool | -0.208 |
Token | a |
Token ID | 257 |
Feature activation | -1.92e-02 |
Pos logit contributions | |
fid | +0.002 |
acci | +0.002 |
ank | +0.001 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.002 |
ked | -0.001 |
OVA | -0.001 |
ILA | -0.001 |
pool | -0.001 |
Token | P |
Token ID | 350 |
Feature activation | +1.37e-01 |
Pos logit contributions | |
fid | +0.014 |
acci | +0.013 |
ank | +0.012 |
obey | +0.012 |
ihil | +0.012 |
Neg logit contributions | |
ARC | -0.014 |
ked | -0.014 |
OVA | -0.013 |
ILA | -0.013 |
pool | -0.012 |
Token | to |
Token ID | 1462 |
Feature activation | -9.48e-02 |
Pos logit contributions | |
ARC | +0.092 |
ked | +0.087 |
ILA | +0.082 |
OVA | +0.082 |
pool | +0.079 |
Neg logit contributions | |
fid | -0.109 |
acci | -0.106 |
ank | -0.097 |
ihil | -0.094 |
obey | -0.093 |
Token | le |
Token ID | 293 |
Feature activation | -4.73e-01 |
Pos logit contributions | |
fid | +0.041 |
acci | +0.038 |
ank | +0.033 |
obey | +0.030 |
ihil | +0.030 |
Neg logit contributions | |
ARC | -0.099 |
ked | -0.095 |
ILA | -0.091 |
OVA | -0.091 |
pool | -0.089 |
Token | ma |
Token ID | 2611 |
Feature activation | +3.21e-02 |
Pos logit contributions | |
fid | +0.394 |
acci | +0.379 |
ank | +0.350 |
obey | +0.340 |
ihil | +0.336 |
Neg logit contributions | |
ARC | -0.305 |
ked | -0.277 |
OVA | -0.268 |
ILA | -0.263 |
Region | -0.252 |
Token | ic |
Token ID | 291 |
Feature activation | +9.94e-02 |
Pos logit contributions | |
ARC | +0.020 |
ked | +0.019 |
ILA | +0.018 |
OVA | +0.018 |
pool | +0.017 |
Neg logit contributions | |
fid | -0.027 |
acci | -0.026 |
ank | -0.024 |
obey | -0.023 |
ihil | -0.023 |
Token | system |
Token ID | 1080 |
Feature activation | +6.20e-02 |
Pos logit contributions | |
ARC | +0.073 |
ked | +0.070 |
OVA | +0.065 |
ILA | +0.065 |
pool | +0.063 |
Neg logit contributions | |
fid | -0.073 |
acci | -0.070 |
ank | -0.065 |
obey | -0.061 |
ihil | -0.061 |
Token | . |
Token ID | 13 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
ARC | +0.042 |
ked | +0.040 |
ILA | +0.037 |
OVA | +0.037 |
pool | +0.035 |
Neg logit contributions | |
fid | -0.050 |
acci | -0.048 |
ank | -0.044 |
obey | -0.042 |
ihil | -0.042 |
Token | It |
Token ID | 632 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
ARC | +0.010 |
ked | +0.010 |
ILA | +0.009 |
OVA | +0.009 |
pool | +0.009 |
Neg logit contributions | |
fid | -0.012 |
acci | -0.012 |
ank | -0.011 |
obey | -0.010 |
ihil | -0.010 |
Token | - |
Token ID | 12 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
ARC | +0.043 |
ked | +0.040 |
ILA | +0.038 |
OVA | +0.038 |
pool | +0.036 |
Neg logit contributions | |
fid | -0.043 |
acci | -0.041 |
ank | -0.038 |
obey | -0.036 |
ihil | -0.036 |
Token | rice |
Token ID | 20970 |
Feature activation | +5.56e-02 |
Pos logit contributions | |
fid | +0.018 |
acci | +0.017 |
ank | +0.016 |
obey | +0.015 |
ihil | +0.015 |
Neg logit contributions | |
ARC | -0.016 |
ked | -0.015 |
ILA | -0.014 |
OVA | -0.014 |
pool | -0.013 |
Token | dish |
Token ID | 9433 |
Feature activation | +1.02e-01 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.037 |
ILA | +0.035 |
OVA | +0.034 |
pool | +0.033 |
Neg logit contributions | |
fid | -0.043 |
acci | -0.041 |
ank | -0.038 |
obey | -0.037 |
ihil | -0.036 |
Token | with |
Token ID | 351 |
Feature activation | -3.72e-02 |
Pos logit contributions | |
ARC | +0.070 |
ked | +0.066 |
ILA | +0.062 |
OVA | +0.062 |
Region | +0.059 |
Neg logit contributions | |
fid | -0.081 |
acci | -0.077 |
ank | -0.072 |
obey | -0.069 |
ihil | -0.068 |
Token | esc |
Token ID | 3671 |
Feature activation | -1.03e-01 |
Pos logit contributions | |
fid | +0.028 |
acci | +0.027 |
ank | +0.025 |
obey | +0.024 |
ihil | +0.023 |
Neg logit contributions | |
ARC | -0.027 |
ked | -0.026 |
ILA | -0.024 |
OVA | -0.024 |
pool | -0.023 |
Token | olar |
Token ID | 6192 |
Feature activation | -4.65e-01 |
Pos logit contributions | |
fid | +0.079 |
acci | +0.076 |
ank | +0.069 |
obey | +0.067 |
ihil | +0.066 |
Neg logit contributions | |
ARC | -0.073 |
ked | -0.068 |
ILA | -0.065 |
OVA | -0.065 |
Region | -0.062 |
Token | and |
Token ID | 290 |
Feature activation | -5.63e-02 |
Pos logit contributions | |
fid | +0.365 |
acci | +0.350 |
ank | +0.325 |
obey | +0.310 |
ihil | +0.305 |
Neg logit contributions | |
ARC | -0.324 |
ked | -0.303 |
ILA | -0.287 |
OVA | -0.286 |
pool | -0.273 |
Token | Chinese |
Token ID | 3999 |
Feature activation | +1.38e-01 |
Pos logit contributions | |
fid | +0.042 |
acci | +0.040 |
ank | +0.037 |
obey | +0.036 |
ihil | +0.035 |
Neg logit contributions | |
ARC | -0.041 |
ked | -0.039 |
ILA | -0.037 |
OVA | -0.036 |
pool | -0.035 |
Token | sausage |
Token ID | 31889 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
ARC | +0.098 |
ked | +0.091 |
ILA | +0.087 |
OVA | +0.087 |
pool | +0.083 |
Neg logit contributions | |
fid | -0.107 |
acci | -0.103 |
ank | -0.095 |
obey | -0.091 |
obe | -0.089 |
Token | that |
Token ID | 326 |
Feature activation | -3.08e-02 |
Pos logit contributions | |
ARC | +0.094 |
ked | +0.088 |
ILA | +0.084 |
OVA | +0.084 |
pool | +0.079 |
Neg logit contributions | |
fid | -0.107 |
acci | -0.102 |
ank | -0.095 |
obey | -0.091 |
ihil | -0.089 |
Token | is |
Token ID | 318 |
Feature activation | -6.33e-02 |
Pos logit contributions | |
fid | +0.023 |
acci | +0.022 |
ank | +0.020 |
obey | +0.020 |
ihil | +0.019 |
Neg logit contributions | |
ARC | -0.022 |
ked | -0.021 |
ILA | -0.020 |
OVA | -0.020 |
pool | -0.019 |
Token | procedures |
Token ID | 9021 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
ARC | +0.200 |
ked | +0.189 |
ILA | +0.178 |
OVA | +0.177 |
pool | +0.170 |
Neg logit contributions | |
fid | -0.203 |
acci | -0.195 |
ank | -0.179 |
obey | -0.172 |
ihil | -0.170 |
Token | . |
Token ID | 13 |
Feature activation | +2.77e-02 |
Pos logit contributions | |
ARC | +0.010 |
ked | +0.010 |
ILA | +0.009 |
OVA | +0.009 |
pool | +0.009 |
Neg logit contributions | |
fid | -0.011 |
acci | -0.011 |
ank | -0.010 |
obey | -0.010 |
ihil | -0.009 |
Token | This |
Token ID | 770 |
Feature activation | +5.86e-02 |
Pos logit contributions | |
ARC | +0.019 |
ked | +0.018 |
ILA | +0.017 |
OVA | +0.017 |
pool | +0.016 |
Neg logit contributions | |
fid | -0.022 |
acci | -0.021 |
ank | -0.020 |
obey | -0.019 |
ihil | -0.019 |
Token | paper |
Token ID | 3348 |
Feature activation | +8.62e-02 |
Pos logit contributions | |
ARC | +0.035 |
ked | +0.032 |
ILA | +0.030 |
OVA | +0.030 |
pool | +0.028 |
Neg logit contributions | |
fid | -0.052 |
acci | -0.050 |
ank | -0.047 |
obey | -0.045 |
ihil | -0.045 |
Token | presents |
Token ID | 10969 |
Feature activation | -2.46e-01 |
Pos logit contributions | |
ARC | +0.069 |
ked | +0.066 |
ILA | +0.062 |
OVA | +0.062 |
pool | +0.060 |
Neg logit contributions | |
fid | -0.058 |
acci | -0.055 |
ank | -0.051 |
obey | -0.048 |
ihil | -0.048 |
Token | behavioral |
Token ID | 17211 |
Feature activation | -3.76e-01 |
Pos logit contributions | |
fid | +0.188 |
acci | +0.180 |
ank | +0.167 |
obey | +0.160 |
ihil | +0.158 |
Neg logit contributions | |
ARC | -0.176 |
ked | -0.166 |
ILA | -0.157 |
OVA | -0.156 |
pool | -0.149 |
Token | results |
Token ID | 2482 |
Feature activation | +4.04e-02 |
Pos logit contributions | |
fid | +0.295 |
acci | +0.282 |
ank | +0.262 |
obey | +0.251 |
ihil | +0.247 |
Neg logit contributions | |
ARC | -0.262 |
ked | -0.246 |
ILA | -0.233 |
OVA | -0.231 |
pool | -0.221 |
Token | using |
Token ID | 1262 |
Feature activation | -2.00e-03 |
Pos logit contributions | |
ARC | +0.029 |
ked | +0.027 |
ILA | +0.025 |
OVA | +0.025 |
pool | +0.024 |
Neg logit contributions | |
fid | -0.031 |
acci | -0.030 |
ank | -0.028 |
obey | -0.027 |
ihil | -0.026 |
Token | this |
Token ID | 428 |
Feature activation | +6.08e-02 |
Pos logit contributions | |
fid | +0.001 |
acci | +0.001 |
ank | +0.001 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.001 |
ked | -0.001 |
ILA | -0.001 |
OVA | -0.001 |
pool | -0.001 |
Token | platform |
Token ID | 3859 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
ARC | +0.039 |
ked | +0.037 |
ILA | +0.034 |
OVA | +0.034 |
pool | +0.033 |
Neg logit contributions | |
fid | -0.051 |
acci | -0.049 |
ank | -0.046 |
obey | -0.044 |
ihil | -0.043 |
Token | . |
Token ID | 13 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
fid | +0.120 |
acci | +0.115 |
ank | +0.106 |
obey | +0.102 |
ihil | +0.101 |
Neg logit contributions | |
ARC | -0.105 |
ked | -0.099 |
ILA | -0.093 |
OVA | -0.092 |
pool | -0.088 |
Token | � |
Token ID | 447 |
Feature activation | -6.02e-03 |
Pos logit contributions | |
fid | +0.002 |
acci | +0.002 |
ank | +0.002 |
obey | +0.001 |
ihil | +0.001 |
Neg logit contributions | |
ARC | -0.002 |
ked | -0.002 |
ILA | -0.001 |
OVA | -0.001 |
pool | -0.001 |
Token | � |
Token ID | 247 |
Feature activation | -5.72e-03 |
Pos logit contributions | |
fid | +0.005 |
acci | +0.005 |
ank | +0.005 |
obey | +0.005 |
ihil | +0.004 |
Neg logit contributions | |
ARC | -0.004 |
ked | -0.003 |
OVA | -0.003 |
ILA | -0.003 |
kers | -0.003 |
Token | s |
Token ID | 82 |
Feature activation | -3.02e-02 |
Pos logit contributions | |
fid | +0.004 |
acci | +0.004 |
ank | +0.003 |
obey | +0.003 |
ihil | +0.003 |
Neg logit contributions | |
ARC | -0.004 |
ked | -0.004 |
ILA | -0.004 |
OVA | -0.004 |
pool | -0.004 |
Token | Drew |
Token ID | 18624 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
fid | +0.024 |
acci | +0.023 |
ank | +0.022 |
obey | +0.021 |
ihil | +0.020 |
Neg logit contributions | |
ARC | -0.020 |
ked | -0.019 |
ILA | -0.018 |
OVA | -0.018 |
pool | -0.017 |
Token | P |
Token ID | 350 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
ARC | +0.222 |
ked | +0.207 |
ILA | +0.195 |
OVA | +0.195 |
Region | +0.185 |
Neg logit contributions | |
fid | -0.267 |
acci | -0.256 |
ank | -0.238 |
obey | -0.230 |
ihil | -0.228 |
Token | omer |
Token ID | 12057 |
Feature activation | -4.18e-01 |
Pos logit contributions | |
ARC | +0.138 |
ked | +0.133 |
ILA | +0.129 |
OVA | +0.129 |
pool | +0.126 |
Neg logit contributions | |
fid | -0.043 |
acci | -0.039 |
ank | -0.031 |
obey | -0.028 |
ihil | -0.028 |
Token | anz |
Token ID | 35410 |
Feature activation | -6.50e-02 |
Pos logit contributions | |
fid | +0.283 |
acci | +0.269 |
ank | +0.246 |
obey | +0.234 |
ihil | +0.231 |
Neg logit contributions | |
ARC | -0.336 |
ked | -0.319 |
ILA | -0.303 |
OVA | -0.302 |
pool | -0.291 |
Token | and |
Token ID | 290 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
fid | +0.053 |
acci | +0.051 |
ank | +0.047 |
obey | +0.045 |
ihil | +0.045 |
Neg logit contributions | |
ARC | -0.043 |
ked | -0.040 |
ILA | -0.038 |
OVA | -0.038 |
pool | -0.036 |
Token | potentially |
Token ID | 6196 |
Feature activation | -1.69e-01 |
Pos logit contributions | |
fid | +0.012 |
acci | +0.012 |
ank | +0.011 |
obey | +0.010 |
ihil | +0.010 |
Neg logit contributions | |
ARC | -0.012 |
ked | -0.012 |
ILA | -0.011 |
OVA | -0.011 |
pool | -0.010 |
Token | Oakland |
Token ID | 12369 |
Feature activation | -9.03e-02 |
Pos logit contributions | |
fid | +0.128 |
acci | +0.122 |
ank | +0.114 |
obey | +0.109 |
ihil | +0.107 |
Neg logit contributions | |
ARC | -0.122 |
ked | -0.114 |
ILA | -0.109 |
OVA | -0.109 |
pool | -0.104 |
Token | � |
Token ID | 447 |
Feature activation | -5.36e-02 |
Pos logit contributions | |
fid | +0.067 |
acci | +0.064 |
ank | +0.060 |
obey | +0.057 |
ihil | +0.056 |
Neg logit contributions | |
ARC | -0.066 |
ked | -0.062 |
ILA | -0.059 |
OVA | -0.059 |
pool | -0.056 |