Token | some |
Token ID | 617 |
Feature activation | +9.75e-04 |
Pos logit contributions | |
rob | +0.014 |
ie | +0.014 |
co | +0.014 |
glob | +0.013 |
ty | +0.012 |
Neg logit contributions | |
� | -0.013 |
ifying | -0.011 |
Having | -0.011 |
Not | -0.011 |
wins | -0.011 |
Token | big |
Token ID | 1263 |
Feature activation | -1.68e-03 |
Pos logit contributions | |
co | +0.001 |
isk | +0.001 |
fl | +0.001 |
ie | +0.001 |
rob | +0.001 |
Neg logit contributions | |
ite | -0.001 |
� | -0.001 |
ifying | -0.001 |
ending | -0.001 |
Having | -0.001 |
Token | cats |
Token ID | 11875 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
� | +0.002 |
ite | +0.002 |
ago | +0.002 |
ifying | +0.002 |
Having | +0.002 |
Neg logit contributions | |
isk | -0.002 |
ie | -0.002 |
co | -0.002 |
ty | -0.002 |
mar | -0.002 |
Token | around |
Token ID | 1088 |
Feature activation | +3.11e-02 |
Pos logit contributions | |
pots | +0.011 |
ie | +0.011 |
rust | +0.010 |
fl | +0.010 |
ty | +0.010 |
Neg logit contributions | |
ite | -0.017 |
Having | -0.016 |
ending | -0.016 |
ver | -0.016 |
ifying | -0.016 |
Token | here |
Token ID | 994 |
Feature activation | +3.03e-02 |
Pos logit contributions | |
rust | +0.031 |
pots | +0.030 |
glob | +0.030 |
please | +0.029 |
ie | +0.029 |
Neg logit contributions | |
ite | -0.044 |
� | -0.044 |
ifying | -0.044 |
Having | -0.043 |
Doing | -0.042 |
Token | ," |
Token ID | 553 |
Feature activation | +7.92e-02 |
Pos logit contributions | |
ie | +0.032 |
pots | +0.031 |
isk | +0.030 |
fl | +0.030 |
rust | +0.030 |
Neg logit contributions | |
ite | -0.043 |
� | -0.042 |
ver | -0.042 |
ifying | -0.041 |
Having | -0.041 |
Token | warned |
Token ID | 7728 |
Feature activation | +4.91e-02 |
Pos logit contributions | |
pots | +0.138 |
guys | +0.128 |
ger | +0.125 |
ils | +0.124 |
co | +0.123 |
Neg logit contributions | |
� | -0.076 |
ite | -0.071 |
Doing | -0.069 |
From | -0.068 |
It | -0.068 |
Token | H |
Token ID | 367 |
Feature activation | +7.77e-04 |
Pos logit contributions | |
pots | +0.064 |
hunt | +0.058 |
cast | +0.056 |
ils | +0.053 |
pies | +0.052 |
Neg logit contributions | |
� | -0.065 |
ite | -0.063 |
ver | -0.059 |
It | -0.059 |
Its | -0.058 |
Token | oot |
Token ID | 1025 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
ie | +0.001 |
pots | +0.001 |
ty | +0.001 |
fl | +0.001 |
rust | +0.001 |
Neg logit contributions | |
ite | -0.001 |
Having | -0.001 |
ifying | -0.001 |
ending | -0.001 |
ver | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +2.87e-02 |
Pos logit contributions | |
ending | +0.026 |
ver | +0.026 |
ite | +0.026 |
Having | +0.025 |
� | +0.025 |
Neg logit contributions | |
pots | -0.013 |
guys | -0.012 |
rust | -0.011 |
hunt | -0.011 |
fl | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
ie | +0.050 |
pots | +0.050 |
guys | +0.048 |
ty | +0.046 |
ils | +0.046 |
Neg logit contributions | |
ite | -0.024 |
Having | -0.023 |
ver | -0.023 |
Doing | -0.023 |
ending | -0.022 |
Token | 's |
Token ID | 338 |
Feature activation | +2.28e-02 |
Pos logit contributions | |
ite | +0.013 |
Having | +0.013 |
ending | +0.013 |
ver | +0.012 |
ifying | +0.012 |
Neg logit contributions | |
pots | -0.018 |
ie | -0.018 |
rust | -0.017 |
fl | -0.017 |
ty | -0.017 |
Token | what |
Token ID | 644 |
Feature activation | +4.56e-03 |
Pos logit contributions | |
pots | +0.037 |
fl | +0.035 |
ie | +0.035 |
rob | +0.034 |
cast | +0.034 |
Neg logit contributions | |
� | -0.021 |
ver | -0.020 |
Having | -0.020 |
ending | -0.019 |
ifying | -0.019 |
Token | friends |
Token ID | 2460 |
Feature activation | -5.33e-03 |
Pos logit contributions | |
guys | +0.005 |
pots | +0.005 |
ie | +0.005 |
b | +0.005 |
for | +0.005 |
Neg logit contributions | |
ifying | -0.007 |
igsaw | -0.007 |
ite | -0.006 |
Having | -0.006 |
Since | -0.006 |
Token | are |
Token ID | 389 |
Feature activation | +8.84e-03 |
Pos logit contributions | |
ite | +0.007 |
ending | +0.007 |
Having | +0.007 |
ver | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.007 |
fl | -0.006 |
rust | -0.006 |
ty | -0.006 |
Token | for |
Token ID | 329 |
Feature activation | +2.18e-02 |
Pos logit contributions | |
isk | +0.009 |
ie | +0.008 |
pots | +0.008 |
glob | +0.008 |
co | +0.008 |
Neg logit contributions | |
ending | -0.013 |
glad | -0.013 |
� | -0.013 |
ver | -0.013 |
ite | -0.012 |
Token | ," |
Token ID | 553 |
Feature activation | +7.79e-02 |
Pos logit contributions | |
rust | +0.026 |
fl | +0.025 |
ie | +0.025 |
pots | +0.025 |
cast | +0.024 |
Neg logit contributions | |
� | -0.028 |
ending | -0.027 |
ver | -0.027 |
ite | -0.026 |
Doing | -0.026 |
Token | replied |
Token ID | 8712 |
Feature activation | +3.55e-02 |
Pos logit contributions | |
pots | +0.128 |
guys | +0.115 |
ils | +0.109 |
urg | +0.109 |
ger | +0.109 |
Neg logit contributions | |
ite | -0.087 |
� | -0.087 |
Doing | -0.080 |
From | -0.078 |
Having | -0.076 |
Token | H |
Token ID | 367 |
Feature activation | +4.12e-03 |
Pos logit contributions | |
pots | +0.044 |
hunt | +0.039 |
ie | +0.039 |
cast | +0.037 |
guys | +0.036 |
Neg logit contributions | |
� | -0.049 |
ite | -0.048 |
gol | -0.046 |
ver | -0.046 |
It | -0.046 |
Token | oot |
Token ID | 1025 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ie | +0.005 |
pots | +0.005 |
rust | +0.005 |
ty | +0.005 |
fl | +0.005 |
Neg logit contributions | |
ite | -0.005 |
Having | -0.005 |
ending | -0.005 |
ifying | -0.005 |
ver | -0.005 |
Token | with |
Token ID | 351 |
Feature activation | -2.91e-03 |
Pos logit contributions | |
ver | +0.016 |
ending | +0.016 |
ite | +0.016 |
� | +0.015 |
old | +0.015 |
Neg logit contributions | |
pots | -0.012 |
guys | -0.011 |
hunt | -0.011 |
ger | -0.010 |
rust | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | +2.77e-03 |
Pos logit contributions | |
Having | +0.003 |
ifying | +0.003 |
ite | +0.003 |
� | +0.003 |
ending | +0.003 |
Neg logit contributions | |
ie | -0.004 |
pots | -0.004 |
fl | -0.004 |
ty | -0.004 |
co | -0.004 |
Token | looks |
Token ID | 3073 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
ite | +0.005 |
ending | +0.004 |
Having | +0.004 |
ver | +0.004 |
ifying | +0.004 |
Neg logit contributions | |
pots | -0.006 |
ie | -0.006 |
rust | -0.006 |
please | -0.006 |
ty | -0.006 |
Token | fun |
Token ID | 1257 |
Feature activation | +9.28e-03 |
Pos logit contributions | |
ie | +0.015 |
isk | +0.015 |
fl | +0.015 |
glob | +0.014 |
pots | +0.014 |
Neg logit contributions | |
� | -0.014 |
ifying | -0.013 |
Having | -0.012 |
glad | -0.012 |
ite | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
isk | +0.012 |
pots | +0.011 |
rust | +0.011 |
god | +0.011 |
ie | +0.011 |
Neg logit contributions | |
ite | -0.012 |
� | -0.011 |
case | -0.011 |
ending | -0.011 |
ver | -0.010 |
Token | play |
Token ID | 711 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
pots | +0.013 |
fl | +0.012 |
god | +0.012 |
ie | +0.012 |
rust | +0.012 |
Neg logit contributions | |
ite | -0.013 |
Having | -0.012 |
� | -0.012 |
've | -0.011 |
Whoever | -0.011 |
Token | in |
Token ID | 287 |
Feature activation | +1.59e-03 |
Pos logit contributions | |
pots | +0.015 |
ie | +0.015 |
fl | +0.015 |
isk | +0.015 |
please | +0.014 |
Neg logit contributions | |
� | -0.014 |
ite | -0.013 |
Jimmy | -0.013 |
case | -0.013 |
Whoever | -0.012 |
Token | ," |
Token ID | 553 |
Feature activation | +7.71e-02 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
hunt | +0.002 |
ty | +0.002 |
them | +0.002 |
Neg logit contributions | |
ending | -0.002 |
ver | -0.002 |
ite | -0.002 |
Having | -0.002 |
ifying | -0.002 |
Token | thought |
Token ID | 1807 |
Feature activation | +4.27e-02 |
Pos logit contributions | |
pots | +0.115 |
ie | +0.105 |
ils | +0.103 |
isk | +0.103 |
ty | +0.103 |
Neg logit contributions | |
ite | -0.093 |
It | -0.086 |
Having | -0.083 |
� | -0.083 |
destruct | -0.082 |
Token | Spe |
Token ID | 2531 |
Feature activation | -4.65e-03 |
Pos logit contributions | |
pots | +0.049 |
ie | +0.048 |
fl | +0.045 |
rust | +0.044 |
ty | +0.044 |
Neg logit contributions | |
ite | -0.060 |
ending | -0.059 |
ver | -0.059 |
Having | -0.058 |
ifying | -0.056 |
Token | edy |
Token ID | 4716 |
Feature activation | -2.24e-03 |
Pos logit contributions | |
ite | +0.006 |
Having | +0.006 |
ending | +0.006 |
ver | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
pots | -0.005 |
ie | -0.005 |
rust | -0.005 |
fl | -0.005 |
ty | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +2.56e-02 |
Pos logit contributions | |
ver | +0.003 |
ite | +0.003 |
ending | +0.003 |
Having | +0.003 |
� | +0.003 |
Neg logit contributions | |
pots | -0.002 |
fl | -0.002 |
ie | -0.002 |
rust | -0.002 |
ger | -0.002 |
Token | So |
Token ID | 1406 |
Feature activation | +3.51e-02 |
Pos logit contributions | |
ie | +0.050 |
pots | +0.049 |
ty | +0.046 |
ils | +0.045 |
guys | +0.045 |
Neg logit contributions | |
ite | -0.018 |
ver | -0.017 |
Having | -0.017 |
Through | -0.016 |
Doing | -0.016 |
Token | we |
Token ID | 356 |
Feature activation | +3.59e-03 |
Pos logit contributions | |
ie | +0.023 |
pots | +0.023 |
rust | +0.022 |
fl | +0.022 |
ty | +0.022 |
Neg logit contributions | |
ite | -0.016 |
Having | -0.015 |
ending | -0.015 |
ver | -0.015 |
ifying | -0.015 |
Token | can |
Token ID | 460 |
Feature activation | -8.33e-03 |
Pos logit contributions | |
pots | +0.005 |
ie | +0.005 |
guys | +0.005 |
rust | +0.005 |
hunt | +0.005 |
Neg logit contributions | |
ite | -0.004 |
Having | -0.004 |
ending | -0.004 |
ver | -0.003 |
ifying | -0.003 |
Token | borrow |
Token ID | 8804 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
ite | +0.011 |
Having | +0.010 |
ending | +0.010 |
ver | +0.010 |
ifying | +0.010 |
Neg logit contributions | |
pots | -0.010 |
ie | -0.010 |
fl | -0.010 |
rust | -0.010 |
guys | -0.009 |
Token | his |
Token ID | 465 |
Feature activation | -2.65e-03 |
Pos logit contributions | |
ite | +0.013 |
ifying | +0.013 |
� | +0.012 |
Having | +0.012 |
ending | +0.012 |
Neg logit contributions | |
ie | -0.016 |
rust | -0.015 |
isk | -0.015 |
fl | -0.015 |
pots | -0.015 |
Token | mixer |
Token ID | 33938 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
ite | +0.003 |
Having | +0.003 |
ending | +0.003 |
ifying | +0.003 |
ver | +0.003 |
Neg logit contributions | |
ie | -0.003 |
pots | -0.003 |
rust | -0.003 |
ty | -0.003 |
fl | -0.003 |
Token | ," |
Token ID | 553 |
Feature activation | +7.28e-02 |
Pos logit contributions | |
rust | +0.021 |
pots | +0.020 |
fl | +0.019 |
rob | +0.018 |
ie | +0.018 |
Neg logit contributions | |
ite | -0.025 |
ver | -0.024 |
� | -0.023 |
case | -0.022 |
ending | -0.021 |
Token | Sam |
Token ID | 3409 |
Feature activation | +2.24e-02 |
Pos logit contributions | |
pots | +0.109 |
guys | +0.107 |
ils | +0.106 |
ger | +0.105 |
hunt | +0.103 |
Neg logit contributions | |
ite | -0.073 |
Having | -0.073 |
� | -0.073 |
Doing | -0.072 |
It | -0.069 |
Token | said |
Token ID | 531 |
Feature activation | +3.33e-03 |
Pos logit contributions | |
pots | +0.030 |
fl | +0.029 |
guys | +0.028 |
cast | +0.028 |
ger | +0.028 |
Neg logit contributions | |
ver | -0.029 |
� | -0.029 |
ending | -0.026 |
ite | -0.025 |
Jimmy | -0.025 |
Token | . |
Token ID | 13 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
pots | +0.003 |
fl | +0.003 |
ie | +0.003 |
rob | +0.003 |
hunt | +0.003 |
Neg logit contributions | |
ver | -0.005 |
� | -0.005 |
ending | -0.005 |
ite | -0.005 |
Jimmy | -0.004 |
Token | " |
Token ID | 366 |
Feature activation | +6.32e-03 |
Pos logit contributions | |
ie | +0.028 |
pots | +0.027 |
ty | +0.026 |
guys | +0.026 |
rust | +0.025 |
Neg logit contributions | |
ite | -0.015 |
Having | -0.014 |
ver | -0.014 |
ending | -0.014 |
Doing | -0.013 |
Token | He |
Token ID | 1544 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
pots | +0.009 |
ie | +0.009 |
rust | +0.008 |
co | +0.008 |
fl | +0.008 |
Neg logit contributions | |
ite | -0.007 |
ending | -0.007 |
ifying | -0.007 |
Having | -0.006 |
ver | -0.006 |
Token | 'm |
Token ID | 1101 |
Feature activation | +2.50e-03 |
Pos logit contributions | |
ite | +0.008 |
Having | +0.008 |
ending | +0.008 |
ifying | +0.008 |
ver | +0.008 |
Neg logit contributions | |
ie | -0.011 |
pots | -0.011 |
fl | -0.010 |
rust | -0.010 |
hunt | -0.010 |
Token | looking |
Token ID | 2045 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
pots | +0.003 |
ie | +0.003 |
rust | +0.002 |
fl | +0.002 |
ty | +0.002 |
Neg logit contributions | |
ite | -0.004 |
Having | -0.004 |
ending | -0.004 |
ver | -0.003 |
ifying | -0.003 |
Token | for |
Token ID | 329 |
Feature activation | +2.09e-02 |
Pos logit contributions | |
pots | +0.006 |
co | +0.006 |
isk | +0.006 |
rust | +0.006 |
fl | +0.006 |
Neg logit contributions | |
ite | -0.021 |
� | -0.021 |
ending | -0.021 |
ifying | -0.021 |
Doing | -0.021 |
Token | some |
Token ID | 617 |
Feature activation | +1.56e-02 |
Pos logit contributions | |
ie | +0.032 |
cast | +0.032 |
ho | +0.031 |
fl | +0.031 |
co | +0.031 |
Neg logit contributions | |
� | -0.019 |
Having | -0.018 |
ending | -0.018 |
Through | -0.017 |
Its | -0.017 |
Token | cheese |
Token ID | 9891 |
Feature activation | +2.82e-02 |
Pos logit contributions | |
ie | +0.015 |
isk | +0.015 |
pots | +0.015 |
fl | +0.015 |
ty | +0.014 |
Neg logit contributions | |
ite | -0.023 |
ending | -0.022 |
ifying | -0.022 |
Having | -0.022 |
� | -0.022 |
Token | ," |
Token ID | 553 |
Feature activation | +7.21e-02 |
Pos logit contributions | |
isk | +0.030 |
rust | +0.029 |
ie | +0.029 |
fl | +0.029 |
pots | +0.029 |
Neg logit contributions | |
ite | -0.040 |
� | -0.038 |
case | -0.037 |
ver | -0.036 |
ending | -0.035 |
Token | replied |
Token ID | 8712 |
Feature activation | +3.65e-02 |
Pos logit contributions | |
pots | +0.126 |
guys | +0.116 |
cast | +0.115 |
ils | +0.114 |
co | +0.113 |
Neg logit contributions | |
� | -0.071 |
Doing | -0.061 |
It | -0.061 |
ite | -0.060 |
From | -0.058 |
Token | S |
Token ID | 311 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
pots | +0.044 |
cast | +0.039 |
ie | +0.039 |
co | +0.038 |
ils | +0.038 |
Neg logit contributions | |
� | -0.050 |
ite | -0.048 |
It | -0.047 |
ver | -0.047 |
Its | -0.047 |
Token | que |
Token ID | 4188 |
Feature activation | +2.32e-03 |
Pos logit contributions | |
pots | +0.027 |
ie | +0.023 |
guys | +0.023 |
hunt | +0.023 |
rust | +0.023 |
Neg logit contributions | |
ite | -0.035 |
ending | -0.035 |
ver | -0.034 |
Having | -0.033 |
Doing | -0.032 |
Token | ak |
Token ID | 461 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
pots | +0.004 |
fl | +0.004 |
guys | +0.004 |
rust | +0.004 |
ie | +0.004 |
Neg logit contributions | |
ending | -0.001 |
ite | -0.001 |
Having | -0.001 |
ver | -0.001 |
earing | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +2.47e-02 |
Pos logit contributions | |
pots | +0.014 |
guys | +0.014 |
ger | +0.013 |
rob | +0.013 |
fl | +0.013 |
Neg logit contributions | |
ending | -0.021 |
ver | -0.021 |
ite | -0.020 |
� | -0.020 |
Having | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +9.03e-03 |
Pos logit contributions | |
ite | +0.013 |
ending | +0.012 |
ver | +0.011 |
� | +0.011 |
ifying | +0.011 |
Neg logit contributions | |
pots | -0.008 |
isk | -0.008 |
fl | -0.008 |
ie | -0.007 |
rust | -0.007 |
Token | What |
Token ID | 1867 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
pots | +0.013 |
S | +0.013 |
ie | +0.013 |
fl | +0.013 |
guys | +0.013 |
Neg logit contributions | |
ending | -0.010 |
ite | -0.010 |
Having | -0.009 |
igsaw | -0.009 |
ver | -0.009 |
Token | 's |
Token ID | 338 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
pots | +0.019 |
ie | +0.019 |
guys | +0.018 |
hunt | +0.018 |
rust | +0.017 |
Neg logit contributions | |
ite | -0.024 |
ifying | -0.024 |
Having | -0.023 |
ending | -0.023 |
igsaw | -0.023 |
Token | your |
Token ID | 534 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
pots | +0.038 |
ie | +0.037 |
rust | +0.036 |
fl | +0.036 |
ty | +0.035 |
Neg logit contributions | |
ite | -0.027 |
Having | -0.026 |
ending | -0.025 |
ifying | -0.025 |
ver | -0.024 |
Token | name |
Token ID | 1438 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
ie | +0.025 |
pots | +0.024 |
ty | +0.023 |
rust | +0.023 |
co | +0.023 |
Neg logit contributions | |
ite | -0.010 |
Having | -0.010 |
ending | -0.009 |
ifying | -0.009 |
ver | -0.009 |
Token | ?" |
Token ID | 1701 |
Feature activation | +7.05e-02 |
Pos logit contributions | |
pots | +0.037 |
bank | +0.036 |
isk | +0.035 |
cast | +0.034 |
ger | +0.034 |
Neg logit contributions | |
ite | -0.018 |
ver | -0.016 |
� | -0.016 |
case | -0.015 |
It | -0.014 |
Token | Bub |
Token ID | 19645 |
Feature activation | +8.93e-03 |
Pos logit contributions | |
pots | +0.096 |
isk | +0.094 |
co | +0.093 |
glob | +0.088 |
ty | +0.087 |
Neg logit contributions | |
� | -0.088 |
It | -0.085 |
Through | -0.084 |
Having | -0.083 |
ite | -0.082 |
Token | bles |
Token ID | 7689 |
Feature activation | -2.36e-03 |
Pos logit contributions | |
pots | +0.013 |
rust | +0.012 |
ger | +0.011 |
fl | +0.011 |
glob | +0.011 |
Neg logit contributions | |
ite | -0.010 |
ver | -0.010 |
ending | -0.010 |
Having | -0.010 |
erv | -0.009 |
Token | asked |
Token ID | 1965 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
ite | +0.003 |
ending | +0.003 |
ver | +0.003 |
Having | +0.003 |
� | +0.003 |
Neg logit contributions | |
pots | -0.003 |
fl | -0.002 |
guys | -0.002 |
ger | -0.002 |
isk | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +2.94e-02 |
Pos logit contributions | |
pots | +0.022 |
co | +0.021 |
rob | +0.021 |
fl | +0.021 |
ger | +0.020 |
Neg logit contributions | |
ver | -0.031 |
� | -0.029 |
Through | -0.027 |
ite | -0.027 |
ending | -0.027 |
Token |
|
Token ID | 198 |
Feature activation | +2.43e-02 |
Pos logit contributions | |
ie | +0.051 |
pots | +0.050 |
ty | +0.048 |
co | +0.047 |
guys | +0.047 |
Neg logit contributions | |
ite | -0.024 |
Having | -0.023 |
ver | -0.023 |
Through | -0.022 |
Doing | -0.022 |
Token | Thank |
Token ID | 10449 |
Feature activation | -5.34e-03 |
Pos logit contributions | |
fl | +0.027 |
ie | +0.027 |
rust | +0.027 |
pots | +0.027 |
ty | +0.027 |
Neg logit contributions | |
ite | -0.035 |
ver | -0.034 |
ending | -0.034 |
ifying | -0.033 |
igsaw | -0.033 |
Token | you |
Token ID | 345 |
Feature activation | +3.18e-03 |
Pos logit contributions | |
� | +0.004 |
ite | +0.004 |
ending | +0.004 |
itt | +0.003 |
Jimmy | +0.003 |
Neg logit contributions | |
pots | -0.010 |
cast | -0.010 |
bank | -0.009 |
rust | -0.009 |
glob | -0.009 |
Token | for |
Token ID | 329 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
pots | +0.004 |
fl | +0.004 |
please | +0.004 |
bank | +0.004 |
we | +0.004 |
Neg logit contributions | |
� | -0.004 |
ver | -0.004 |
glad | -0.004 |
case | -0.004 |
From | -0.004 |
Token | saving |
Token ID | 8914 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
pots | +0.041 |
cast | +0.041 |
ie | +0.039 |
fl | +0.037 |
guys | +0.037 |
Neg logit contributions | |
glad | -0.031 |
Having | -0.029 |
Despite | -0.027 |
ending | -0.027 |
Learning | -0.026 |
Token | me |
Token ID | 502 |
Feature activation | +1.33e-03 |
Pos logit contributions | |
umm | +0.041 |
cast | +0.041 |
rob | +0.040 |
rust | +0.040 |
pots | +0.040 |
Neg logit contributions | |
my | -0.027 |
� | -0.024 |
your | -0.020 |
My | -0.019 |
It | -0.019 |
Token | ," |
Token ID | 553 |
Feature activation | +6.99e-02 |
Pos logit contributions | |
pots | +0.001 |
fl | +0.001 |
guys | +0.001 |
please | +0.001 |
ones | +0.001 |
Neg logit contributions | |
ite | -0.002 |
ending | -0.002 |
� | -0.002 |
ver | -0.002 |
case | -0.002 |
Token | Tweet |
Token ID | 18752 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
pots | +0.118 |
cast | +0.114 |
guys | +0.111 |
ils | +0.111 |
urg | +0.110 |
Neg logit contributions | |
� | -0.063 |
Doing | -0.059 |
From | -0.058 |
It | -0.057 |
Having | -0.054 |
Token | ie |
Token ID | 494 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
pots | +0.015 |
guys | +0.014 |
fl | +0.013 |
ger | +0.013 |
glob | +0.013 |
Neg logit contributions | |
� | -0.015 |
ver | -0.015 |
ite | -0.014 |
Having | -0.014 |
Doing | -0.014 |
Token | said |
Token ID | 531 |
Feature activation | -1.66e-03 |
Pos logit contributions | |
pots | +0.012 |
guys | +0.011 |
fl | +0.011 |
ie | +0.010 |
hunt | +0.010 |
Neg logit contributions | |
� | -0.015 |
ver | -0.015 |
ite | -0.015 |
Having | -0.015 |
ending | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
ver | +0.003 |
ending | +0.002 |
ite | +0.002 |
� | +0.002 |
Having | +0.002 |
Neg logit contributions | |
pots | -0.002 |
fl | -0.002 |
ie | -0.002 |
guys | -0.002 |
hunt | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | -6.55e-03 |
Pos logit contributions | |
pots | +0.019 |
ils | +0.017 |
fl | +0.017 |
guys | +0.016 |
co | +0.016 |
Neg logit contributions | |
Having | -0.013 |
Having | -0.012 |
Since | -0.012 |
It | -0.012 |
glad | -0.011 |
Token | Let |
Token ID | 5756 |
Feature activation | +6.63e-03 |
Pos logit contributions | |
pots | +0.056 |
ie | +0.055 |
guys | +0.052 |
rust | +0.052 |
hunt | +0.052 |
Neg logit contributions | |
ite | -0.044 |
Having | -0.043 |
ending | -0.043 |
ifying | -0.041 |
Doing | -0.040 |
Token | 's |
Token ID | 338 |
Feature activation | -6.03e-03 |
Pos logit contributions | |
pots | +0.012 |
glob | +0.012 |
cast | +0.012 |
rust | +0.012 |
rob | +0.012 |
Neg logit contributions | |
� | -0.006 |
ending | -0.005 |
ite | -0.004 |
Having | -0.004 |
Doing | -0.004 |
Token | pitch |
Token ID | 7078 |
Feature activation | -1.86e-02 |
Pos logit contributions | |
ending | +0.010 |
Having | +0.010 |
ite | +0.010 |
ver | +0.010 |
igsaw | +0.010 |
Neg logit contributions | |
hunt | -0.005 |
pots | -0.005 |
ie | -0.005 |
guys | -0.005 |
ty | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | -2.60e-02 |
Pos logit contributions | |
ite | +0.028 |
Having | +0.026 |
ending | +0.026 |
ver | +0.026 |
ifying | +0.026 |
Neg logit contributions | |
pots | -0.020 |
ie | -0.019 |
rust | -0.018 |
fl | -0.018 |
ty | -0.018 |
Token | ball |
Token ID | 2613 |
Feature activation | -1.16e-03 |
Pos logit contributions | |
ending | +0.038 |
Having | +0.037 |
ver | +0.037 |
Doing | +0.036 |
ite | +0.036 |
Neg logit contributions | |
pots | -0.029 |
hunt | -0.028 |
b | -0.027 |
rust | -0.027 |
guys | -0.027 |
Token | ," |
Token ID | 553 |
Feature activation | +6.98e-02 |
Pos logit contributions | |
ite | +0.002 |
ending | +0.002 |
ver | +0.002 |
Having | +0.002 |
ifying | +0.002 |
Neg logit contributions | |
pots | -0.001 |
ie | -0.001 |
rust | -0.001 |
fl | -0.001 |
ty | -0.001 |
Token | she |
Token ID | 673 |
Feature activation | +3.81e-03 |
Pos logit contributions | |
guys | +0.106 |
isk | +0.104 |
rob | +0.103 |
hunt | +0.101 |
ils | +0.100 |
Neg logit contributions | |
� | -0.078 |
It | -0.077 |
Through | -0.073 |
Having | -0.073 |
ite | -0.072 |
Token | said |
Token ID | 531 |
Feature activation | -2.56e-03 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.004 |
fl | +0.004 |
guys | +0.004 |
hunt | +0.004 |
Neg logit contributions | |
ver | -0.005 |
� | -0.005 |
ending | -0.005 |
ite | -0.005 |
Having | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +3.70e-02 |
Pos logit contributions | |
ver | +0.004 |
ending | +0.004 |
� | +0.004 |
ite | +0.004 |
Having | +0.004 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
guys | -0.002 |
rob | -0.002 |
fl | -0.002 |
Token | Suz |
Token ID | 22691 |
Feature activation | +1.64e-02 |
Pos logit contributions | |
ie | +0.050 |
guys | +0.049 |
pots | +0.048 |
hunt | +0.047 |
ty | +0.047 |
Neg logit contributions | |
Through | -0.042 |
ite | -0.042 |
Having | -0.042 |
� | -0.042 |
ver | -0.041 |
Token | ie |
Token ID | 494 |
Feature activation | -1.98e-02 |
Pos logit contributions | |
pots | +0.004 |
guys | +0.003 |
hunt | +0.003 |
rust | +0.002 |
fl | +0.001 |
Neg logit contributions | |
ite | -0.037 |
ending | -0.037 |
Having | -0.037 |
ver | -0.036 |
Doing | -0.036 |
Token | . |
Token ID | 13 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
pots | +0.022 |
rust | +0.021 |
guys | +0.020 |
ie | +0.019 |
ger | +0.019 |
Neg logit contributions | |
ite | -0.036 |
ver | -0.036 |
� | -0.036 |
ifying | -0.036 |
Having | -0.035 |
Token |
|
Token ID | 198 |
Feature activation | +1.85e-02 |
Pos logit contributions | |
pots | +0.035 |
ie | +0.034 |
fl | +0.032 |
rust | +0.032 |
ty | +0.032 |
Neg logit contributions | |
ite | -0.024 |
ending | -0.023 |
Having | -0.023 |
ifying | -0.023 |
ver | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
ie | +0.027 |
pots | +0.027 |
ty | +0.026 |
rust | +0.026 |
fl | +0.025 |
Neg logit contributions | |
ite | -0.019 |
ifying | -0.019 |
ending | -0.018 |
Having | -0.018 |
ver | -0.018 |
Token | " |
Token ID | 1 |
Feature activation | +2.10e-02 |
Pos logit contributions | |
ie | +0.014 |
pots | +0.014 |
rust | +0.013 |
fl | +0.013 |
ty | +0.013 |
Neg logit contributions | |
ifying | -0.013 |
ite | -0.012 |
ver | -0.012 |
ending | -0.012 |
Having | -0.011 |
Token | Mom |
Token ID | 29252 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
pots | +0.025 |
ie | +0.024 |
fl | +0.024 |
rust | +0.023 |
ty | +0.023 |
Neg logit contributions | |
ite | -0.029 |
ending | -0.028 |
ver | -0.028 |
Having | -0.027 |
ifying | -0.027 |
Token | !" |
Token ID | 2474 |
Feature activation | +6.85e-02 |
Pos logit contributions | |
pots | +0.023 |
rust | +0.021 |
guys | +0.021 |
ger | +0.021 |
hunt | +0.020 |
Neg logit contributions | |
ite | -0.025 |
ver | -0.025 |
ending | -0.024 |
� | -0.024 |
Doing | -0.023 |
Token | Jan |
Token ID | 2365 |
Feature activation | +2.35e-02 |
Pos logit contributions | |
rob | +0.103 |
isk | +0.103 |
ty | +0.102 |
guys | +0.102 |
co | +0.101 |
Neg logit contributions | |
� | -0.078 |
ite | -0.077 |
Through | -0.073 |
It | -0.073 |
Having | -0.071 |
Token | ie |
Token ID | 494 |
Feature activation | +5.95e-03 |
Pos logit contributions | |
pots | +0.007 |
hunt | +0.006 |
guys | +0.005 |
rust | +0.005 |
fl | +0.004 |
Neg logit contributions | |
ite | -0.053 |
ending | -0.052 |
Having | -0.051 |
ver | -0.051 |
� | -0.050 |
Token | called |
Token ID | 1444 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
guys | +0.006 |
fl | +0.006 |
rust | +0.005 |
Neg logit contributions | |
ite | -0.009 |
Having | -0.009 |
ver | -0.009 |
ending | -0.009 |
� | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +6.66e-03 |
Pos logit contributions | |
rob | +0.013 |
fl | +0.012 |
please | +0.012 |
ie | +0.012 |
ils | +0.011 |
Neg logit contributions | |
� | -0.017 |
ver | -0.016 |
erv | -0.015 |
Through | -0.015 |
case | -0.015 |
Token | " |
Token ID | 366 |
Feature activation | +4.33e-03 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
rust | +0.009 |
fl | +0.009 |
ty | +0.009 |
Neg logit contributions | |
ite | -0.007 |
Having | -0.007 |
ending | -0.007 |
ver | -0.006 |
ifying | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +1.43e-02 |
Pos logit contributions | |
pots | +0.037 |
ie | +0.037 |
guys | +0.035 |
rust | +0.035 |
fl | +0.035 |
Neg logit contributions | |
ite | -0.020 |
Having | -0.019 |
ending | -0.019 |
ver | -0.018 |
ifying | -0.018 |
Token | " |
Token ID | 1 |
Feature activation | +3.08e-02 |
Pos logit contributions | |
ie | +0.021 |
pots | +0.021 |
rust | +0.020 |
fl | +0.020 |
ty | +0.020 |
Neg logit contributions | |
ite | -0.015 |
ver | -0.014 |
ifying | -0.014 |
ending | -0.014 |
Having | -0.014 |
Token | Oh |
Token ID | 5812 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
ie | +0.043 |
pots | +0.043 |
fl | +0.041 |
rust | +0.041 |
ty | +0.040 |
Neg logit contributions | |
ite | -0.035 |
ending | -0.034 |
Having | -0.033 |
ver | -0.033 |
ifying | -0.032 |
Token | , |
Token ID | 11 |
Feature activation | +1.23e-02 |
Pos logit contributions | |
pots | +0.021 |
hunt | +0.020 |
ie | +0.019 |
co | +0.019 |
please | +0.019 |
Neg logit contributions | |
ite | -0.017 |
ver | -0.017 |
� | -0.016 |
ifying | -0.016 |
ending | -0.016 |
Token | look |
Token ID | 804 |
Feature activation | +4.79e-03 |
Pos logit contributions | |
pots | +0.016 |
ie | +0.015 |
rust | +0.014 |
fl | +0.014 |
ty | +0.014 |
Neg logit contributions | |
ite | -0.016 |
Having | -0.015 |
ending | -0.015 |
ver | -0.015 |
ifying | -0.015 |
Token | ," |
Token ID | 553 |
Feature activation | +6.81e-02 |
Pos logit contributions | |
pots | +0.006 |
bank | +0.006 |
hunt | +0.006 |
isk | +0.006 |
rust | +0.006 |
Neg logit contributions | |
ifying | -0.006 |
� | -0.006 |
ite | -0.006 |
ver | -0.006 |
ending | -0.006 |
Token | B |
Token ID | 347 |
Feature activation | +1.97e-02 |
Pos logit contributions | |
pots | +0.094 |
isk | +0.092 |
cast | +0.088 |
hunt | +0.087 |
co | +0.087 |
Neg logit contributions | |
� | -0.090 |
ite | -0.084 |
Doing | -0.077 |
Having | -0.077 |
It | -0.075 |
Token | ess |
Token ID | 408 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
pots | +0.027 |
hunt | +0.024 |
guys | +0.024 |
rust | +0.024 |
ie | +0.024 |
Neg logit contributions | |
ite | -0.025 |
ending | -0.025 |
Having | -0.024 |
ver | -0.024 |
Doing | -0.023 |
Token | ie |
Token ID | 494 |
Feature activation | +9.37e-03 |
Pos logit contributions | |
pots | +0.006 |
guys | +0.004 |
hunt | +0.004 |
ger | +0.002 |
fl | +0.002 |
Neg logit contributions | |
ending | -0.040 |
ite | -0.040 |
Having | -0.040 |
ver | -0.040 |
� | -0.039 |
Token | said |
Token ID | 531 |
Feature activation | -1.40e-03 |
Pos logit contributions | |
pots | +0.009 |
ie | +0.009 |
guys | +0.009 |
fl | +0.008 |
hunt | +0.008 |
Neg logit contributions | |
ite | -0.014 |
ending | -0.014 |
Having | -0.014 |
ver | -0.014 |
� | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | +1.16e-02 |
Pos logit contributions | |
ver | +0.002 |
� | +0.002 |
ending | +0.002 |
ite | +0.002 |
Having | +0.002 |
Neg logit contributions | |
pots | -0.002 |
rob | -0.001 |
ie | -0.001 |
guys | -0.001 |
hunt | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
bank | +0.005 |
isk | +0.005 |
ie | +0.005 |
please | +0.005 |
hunt | +0.005 |
Neg logit contributions | |
ite | -0.004 |
� | -0.004 |
It | -0.004 |
ifying | -0.004 |
Doing | -0.004 |
Token | valley |
Token ID | 19272 |
Feature activation | -2.13e-02 |
Pos logit contributions | |
ie | +0.013 |
isk | +0.012 |
ty | +0.012 |
pots | +0.012 |
please | +0.011 |
Neg logit contributions | |
ite | -0.016 |
Having | -0.014 |
ifying | -0.014 |
ending | -0.014 |
case | -0.014 |
Token | with |
Token ID | 351 |
Feature activation | +5.86e-03 |
Pos logit contributions | |
ite | +0.033 |
ver | +0.031 |
ending | +0.031 |
Having | +0.031 |
� | +0.030 |
Neg logit contributions | |
pots | -0.022 |
ie | -0.021 |
rust | -0.020 |
fl | -0.020 |
guys | -0.020 |
Token | pretty |
Token ID | 2495 |
Feature activation | -1.31e-03 |
Pos logit contributions | |
ie | +0.007 |
fl | +0.007 |
ty | +0.007 |
rust | +0.007 |
rob | +0.007 |
Neg logit contributions | |
ite | -0.007 |
ifying | -0.007 |
Having | -0.007 |
ending | -0.007 |
� | -0.007 |
Token | colors |
Token ID | 7577 |
Feature activation | -3.79e-03 |
Pos logit contributions | |
ite | +0.002 |
Having | +0.002 |
ending | +0.002 |
ifying | +0.002 |
ver | +0.002 |
Neg logit contributions | |
pots | -0.001 |
ie | -0.001 |
rust | -0.001 |
ty | -0.001 |
fl | -0.001 |
Token | ," |
Token ID | 553 |
Feature activation | +6.77e-02 |
Pos logit contributions | |
Having | +0.006 |
ending | +0.006 |
ite | +0.006 |
ver | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
ie | -0.003 |
pots | -0.003 |
rust | -0.003 |
fl | -0.003 |
ty | -0.003 |
Token | she |
Token ID | 673 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
isk | +0.107 |
cast | +0.097 |
co | +0.096 |
urg | +0.096 |
pots | +0.095 |
Neg logit contributions | |
� | -0.074 |
ite | -0.073 |
It | -0.072 |
Through | -0.067 |
Having | -0.065 |
Token | said |
Token ID | 531 |
Feature activation | +5.75e-03 |
Pos logit contributions | |
pots | +0.018 |
fl | +0.018 |
ie | +0.018 |
isk | +0.017 |
cast | +0.017 |
Neg logit contributions | |
ver | -0.022 |
ite | -0.021 |
� | -0.021 |
ending | -0.020 |
presses | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +3.79e-02 |
Pos logit contributions | |
ie | +0.005 |
pots | +0.005 |
fl | +0.005 |
guys | +0.004 |
ty | +0.004 |
Neg logit contributions | |
ver | -0.010 |
ending | -0.009 |
ite | -0.009 |
Having | -0.009 |
� | -0.009 |
Token | Bella |
Token ID | 39304 |
Feature activation | -7.52e-03 |
Pos logit contributions | |
ie | +0.050 |
pots | +0.048 |
ty | +0.046 |
isk | +0.045 |
co | +0.044 |
Neg logit contributions | |
ite | -0.046 |
ver | -0.045 |
Through | -0.045 |
Having | -0.044 |
ending | -0.044 |
Token | asked |
Token ID | 1965 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
ite | +0.010 |
Having | +0.010 |
ending | +0.010 |
ver | +0.010 |
ifying | +0.009 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.009 |
rust | -0.008 |
fl | -0.008 |
guys | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +2.03e-02 |
Pos logit contributions | |
pots | +0.045 |
ie | +0.044 |
rust | +0.042 |
fl | +0.042 |
ty | +0.042 |
Neg logit contributions | |
ite | -0.027 |
ending | -0.026 |
Having | -0.026 |
ifying | -0.026 |
ver | -0.025 |
Token | " |
Token ID | 1 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
pots | +0.028 |
ie | +0.028 |
rust | +0.026 |
fl | +0.026 |
ty | +0.026 |
Neg logit contributions | |
ite | -0.024 |
Having | -0.023 |
ending | -0.023 |
ver | -0.022 |
ifying | -0.022 |
Token | A |
Token ID | 32 |
Feature activation | +2.05e-02 |
Pos logit contributions | |
pots | +0.016 |
fl | +0.015 |
rust | +0.015 |
please | +0.015 |
co | +0.015 |
Neg logit contributions | |
ite | -0.013 |
ver | -0.013 |
igsaw | -0.013 |
ending | -0.013 |
ifying | -0.012 |
Token | shiny |
Token ID | 22441 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
pots | +0.024 |
ie | +0.024 |
rust | +0.022 |
guys | +0.022 |
hunt | +0.022 |
Neg logit contributions | |
ite | -0.028 |
Having | -0.027 |
ending | -0.027 |
ifying | -0.027 |
ver | -0.027 |
Token | key |
Token ID | 1994 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
ending | +0.018 |
Having | +0.018 |
ite | +0.018 |
ifying | +0.018 |
ver | +0.018 |
Neg logit contributions | |
pots | -0.015 |
ie | -0.015 |
guys | -0.014 |
rust | -0.014 |
for | -0.013 |
Token | ," |
Token ID | 553 |
Feature activation | +6.76e-02 |
Pos logit contributions | |
pots | +0.015 |
ie | +0.015 |
rust | +0.014 |
fl | +0.014 |
guys | +0.014 |
Neg logit contributions | |
ite | -0.024 |
ending | -0.023 |
ver | -0.023 |
Having | -0.023 |
ifying | -0.023 |
Token | Jan |
Token ID | 2365 |
Feature activation | +2.18e-02 |
Pos logit contributions | |
ger | +0.097 |
isk | +0.094 |
guys | +0.094 |
ty | +0.092 |
rob | +0.091 |
Neg logit contributions | |
� | -0.082 |
ite | -0.079 |
Having | -0.077 |
Using | -0.075 |
Through | -0.075 |
Token | ie |
Token ID | 494 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
pots | +0.007 |
hunt | +0.005 |
rust | +0.005 |
guys | +0.005 |
ger | +0.003 |
Neg logit contributions | |
ending | -0.049 |
ite | -0.049 |
Having | -0.048 |
ver | -0.048 |
Doing | -0.047 |
Token | answered |
Token ID | 9373 |
Feature activation | -8.78e-03 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
guys | +0.005 |
fl | +0.005 |
rust | +0.005 |
Neg logit contributions | |
ite | -0.009 |
Having | -0.009 |
ending | -0.009 |
ver | -0.009 |
� | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
� | +0.013 |
ver | +0.013 |
Having | +0.012 |
ending | +0.012 |
ite | +0.012 |
Neg logit contributions | |
rob | -0.009 |
pots | -0.009 |
guys | -0.009 |
hunt | -0.009 |
fl | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | +7.93e-03 |
Pos logit contributions | |
ie | +0.031 |
pots | +0.031 |
ty | +0.029 |
guys | +0.029 |
rust | +0.029 |
Neg logit contributions | |
ite | -0.020 |
Having | -0.020 |
ending | -0.020 |
ver | -0.019 |
Doing | -0.019 |
Token |
|
Token ID | 198 |
Feature activation | -3.49e-03 |
Pos logit contributions | |
ie | +0.004 |
pots | +0.004 |
S | +0.004 |
them | +0.004 |
rust | +0.004 |
Neg logit contributions | |
ifying | -0.004 |
ending | -0.004 |
ite | -0.004 |
igsaw | -0.004 |
ver | -0.004 |
Token | " |
Token ID | 1 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
ifying | +0.005 |
ending | +0.005 |
ite | +0.004 |
ver | +0.004 |
igsaw | +0.004 |
Neg logit contributions | |
ie | -0.004 |
pots | -0.004 |
S | -0.004 |
b | -0.004 |
them | -0.004 |
Token | Ch |
Token ID | 1925 |
Feature activation | +4.85e-03 |
Pos logit contributions | |
pots | +0.016 |
rust | +0.015 |
co | +0.014 |
fl | +0.014 |
please | +0.014 |
Neg logit contributions | |
ver | -0.016 |
ite | -0.016 |
ending | -0.016 |
igsaw | -0.016 |
osity | -0.015 |
Token | ocolate |
Token ID | 9140 |
Feature activation | +4.88e-03 |
Pos logit contributions | |
ie | +0.007 |
pots | +0.006 |
ty | +0.006 |
isk | +0.006 |
co | +0.006 |
Neg logit contributions | |
ite | -0.006 |
ifying | -0.006 |
Having | -0.006 |
ending | -0.006 |
ver | -0.006 |
Token | cake |
Token ID | 12187 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.005 |
isk | +0.005 |
rust | +0.005 |
hunt | +0.005 |
Neg logit contributions | |
ite | -0.006 |
� | -0.006 |
ending | -0.006 |
ver | -0.006 |
Having | -0.006 |
Token | ," |
Token ID | 553 |
Feature activation | +6.68e-02 |
Pos logit contributions | |
isk | +0.020 |
pots | +0.018 |
rust | +0.018 |
ie | +0.017 |
please | +0.017 |
Neg logit contributions | |
ite | -0.022 |
� | -0.022 |
ending | -0.020 |
ver | -0.020 |
case | -0.020 |
Token | her |
Token ID | 607 |
Feature activation | +3.84e-03 |
Pos logit contributions | |
isk | +0.093 |
hunt | +0.091 |
guys | +0.088 |
ty | +0.087 |
bank | +0.087 |
Neg logit contributions | |
� | -0.081 |
Having | -0.080 |
Jimmy | -0.078 |
Doing | -0.077 |
ite | -0.076 |
Token | mom |
Token ID | 1995 |
Feature activation | +2.12e-02 |
Pos logit contributions | |
pots | +0.005 |
ie | +0.005 |
hunt | +0.004 |
ty | +0.004 |
fl | +0.004 |
Neg logit contributions | |
ite | -0.005 |
Having | -0.005 |
ver | -0.005 |
ending | -0.005 |
ifying | -0.005 |
Token | replied |
Token ID | 8712 |
Feature activation | +4.41e-03 |
Pos logit contributions | |
pots | +0.026 |
guys | +0.026 |
ger | +0.025 |
hunt | +0.024 |
fl | +0.023 |
Neg logit contributions | |
� | -0.028 |
ver | -0.028 |
ending | -0.028 |
Having | -0.027 |
ite | -0.027 |
Token | . |
Token ID | 13 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
rob | +0.005 |
hunt | +0.005 |
fl | +0.005 |
pots | +0.004 |
guys | +0.004 |
Neg logit contributions | |
ver | -0.006 |
� | -0.006 |
Through | -0.006 |
erv | -0.006 |
earing | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
pots | +0.027 |
ie | +0.027 |
rust | +0.025 |
ty | +0.025 |
fl | +0.025 |
Neg logit contributions | |
ite | -0.017 |
Having | -0.017 |
ending | -0.017 |
ver | -0.016 |
ifying | -0.016 |
Token | to |
Token ID | 284 |
Feature activation | -9.74e-04 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
rust | +0.006 |
fl | +0.006 |
ty | +0.006 |
Neg logit contributions | |
ite | -0.009 |
Having | -0.009 |
ending | -0.009 |
ver | -0.009 |
ifying | -0.009 |
Token | split |
Token ID | 6626 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
� | +0.001 |
Having | +0.001 |
ending | +0.001 |
ite | +0.001 |
ver | +0.001 |
Neg logit contributions | |
fl | -0.001 |
pots | -0.001 |
rob | -0.001 |
ie | -0.001 |
co | -0.001 |
Token | this |
Token ID | 428 |
Feature activation | +3.76e-03 |
Pos logit contributions | |
isk | +0.014 |
rust | +0.014 |
pots | +0.013 |
hunt | +0.013 |
please | +0.013 |
Neg logit contributions | |
ite | -0.013 |
� | -0.013 |
ifying | -0.013 |
Having | -0.012 |
igsaw | -0.012 |
Token | nut |
Token ID | 6701 |
Feature activation | +6.02e-03 |
Pos logit contributions | |
ie | +0.004 |
co | +0.004 |
isk | +0.004 |
pots | +0.004 |
please | +0.004 |
Neg logit contributions | |
ite | -0.005 |
� | -0.005 |
ifying | -0.005 |
ending | -0.004 |
ver | -0.004 |
Token | open |
Token ID | 1280 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
rust | +0.006 |
fl | +0.005 |
isk | +0.005 |
Neg logit contributions | |
ite | -0.009 |
ver | -0.009 |
ending | -0.009 |
� | -0.009 |
Having | -0.009 |
Token | ," |
Token ID | 553 |
Feature activation | +6.61e-02 |
Pos logit contributions | |
pots | +0.012 |
ie | +0.012 |
rust | +0.012 |
guys | +0.011 |
fl | +0.011 |
Neg logit contributions | |
ite | -0.020 |
ifying | -0.019 |
Having | -0.019 |
ver | -0.019 |
ending | -0.019 |
Token | said |
Token ID | 531 |
Feature activation | +3.45e-02 |
Pos logit contributions | |
co | +0.105 |
isk | +0.102 |
pots | +0.102 |
guys | +0.098 |
ger | +0.098 |
Neg logit contributions | |
� | -0.073 |
Doing | -0.069 |
It | -0.068 |
Having | -0.066 |
Having | -0.064 |
Token | Ros |
Token ID | 10018 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
co | +0.037 |
pots | +0.037 |
hunt | +0.035 |
cast | +0.034 |
isk | +0.034 |
Neg logit contributions | |
ver | -0.049 |
� | -0.048 |
It | -0.048 |
Through | -0.047 |
ite | -0.047 |
Token | ie |
Token ID | 494 |
Feature activation | +4.12e-03 |
Pos logit contributions | |
pots | +0.006 |
hunt | +0.005 |
guys | +0.005 |
rust | +0.005 |
ger | +0.004 |
Neg logit contributions | |
ending | -0.022 |
ver | -0.022 |
ite | -0.022 |
Having | -0.022 |
enny | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +2.27e-02 |
Pos logit contributions | |
pots | +0.004 |
guys | +0.004 |
rob | +0.004 |
hunt | +0.004 |
ger | +0.004 |
Neg logit contributions | |
� | -0.006 |
ver | -0.006 |
ending | -0.006 |
ite | -0.006 |
Having | -0.006 |
Token | " |
Token ID | 366 |
Feature activation | +8.57e-03 |
Pos logit contributions | |
pots | +0.039 |
ie | +0.039 |
guys | +0.037 |
ty | +0.036 |
rust | +0.036 |
Neg logit contributions | |
ite | -0.019 |
Having | -0.019 |
ver | -0.018 |
ending | -0.018 |
Doing | -0.018 |
Token | 's |
Token ID | 338 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.007 |
rust | +0.006 |
guys | +0.006 |
ty | +0.006 |
Neg logit contributions | |
ite | -0.004 |
ending | -0.004 |
Having | -0.004 |
ver | -0.004 |
� | -0.004 |
Token | so |
Token ID | 523 |
Feature activation | +5.07e-03 |
Pos logit contributions | |
ie | +0.029 |
pots | +0.029 |
fl | +0.028 |
co | +0.027 |
glob | +0.027 |
Neg logit contributions | |
� | -0.028 |
Having | -0.028 |
Doing | -0.027 |
glad | -0.027 |
ifying | -0.027 |
Token | big |
Token ID | 1263 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
pots | +0.005 |
ie | +0.005 |
rust | +0.005 |
fl | +0.005 |
ty | +0.005 |
Neg logit contributions | |
ite | -0.008 |
Having | -0.008 |
ending | -0.008 |
ver | -0.007 |
ifying | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
pots | +0.021 |
ie | +0.020 |
rust | +0.019 |
fl | +0.019 |
isk | +0.019 |
Neg logit contributions | |
ite | -0.020 |
ending | -0.019 |
Having | -0.019 |
ver | -0.019 |
Doing | -0.019 |
Token | peaceful |
Token ID | 12309 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
ite | +0.017 |
Having | +0.016 |
� | +0.016 |
ending | +0.016 |
ifying | +0.016 |
Neg logit contributions | |
ie | -0.014 |
pots | -0.014 |
fl | -0.013 |
ty | -0.013 |
co | -0.012 |
Token | ," |
Token ID | 553 |
Feature activation | +6.60e-02 |
Pos logit contributions | |
isk | +0.020 |
pots | +0.020 |
ie | +0.019 |
rust | +0.019 |
S | +0.018 |
Neg logit contributions | |
ite | -0.027 |
� | -0.025 |
ending | -0.025 |
ver | -0.025 |
Doing | -0.024 |
Token | said |
Token ID | 531 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
pots | +0.087 |
co | +0.087 |
isk | +0.086 |
cast | +0.081 |
urg | +0.078 |
Neg logit contributions | |
� | -0.085 |
Having | -0.080 |
Doing | -0.080 |
ite | -0.078 |
Having | -0.076 |
Token | Benny |
Token ID | 44275 |
Feature activation | +7.51e-04 |
Pos logit contributions | |
co | +0.051 |
pots | +0.051 |
cast | +0.048 |
isk | +0.047 |
hunt | +0.046 |
Neg logit contributions | |
� | -0.055 |
It | -0.054 |
ver | -0.054 |
ite | -0.052 |
Through | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
pots | +0.001 |
guys | +0.001 |
ie | +0.001 |
rust | +0.001 |
fl | +0.001 |
Neg logit contributions | |
ver | -0.001 |
ite | -0.001 |
ending | -0.001 |
Having | -0.001 |
� | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
pots | +0.042 |
ie | +0.042 |
rust | +0.039 |
ty | +0.039 |
guys | +0.039 |
Neg logit contributions | |
ite | -0.021 |
Having | -0.021 |
ending | -0.020 |
ver | -0.020 |
Doing | -0.020 |
Token |
|
Token ID | 198 |
Feature activation | +5.16e-03 |
Pos logit contributions | |
pots | +0.034 |
ie | +0.033 |
rust | +0.032 |
guys | +0.032 |
fl | +0.032 |
Neg logit contributions | |
ite | -0.016 |
Having | -0.016 |
ending | -0.016 |
ver | -0.015 |
Doing | -0.015 |
Token | skipping |
Token ID | 31017 |
Feature activation | -3.04e-03 |
Pos logit contributions | |
ite | +0.016 |
Having | +0.016 |
ending | +0.016 |
ifying | +0.016 |
ver | +0.015 |
Neg logit contributions | |
pots | -0.011 |
ie | -0.011 |
rust | -0.010 |
for | -0.010 |
ty | -0.010 |
Token | because |
Token ID | 780 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
ite | +0.005 |
ifying | +0.004 |
Having | +0.004 |
ending | +0.004 |
ver | +0.004 |
Neg logit contributions | |
pots | -0.003 |
ie | -0.003 |
rust | -0.003 |
hunt | -0.003 |
ty | -0.003 |
Token | it |
Token ID | 340 |
Feature activation | -2.45e-03 |
Pos logit contributions | |
erv | +0.022 |
Having | +0.021 |
ending | +0.021 |
ver | +0.021 |
ite | +0.021 |
Neg logit contributions | |
ie | -0.021 |
for | -0.021 |
pots | -0.021 |
all | -0.020 |
them | -0.020 |
Token | 's |
Token ID | 338 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
ite | +0.003 |
Having | +0.003 |
ifying | +0.003 |
ending | +0.003 |
ver | +0.003 |
Neg logit contributions | |
ie | -0.003 |
pots | -0.003 |
fl | -0.003 |
rust | -0.003 |
ty | -0.003 |
Token | fun |
Token ID | 1257 |
Feature activation | +1.18e-02 |
Pos logit contributions | |
pots | +0.019 |
ie | +0.019 |
guys | +0.018 |
fl | +0.018 |
rust | +0.017 |
Neg logit contributions | |
Having | -0.023 |
ite | -0.023 |
ending | -0.023 |
� | -0.023 |
ver | -0.023 |
Token | ," |
Token ID | 553 |
Feature activation | +6.57e-02 |
Pos logit contributions | |
pots | +0.012 |
isk | +0.012 |
ie | +0.011 |
rust | +0.011 |
S | +0.011 |
Neg logit contributions | |
ite | -0.017 |
ending | -0.016 |
� | -0.016 |
Having | -0.016 |
ver | -0.016 |
Token | explained |
Token ID | 4893 |
Feature activation | +2.87e-02 |
Pos logit contributions | |
pots | +0.088 |
guys | +0.086 |
hunt | +0.085 |
isk | +0.084 |
glob | +0.081 |
Neg logit contributions | |
� | -0.083 |
Having | -0.082 |
Doing | -0.079 |
Through | -0.077 |
Jimmy | -0.077 |
Token | Sus |
Token ID | 8932 |
Feature activation | -5.35e-03 |
Pos logit contributions | |
hunt | +0.039 |
please | +0.038 |
isk | +0.037 |
pots | +0.036 |
rob | +0.036 |
Neg logit contributions | |
� | -0.034 |
Through | -0.032 |
Jimmy | -0.032 |
It | -0.031 |
Since | -0.031 |
Token | ie |
Token ID | 494 |
Feature activation | -7.35e-03 |
Pos logit contributions | |
ite | +0.013 |
ending | +0.013 |
Having | +0.013 |
ver | +0.013 |
ifying | +0.012 |
Neg logit contributions | |
pots | -0.001 |
rust | -0.000 |
hunt | -0.000 |
guys | -0.000 |
ie | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
ite | +0.013 |
ending | +0.013 |
Having | +0.013 |
ver | +0.013 |
ifying | +0.012 |
Neg logit contributions | |
pots | -0.006 |
ie | -0.005 |
rust | -0.005 |
guys | -0.005 |
fl | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +7.78e-03 |
Pos logit contributions | |
pots | +0.017 |
ie | +0.017 |
rust | +0.016 |
S | +0.016 |
fl | +0.016 |
Neg logit contributions | |
ite | -0.014 |
ending | -0.013 |
ifying | -0.013 |
Having | -0.013 |
ver | -0.012 |
Token | I |
Token ID | 40 |
Feature activation | -8.82e-03 |
Pos logit contributions | |
fl | +0.015 |
rust | +0.015 |
pots | +0.014 |
please | +0.014 |
we | +0.014 |
Neg logit contributions | |
ver | -0.020 |
ending | -0.020 |
ite | -0.019 |
igsaw | -0.019 |
earing | -0.019 |
Token | am |
Token ID | 716 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
ite | +0.010 |
Having | +0.009 |
ending | +0.009 |
ver | +0.009 |
ifying | +0.009 |
Neg logit contributions | |
pots | -0.013 |
ie | -0.013 |
rust | -0.012 |
fl | -0.012 |
ty | -0.012 |
Token | making |
Token ID | 1642 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
ie | +0.001 |
pots | +0.001 |
fl | +0.001 |
rust | +0.001 |
co | +0.001 |
Neg logit contributions | |
Having | -0.001 |
ending | -0.001 |
ite | -0.001 |
ver | -0.001 |
ifying | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +5.12e-03 |
Pos logit contributions | |
ie | +0.014 |
isk | +0.014 |
co | +0.014 |
pots | +0.014 |
glob | +0.013 |
Neg logit contributions | |
� | -0.014 |
ending | -0.013 |
igsaw | -0.012 |
Doing | -0.012 |
Having | -0.012 |
Token | cake |
Token ID | 12187 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
ie | +0.007 |
we | +0.006 |
fl | +0.006 |
pots | +0.006 |
co | +0.006 |
Neg logit contributions | |
ite | -0.006 |
� | -0.006 |
ifying | -0.006 |
igsaw | -0.006 |
case | -0.006 |
Token | ," |
Token ID | 553 |
Feature activation | +6.55e-02 |
Pos logit contributions | |
isk | +0.027 |
co | +0.024 |
pots | +0.024 |
ger | +0.024 |
bank | +0.023 |
Neg logit contributions | |
ite | -0.030 |
case | -0.029 |
� | -0.028 |
outage | -0.026 |
ver | -0.025 |
Token | said |
Token ID | 531 |
Feature activation | +4.09e-02 |
Pos logit contributions | |
co | +0.113 |
isk | +0.107 |
pots | +0.102 |
cast | +0.101 |
ger | +0.100 |
Neg logit contributions | |
� | -0.068 |
It | -0.062 |
Doing | -0.062 |
From | -0.058 |
Having | -0.058 |
Token | Ros |
Token ID | 10018 |
Feature activation | +1.05e-02 |
Pos logit contributions | |
co | +0.054 |
pots | +0.047 |
cast | +0.047 |
isk | +0.046 |
bank | +0.046 |
Neg logit contributions | |
It | -0.054 |
� | -0.052 |
ver | -0.051 |
Through | -0.051 |
Its | -0.050 |
Token | ie |
Token ID | 494 |
Feature activation | -7.52e-05 |
Pos logit contributions | |
pots | +0.005 |
hunt | +0.005 |
rust | +0.005 |
guys | +0.004 |
fl | +0.004 |
Neg logit contributions | |
ver | -0.020 |
ite | -0.020 |
ending | -0.020 |
enny | -0.020 |
Having | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +2.29e-02 |
Pos logit contributions | |
� | +0.000 |
ver | +0.000 |
ending | +0.000 |
ite | +0.000 |
Having | +0.000 |
Neg logit contributions | |
pots | -0.000 |
guys | -0.000 |
rob | -0.000 |
hunt | -0.000 |
ger | -0.000 |
Token | " |
Token ID | 366 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
ie | +0.038 |
pots | +0.037 |
ty | +0.036 |
guys | +0.035 |
rust | +0.035 |
Neg logit contributions | |
Having | -0.020 |
ite | -0.019 |
ver | -0.019 |
Doing | -0.019 |
Through | -0.019 |
Token | 't |
Token ID | 470 |
Feature activation | -3.90e-03 |
Pos logit contributions | |
ite | +0.014 |
Having | +0.014 |
ifying | +0.013 |
ending | +0.013 |
ver | +0.013 |
Neg logit contributions | |
pots | -0.019 |
ie | -0.019 |
rust | -0.018 |
ty | -0.018 |
hunt | -0.018 |
Token | know |
Token ID | 760 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
ite | +0.004 |
ending | +0.003 |
ver | +0.003 |
� | +0.003 |
Having | +0.003 |
Neg logit contributions | |
pots | -0.006 |
fl | -0.006 |
ie | -0.006 |
glob | -0.006 |
rust | -0.006 |
Token | how |
Token ID | 703 |
Feature activation | +1.40e-03 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
rust | +0.009 |
fl | +0.009 |
ty | +0.009 |
Neg logit contributions | |
ite | -0.020 |
ending | -0.019 |
ver | -0.019 |
Having | -0.019 |
ifying | -0.019 |
Token | to |
Token ID | 284 |
Feature activation | -1.85e-02 |
Pos logit contributions | |
ie | +0.001 |
pots | +0.001 |
for | +0.001 |
them | +0.001 |
rust | +0.001 |
Neg logit contributions | |
ver | -0.003 |
Having | -0.003 |
igsaw | -0.003 |
ite | -0.003 |
ifying | -0.003 |
Token | swim |
Token ID | 9422 |
Feature activation | +1.90e-02 |
Pos logit contributions | |
ite | +0.020 |
� | +0.019 |
ver | +0.019 |
ending | +0.018 |
Having | +0.018 |
Neg logit contributions | |
pots | -0.027 |
fl | -0.026 |
isk | -0.025 |
glob | -0.025 |
ie | -0.025 |
Token | ," |
Token ID | 553 |
Feature activation | +6.55e-02 |
Pos logit contributions | |
pots | +0.024 |
isk | +0.024 |
por | +0.023 |
fl | +0.023 |
please | +0.023 |
Neg logit contributions | |
ite | -0.025 |
� | -0.024 |
ver | -0.023 |
ifying | -0.023 |
wins | -0.021 |
Token | replied |
Token ID | 8712 |
Feature activation | +3.06e-02 |
Pos logit contributions | |
pots | +0.115 |
urg | +0.110 |
cast | +0.108 |
ales | +0.106 |
isk | +0.105 |
Neg logit contributions | |
� | -0.058 |
It | -0.055 |
From | -0.052 |
Having | -0.051 |
ite | -0.050 |
Token | Lily |
Token ID | 20037 |
Feature activation | -5.54e-03 |
Pos logit contributions | |
co | +0.048 |
pots | +0.047 |
cast | +0.046 |
we | +0.045 |
isk | +0.045 |
Neg logit contributions | |
It | -0.030 |
� | -0.028 |
Its | -0.027 |
Mes | -0.026 |
Fasc | -0.026 |
Token | . |
Token ID | 13 |
Feature activation | +1.74e-02 |
Pos logit contributions | |
ver | +0.008 |
� | +0.008 |
ending | +0.007 |
ite | +0.007 |
Having | +0.007 |
Neg logit contributions | |
pots | -0.006 |
rob | -0.006 |
guys | -0.006 |
ger | -0.006 |
hunt | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +1.79e-02 |
Pos logit contributions | |
ie | +0.030 |
pots | +0.030 |
guys | +0.029 |
ty | +0.028 |
rust | +0.028 |
Neg logit contributions | |
ite | -0.014 |
Having | -0.014 |
ver | -0.013 |
ending | -0.013 |
Doing | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | +8.80e-03 |
Pos logit contributions | |
pots | +0.032 |
ie | +0.031 |
guys | +0.030 |
rust | +0.030 |
fl | +0.030 |
Neg logit contributions | |
ite | -0.014 |
Having | -0.013 |
ending | -0.013 |
ver | -0.013 |
Doing | -0.012 |
Token | yourself |
Token ID | 3511 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
Jimmy | +0.004 |
� | +0.004 |
ite | +0.004 |
ifying | +0.004 |
Having | +0.003 |
Neg logit contributions | |
please | -0.006 |
rust | -0.006 |
pots | -0.006 |
isk | -0.006 |
hunt | -0.006 |
Token | before |
Token ID | 878 |
Feature activation | +2.02e-02 |
Pos logit contributions | |
ite | +0.032 |
ver | +0.030 |
� | +0.030 |
ending | +0.030 |
Having | +0.030 |
Neg logit contributions | |
pots | -0.021 |
fl | -0.020 |
rust | -0.020 |
ie | -0.020 |
guys | -0.019 |
Token | you |
Token ID | 345 |
Feature activation | +6.66e-03 |
Pos logit contributions | |
ie | +0.026 |
co | +0.025 |
fl | +0.025 |
pots | +0.025 |
isk | +0.025 |
Neg logit contributions | |
ite | -0.024 |
� | -0.023 |
Having | -0.023 |
ending | -0.023 |
ifying | -0.022 |
Token | go |
Token ID | 467 |
Feature activation | +2.49e-02 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.007 |
fl | +0.007 |
rust | +0.007 |
ty | +0.006 |
Neg logit contributions | |
ite | -0.010 |
ifying | -0.009 |
� | -0.009 |
ver | -0.009 |
ending | -0.009 |
Token | home |
Token ID | 1363 |
Feature activation | +9.93e-03 |
Pos logit contributions | |
pots | +0.026 |
rust | +0.025 |
ie | +0.025 |
fl | +0.024 |
guys | +0.024 |
Neg logit contributions | |
ite | -0.037 |
ifying | -0.034 |
ending | -0.034 |
Having | -0.034 |
Doing | -0.033 |
Token | ," |
Token ID | 553 |
Feature activation | +6.53e-02 |
Pos logit contributions | |
pots | +0.011 |
rust | +0.010 |
fl | +0.010 |
guys | +0.010 |
isk | +0.010 |
Neg logit contributions | |
ite | -0.014 |
ver | -0.013 |
� | -0.013 |
case | -0.013 |
Doing | -0.013 |
Token | his |
Token ID | 465 |
Feature activation | +2.99e-02 |
Pos logit contributions | |
co | +0.116 |
isk | +0.108 |
pots | +0.097 |
ty | +0.096 |
glob | +0.096 |
Neg logit contributions | |
It | -0.062 |
From | -0.059 |
� | -0.058 |
Doing | -0.057 |
Having | -0.057 |
Token | mother |
Token ID | 2802 |
Feature activation | +6.39e-03 |
Pos logit contributions | |
rob | +0.053 |
hunt | +0.052 |
pots | +0.052 |
ty | +0.051 |
ils | +0.050 |
Neg logit contributions | |
ite | -0.018 |
glad | -0.017 |
erv | -0.015 |
endant | -0.015 |
young | -0.015 |
Token | said |
Token ID | 531 |
Feature activation | -5.65e-03 |
Pos logit contributions | |
pots | +0.008 |
guys | +0.008 |
fl | +0.008 |
ger | +0.008 |
hunt | +0.008 |
Neg logit contributions | |
ver | -0.008 |
� | -0.008 |
ending | -0.008 |
ite | -0.008 |
old | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
ver | +0.009 |
ending | +0.009 |
ite | +0.009 |
Having | +0.009 |
ifying | +0.009 |
Neg logit contributions | |
pots | -0.005 |
ie | -0.005 |
fl | -0.005 |
guys | -0.004 |
hunt | -0.004 |
Token | " |
Token ID | 366 |
Feature activation | +4.78e-03 |
Pos logit contributions | |
ie | +0.021 |
pots | +0.021 |
co | +0.020 |
ty | +0.020 |
guys | +0.019 |
Neg logit contributions | |
Having | -0.023 |
ite | -0.023 |
Through | -0.023 |
Doing | -0.022 |
Having | -0.022 |
Token |
|
Token ID | 198 |
Feature activation | +2.38e-02 |
Pos logit contributions | |
pots | +0.024 |
ie | +0.024 |
fl | +0.023 |
rust | +0.022 |
S | +0.022 |
Neg logit contributions | |
ite | -0.023 |
ending | -0.022 |
ifying | -0.021 |
ver | -0.021 |
Having | -0.021 |
Token |
|
Token ID | 198 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
ie | +0.031 |
pots | +0.030 |
them | +0.030 |
rust | +0.028 |
S | +0.028 |
Neg logit contributions | |
ite | -0.029 |
ifying | -0.029 |
ending | -0.027 |
ver | -0.026 |
osity | -0.026 |
Token | " |
Token ID | 1 |
Feature activation | +2.97e-02 |
Pos logit contributions | |
ie | +0.013 |
pots | +0.012 |
them | +0.012 |
co | +0.012 |
rust | +0.012 |
Neg logit contributions | |
ite | -0.016 |
ver | -0.016 |
ifying | -0.015 |
osity | -0.015 |
ending | -0.015 |
Token | Me |
Token ID | 5308 |
Feature activation | -2.66e-03 |
Pos logit contributions | |
pots | +0.039 |
ie | +0.039 |
rust | +0.036 |
guys | +0.036 |
hunt | +0.036 |
Neg logit contributions | |
ite | -0.036 |
Having | -0.036 |
ending | -0.035 |
ifying | -0.035 |
ver | -0.034 |
Token | ow |
Token ID | 322 |
Feature activation | +9.19e-03 |
Pos logit contributions | |
ite | +0.004 |
ver | +0.003 |
ending | +0.003 |
ifying | +0.003 |
Having | +0.003 |
Neg logit contributions | |
pots | -0.004 |
ie | -0.003 |
hunt | -0.003 |
rust | -0.003 |
guys | -0.003 |
Token | ," |
Token ID | 553 |
Feature activation | +6.52e-02 |
Pos logit contributions | |
pots | +0.010 |
hunt | +0.009 |
please | +0.009 |
fl | +0.009 |
rust | +0.009 |
Neg logit contributions | |
ite | -0.014 |
ending | -0.013 |
ver | -0.013 |
ifying | -0.013 |
� | -0.013 |
Token | m |
Token ID | 285 |
Feature activation | +1.73e-02 |
Pos logit contributions | |
pots | +0.084 |
isk | +0.084 |
hunt | +0.084 |
guys | +0.081 |
glob | +0.081 |
Neg logit contributions | |
� | -0.083 |
Having | -0.080 |
Doing | -0.078 |
Jimmy | -0.077 |
Through | -0.077 |
Token | ew |
Token ID | 413 |
Feature activation | +1.78e-02 |
Pos logit contributions | |
ie | +0.024 |
pots | +0.023 |
rust | +0.023 |
ty | +0.022 |
co | +0.022 |
Neg logit contributions | |
Having | -0.019 |
ite | -0.019 |
ifying | -0.019 |
ending | -0.018 |
ver | -0.018 |
Token | ed |
Token ID | 276 |
Feature activation | +3.14e-02 |
Pos logit contributions | |
pots | +0.019 |
hunt | +0.018 |
guys | +0.017 |
rust | +0.016 |
glob | +0.016 |
Neg logit contributions | |
ending | -0.026 |
ite | -0.026 |
Having | -0.026 |
ver | -0.026 |
Jimmy | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
hunt | +0.042 |
pots | +0.042 |
isk | +0.041 |
rob | +0.040 |
guys | +0.039 |
Neg logit contributions | |
� | -0.037 |
Jimmy | -0.035 |
Having | -0.035 |
Through | -0.034 |
Since | -0.033 |
Token | cat |
Token ID | 3797 |
Feature activation | +6.37e-03 |
Pos logit contributions | |
ie | +0.020 |
pots | +0.019 |
cast | +0.018 |
ty | +0.018 |
fl | +0.017 |
Neg logit contributions | |
ite | -0.017 |
ifying | -0.017 |
Having | -0.016 |
� | -0.016 |
ending | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | -1.44e-03 |
Pos logit contributions | |
ite | +0.020 |
ifying | +0.019 |
Having | +0.019 |
� | +0.019 |
ver | +0.018 |
Neg logit contributions | |
ie | -0.017 |
pots | -0.016 |
hunt | -0.016 |
please | -0.016 |
ty | -0.015 |
Token | rest |
Token ID | 1334 |
Feature activation | -7.35e-03 |
Pos logit contributions | |
ite | +0.002 |
ending | +0.002 |
Having | +0.002 |
ver | +0.002 |
ifying | +0.002 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
rust | -0.002 |
fl | -0.002 |
guys | -0.002 |
Token | of |
Token ID | 286 |
Feature activation | +1.76e-03 |
Pos logit contributions | |
ite | +0.007 |
Having | +0.007 |
ending | +0.007 |
ver | +0.007 |
ifying | +0.007 |
Neg logit contributions | |
pots | -0.011 |
ie | -0.011 |
rust | -0.010 |
ty | -0.010 |
fl | -0.010 |
Token | the |
Token ID | 262 |
Feature activation | +6.75e-03 |
Pos logit contributions | |
ie | +0.002 |
pots | +0.002 |
fl | +0.002 |
guys | +0.002 |
rust | +0.002 |
Neg logit contributions | |
ite | -0.002 |
Having | -0.002 |
ifying | -0.002 |
igsaw | -0.002 |
ver | -0.002 |
Token | or |
Token ID | 393 |
Feature activation | +4.72e-03 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.008 |
rust | +0.007 |
fl | +0.007 |
hunt | +0.007 |
Neg logit contributions | |
ending | -0.009 |
ver | -0.009 |
ite | -0.009 |
Having | -0.009 |
ifying | -0.009 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.79e-02 |
Pos logit contributions | |
ie | +0.006 |
fl | +0.005 |
pots | +0.005 |
co | +0.005 |
ty | +0.005 |
Neg logit contributions | |
ite | -0.006 |
Having | -0.006 |
ifying | -0.006 |
ver | -0.006 |
� | -0.006 |
Token | ents |
Token ID | 658 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
Flying | +0.056 |
Having | +0.056 |
Fasc | +0.055 |
ver | +0.055 |
Jimmy | +0.054 |
Neg logit contributions | |
ie | -0.113 |
pots | -0.108 |
each | -0.100 |
please | -0.100 |
rust | -0.096 |
Token | onto |
Token ID | 4291 |
Feature activation | +3.68e-03 |
Pos logit contributions | |
ite | +0.028 |
ending | +0.027 |
Having | +0.027 |
ver | +0.027 |
ifying | +0.027 |
Neg logit contributions | |
pots | -0.014 |
ie | -0.014 |
guys | -0.012 |
fl | -0.012 |
rust | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
ie | +0.004 |
fl | +0.004 |
please | +0.004 |
pots | +0.004 |
rust | +0.004 |
Neg logit contributions | |
ifying | -0.005 |
� | -0.005 |
Having | -0.004 |
ver | -0.004 |
ite | -0.004 |
Token | tree |
Token ID | 5509 |
Feature activation | -1.91e-03 |
Pos logit contributions | |
ie | +0.013 |
pots | +0.013 |
rust | +0.012 |
ty | +0.012 |
fl | +0.012 |
Neg logit contributions | |
ite | -0.013 |
ifying | -0.012 |
Having | -0.012 |
� | -0.012 |
case | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -7.69e-03 |
Pos logit contributions | |
ite | +0.003 |
ending | +0.003 |
ver | +0.003 |
ifying | +0.003 |
Having | +0.003 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
guys | -0.002 |
fl | -0.001 |
rust | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
ite | +0.002 |
Having | +0.002 |
ending | +0.002 |
ifying | +0.002 |
Doing | +0.002 |
Neg logit contributions | |
ie | -0.002 |
pots | -0.002 |
ty | -0.002 |
rust | -0.002 |
fl | -0.002 |
Token | look |
Token ID | 804 |
Feature activation | -4.14e-03 |
Pos logit contributions | |
pots | +0.012 |
ie | +0.012 |
hunt | +0.012 |
rust | +0.011 |
guys | +0.011 |
Neg logit contributions | |
ending | -0.024 |
ite | -0.024 |
ver | -0.023 |
ifying | -0.023 |
Having | -0.023 |
Token | at |
Token ID | 379 |
Feature activation | +2.33e-03 |
Pos logit contributions | |
ite | +0.006 |
ending | +0.006 |
Having | +0.006 |
ifying | +0.006 |
ver | +0.006 |
Neg logit contributions | |
pots | -0.004 |
rust | -0.004 |
ie | -0.004 |
fl | -0.004 |
hunt | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | -1.45e-02 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
rust | +0.002 |
fl | +0.002 |
ty | +0.002 |
Neg logit contributions | |
ite | -0.003 |
Having | -0.003 |
ending | -0.003 |
ifying | -0.003 |
ver | -0.003 |
Token | or |
Token ID | 393 |
Feature activation | -3.85e-03 |
Pos logit contributions | |
ending | +0.021 |
ite | +0.021 |
Having | +0.021 |
ver | +0.021 |
ifying | +0.020 |
Neg logit contributions | |
pots | -0.015 |
ie | -0.015 |
rust | -0.014 |
fl | -0.014 |
guys | -0.014 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.72e-02 |
Pos logit contributions | |
Having | +0.005 |
ite | +0.004 |
ifying | +0.004 |
ending | +0.004 |
Doing | +0.004 |
Neg logit contributions | |
ie | -0.005 |
pots | -0.005 |
ty | -0.005 |
fl | -0.005 |
co | -0.005 |
Token | ents |
Token ID | 658 |
Feature activation | +1.36e-03 |
Pos logit contributions | |
ver | +0.054 |
Having | +0.053 |
Fasc | +0.050 |
Doing | +0.050 |
Jimmy | +0.049 |
Neg logit contributions | |
ie | -0.116 |
pots | -0.108 |
please | -0.101 |
each | -0.100 |
rust | -0.099 |
Token | on |
Token ID | 319 |
Feature activation | +7.64e-03 |
Pos logit contributions | |
pots | +0.001 |
ie | +0.001 |
guys | +0.001 |
fl | +0.001 |
rust | +0.001 |
Neg logit contributions | |
ite | -0.002 |
ending | -0.002 |
ver | -0.002 |
Having | -0.002 |
ifying | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +7.56e-03 |
Pos logit contributions | |
ie | +0.008 |
pots | +0.008 |
fl | +0.007 |
ty | +0.007 |
rust | +0.007 |
Neg logit contributions | |
Having | -0.011 |
ite | -0.011 |
ifying | -0.011 |
ending | -0.011 |
ver | -0.011 |
Token | tree |
Token ID | 5509 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
ie | +0.010 |
isk | +0.010 |
urg | +0.010 |
S | +0.009 |
please | +0.009 |
Neg logit contributions | |
case | -0.009 |
� | -0.008 |
ifying | -0.008 |
ite | -0.008 |
Having | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +2.76e-03 |
Pos logit contributions | |
pots | +0.013 |
ie | +0.012 |
guys | +0.012 |
fl | +0.011 |
ty | +0.011 |
Neg logit contributions | |
ite | -0.028 |
ending | -0.027 |
Having | -0.027 |
ifying | -0.027 |
ver | -0.027 |
Token | take |
Token ID | 1011 |
Feature activation | +1.69e-04 |
Pos logit contributions | |
ite | +0.006 |
ending | +0.006 |
ifying | +0.006 |
Having | +0.006 |
ver | +0.006 |
Neg logit contributions | |
ie | -0.003 |
pots | -0.003 |
hunt | -0.003 |
guys | -0.003 |
rust | -0.003 |
Token | one |
Token ID | 530 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
ie | +0.000 |
pots | +0.000 |
rust | +0.000 |
isk | +0.000 |
fl | +0.000 |
Neg logit contributions | |
ite | -0.000 |
Having | -0.000 |
� | -0.000 |
ver | -0.000 |
ending | -0.000 |
Token | of |
Token ID | 286 |
Feature activation | -6.81e-03 |
Pos logit contributions | |
pots | +0.017 |
ie | +0.016 |
rust | +0.016 |
fl | +0.016 |
guys | +0.016 |
Neg logit contributions | |
ite | -0.015 |
ending | -0.014 |
Having | -0.014 |
ifying | -0.014 |
ver | -0.014 |
Token | the |
Token ID | 262 |
Feature activation | +6.83e-03 |
Pos logit contributions | |
ite | +0.011 |
ending | +0.011 |
Having | +0.011 |
ver | +0.010 |
ifying | +0.010 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.006 |
rust | -0.006 |
ty | -0.006 |
fl | -0.006 |
Token | or |
Token ID | 393 |
Feature activation | +1.59e-03 |
Pos logit contributions | |
ie | +0.008 |
ty | +0.008 |
pots | +0.008 |
isk | +0.008 |
fl | +0.008 |
Neg logit contributions | |
ite | -0.009 |
Having | -0.009 |
ending | -0.008 |
ver | -0.008 |
ifying | -0.008 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.56e-02 |
Pos logit contributions | |
ie | +0.002 |
pots | +0.002 |
fl | +0.002 |
ty | +0.002 |
rust | +0.002 |
Neg logit contributions | |
ite | -0.002 |
Having | -0.002 |
ver | -0.002 |
ifying | -0.002 |
ending | -0.002 |
Token | ents |
Token ID | 658 |
Feature activation | -4.95e-03 |
Pos logit contributions | |
Having | +0.051 |
ver | +0.051 |
Jimmy | +0.050 |
Doing | +0.048 |
Flying | +0.048 |
Neg logit contributions | |
ie | -0.114 |
pots | -0.106 |
please | -0.100 |
rust | -0.098 |
bat | -0.097 |
Token | outside |
Token ID | 2354 |
Feature activation | +3.70e-03 |
Pos logit contributions | |
ite | +0.007 |
ver | +0.007 |
ending | +0.007 |
Having | +0.007 |
ifying | +0.007 |
Neg logit contributions | |
pots | -0.005 |
ie | -0.005 |
fl | -0.005 |
guys | -0.005 |
rust | -0.005 |
Token | for |
Token ID | 329 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.003 |
fl | +0.003 |
rust | +0.003 |
ty | +0.003 |
Neg logit contributions | |
ite | -0.006 |
Having | -0.005 |
ifying | -0.005 |
ver | -0.005 |
ending | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | +2.08e-02 |
Pos logit contributions | |
ie | +0.017 |
fl | +0.017 |
pots | +0.016 |
isk | +0.015 |
ty | +0.015 |
Neg logit contributions | |
Having | -0.015 |
Jimmy | -0.014 |
ver | -0.014 |
ending | -0.014 |
� | -0.014 |
Token | walk |
Token ID | 2513 |
Feature activation | +4.47e-03 |
Pos logit contributions | |
pots | +0.024 |
ie | +0.024 |
rust | +0.022 |
ty | +0.022 |
fl | +0.022 |
Neg logit contributions | |
ite | -0.029 |
Having | -0.028 |
ending | -0.028 |
ver | -0.028 |
ifying | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | +3.85e-03 |
Pos logit contributions | |
ite | +0.017 |
ifying | +0.016 |
Having | +0.016 |
� | +0.015 |
ver | +0.015 |
Neg logit contributions | |
ie | -0.015 |
pots | -0.015 |
hunt | -0.014 |
ty | -0.014 |
please | -0.014 |
Token | rest |
Token ID | 1334 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
pots | +0.005 |
ie | +0.005 |
rust | +0.005 |
fl | +0.005 |
b | +0.005 |
Neg logit contributions | |
ending | -0.005 |
ite | -0.005 |
ver | -0.005 |
ifying | -0.005 |
Having | -0.005 |
Token | of |
Token ID | 286 |
Feature activation | -4.33e-03 |
Pos logit contributions | |
Having | +0.012 |
ending | +0.011 |
Fasc | +0.011 |
Jimmy | +0.011 |
Doing | +0.011 |
Neg logit contributions | |
ie | -0.019 |
pots | -0.018 |
for | -0.018 |
ty | -0.017 |
fl | -0.017 |
Token | the |
Token ID | 262 |
Feature activation | +9.75e-03 |
Pos logit contributions | |
ite | +0.007 |
ending | +0.007 |
Having | +0.007 |
ver | +0.007 |
ifying | +0.007 |
Neg logit contributions | |
pots | -0.004 |
ie | -0.004 |
rust | -0.004 |
ty | -0.004 |
fl | -0.004 |
Token | or |
Token ID | 393 |
Feature activation | +6.36e-03 |
Pos logit contributions | |
ie | +0.013 |
pots | +0.013 |
rust | +0.012 |
fl | +0.012 |
b | +0.011 |
Neg logit contributions | |
ver | -0.013 |
ifying | -0.012 |
ending | -0.012 |
ite | -0.012 |
Having | -0.012 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.37e-02 |
Pos logit contributions | |
ie | +0.008 |
fl | +0.008 |
co | +0.008 |
ty | +0.008 |
pots | +0.008 |
Neg logit contributions | |
ite | -0.007 |
Having | -0.007 |
ifying | -0.007 |
ver | -0.007 |
� | -0.007 |
Token | ents |
Token ID | 658 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
Having | +0.054 |
Jimmy | +0.053 |
Fasc | +0.052 |
ver | +0.052 |
Flying | +0.050 |
Neg logit contributions | |
ie | -0.109 |
pots | -0.103 |
each | -0.092 |
for | -0.092 |
rust | -0.091 |
Token | onto |
Token ID | 4291 |
Feature activation | -7.03e-03 |
Pos logit contributions | |
ite | +0.018 |
Having | +0.017 |
ending | +0.017 |
ver | +0.017 |
ifying | +0.017 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.009 |
rust | -0.009 |
fl | -0.008 |
ty | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +1.61e-03 |
Pos logit contributions | |
Having | +0.008 |
ifying | +0.008 |
igsaw | +0.007 |
ite | +0.007 |
� | +0.007 |
Neg logit contributions | |
ie | -0.010 |
fl | -0.009 |
guys | -0.009 |
please | -0.009 |
rust | -0.009 |
Token | tree |
Token ID | 5509 |
Feature activation | +1.79e-03 |
Pos logit contributions | |
ie | +0.002 |
pots | +0.002 |
fl | +0.002 |
rust | +0.002 |
guys | +0.002 |
Neg logit contributions | |
ite | -0.002 |
Having | -0.002 |
ifying | -0.002 |
ending | -0.002 |
ver | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +7.94e-03 |
Pos logit contributions | |
guys | +0.002 |
pots | +0.002 |
ie | +0.002 |
fl | +0.002 |
please | +0.002 |
Neg logit contributions | |
ite | -0.003 |
case | -0.003 |
ver | -0.003 |
� | -0.002 |
ending | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -3.76e-03 |
Pos logit contributions | |
ite | +0.017 |
Having | +0.017 |
ending | +0.017 |
Doing | +0.016 |
� | +0.016 |
Neg logit contributions | |
pots | -0.017 |
ie | -0.016 |
guys | -0.016 |
rust | -0.015 |
fl | -0.015 |
Token | help |
Token ID | 1037 |
Feature activation | +1.36e-03 |
Pos logit contributions | |
ite | +0.004 |
Having | +0.004 |
� | +0.004 |
ending | +0.004 |
ver | +0.004 |
Neg logit contributions | |
pots | -0.005 |
ie | -0.005 |
fl | -0.005 |
rust | -0.005 |
ty | -0.005 |
Token | sort |
Token ID | 3297 |
Feature activation | -2.23e-02 |
Pos logit contributions | |
rob | +0.002 |
fl | +0.002 |
cast | +0.002 |
pots | +0.002 |
glob | +0.002 |
Neg logit contributions | |
� | -0.002 |
Having | -0.002 |
Doing | -0.002 |
ver | -0.002 |
Through | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | -6.98e-03 |
Pos logit contributions | |
ite | +0.035 |
� | +0.033 |
Having | +0.033 |
ifying | +0.033 |
igsaw | +0.033 |
Neg logit contributions | |
hunt | -0.021 |
please | -0.020 |
isk | -0.020 |
ie | -0.020 |
pots | -0.020 |
Token | or |
Token ID | 393 |
Feature activation | -6.46e-03 |
Pos logit contributions | |
ite | +0.010 |
ending | +0.010 |
Having | +0.010 |
ver | +0.010 |
ifying | +0.010 |
Neg logit contributions | |
pots | -0.008 |
ie | -0.007 |
rust | -0.007 |
fl | -0.007 |
guys | -0.007 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.28e-02 |
Pos logit contributions | |
Having | +0.008 |
ite | +0.008 |
ver | +0.008 |
ending | +0.008 |
ifying | +0.008 |
Neg logit contributions | |
ie | -0.008 |
fl | -0.007 |
pots | -0.007 |
ty | -0.007 |
co | -0.007 |
Token | ents |
Token ID | 658 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
ver | +0.045 |
Having | +0.045 |
ending | +0.044 |
Doing | +0.043 |
Jimmy | +0.043 |
Neg logit contributions | |
ie | -0.111 |
pots | -0.106 |
please | -0.099 |
each | -0.098 |
rust | -0.098 |
Token | . |
Token ID | 13 |
Feature activation | -5.04e-03 |
Pos logit contributions | |
ite | +0.017 |
ver | +0.017 |
ending | +0.016 |
Having | +0.016 |
ifying | +0.016 |
Neg logit contributions | |
pots | -0.010 |
ie | -0.010 |
guys | -0.009 |
fl | -0.009 |
please | -0.009 |
Token | She |
Token ID | 1375 |
Feature activation | -7.61e-05 |
Pos logit contributions | |
ending | +0.007 |
ite | +0.007 |
ifying | +0.006 |
ver | +0.006 |
outage | +0.006 |
Neg logit contributions | |
pots | -0.006 |
S | -0.006 |
ie | -0.006 |
for | -0.006 |
fl | -0.006 |
Token | picked |
Token ID | 6497 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
ite | +0.000 |
Having | +0.000 |
ending | +0.000 |
ver | +0.000 |
Doing | +0.000 |
Neg logit contributions | |
pots | -0.000 |
ie | -0.000 |
fl | -0.000 |
rust | -0.000 |
guys | -0.000 |
Token | up |
Token ID | 510 |
Feature activation | -1.67e-02 |
Pos logit contributions | |
Having | +0.018 |
ver | +0.018 |
� | +0.018 |
ite | +0.017 |
It | +0.017 |
Neg logit contributions | |
hunt | -0.014 |
ie | -0.013 |
isk | -0.013 |
pots | -0.013 |
rust | -0.013 |
Token | had |
Token ID | 550 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.004 |
guys | +0.004 |
ty | +0.004 |
rust | +0.004 |
Neg logit contributions | |
ite | -0.005 |
igsaw | -0.005 |
ending | -0.005 |
Having | -0.005 |
Doing | -0.005 |
Token | not |
Token ID | 407 |
Feature activation | +1.89e-02 |
Pos logit contributions | |
ie | +0.017 |
pots | +0.017 |
fl | +0.016 |
rust | +0.016 |
ty | +0.016 |
Neg logit contributions | |
Having | -0.013 |
ver | -0.013 |
ite | -0.013 |
ending | -0.013 |
Doing | -0.012 |
Token | touched |
Token ID | 12615 |
Feature activation | +4.81e-04 |
Pos logit contributions | |
pots | +0.022 |
ie | +0.022 |
rust | +0.021 |
hunt | +0.020 |
guys | +0.020 |
Neg logit contributions | |
ite | -0.026 |
Having | -0.025 |
ending | -0.025 |
ver | -0.025 |
ifying | -0.025 |
Token | the |
Token ID | 262 |
Feature activation | +8.42e-03 |
Pos logit contributions | |
ie | +0.000 |
pots | +0.000 |
rust | +0.000 |
ty | +0.000 |
hunt | +0.000 |
Neg logit contributions | |
ite | -0.001 |
ifying | -0.001 |
Having | -0.001 |
ver | -0.001 |
ending | -0.001 |
Token | or |
Token ID | 393 |
Feature activation | +9.55e-03 |
Pos logit contributions | |
ie | +0.011 |
ty | +0.010 |
pots | +0.010 |
hunt | +0.010 |
isk | +0.010 |
Neg logit contributions | |
ite | -0.011 |
Having | -0.010 |
ifying | -0.010 |
case | -0.010 |
ending | -0.010 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.23e-02 |
Pos logit contributions | |
ie | +0.011 |
pots | +0.011 |
fl | +0.010 |
ty | +0.010 |
rust | +0.010 |
Neg logit contributions | |
ite | -0.013 |
Having | -0.013 |
ifying | -0.012 |
ver | -0.012 |
ending | -0.012 |
Token | ents |
Token ID | 658 |
Feature activation | -1.75e-02 |
Pos logit contributions | |
Having | +0.047 |
Jimmy | +0.047 |
ver | +0.045 |
Fasc | +0.045 |
Through | +0.044 |
Neg logit contributions | |
ie | -0.110 |
pots | -0.104 |
please | -0.098 |
rust | -0.096 |
each | -0.095 |
Token | . |
Token ID | 13 |
Feature activation | -1.70e-02 |
Pos logit contributions | |
ite | +0.029 |
ending | +0.028 |
Having | +0.028 |
ver | +0.028 |
ifying | +0.028 |
Neg logit contributions | |
pots | -0.016 |
ie | -0.015 |
fl | -0.014 |
rust | -0.014 |
guys | -0.014 |
Token | They |
Token ID | 1119 |
Feature activation | +9.49e-04 |
Pos logit contributions | |
ending | +0.033 |
ite | +0.032 |
ver | +0.029 |
ended | +0.028 |
igsaw | +0.028 |
Neg logit contributions | |
pots | -0.014 |
S | -0.014 |
each | -0.013 |
them | -0.013 |
ones | -0.012 |
Token | hoped |
Token ID | 10719 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
ie | +0.001 |
pots | +0.001 |
fl | +0.001 |
ty | +0.001 |
rust | +0.001 |
Neg logit contributions | |
ite | -0.001 |
Having | -0.001 |
ver | -0.001 |
ifying | -0.001 |
ending | -0.001 |
Token | Mom |
Token ID | 11254 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
ite | +0.016 |
Having | +0.015 |
ending | +0.015 |
ver | +0.015 |
ifying | +0.015 |
Neg logit contributions | |
pots | -0.013 |
ie | -0.013 |
fl | -0.012 |
rust | -0.012 |
ty | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | +4.39e-03 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.004 |
ty | +0.004 |
for | +0.004 |
rust | +0.004 |
Neg logit contributions | |
ite | -0.007 |
Having | -0.007 |
ending | -0.007 |
ifying | -0.007 |
ver | -0.007 |
Token | me |
Token ID | 502 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
fl | +0.006 |
pots | +0.006 |
rob | +0.006 |
rust | +0.005 |
bank | +0.005 |
Neg logit contributions | |
Having | -0.005 |
Jimmy | -0.005 |
� | -0.005 |
Sharing | -0.005 |
presses | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -1.54e-02 |
Pos logit contributions | |
ite | +0.023 |
Having | +0.023 |
ending | +0.023 |
ver | +0.022 |
ifying | +0.022 |
Neg logit contributions | |
pots | -0.012 |
ie | -0.012 |
rust | -0.011 |
fl | -0.011 |
ty | -0.011 |
Token | The |
Token ID | 383 |
Feature activation | -6.48e-04 |
Pos logit contributions | |
ending | +0.022 |
ver | +0.021 |
ite | +0.020 |
ival | +0.020 |
osity | +0.020 |
Neg logit contributions | |
S | -0.021 |
Mitt | -0.017 |
Wh | -0.016 |
Chick | -0.015 |
pots | -0.015 |
Token | or |
Token ID | 393 |
Feature activation | +1.83e-03 |
Pos logit contributions | |
ite | +0.001 |
Having | +0.001 |
ifying | +0.001 |
ending | +0.001 |
ver | +0.001 |
Neg logit contributions | |
ie | -0.001 |
pots | -0.001 |
ty | -0.001 |
rust | -0.001 |
fl | -0.001 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.15e-02 |
Pos logit contributions | |
ie | +0.002 |
pots | +0.002 |
ty | +0.002 |
fl | +0.002 |
rust | +0.002 |
Neg logit contributions | |
ite | -0.003 |
Having | -0.002 |
ifying | -0.002 |
ending | -0.002 |
ver | -0.002 |
Token | ents |
Token ID | 658 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
Fasc | +0.051 |
Having | +0.050 |
ver | +0.049 |
Jimmy | +0.048 |
Through | +0.047 |
Neg logit contributions | |
ie | -0.104 |
pots | -0.098 |
please | -0.093 |
each | -0.092 |
co | -0.090 |
Token | were |
Token ID | 547 |
Feature activation | +8.31e-03 |
Pos logit contributions | |
ite | +0.035 |
Having | +0.034 |
ending | +0.034 |
ifying | +0.033 |
ver | +0.033 |
Neg logit contributions | |
ie | -0.027 |
pots | -0.027 |
rust | -0.025 |
ty | -0.025 |
fl | -0.025 |
Token | very |
Token ID | 845 |
Feature activation | +1.84e-03 |
Pos logit contributions | |
pots | +0.009 |
ie | +0.009 |
rust | +0.009 |
fl | +0.009 |
ty | +0.009 |
Neg logit contributions | |
ite | -0.012 |
Having | -0.011 |
ending | -0.011 |
ver | -0.011 |
ifying | -0.011 |
Token | important |
Token ID | 1593 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
rust | +0.002 |
ty | +0.002 |
guys | +0.002 |
Neg logit contributions | |
ite | -0.003 |
Having | -0.003 |
ending | -0.002 |
ver | -0.002 |
ifying | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
ite | +0.024 |
ending | +0.023 |
Having | +0.023 |
ver | +0.023 |
ifying | +0.023 |
Neg logit contributions | |
pots | -0.012 |
ie | -0.011 |
rust | -0.010 |
fl | -0.010 |
ty | -0.010 |
Token | at |
Token ID | 379 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
hunt | +0.003 |
please | +0.003 |
pots | +0.003 |
fl | +0.003 |
ty | +0.003 |
Neg logit contributions | |
ite | -0.005 |
ver | -0.005 |
ending | -0.004 |
ifying | -0.004 |
Through | -0.004 |
Token | all |
Token ID | 477 |
Feature activation | -2.20e-02 |
Pos logit contributions | |
ite | +0.025 |
Having | +0.024 |
ifying | +0.024 |
ver | +0.024 |
ending | +0.024 |
Neg logit contributions | |
pots | -0.016 |
ie | -0.016 |
rust | -0.015 |
guys | -0.015 |
fl | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | -9.63e-04 |
Pos logit contributions | |
ver | +0.042 |
ending | +0.042 |
ifying | +0.040 |
ite | +0.040 |
erv | +0.039 |
Neg logit contributions | |
ie | -0.019 |
pots | -0.017 |
for | -0.016 |
them | -0.015 |
fl | -0.015 |
Token | different |
Token ID | 1180 |
Feature activation | -7.60e-03 |
Pos logit contributions | |
ite | +0.002 |
Having | +0.001 |
ending | +0.001 |
ver | +0.001 |
ifying | +0.001 |
Neg logit contributions | |
pots | -0.001 |
ie | -0.001 |
rust | -0.001 |
fl | -0.001 |
ty | -0.001 |
Token | or |
Token ID | 393 |
Feature activation | -7.42e-03 |
Pos logit contributions | |
ite | +0.012 |
Having | +0.012 |
ending | +0.012 |
ifying | +0.012 |
ver | +0.012 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.007 |
ty | -0.006 |
rust | -0.006 |
hunt | -0.006 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.09e-02 |
Pos logit contributions | |
Having | +0.008 |
ifying | +0.008 |
ite | +0.008 |
Doing | +0.008 |
ver | +0.008 |
Neg logit contributions | |
ie | -0.010 |
ty | -0.010 |
pots | -0.009 |
co | -0.009 |
guys | -0.009 |
Token | ents |
Token ID | 658 |
Feature activation | -1.19e-02 |
Pos logit contributions | |
Having | +0.046 |
ver | +0.046 |
Fasc | +0.044 |
Jimmy | +0.044 |
Doing | +0.044 |
Neg logit contributions | |
ie | -0.106 |
pots | -0.100 |
please | -0.093 |
each | -0.093 |
rust | -0.093 |
Token | and |
Token ID | 290 |
Feature activation | -7.92e-03 |
Pos logit contributions | |
ite | +0.019 |
ending | +0.018 |
ver | +0.018 |
Having | +0.018 |
ifying | +0.018 |
Neg logit contributions | |
pots | -0.011 |
ie | -0.010 |
guys | -0.010 |
fl | -0.010 |
rust | -0.010 |
Token | adm |
Token ID | 6178 |
Feature activation | -3.87e-03 |
Pos logit contributions | |
Having | +0.010 |
ite | +0.010 |
ifying | +0.010 |
ver | +0.010 |
Doing | +0.009 |
Neg logit contributions | |
ie | -0.010 |
ty | -0.009 |
guys | -0.009 |
pots | -0.009 |
co | -0.009 |
Token | iring |
Token ID | 3428 |
Feature activation | -6.32e-03 |
Pos logit contributions | |
ite | +0.005 |
Having | +0.005 |
ending | +0.005 |
ver | +0.005 |
ifying | +0.005 |
Neg logit contributions | |
ie | -0.005 |
pots | -0.005 |
rust | -0.005 |
fl | -0.005 |
ty | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | +1.60e-02 |
Pos logit contributions | |
ite | +0.009 |
Having | +0.009 |
ifying | +0.009 |
ver | +0.009 |
ending | +0.009 |
Neg logit contributions | |
pots | -0.006 |
ie | -0.006 |
hunt | -0.006 |
ty | -0.006 |
guys | -0.006 |
Token | She |
Token ID | 1375 |
Feature activation | -9.69e-03 |
Pos logit contributions | |
pots | +0.008 |
S | +0.008 |
for | +0.007 |
them | +0.007 |
him | +0.007 |
Neg logit contributions | |
ending | -0.013 |
ite | -0.013 |
ifying | -0.012 |
ver | -0.012 |
Having | -0.011 |
Token | learned |
Token ID | 4499 |
Feature activation | -1.73e-02 |
Pos logit contributions | |
ite | +0.014 |
ending | +0.014 |
Having | +0.014 |
ver | +0.014 |
ifying | +0.014 |
Neg logit contributions | |
pots | -0.010 |
ie | -0.010 |
rust | -0.009 |
fl | -0.009 |
ty | -0.009 |
Token | that |
Token ID | 326 |
Feature activation | -4.62e-04 |
Pos logit contributions | |
ite | +0.033 |
ifying | +0.032 |
ending | +0.031 |
ver | +0.031 |
Having | +0.031 |
Neg logit contributions | |
pots | -0.013 |
ie | -0.012 |
rust | -0.011 |
for | -0.011 |
ty | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | +4.29e-03 |
Pos logit contributions | |
ite | +0.001 |
ifying | +0.001 |
ending | +0.001 |
ver | +0.001 |
Having | +0.001 |
Neg logit contributions | |
pots | -0.000 |
ie | -0.000 |
rust | -0.000 |
fl | -0.000 |
guys | -0.000 |
Token | or |
Token ID | 393 |
Feature activation | +2.79e-03 |
Pos logit contributions | |
pots | +0.005 |
ie | +0.005 |
rust | +0.005 |
fl | +0.004 |
guys | +0.004 |
Neg logit contributions | |
ite | -0.006 |
ending | -0.006 |
Having | -0.006 |
ifying | -0.006 |
ver | -0.006 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.05e-02 |
Pos logit contributions | |
pots | +0.003 |
ie | +0.003 |
rust | +0.003 |
for | +0.003 |
guys | +0.003 |
Neg logit contributions | |
ite | -0.004 |
ending | -0.004 |
ifying | -0.004 |
Having | -0.004 |
ver | -0.004 |
Token | ents |
Token ID | 658 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
Jimmy | +0.052 |
Fasc | +0.051 |
Having | +0.049 |
ver | +0.049 |
Jeremy | +0.047 |
Neg logit contributions | |
ie | -0.104 |
pots | -0.099 |
each | -0.090 |
for | -0.088 |
rust | -0.088 |
Token | were |
Token ID | 547 |
Feature activation | +4.97e-03 |
Pos logit contributions | |
ite | +0.037 |
Having | +0.036 |
ending | +0.036 |
ver | +0.035 |
ifying | +0.035 |
Neg logit contributions | |
pots | -0.027 |
ie | -0.027 |
rust | -0.025 |
fl | -0.025 |
ty | -0.025 |
Token | not |
Token ID | 407 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
pots | +0.005 |
ie | +0.005 |
rust | +0.005 |
for | +0.005 |
ty | +0.005 |
Neg logit contributions | |
ite | -0.008 |
ending | -0.007 |
ifying | -0.007 |
Having | -0.007 |
ver | -0.007 |
Token | for |
Token ID | 329 |
Feature activation | +2.68e-02 |
Pos logit contributions | |
pots | +0.011 |
ie | +0.010 |
rust | +0.010 |
guys | +0.010 |
ty | +0.009 |
Neg logit contributions | |
ite | -0.016 |
ending | -0.015 |
Having | -0.015 |
ifying | -0.015 |
ver | -0.015 |
Token | playing |
Token ID | 2712 |
Feature activation | +9.11e-03 |
Pos logit contributions | |
ie | +0.034 |
pots | +0.033 |
ty | +0.032 |
fl | +0.032 |
hunt | +0.031 |
Neg logit contributions | |
Having | -0.033 |
ending | -0.033 |
ite | -0.032 |
ver | -0.031 |
Doing | -0.030 |
Token | lo |
Token ID | 2376 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
ite | +0.008 |
Having | +0.008 |
ver | +0.008 |
� | +0.008 |
ifying | +0.008 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.009 |
fl | -0.008 |
guys | -0.008 |
co | -0.008 |
Token | vel |
Token ID | 626 |
Feature activation | +1.77e-03 |
Pos logit contributions | |
Having | +0.013 |
ite | +0.013 |
ending | +0.012 |
outage | +0.012 |
Doing | +0.012 |
Neg logit contributions | |
for | -0.016 |
pots | -0.015 |
ie | -0.015 |
ty | -0.015 |
guys | -0.014 |
Token | ier |
Token ID | 959 |
Feature activation | -3.99e-03 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
rust | +0.002 |
hunt | +0.002 |
fl | +0.002 |
Neg logit contributions | |
ite | -0.002 |
ver | -0.002 |
ending | -0.002 |
ifying | -0.002 |
Having | -0.002 |
Token | than |
Token ID | 621 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
ite | +0.006 |
ending | +0.006 |
Having | +0.006 |
ver | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
pots | -0.004 |
ie | -0.004 |
rust | -0.004 |
ty | -0.004 |
fl | -0.003 |
Token | my |
Token ID | 616 |
Feature activation | -3.95e-02 |
Pos logit contributions | |
ite | +0.020 |
ending | +0.019 |
Having | +0.019 |
ver | +0.018 |
Doing | +0.018 |
Neg logit contributions | |
pots | -0.014 |
ie | -0.014 |
for | -0.013 |
guys | -0.013 |
rust | -0.013 |
Token | old |
Token ID | 1468 |
Feature activation | -6.05e-02 |
Pos logit contributions | |
ending | +0.048 |
ite | +0.048 |
Having | +0.047 |
ver | +0.046 |
ifying | +0.046 |
Neg logit contributions | |
pots | -0.053 |
ie | -0.051 |
hunt | -0.049 |
rust | -0.049 |
guys | -0.049 |
Token | net |
Token ID | 2010 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
ite | +0.078 |
ending | +0.076 |
Having | +0.076 |
ver | +0.074 |
ifying | +0.074 |
Neg logit contributions | |
pots | -0.076 |
ie | -0.075 |
rust | -0.070 |
fl | -0.069 |
ty | -0.069 |
Token | !" |
Token ID | 2474 |
Feature activation | +2.29e-03 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
rust | +0.002 |
fl | +0.002 |
co | +0.002 |
Neg logit contributions | |
ite | -0.003 |
ver | -0.003 |
ending | -0.003 |
� | -0.003 |
ifying | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
ie | +0.003 |
pots | +0.003 |
fl | +0.003 |
rust | +0.003 |
S | +0.003 |
Neg logit contributions | |
ite | -0.003 |
ifying | -0.003 |
ending | -0.003 |
ver | -0.003 |
Having | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -2.47e-02 |
Pos logit contributions | |
ite | +0.007 |
ifying | +0.007 |
ending | +0.007 |
ver | +0.006 |
Having | +0.006 |
Neg logit contributions | |
ie | -0.007 |
ty | -0.007 |
pots | -0.007 |
them | -0.007 |
rust | -0.007 |
Token | M |
Token ID | 44 |
Feature activation | +1.20e-03 |
Pos logit contributions | |
ite | +0.041 |
ifying | +0.040 |
ver | +0.038 |
endant | +0.038 |
outage | +0.037 |
Neg logit contributions | |
ie | -0.023 |
ty | -0.023 |
them | -0.021 |
please | -0.021 |
rust | -0.020 |
Token | a |
Token ID | 257 |
Feature activation | +4.06e-03 |
Pos logit contributions | |
ver | +0.009 |
Through | +0.008 |
Having | +0.007 |
Jimmy | +0.007 |
� | +0.007 |
Neg logit contributions | |
ie | -0.010 |
please | -0.009 |
hunt | -0.009 |
ger | -0.009 |
bank | -0.009 |
Token | letter |
Token ID | 3850 |
Feature activation | +1.59e-02 |
Pos logit contributions | |
ie | +0.006 |
pots | +0.006 |
fl | +0.005 |
ty | +0.005 |
rust | +0.005 |
Neg logit contributions | |
ite | -0.005 |
Having | -0.005 |
ending | -0.004 |
ifying | -0.004 |
ver | -0.004 |
Token | about |
Token ID | 546 |
Feature activation | -3.17e-04 |
Pos logit contributions | |
pots | +0.017 |
ie | +0.016 |
ger | +0.016 |
guys | +0.015 |
isk | +0.015 |
Neg logit contributions | |
ite | -0.024 |
ver | -0.023 |
ending | -0.023 |
ifying | -0.022 |
� | -0.022 |
Token | the |
Token ID | 262 |
Feature activation | +9.77e-03 |
Pos logit contributions | |
Having | +0.000 |
ite | +0.000 |
ifying | +0.000 |
ending | +0.000 |
Doing | +0.000 |
Neg logit contributions | |
ie | -0.000 |
pots | -0.000 |
ty | -0.000 |
guys | -0.000 |
co | -0.000 |
Token | or |
Token ID | 393 |
Feature activation | -7.51e-04 |
Pos logit contributions | |
ie | +0.013 |
pots | +0.012 |
ty | +0.012 |
bank | +0.012 |
isk | +0.012 |
Neg logit contributions | |
ite | -0.012 |
Having | -0.011 |
case | -0.011 |
� | -0.011 |
ifying | -0.010 |
Token | nam |
Token ID | 7402 |
Feature activation | -6.02e-02 |
Pos logit contributions | |
Having | +0.001 |
ver | +0.001 |
ifying | +0.001 |
Doing | +0.001 |
Jimmy | +0.001 |
Neg logit contributions | |
ie | -0.001 |
co | -0.001 |
pots | -0.001 |
ty | -0.001 |
fl | -0.001 |
Token | ents |
Token ID | 658 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
Having | +0.049 |
ver | +0.048 |
Fasc | +0.047 |
Jimmy | +0.047 |
Through | +0.046 |
Neg logit contributions | |
ie | -0.104 |
pots | -0.097 |
please | -0.090 |
rust | -0.088 |
ty | -0.087 |
Token | and |
Token ID | 290 |
Feature activation | -7.44e-03 |
Pos logit contributions | |
ite | +0.024 |
Having | +0.023 |
ending | +0.023 |
ver | +0.023 |
ifying | +0.023 |
Neg logit contributions | |
pots | -0.012 |
ie | -0.012 |
rust | -0.011 |
fl | -0.011 |
ty | -0.011 |
Token | asked |
Token ID | 1965 |
Feature activation | +4.74e-03 |
Pos logit contributions | |
Having | +0.010 |
ite | +0.010 |
ver | +0.009 |
ifying | +0.009 |
ending | +0.009 |
Neg logit contributions | |
ie | -0.009 |
pots | -0.008 |
ty | -0.008 |
co | -0.008 |
guys | -0.008 |
Token | for |
Token ID | 329 |
Feature activation | +6.79e-03 |
Pos logit contributions | |
rob | +0.006 |
hunt | +0.006 |
please | +0.006 |
rust | +0.006 |
fl | +0.006 |
Neg logit contributions | |
ver | -0.006 |
� | -0.006 |
Jimmy | -0.005 |
It | -0.005 |
Since | -0.005 |
Token | one |
Token ID | 530 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
fl | +0.009 |
ie | +0.009 |
isk | +0.008 |
bank | +0.008 |
co | +0.008 |
Neg logit contributions | |
Having | -0.008 |
ver | -0.008 |
ifying | -0.008 |
Jimmy | -0.008 |
ending | -0.008 |
Token | clock |
Token ID | 8801 |
Feature activation | +1.27e-02 |
Pos logit contributions | |
ite | +0.031 |
ending | +0.031 |
Having | +0.031 |
ver | +0.030 |
ifying | +0.029 |
Neg logit contributions | |
ie | -0.028 |
pots | -0.028 |
rust | -0.026 |
guys | -0.026 |
fl | -0.026 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-05 |
Pos logit contributions | |
pots | +0.012 |
ie | +0.011 |
rust | +0.010 |
guys | +0.010 |
fl | +0.010 |
Neg logit contributions | |
ite | -0.021 |
ending | -0.020 |
Having | -0.020 |
ifying | -0.020 |
ver | -0.019 |
Token | It |
Token ID | 632 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
S | +0.000 |
pots | +0.000 |
him | +0.000 |
guys | +0.000 |
rust | +0.000 |
Neg logit contributions | |
ending | -0.000 |
ite | -0.000 |
ver | -0.000 |
ifying | -0.000 |
Having | -0.000 |
Token | was |
Token ID | 373 |
Feature activation | +8.58e-03 |
Pos logit contributions | |
ie | +0.015 |
pots | +0.015 |
rust | +0.014 |
fl | +0.014 |
ty | +0.014 |
Neg logit contributions | |
ite | -0.020 |
ending | -0.020 |
Having | -0.020 |
ifying | -0.020 |
ver | -0.020 |
Token | an |
Token ID | 281 |
Feature activation | -2.45e-02 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.008 |
rust | +0.007 |
fl | +0.007 |
ty | +0.007 |
Neg logit contributions | |
ite | -0.014 |
Having | -0.013 |
ending | -0.013 |
ver | -0.013 |
ifying | -0.013 |
Token | old |
Token ID | 1468 |
Feature activation | -6.00e-02 |
Pos logit contributions | |
ifying | +0.039 |
ver | +0.038 |
ite | +0.038 |
Having | +0.038 |
ending | +0.036 |
Neg logit contributions | |
ie | -0.025 |
pots | -0.024 |
guys | -0.022 |
for | -0.022 |
o | -0.022 |
Token | clock |
Token ID | 8801 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
ifying | +0.082 |
ver | +0.076 |
Having | +0.076 |
ending | +0.076 |
osity | +0.071 |
Neg logit contributions | |
pots | -0.079 |
sound | -0.078 |
for | -0.078 |
ie | -0.077 |
ones | -0.075 |
Token | and |
Token ID | 290 |
Feature activation | -8.41e-03 |
Pos logit contributions | |
pots | +0.009 |
ie | +0.009 |
rust | +0.008 |
fl | +0.008 |
guys | +0.008 |
Neg logit contributions | |
ite | -0.017 |
ending | -0.016 |
Having | -0.016 |
ver | -0.016 |
ifying | -0.016 |
Token | it |
Token ID | 340 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
ending | +0.012 |
ite | +0.012 |
ifying | +0.012 |
Having | +0.012 |
ver | +0.012 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.009 |
rust | -0.009 |
fl | -0.008 |
for | -0.008 |
Token | was |
Token ID | 373 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
pots | +0.014 |
ie | +0.014 |
rust | +0.013 |
fl | +0.013 |
ty | +0.012 |
Neg logit contributions | |
ite | -0.020 |
ending | -0.020 |
Having | -0.020 |
ifying | -0.020 |
ver | -0.020 |
Token | very |
Token ID | 845 |
Feature activation | +4.01e-03 |
Pos logit contributions | |
pots | +0.015 |
ie | +0.015 |
rust | +0.014 |
fl | +0.014 |
ty | +0.014 |
Neg logit contributions | |
ite | -0.028 |
Having | -0.027 |
ending | -0.027 |
ver | -0.027 |
ifying | -0.027 |
Token | too |
Token ID | 1165 |
Feature activation | -8.68e-03 |
Pos logit contributions | |
ite | +0.003 |
ifying | +0.003 |
ver | +0.003 |
Having | +0.003 |
ending | +0.002 |
Neg logit contributions | |
pots | -0.002 |
guys | -0.002 |
please | -0.002 |
ie | -0.002 |
rust | -0.002 |
Token | deep |
Token ID | 2769 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
ite | +0.016 |
Having | +0.015 |
ending | +0.015 |
ifying | +0.015 |
ver | +0.015 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.007 |
ty | -0.006 |
rust | -0.006 |
hunt | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
pots | +0.016 |
rust | +0.015 |
ie | +0.015 |
guys | +0.015 |
please | +0.014 |
Neg logit contributions | |
ifying | -0.022 |
ite | -0.022 |
� | -0.021 |
ending | -0.021 |
ver | -0.021 |
Token | She |
Token ID | 1375 |
Feature activation | -9.99e-03 |
Pos logit contributions | |
ite | +0.020 |
ifying | +0.020 |
ending | +0.020 |
outage | +0.019 |
Jimmy | +0.019 |
Neg logit contributions | |
pots | -0.020 |
S | -0.020 |
ie | -0.019 |
for | -0.019 |
fl | -0.019 |
Token | slowly |
Token ID | 6364 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
ite | +0.015 |
ending | +0.015 |
Having | +0.015 |
ifying | +0.015 |
ver | +0.014 |
Neg logit contributions | |
ie | -0.011 |
pots | -0.010 |
ty | -0.010 |
rust | -0.010 |
hunt | -0.009 |
Token | filled |
Token ID | 5901 |
Feature activation | -5.96e-02 |
Pos logit contributions | |
ite | +0.019 |
ending | +0.018 |
Having | +0.018 |
ver | +0.018 |
ifying | +0.017 |
Neg logit contributions | |
pots | -0.017 |
ie | -0.017 |
fl | -0.016 |
guys | -0.016 |
rust | -0.016 |
Token | the |
Token ID | 262 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
ite | +0.101 |
Having | +0.100 |
ending | +0.099 |
ver | +0.097 |
ifying | +0.096 |
Neg logit contributions | |
pots | -0.049 |
ie | -0.049 |
rust | -0.044 |
fl | -0.044 |
guys | -0.044 |
Token | hole |
Token ID | 7604 |
Feature activation | -3.19e-02 |
Pos logit contributions | |
ver | +0.025 |
ending | +0.024 |
Whoever | +0.021 |
Jimmy | +0.021 |
osity | +0.021 |
Neg logit contributions | |
pots | -0.009 |
footprints | -0.007 |
sound | -0.007 |
hunt | -0.007 |
ones | -0.007 |
Token | with |
Token ID | 351 |
Feature activation | -1.76e-02 |
Pos logit contributions | |
ite | +0.050 |
ending | +0.049 |
Having | +0.049 |
ifying | +0.048 |
ver | +0.048 |
Neg logit contributions | |
ie | -0.031 |
pots | -0.031 |
rust | -0.029 |
ty | -0.028 |
fl | -0.027 |
Token | dirt |
Token ID | 13647 |
Feature activation | -2.40e-02 |
Pos logit contributions | |
Having | +0.025 |
ite | +0.024 |
ifying | +0.024 |
� | +0.024 |
ending | +0.023 |
Neg logit contributions | |
ie | -0.019 |
co | -0.018 |
guys | -0.018 |
fl | -0.018 |
ty | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -4.97e-03 |
Pos logit contributions | |
ite | +0.030 |
ending | +0.029 |
Having | +0.029 |
ver | +0.028 |
ifying | +0.028 |
Neg logit contributions | |
pots | -0.030 |
ie | -0.030 |
guys | -0.028 |
fl | -0.028 |
rust | -0.028 |
Token | he |
Token ID | 339 |
Feature activation | +2.04e-02 |
Pos logit contributions | |
Having | +0.001 |
ite | +0.001 |
ending | +0.001 |
ver | +0.001 |
ifying | +0.001 |
Neg logit contributions | |
ie | -0.001 |
pots | -0.001 |
fl | -0.001 |
ty | -0.001 |
guys | -0.001 |
Token | especially |
Token ID | 2592 |
Feature activation | +2.48e-03 |
Pos logit contributions | |
pots | +0.024 |
ie | +0.024 |
rust | +0.022 |
fl | +0.022 |
ty | +0.022 |
Neg logit contributions | |
ite | -0.028 |
Having | -0.027 |
ending | -0.027 |
ver | -0.027 |
ifying | -0.026 |
Token | liked |
Token ID | 8288 |
Feature activation | +8.29e-03 |
Pos logit contributions | |
pots | +0.003 |
ie | +0.003 |
rust | +0.003 |
fl | +0.003 |
ty | +0.003 |
Neg logit contributions | |
ite | -0.003 |
ending | -0.003 |
Having | -0.003 |
ifying | -0.003 |
ver | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | -5.86e-03 |
Pos logit contributions | |
ie | +0.010 |
pots | +0.010 |
rust | +0.010 |
isk | +0.010 |
ty | +0.010 |
Neg logit contributions | |
Having | -0.010 |
ending | -0.010 |
ite | -0.010 |
ifying | -0.009 |
Doing | -0.009 |
Token | or |
Token ID | 393 |
Feature activation | +7.40e-03 |
Pos logit contributions | |
ite | +0.008 |
Having | +0.008 |
ending | +0.008 |
ver | +0.008 |
ifying | +0.008 |
Neg logit contributions | |
ie | -0.006 |
pots | -0.006 |
ty | -0.006 |
rust | -0.006 |
fl | -0.006 |
Token | nam |
Token ID | 7402 |
Feature activation | -5.94e-02 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.008 |
rust | +0.007 |
fl | +0.007 |
ty | +0.007 |
Neg logit contributions | |
ite | -0.011 |
Having | -0.011 |
ending | -0.011 |
ver | -0.010 |
ifying | -0.010 |
Token | ents |
Token ID | 658 |
Feature activation | -2.16e-03 |
Pos logit contributions | |
Having | +0.045 |
ver | +0.045 |
Jimmy | +0.044 |
Doing | +0.043 |
Flying | +0.042 |
Neg logit contributions | |
ie | -0.104 |
pots | -0.098 |
please | -0.092 |
rust | -0.090 |
each | -0.089 |
Token | he |
Token ID | 339 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
ite | +0.004 |
ver | +0.004 |
ending | +0.004 |
Having | +0.003 |
ifying | +0.003 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
fl | -0.002 |
guys | -0.002 |
rust | -0.002 |
Token | kept |
Token ID | 4030 |
Feature activation | +5.19e-03 |
Pos logit contributions | |
pots | +0.027 |
ie | +0.026 |
fl | +0.026 |
rust | +0.025 |
glob | +0.025 |
Neg logit contributions | |
Having | -0.017 |
� | -0.017 |
ver | -0.017 |
ite | -0.017 |
ending | -0.016 |
Token | around |
Token ID | 1088 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
ie | +0.005 |
pots | +0.005 |
fl | +0.005 |
guys | +0.005 |
rust | +0.005 |
Neg logit contributions | |
Having | -0.007 |
ifying | -0.007 |
ite | -0.007 |
ending | -0.007 |
� | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +4.71e-03 |
Pos logit contributions | |
isk | +0.017 |
rob | +0.017 |
ie | +0.017 |
pots | +0.017 |
fl | +0.017 |
Neg logit contributions | |
� | -0.022 |
ifying | -0.021 |
Having | -0.021 |
ago | -0.021 |
Doing | -0.020 |
Token | she |
Token ID | 673 |
Feature activation | -5.58e-03 |
Pos logit contributions | |
ite | +0.014 |
Having | +0.014 |
ending | +0.014 |
ver | +0.013 |
Doing | +0.013 |
Neg logit contributions | |
pots | -0.013 |
ie | -0.012 |
guys | -0.012 |
ty | -0.012 |
rust | -0.012 |
Token | could |
Token ID | 714 |
Feature activation | -9.45e-03 |
Pos logit contributions | |
ite | +0.007 |
Having | +0.007 |
ending | +0.007 |
ver | +0.007 |
ifying | +0.006 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.007 |
rust | -0.007 |
fl | -0.007 |
guys | -0.007 |
Token | carry |
Token ID | 3283 |
Feature activation | -1.31e-02 |
Pos logit contributions | |
ite | +0.015 |
Having | +0.015 |
ver | +0.015 |
ending | +0.015 |
� | +0.014 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.008 |
fl | -0.008 |
guys | -0.008 |
ty | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +6.27e-03 |
Pos logit contributions | |
� | +0.014 |
ite | +0.013 |
It | +0.013 |
Having | +0.013 |
ver | +0.013 |
Neg logit contributions | |
isk | -0.018 |
urg | -0.017 |
please | -0.017 |
bank | -0.017 |
hunt | -0.017 |
Token | or |
Token ID | 393 |
Feature activation | -2.32e-03 |
Pos logit contributions | |
ie | +0.007 |
pots | +0.007 |
ty | +0.007 |
rust | +0.007 |
fl | +0.007 |
Neg logit contributions | |
ite | -0.009 |
Having | -0.008 |
ending | -0.008 |
ifying | -0.008 |
ver | -0.008 |
Token | nam |
Token ID | 7402 |
Feature activation | -5.93e-02 |
Pos logit contributions | |
ite | +0.003 |
Having | +0.003 |
ifying | +0.003 |
ver | +0.003 |
ending | +0.003 |
Neg logit contributions | |
ie | -0.003 |
pots | -0.003 |
fl | -0.002 |
ty | -0.002 |
co | -0.002 |
Token | ents |
Token ID | 658 |
Feature activation | -8.44e-03 |
Pos logit contributions | |
Having | +0.040 |
Jimmy | +0.039 |
ver | +0.039 |
ite | +0.037 |
Doing | +0.037 |
Neg logit contributions | |
ie | -0.110 |
pots | -0.105 |
rust | -0.099 |
fl | -0.097 |
ty | -0.096 |
Token | to |
Token ID | 284 |
Feature activation | -4.76e-03 |
Pos logit contributions | |
ite | +0.013 |
ver | +0.012 |
ending | +0.012 |
Having | +0.012 |
ifying | +0.012 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.008 |
guys | -0.008 |
fl | -0.008 |
rust | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +1.44e-03 |
Pos logit contributions | |
Having | +0.005 |
glad | +0.005 |
've | +0.005 |
ver | +0.005 |
Through | +0.005 |
Neg logit contributions | |
fl | -0.007 |
ie | -0.006 |
rob | -0.006 |
bat | -0.006 |
pots | -0.006 |
Token | place |
Token ID | 1295 |
Feature activation | -1.60e-02 |
Pos logit contributions | |
ie | +0.002 |
pots | +0.002 |
ty | +0.002 |
isk | +0.002 |
fl | +0.002 |
Neg logit contributions | |
ite | -0.002 |
Having | -0.002 |
ifying | -0.002 |
case | -0.002 |
� | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +8.79e-03 |
Pos logit contributions | |
ite | +0.024 |
ver | +0.023 |
Having | +0.022 |
ifying | +0.022 |
� | +0.022 |
Neg logit contributions | |
guys | -0.017 |
pots | -0.017 |
fl | -0.016 |
please | -0.016 |
ie | -0.016 |
Token | They |
Token ID | 1119 |
Feature activation | -1.05e-03 |
Pos logit contributions | |
ending | +0.037 |
ite | +0.036 |
rou | +0.033 |
aser | +0.032 |
osity | +0.032 |
Neg logit contributions | |
pots | -0.022 |
S | -0.021 |
them | -0.021 |
him | -0.020 |
each | -0.020 |
Token | reached |
Token ID | 4251 |
Feature activation | +5.72e-03 |
Pos logit contributions | |
ite | +0.001 |
Having | +0.001 |
ver | +0.001 |
ending | +0.001 |
ifying | +0.001 |
Neg logit contributions | |
ie | -0.001 |
pots | -0.001 |
fl | -0.001 |
rust | -0.001 |
guys | -0.001 |
Token | for |
Token ID | 329 |
Feature activation | +4.21e-03 |
Pos logit contributions | |
ie | +0.005 |
please | +0.004 |
pots | +0.004 |
rust | +0.004 |
fl | +0.004 |
Neg logit contributions | |
ite | -0.010 |
ver | -0.009 |
Having | -0.009 |
ifying | -0.009 |
Through | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | +6.38e-03 |
Pos logit contributions | |
ie | +0.006 |
fl | +0.006 |
isk | +0.005 |
please | +0.005 |
ty | +0.005 |
Neg logit contributions | |
Having | -0.005 |
ifying | -0.005 |
Jimmy | -0.004 |
ver | -0.004 |
Whoever | -0.004 |
Token | or |
Token ID | 393 |
Feature activation | -2.88e-03 |
Pos logit contributions | |
ie | +0.008 |
isk | +0.008 |
ty | +0.008 |
fl | +0.008 |
pots | +0.008 |
Neg logit contributions | |
ite | -0.008 |
Having | -0.007 |
ifying | -0.007 |
case | -0.007 |
ver | -0.007 |
Token | nam |
Token ID | 7402 |
Feature activation | -5.88e-02 |
Pos logit contributions | |
ite | +0.004 |
Having | +0.004 |
ifying | +0.004 |
ver | +0.004 |
ending | +0.004 |
Neg logit contributions | |
ie | -0.004 |
pots | -0.004 |
fl | -0.003 |
rust | -0.003 |
ty | -0.003 |
Token | ents |
Token ID | 658 |
Feature activation | -1.58e-02 |
Pos logit contributions | |
Having | +0.045 |
ver | +0.045 |
Jimmy | +0.042 |
Doing | +0.042 |
Fasc | +0.041 |
Neg logit contributions | |
ie | -0.104 |
pots | -0.101 |
rust | -0.091 |
ty | -0.091 |
please | -0.090 |
Token | and |
Token ID | 290 |
Feature activation | -2.15e-03 |
Pos logit contributions | |
ite | +0.023 |
ver | +0.022 |
ending | +0.022 |
Having | +0.022 |
ifying | +0.022 |
Neg logit contributions | |
pots | -0.017 |
ie | -0.016 |
fl | -0.015 |
guys | -0.015 |
rust | -0.015 |
Token | tried |
Token ID | 3088 |
Feature activation | -3.96e-03 |
Pos logit contributions | |
ite | +0.003 |
Having | +0.003 |
ver | +0.003 |
ifying | +0.003 |
ending | +0.003 |
Neg logit contributions | |
ie | -0.003 |
pots | -0.002 |
fl | -0.002 |
guys | -0.002 |
rust | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -2.56e-03 |
Pos logit contributions | |
Having | +0.005 |
ending | +0.005 |
ver | +0.005 |
ite | +0.005 |
ifying | +0.004 |
Neg logit contributions | |
ie | -0.005 |
pots | -0.005 |
guys | -0.005 |
ty | -0.005 |
fl | -0.005 |
Token | take |
Token ID | 1011 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
� | +0.003 |
Having | +0.003 |
ver | +0.002 |
Using | +0.002 |
ite | +0.002 |
Neg logit contributions | |
fl | -0.004 |
rob | -0.004 |
ie | -0.004 |
pots | -0.004 |
cast | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -2.99e-03 |
Pos logit contributions | |
rust | +0.010 |
god | +0.010 |
pots | +0.010 |
fl | +0.009 |
isk | +0.009 |
Neg logit contributions | |
ite | -0.010 |
� | -0.010 |
case | -0.010 |
Sharing | -0.009 |
football | -0.009 |
Token | He |
Token ID | 679 |
Feature activation | -7.65e-04 |
Pos logit contributions | |
ending | +0.004 |
ifying | +0.004 |
ite | +0.004 |
ver | +0.004 |
Having | +0.004 |
Neg logit contributions | |
pots | -0.004 |
S | -0.004 |
him | -0.004 |
guys | -0.004 |
hunt | -0.004 |
Token | had |
Token ID | 550 |
Feature activation | -1.34e-02 |
Pos logit contributions | |
ite | +0.001 |
ending | +0.001 |
ifying | +0.001 |
Having | +0.001 |
igsaw | +0.001 |
Neg logit contributions | |
pots | -0.001 |
ie | -0.001 |
ty | -0.001 |
hunt | -0.001 |
guys | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | -3.90e-02 |
Pos logit contributions | |
ite | +0.024 |
ending | +0.024 |
ver | +0.023 |
igsaw | +0.023 |
ifying | +0.023 |
Neg logit contributions | |
pots | -0.012 |
them | -0.010 |
each | -0.010 |
ones | -0.010 |
guys | -0.010 |
Token | big |
Token ID | 1263 |
Feature activation | -4.05e-02 |
Pos logit contributions | |
ending | +0.075 |
ver | +0.071 |
ite | +0.070 |
ifying | +0.069 |
Doing | +0.069 |
Neg logit contributions | |
pots | -0.032 |
guys | -0.027 |
b | -0.027 |
hunt | -0.027 |
ones | -0.026 |
Token | red |
Token ID | 2266 |
Feature activation | -5.88e-02 |
Pos logit contributions | |
ending | +0.054 |
ver | +0.052 |
ifying | +0.052 |
Having | +0.052 |
ite | +0.052 |
Neg logit contributions | |
pots | -0.051 |
ie | -0.049 |
guys | -0.048 |
hunt | -0.047 |
for | -0.046 |
Token | ball |
Token ID | 2613 |
Feature activation | -1.17e-03 |
Pos logit contributions | |
ending | +0.079 |
ver | +0.078 |
Having | +0.074 |
Doing | +0.072 |
osity | +0.070 |
Neg logit contributions | |
pots | -0.078 |
guys | -0.075 |
ie | -0.075 |
for | -0.073 |
ones | -0.073 |
Token | and |
Token ID | 290 |
Feature activation | -1.55e-02 |
Pos logit contributions | |
Having | +0.002 |
ite | +0.002 |
ending | +0.002 |
ver | +0.002 |
ifying | +0.002 |
Neg logit contributions | |
pots | -0.001 |
ie | -0.001 |
rust | -0.001 |
ty | -0.001 |
hunt | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | -2.45e-02 |
Pos logit contributions | |
ending | +0.025 |
ite | +0.025 |
ifying | +0.025 |
igsaw | +0.024 |
ver | +0.024 |
Neg logit contributions | |
pots | -0.016 |
ie | -0.015 |
for | -0.014 |
guys | -0.014 |
b | -0.014 |
Token | bat |
Token ID | 7365 |
Feature activation | +3.24e-03 |
Pos logit contributions | |
ending | +0.047 |
ver | +0.044 |
Doing | +0.043 |
ite | +0.043 |
earing | +0.042 |
Neg logit contributions | |
pots | -0.021 |
b | -0.020 |
w | -0.019 |
ones | -0.019 |
rust | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | +2.46e-03 |
Pos logit contributions | |
pots | +0.004 |
fl | +0.004 |
rust | +0.003 |
ie | +0.003 |
god | +0.003 |
Neg logit contributions | |
ite | -0.005 |
ver | -0.004 |
Having | -0.004 |
case | -0.004 |
ending | -0.004 |
Token | time |
Token ID | 640 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
ie | +0.003 |
pots | +0.003 |
rust | +0.003 |
fl | +0.003 |
guys | +0.003 |
Neg logit contributions | |
ite | -0.005 |
ending | -0.005 |
ver | -0.004 |
Having | -0.004 |
ifying | -0.004 |
Token | playing |
Token ID | 2712 |
Feature activation | +1.63e-03 |
Pos logit contributions | |
pots | +0.012 |
ie | +0.012 |
rust | +0.011 |
fl | +0.011 |
ty | +0.011 |
Neg logit contributions | |
ite | -0.020 |
Having | -0.020 |
ending | -0.020 |
ver | -0.019 |
ifying | -0.019 |
Token | with |
Token ID | 351 |
Feature activation | -6.62e-03 |
Pos logit contributions | |
pots | +0.002 |
please | +0.002 |
ie | +0.002 |
rust | +0.002 |
isk | +0.002 |
Neg logit contributions | |
ite | -0.002 |
� | -0.002 |
Having | -0.002 |
Jimmy | -0.002 |
igsaw | -0.002 |
Token | her |
Token ID | 607 |
Feature activation | -1.52e-03 |
Pos logit contributions | |
Having | +0.011 |
ite | +0.011 |
Jimmy | +0.011 |
ifying | +0.011 |
� | +0.011 |
Neg logit contributions | |
guys | -0.005 |
pots | -0.005 |
ie | -0.005 |
hunt | -0.005 |
fl | -0.005 |
Token | or |
Token ID | 393 |
Feature activation | +4.26e-03 |
Pos logit contributions | |
ending | +0.002 |
ite | +0.002 |
Having | +0.002 |
ver | +0.002 |
ifying | +0.002 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
fl | -0.002 |
rust | -0.002 |
ty | -0.002 |
Token | nam |
Token ID | 7402 |
Feature activation | -5.88e-02 |
Pos logit contributions | |
co | +0.005 |
ie | +0.005 |
pots | +0.005 |
ty | +0.004 |
guys | +0.004 |
Neg logit contributions | |
Having | -0.006 |
ite | -0.005 |
ifying | -0.005 |
� | -0.005 |
Doing | -0.005 |
Token | ents |
Token ID | 658 |
Feature activation | -4.21e-03 |
Pos logit contributions | |
ver | +0.045 |
Having | +0.045 |
Doing | +0.043 |
Fasc | +0.043 |
Jimmy | +0.043 |
Neg logit contributions | |
ie | -0.103 |
pots | -0.095 |
please | -0.091 |
each | -0.088 |
ty | -0.087 |
Token | and |
Token ID | 290 |
Feature activation | +1.77e-03 |
Pos logit contributions | |
ite | +0.007 |
ver | +0.007 |
ending | +0.007 |
Having | +0.007 |
ifying | +0.007 |
Neg logit contributions | |
pots | -0.004 |
ie | -0.003 |
guys | -0.003 |
rust | -0.003 |
fl | -0.003 |
Token | making |
Token ID | 1642 |
Feature activation | +3.61e-03 |
Pos logit contributions | |
ie | +0.002 |
guys | +0.002 |
pots | +0.002 |
isk | +0.002 |
co | +0.002 |
Neg logit contributions | |
Having | -0.002 |
� | -0.002 |
ite | -0.002 |
Using | -0.002 |
ver | -0.002 |
Token | her |
Token ID | 607 |
Feature activation | -1.93e-03 |
Pos logit contributions | |
hunt | +0.004 |
pots | +0.004 |
ie | +0.004 |
fl | +0.004 |
rob | +0.004 |
Neg logit contributions | |
Having | -0.005 |
� | -0.005 |
ending | -0.005 |
Jimmy | -0.005 |
igsaw | -0.005 |
Token | special |
Token ID | 2041 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
ite | +0.003 |
ending | +0.003 |
Having | +0.003 |
ver | +0.003 |
ifying | +0.002 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
rust | -0.002 |
fl | -0.002 |
ty | -0.002 |
Token | more |
Token ID | 517 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.007 |
ty | +0.007 |
rust | +0.007 |
for | +0.007 |
Neg logit contributions | |
ite | -0.006 |
ending | -0.006 |
Having | -0.006 |
ifying | -0.006 |
ver | -0.006 |
Token | careful |
Token ID | 8161 |
Feature activation | +4.43e-03 |
Pos logit contributions | |
ite | +0.013 |
ifying | +0.013 |
Having | +0.012 |
igsaw | +0.012 |
ver | +0.012 |
Neg logit contributions | |
pots | -0.015 |
for | -0.015 |
ie | -0.015 |
please | -0.014 |
ty | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | -2.30e-02 |
Pos logit contributions | |
ie | +0.004 |
pots | +0.004 |
ty | +0.004 |
for | +0.004 |
fl | +0.003 |
Neg logit contributions | |
ite | -0.007 |
Having | -0.007 |
ifying | -0.007 |
ending | -0.007 |
ver | -0.007 |
Token | The |
Token ID | 383 |
Feature activation | +7.33e-03 |
Pos logit contributions | |
ver | +0.031 |
ending | +0.030 |
ival | +0.030 |
ite | +0.030 |
Having | +0.029 |
Neg logit contributions | |
S | -0.031 |
Mitt | -0.027 |
Chick | -0.024 |
Wh | -0.024 |
Ros | -0.024 |
Token | or |
Token ID | 393 |
Feature activation | +2.43e-03 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.008 |
rust | +0.007 |
fl | +0.007 |
guys | +0.007 |
Neg logit contributions | |
ite | -0.011 |
ending | -0.010 |
Having | -0.010 |
ver | -0.010 |
ifying | -0.010 |
Token | nam |
Token ID | 7402 |
Feature activation | -5.88e-02 |
Pos logit contributions | |
pots | +0.003 |
ie | +0.003 |
fl | +0.003 |
ty | +0.003 |
rust | +0.003 |
Neg logit contributions | |
ite | -0.003 |
Having | -0.003 |
ending | -0.003 |
ifying | -0.003 |
ver | -0.003 |
Token | ents |
Token ID | 658 |
Feature activation | -1.83e-02 |
Pos logit contributions | |
Fasc | +0.050 |
Having | +0.050 |
ver | +0.048 |
Jimmy | +0.047 |
Through | +0.046 |
Neg logit contributions | |
ie | -0.100 |
pots | -0.094 |
each | -0.087 |
please | -0.086 |
rust | -0.085 |
Token | are |
Token ID | 389 |
Feature activation | +5.29e-03 |
Pos logit contributions | |
ite | +0.026 |
Having | +0.025 |
ending | +0.025 |
ver | +0.025 |
ifying | +0.025 |
Neg logit contributions | |
pots | -0.020 |
ie | -0.020 |
rust | -0.018 |
fl | -0.018 |
ty | -0.018 |
Token | not |
Token ID | 407 |
Feature activation | +9.08e-03 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
rust | +0.006 |
ty | +0.006 |
fl | +0.006 |
Neg logit contributions | |
ite | -0.007 |
Having | -0.007 |
ending | -0.007 |
ver | -0.007 |
ifying | -0.007 |
Token | toys |
Token ID | 14958 |
Feature activation | -2.17e-02 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
fl | +0.009 |
rust | +0.009 |
ty | +0.009 |
Neg logit contributions | |
ite | -0.013 |
ending | -0.012 |
Having | -0.012 |
ver | -0.012 |
ifying | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -8.67e-03 |
Pos logit contributions | |
ite | +0.035 |
ending | +0.034 |
Having | +0.034 |
ver | +0.034 |
ifying | +0.034 |
Neg logit contributions | |
pots | -0.020 |
ie | -0.020 |
rust | -0.018 |
fl | -0.018 |
ty | -0.017 |
Token | never |
Token ID | 1239 |
Feature activation | +5.54e-03 |
Pos logit contributions | |
pots | +0.003 |
ie | +0.003 |
rust | +0.003 |
fl | +0.003 |
guys | +0.003 |
Neg logit contributions | |
ite | -0.004 |
Having | -0.004 |
ending | -0.003 |
ver | -0.003 |
ifying | -0.003 |
Token | played |
Token ID | 2826 |
Feature activation | +5.89e-04 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.006 |
ty | +0.006 |
fl | +0.006 |
rust | +0.006 |
Neg logit contributions | |
ite | -0.007 |
ending | -0.007 |
Having | -0.007 |
ver | -0.007 |
ifying | -0.007 |
Token | with |
Token ID | 351 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
ie | +0.001 |
pots | +0.001 |
fl | +0.001 |
rust | +0.001 |
hunt | +0.001 |
Neg logit contributions | |
ite | -0.001 |
Having | -0.001 |
ver | -0.001 |
ending | -0.001 |
ifying | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +7.10e-04 |
Pos logit contributions | |
Having | +0.018 |
ite | +0.018 |
ifying | +0.018 |
ver | +0.018 |
ending | +0.018 |
Neg logit contributions | |
ie | -0.014 |
fl | -0.013 |
rust | -0.013 |
pots | -0.013 |
hunt | -0.013 |
Token | or |
Token ID | 393 |
Feature activation | +9.26e-03 |
Pos logit contributions | |
ie | +0.001 |
pots | +0.001 |
ty | +0.001 |
rust | +0.001 |
fl | +0.001 |
Neg logit contributions | |
ite | -0.001 |
Having | -0.001 |
ending | -0.001 |
ifying | -0.001 |
ver | -0.001 |
Token | nam |
Token ID | 7402 |
Feature activation | -5.86e-02 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
fl | +0.009 |
rust | +0.009 |
ty | +0.009 |
Neg logit contributions | |
ite | -0.013 |
Having | -0.013 |
ending | -0.013 |
ifying | -0.013 |
ver | -0.013 |
Token | ents |
Token ID | 658 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
ver | +0.044 |
Having | +0.044 |
Jimmy | +0.042 |
Fasc | +0.042 |
Through | +0.042 |
Neg logit contributions | |
ie | -0.104 |
pots | -0.098 |
please | -0.093 |
ty | -0.090 |
rust | -0.089 |
Token | again |
Token ID | 757 |
Feature activation | +2.31e-03 |
Pos logit contributions | |
ite | +0.030 |
ending | +0.029 |
ver | +0.029 |
Having | +0.029 |
ifying | +0.029 |
Neg logit contributions | |
pots | -0.023 |
ie | -0.022 |
fl | -0.021 |
rust | -0.021 |
guys | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | +4.11e-03 |
Pos logit contributions | |
pots | +0.003 |
guys | +0.002 |
rust | +0.002 |
ie | +0.002 |
rob | +0.002 |
Neg logit contributions | |
� | -0.003 |
Having | -0.003 |
ite | -0.003 |
ifying | -0.003 |
Doing | -0.003 |
Token | They |
Token ID | 1119 |
Feature activation | +6.52e-03 |
Pos logit contributions | |
S | +0.005 |
them | +0.004 |
isk | +0.004 |
him | +0.004 |
Mitt | +0.004 |
Neg logit contributions | |
ending | -0.007 |
ite | -0.007 |
ver | -0.006 |
ifying | -0.006 |
osity | -0.006 |
Token | still |
Token ID | 991 |
Feature activation | +4.86e-03 |
Pos logit contributions | |
pots | +0.010 |
fl | +0.010 |
ie | +0.010 |
rust | +0.009 |
guys | +0.009 |
Neg logit contributions | |
ite | -0.006 |
ver | -0.006 |
Having | -0.006 |
� | -0.006 |
ifying | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +9.43e-03 |
Pos logit contributions | |
fl | +0.014 |
ie | +0.014 |
rust | +0.014 |
please | +0.013 |
pots | +0.013 |
Neg logit contributions | |
ite | -0.018 |
ago | -0.017 |
� | -0.017 |
case | -0.017 |
ifying | -0.017 |
Token | but |
Token ID | 475 |
Feature activation | -1.28e-03 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
rust | +0.010 |
ty | +0.010 |
guys | +0.009 |
Neg logit contributions | |
ite | -0.014 |
ending | -0.014 |
Having | -0.013 |
ver | -0.013 |
ifying | -0.013 |
Token | it |
Token ID | 340 |
Feature activation | -4.50e-03 |
Pos logit contributions | |
ite | +0.001 |
ending | +0.001 |
Having | +0.001 |
ifying | +0.001 |
ver | +0.001 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
rust | -0.002 |
guys | -0.002 |
ty | -0.002 |
Token | hurt |
Token ID | 5938 |
Feature activation | +1.61e-02 |
Pos logit contributions | |
ite | +0.007 |
Having | +0.007 |
ending | +0.007 |
igsaw | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
ie | -0.005 |
pots | -0.005 |
ty | -0.005 |
rust | -0.005 |
b | -0.004 |
Token | me |
Token ID | 502 |
Feature activation | -7.75e-03 |
Pos logit contributions | |
hunt | +0.021 |
rob | +0.021 |
cast | +0.021 |
pots | +0.021 |
please | +0.021 |
Neg logit contributions | |
� | -0.020 |
ite | -0.019 |
ifying | -0.018 |
It | -0.017 |
Jimmy | -0.016 |
Token | ," |
Token ID | 553 |
Feature activation | +4.59e-02 |
Pos logit contributions | |
ite | +0.012 |
ver | +0.011 |
� | +0.011 |
ending | +0.011 |
ifying | +0.011 |
Neg logit contributions | |
pots | -0.008 |
fl | -0.008 |
guys | -0.008 |
rust | -0.007 |
rob | -0.007 |
Token | Sam |
Token ID | 3409 |
Feature activation | +1.08e-02 |
Pos logit contributions | |
pots | +0.070 |
guys | +0.070 |
co | +0.069 |
ie | +0.069 |
isk | +0.069 |
Neg logit contributions | |
ite | -0.043 |
Having | -0.043 |
� | -0.041 |
Doing | -0.040 |
Through | -0.039 |
Token | said |
Token ID | 531 |
Feature activation | +2.72e-03 |
Pos logit contributions | |
rob | +0.016 |
fl | +0.016 |
pots | +0.016 |
cast | +0.015 |
guys | +0.015 |
Neg logit contributions | |
� | -0.013 |
ver | -0.012 |
earing | -0.011 |
Despite | -0.011 |
erv | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | -4.37e-03 |
Pos logit contributions | |
rob | +0.003 |
fl | +0.003 |
pots | +0.003 |
isk | +0.003 |
hunt | +0.003 |
Neg logit contributions | |
ver | -0.004 |
� | -0.003 |
ending | -0.003 |
erv | -0.003 |
Through | -0.003 |
Token | sniff |
Token ID | 26300 |
Feature activation | +6.12e-04 |
Pos logit contributions | |
ite | +0.006 |
Having | +0.006 |
ending | +0.006 |
ver | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
pots | -0.005 |
ie | -0.005 |
rust | -0.005 |
fl | -0.005 |
ty | -0.005 |
Token | ling |
Token ID | 1359 |
Feature activation | -1.14e-03 |
Pos logit contributions | |
hunt | +0.001 |
pots | +0.001 |
isk | +0.001 |
bank | +0.001 |
please | +0.001 |
Neg logit contributions | |
ite | -0.001 |
ending | -0.001 |
ver | -0.001 |
ifying | -0.001 |
� | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
pots | +0.004 |
cast | +0.003 |
please | +0.003 |
ts | +0.003 |
bothering | +0.003 |
Neg logit contributions | |
ite | -0.003 |
� | -0.003 |
ending | -0.003 |
ver | -0.003 |
erv | -0.002 |
Token | you |
Token ID | 345 |
Feature activation | -1.41e-02 |
Pos logit contributions | |
pots | +0.015 |
ie | +0.015 |
fl | +0.014 |
rust | +0.014 |
ty | +0.014 |
Neg logit contributions | |
ite | -0.013 |
Having | -0.013 |
ending | -0.013 |
ver | -0.013 |
ifying | -0.013 |
Token | 're |
Token ID | 821 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
ite | +0.018 |
Having | +0.017 |
ending | +0.017 |
ver | +0.017 |
� | +0.017 |
Neg logit contributions | |
pots | -0.018 |
co | -0.017 |
fl | -0.017 |
ie | -0.017 |
ty | -0.016 |
Token | so |
Token ID | 523 |
Feature activation | +8.97e-03 |
Pos logit contributions | |
pots | +0.023 |
co | +0.022 |
ie | +0.021 |
glob | +0.021 |
fl | +0.021 |
Neg logit contributions | |
Having | -0.020 |
glad | -0.020 |
� | -0.019 |
ending | -0.019 |
ite | -0.019 |
Token | pretty |
Token ID | 2495 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
ie | +0.010 |
pots | +0.010 |
rust | +0.010 |
fl | +0.009 |
guys | +0.009 |
Neg logit contributions | |
ite | -0.013 |
ifying | -0.012 |
Having | -0.012 |
ending | -0.012 |
ver | -0.012 |
Token | !" |
Token ID | 2474 |
Feature activation | +4.50e-02 |
Pos logit contributions | |
ite | +0.020 |
ending | +0.019 |
� | +0.018 |
ver | +0.018 |
Having | +0.018 |
Neg logit contributions | |
pots | -0.014 |
isk | -0.013 |
ie | -0.013 |
rust | -0.013 |
hunt | -0.012 |
Token | said |
Token ID | 531 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
pots | +0.058 |
cast | +0.054 |
urg | +0.054 |
co | +0.053 |
isk | +0.053 |
Neg logit contributions | |
� | -0.058 |
Having | -0.056 |
ite | -0.055 |
Doing | -0.054 |
Through | -0.053 |
Token | Lily |
Token ID | 20037 |
Feature activation | -3.58e-03 |
Pos logit contributions | |
pots | +0.044 |
cast | +0.044 |
co | +0.042 |
fl | +0.041 |
we | +0.040 |
Neg logit contributions | |
� | -0.024 |
It | -0.024 |
ver | -0.024 |
Having | -0.022 |
Through | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
ite | +0.006 |
ver | +0.006 |
� | +0.006 |
ending | +0.006 |
Having | +0.005 |
Neg logit contributions | |
pots | -0.003 |
guys | -0.003 |
ie | -0.003 |
fl | -0.003 |
ger | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +1.47e-02 |
Pos logit contributions | |
pots | +0.026 |
ie | +0.026 |
rust | +0.024 |
ty | +0.024 |
fl | +0.024 |
Neg logit contributions | |
ite | -0.016 |
Having | -0.015 |
ending | -0.015 |
ver | -0.015 |
ifying | -0.014 |
Token |
|
Token ID | 198 |
Feature activation | -4.03e-03 |
Pos logit contributions | |
pots | +0.024 |
ie | +0.024 |
rust | +0.023 |
fl | +0.023 |
guys | +0.023 |
Neg logit contributions | |
ite | -0.013 |
Having | -0.013 |
ending | -0.012 |
ver | -0.012 |
ifying | -0.012 |
Token | want |
Token ID | 765 |
Feature activation | -1.21e-03 |
Pos logit contributions | |
ite | +0.027 |
ending | +0.026 |
Having | +0.026 |
ifying | +0.026 |
igsaw | +0.025 |
Neg logit contributions | |
ie | -0.028 |
pots | -0.028 |
ty | -0.026 |
hunt | -0.026 |
rust | -0.026 |
Token | to |
Token ID | 284 |
Feature activation | -8.40e-03 |
Pos logit contributions | |
ite | +0.002 |
ending | +0.002 |
Having | +0.002 |
ifying | +0.001 |
� | +0.001 |
Neg logit contributions | |
ie | -0.001 |
pots | -0.001 |
rust | -0.001 |
fl | -0.001 |
isk | -0.001 |
Token | watch |
Token ID | 2342 |
Feature activation | +8.55e-03 |
Pos logit contributions | |
ite | +0.013 |
Having | +0.012 |
ending | +0.012 |
ver | +0.012 |
ifying | +0.012 |
Neg logit contributions | |
pots | -0.008 |
ie | -0.008 |
fl | -0.008 |
rust | -0.008 |
ty | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | -5.07e-03 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
rust | +0.010 |
fl | +0.010 |
isk | +0.009 |
Neg logit contributions | |
ite | -0.011 |
ifying | -0.011 |
ending | -0.011 |
Having | -0.011 |
� | -0.010 |
Token | sunrise |
Token ID | 40048 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
ite | +0.007 |
ifying | +0.006 |
� | +0.006 |
Having | +0.006 |
ending | +0.006 |
Neg logit contributions | |
isk | -0.006 |
ie | -0.006 |
bank | -0.005 |
ty | -0.005 |
pots | -0.005 |
Token | ," |
Token ID | 553 |
Feature activation | +4.31e-02 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
isk | +0.010 |
rust | +0.010 |
guys | +0.009 |
Neg logit contributions | |
ite | -0.015 |
� | -0.015 |
ver | -0.014 |
ending | -0.014 |
case | -0.014 |
Token | Tim |
Token ID | 5045 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
pots | +0.047 |
ie | +0.045 |
guys | +0.043 |
rust | +0.043 |
fl | +0.042 |
Neg logit contributions | |
ite | -0.062 |
Having | -0.061 |
ending | -0.060 |
ver | -0.059 |
Doing | -0.059 |
Token | my |
Token ID | 1820 |
Feature activation | -3.44e-03 |
Pos logit contributions | |
pots | +0.016 |
rust | +0.015 |
guys | +0.015 |
hunt | +0.015 |
fl | +0.015 |
Neg logit contributions | |
ite | -0.014 |
ending | -0.013 |
Having | -0.013 |
ver | -0.013 |
� | -0.013 |
Token | replied |
Token ID | 8712 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
ver | +0.005 |
ending | +0.005 |
Having | +0.005 |
ite | +0.005 |
� | +0.005 |
Neg logit contributions | |
pots | -0.004 |
fl | -0.003 |
ie | -0.003 |
guys | -0.003 |
rust | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +9.83e-04 |
Pos logit contributions | |
ver | +0.020 |
ite | +0.020 |
ending | +0.020 |
Having | +0.020 |
ifying | +0.019 |
Neg logit contributions | |
pots | -0.010 |
ie | -0.010 |
fl | -0.009 |
guys | -0.009 |
rust | -0.009 |
Token | |
Token ID | 220 |
Feature activation | -5.66e-03 |
Pos logit contributions | |
S | +0.001 |
pots | +0.001 |
them | +0.001 |
ie | +0.001 |
bank | +0.001 |
Neg logit contributions | |
ending | -0.001 |
ite | -0.001 |
ifying | -0.001 |
ver | -0.001 |
outage | -0.001 |
Token | That |
Token ID | 2504 |
Feature activation | -3.09e-02 |
Pos logit contributions | |
fl | +0.008 |
pots | +0.008 |
rust | +0.008 |
please | +0.007 |
co | +0.007 |
Neg logit contributions | |
igsaw | -0.007 |
ver | -0.007 |
ending | -0.007 |
osity | -0.007 |
earing | -0.007 |
Token | 's |
Token ID | 338 |
Feature activation | +9.84e-03 |
Pos logit contributions | |
igsaw | +0.044 |
ifying | +0.043 |
Having | +0.043 |
ending | +0.042 |
Jimmy | +0.042 |
Neg logit contributions | |
pots | -0.036 |
fl | -0.036 |
ie | -0.035 |
guys | -0.034 |
rust | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | -2.23e-02 |
Pos logit contributions | |
ie | +0.012 |
pots | +0.012 |
rust | +0.011 |
fl | +0.011 |
ty | +0.011 |
Neg logit contributions | |
ite | -0.013 |
Having | -0.013 |
ending | -0.013 |
ifying | -0.013 |
ver | -0.013 |
Token | flag |
Token ID | 6056 |
Feature activation | +8.78e-03 |
Pos logit contributions | |
ite | +0.023 |
Having | +0.022 |
ending | +0.022 |
ifying | +0.021 |
ver | +0.021 |
Neg logit contributions | |
ie | -0.034 |
pots | -0.034 |
ty | -0.032 |
fl | -0.032 |
rust | -0.032 |
Token | pole |
Token ID | 36869 |
Feature activation | +7.93e-03 |
Pos logit contributions | |
pots | +0.009 |
isk | +0.008 |
ie | +0.008 |
guys | +0.008 |
rust | +0.008 |
Neg logit contributions | |
ite | -0.014 |
ending | -0.013 |
� | -0.013 |
ver | -0.013 |
ifying | -0.013 |
Token | ," |
Token ID | 553 |
Feature activation | +4.83e-02 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.007 |
isk | +0.007 |
rust | +0.007 |
co | +0.006 |
Neg logit contributions | |
ite | -0.013 |
ending | -0.012 |
ver | -0.012 |
ifying | -0.012 |
� | -0.012 |
Token | said |
Token ID | 531 |
Feature activation | +2.30e-02 |
Pos logit contributions | |
pots | +0.059 |
guys | +0.056 |
co | +0.056 |
isk | +0.055 |
hunt | +0.055 |
Neg logit contributions | |
ite | -0.062 |
� | -0.062 |
Having | -0.062 |
Doing | -0.061 |
Jimmy | -0.059 |
Token | his |
Token ID | 465 |
Feature activation | -5.22e-03 |
Pos logit contributions | |
pots | +0.031 |
hunt | +0.031 |
cast | +0.030 |
fl | +0.030 |
co | +0.030 |
Neg logit contributions | |
ver | -0.025 |
ite | -0.025 |
Through | -0.024 |
Having | -0.024 |
Jimmy | -0.024 |
Token | mom |
Token ID | 1995 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
ite | +0.007 |
Having | +0.007 |
ending | +0.007 |
ver | +0.007 |
ifying | +0.007 |
Neg logit contributions | |
pots | -0.006 |
ie | -0.006 |
ty | -0.005 |
rust | -0.005 |
fl | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
pots | +0.012 |
guys | +0.012 |
ger | +0.011 |
hunt | +0.011 |
rob | +0.010 |
Neg logit contributions | |
ver | -0.016 |
� | -0.016 |
ending | -0.016 |
ite | -0.016 |
Doing | -0.015 |
Token | " |
Token ID | 366 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
pots | +0.013 |
S | +0.013 |
ie | +0.013 |
rust | +0.013 |
fl | +0.013 |
Neg logit contributions | |
ite | -0.015 |
ending | -0.014 |
ifying | -0.014 |
Having | -0.014 |
ver | -0.013 |
Token | was |
Token ID | 373 |
Feature activation | +9.17e-03 |
Pos logit contributions | |
pots | +0.009 |
guys | +0.009 |
ger | +0.008 |
pies | +0.008 |
mel | +0.008 |
Neg logit contributions | |
� | -0.006 |
Having | -0.006 |
ver | -0.005 |
Through | -0.005 |
Although | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | +5.92e-03 |
Pos logit contributions | |
pots | +0.010 |
guys | +0.010 |
ie | +0.010 |
cast | +0.010 |
ils | +0.009 |
Neg logit contributions | |
� | -0.013 |
Having | -0.013 |
Through | -0.012 |
glad | -0.012 |
ifying | -0.012 |
Token | grown |
Token ID | 7334 |
Feature activation | -3.64e-02 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.007 |
rust | +0.007 |
fl | +0.007 |
ty | +0.007 |
Neg logit contributions | |
ite | -0.008 |
Having | -0.008 |
ending | -0.008 |
ver | -0.007 |
ifying | -0.007 |
Token | up |
Token ID | 510 |
Feature activation | +1.24e-02 |
Pos logit contributions | |
ite | +0.061 |
ending | +0.060 |
Having | +0.060 |
ver | +0.059 |
ifying | +0.058 |
Neg logit contributions | |
pots | -0.031 |
ie | -0.030 |
rust | -0.028 |
fl | -0.027 |
guys | -0.027 |
Token | asking |
Token ID | 4737 |
Feature activation | +3.92e-02 |
Pos logit contributions | |
ie | +0.013 |
pots | +0.013 |
rust | +0.012 |
fl | +0.012 |
ty | +0.012 |
Neg logit contributions | |
ite | -0.018 |
ending | -0.018 |
Having | -0.018 |
ver | -0.018 |
ifying | -0.018 |
Token | if |
Token ID | 611 |
Feature activation | +4.47e-02 |
Pos logit contributions | |
rob | +0.050 |
please | +0.045 |
pots | +0.045 |
hunt | +0.044 |
guys | +0.044 |
Neg logit contributions | |
� | -0.058 |
ver | -0.054 |
ending | -0.054 |
earing | -0.051 |
Through | -0.051 |
Token | she |
Token ID | 673 |
Feature activation | -6.81e-03 |
Pos logit contributions | |
pots | +0.066 |
glob | +0.066 |
rob | +0.065 |
hunt | +0.064 |
please | +0.063 |
Neg logit contributions | |
ending | -0.046 |
� | -0.045 |
ver | -0.045 |
Having | -0.043 |
ite | -0.043 |
Token | needed |
Token ID | 2622 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
ite | +0.009 |
Having | +0.009 |
ending | +0.009 |
ver | +0.008 |
ifying | +0.008 |
Neg logit contributions | |
pots | -0.008 |
ie | -0.008 |
rust | -0.008 |
fl | -0.008 |
ty | -0.008 |
Token | help |
Token ID | 1037 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
ie | +0.018 |
pots | +0.018 |
fl | +0.017 |
rust | +0.016 |
guys | +0.016 |
Neg logit contributions | |
ite | -0.026 |
ending | -0.026 |
Having | -0.025 |
ver | -0.025 |
ifying | -0.024 |
Token | . |
Token ID | 13 |
Feature activation | +2.39e-02 |
Pos logit contributions | |
rob | +0.022 |
please | +0.019 |
pots | +0.019 |
glob | +0.019 |
fl | +0.019 |
Neg logit contributions | |
� | -0.023 |
ending | -0.020 |
ver | -0.020 |
ite | -0.019 |
Having | -0.019 |
Token | The |
Token ID | 383 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
pots | +0.036 |
ie | +0.036 |
guys | +0.034 |
ty | +0.034 |
hunt | +0.034 |
Neg logit contributions | |
ite | -0.024 |
Having | -0.024 |
ending | -0.023 |
ver | -0.023 |
ifying | -0.022 |
Token | asked |
Token ID | 1965 |
Feature activation | +3.59e-03 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
rust | +0.002 |
fl | +0.002 |
guys | +0.002 |
Neg logit contributions | |
ite | -0.002 |
Having | -0.002 |
ending | -0.002 |
ver | -0.002 |
ifying | -0.002 |
Token | her |
Token ID | 607 |
Feature activation | -6.42e-04 |
Pos logit contributions | |
fl | +0.005 |
rob | +0.005 |
pots | +0.005 |
please | +0.004 |
rust | +0.004 |
Neg logit contributions | |
ver | -0.005 |
� | -0.004 |
Jimmy | -0.004 |
Having | -0.004 |
old | -0.004 |
Token | " |
Token ID | 366 |
Feature activation | +2.27e-02 |
Pos logit contributions | |
ver | +0.001 |
ite | +0.001 |
ending | +0.001 |
Having | +0.001 |
� | +0.001 |
Neg logit contributions | |
pots | -0.001 |
ie | -0.001 |
rob | -0.001 |
hunt | -0.001 |
guys | -0.001 |
Token | What |
Token ID | 2061 |
Feature activation | -4.73e-03 |
Pos logit contributions | |
pots | +0.031 |
ie | +0.029 |
rust | +0.028 |
guys | +0.028 |
hunt | +0.027 |
Neg logit contributions | |
Having | -0.028 |
Jimmy | -0.027 |
ite | -0.027 |
ending | -0.026 |
ifying | -0.026 |
Token | 's |
Token ID | 338 |
Feature activation | +1.36e-02 |
Pos logit contributions | |
ifying | +0.008 |
igsaw | +0.008 |
Having | +0.008 |
uster | +0.008 |
osity | +0.008 |
Neg logit contributions | |
guys | -0.004 |
pots | -0.004 |
for | -0.004 |
hide | -0.004 |
hunt | -0.004 |
Token | wrong |
Token ID | 2642 |
Feature activation | +6.57e-03 |
Pos logit contributions | |
pots | +0.011 |
ie | +0.011 |
for | +0.010 |
ty | +0.010 |
rust | +0.010 |
Neg logit contributions | |
ite | -0.024 |
Having | -0.023 |
ending | -0.023 |
ver | -0.023 |
ifying | -0.023 |
Token | ?". |
Token ID | 43634 |
Feature activation | -8.86e-03 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.008 |
rust | +0.008 |
rob | +0.008 |
hunt | +0.008 |
Neg logit contributions | |
ite | -0.008 |
ver | -0.008 |
� | -0.008 |
ending | -0.008 |
Having | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
ite | +0.009 |
ending | +0.009 |
ifying | +0.009 |
Having | +0.009 |
ver | +0.008 |
Neg logit contributions | |
pots | -0.013 |
ie | -0.013 |
rust | -0.013 |
ty | -0.012 |
guys | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | -2.60e-02 |
Pos logit contributions | |
ifying | +0.020 |
ite | +0.019 |
endant | +0.019 |
ending | +0.019 |
osity | +0.019 |
Neg logit contributions | |
them | -0.021 |
ie | -0.020 |
him | -0.020 |
please | -0.020 |
pots | -0.020 |
Token | The |
Token ID | 464 |
Feature activation | -4.59e-03 |
Pos logit contributions | |
endant | +0.035 |
ifying | +0.032 |
fault | +0.032 |
ite | +0.032 |
outage | +0.031 |
Neg logit contributions | |
them | -0.032 |
god | -0.031 |
each | -0.031 |
please | -0.030 |
him | -0.030 |
Token | woman |
Token ID | 2415 |
Feature activation | -3.79e-03 |
Pos logit contributions | |
ite | +0.004 |
Having | +0.004 |
ending | +0.004 |
� | +0.004 |
Doing | +0.004 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.007 |
hunt | -0.007 |
guys | -0.007 |
ty | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | -9.89e-03 |
Pos logit contributions | |
ite | +0.002 |
ver | +0.002 |
ending | +0.002 |
Having | +0.002 |
ifying | +0.002 |
Neg logit contributions | |
pots | -0.002 |
ie | -0.002 |
fl | -0.002 |
guys | -0.002 |
rust | -0.002 |
Token | pulled |
Token ID | 5954 |
Feature activation | +7.04e-03 |
Pos logit contributions | |
ending | +0.015 |
ite | +0.015 |
ifying | +0.015 |
Having | +0.015 |
igsaw | +0.014 |
Neg logit contributions | |
pots | -0.010 |
ie | -0.010 |
rust | -0.010 |
ty | -0.009 |
hunt | -0.009 |
Token | it |
Token ID | 340 |
Feature activation | +2.50e-02 |
Pos logit contributions | |
pots | +0.009 |
ie | +0.009 |
fl | +0.009 |
rust | +0.009 |
hunt | +0.009 |
Neg logit contributions | |
ite | -0.008 |
ending | -0.008 |
Having | -0.008 |
ver | -0.008 |
� | -0.008 |
Token | away |
Token ID | 1497 |
Feature activation | -2.87e-03 |
Pos logit contributions | |
pots | +0.027 |
ie | +0.026 |
rob | +0.025 |
please | +0.024 |
guys | +0.024 |
Neg logit contributions | |
ite | -0.037 |
ver | -0.037 |
ending | -0.036 |
� | -0.036 |
Having | -0.034 |
Token | from |
Token ID | 422 |
Feature activation | +1.65e-02 |
Pos logit contributions | |
ver | +0.004 |
ifying | +0.004 |
ending | +0.004 |
� | +0.004 |
ite | +0.004 |
Neg logit contributions | |
ie | -0.003 |
pots | -0.003 |
please | -0.003 |
guys | -0.003 |
rob | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +7.43e-03 |
Pos logit contributions | |
fl | +0.023 |
pots | +0.023 |
ie | +0.022 |
rust | +0.021 |
god | +0.021 |
Neg logit contributions | |
Having | -0.017 |
Balloon | -0.016 |
glad | -0.016 |
Whoever | -0.016 |
presses | -0.016 |
Token | tree |
Token ID | 5509 |
Feature activation | +4.12e-03 |
Pos logit contributions | |
pots | +0.008 |
rust | +0.008 |
guys | +0.008 |
hunt | +0.008 |
ie | +0.007 |
Neg logit contributions | |
ending | -0.011 |
ver | -0.011 |
ite | -0.011 |
Having | -0.011 |
Doing | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +8.15e-03 |
Pos logit contributions | |
pots | +0.003 |
ie | +0.003 |
rust | +0.003 |
fl | +0.003 |
guys | +0.003 |
Neg logit contributions | |
ite | -0.007 |
ending | -0.007 |
Having | -0.007 |
ver | -0.007 |
ifying | -0.007 |
Token | The |
Token ID | 383 |
Feature activation | +3.70e-03 |
Pos logit contributions | |
S | +0.010 |
him | +0.010 |
for | +0.010 |
pots | +0.010 |
them | +0.010 |
Neg logit contributions | |
ending | -0.010 |
ite | -0.010 |
ifying | -0.009 |
outage | -0.009 |
Having | -0.009 |
Token | car |
Token ID | 1097 |
Feature activation | -5.21e-03 |
Pos logit contributions | |
animals | +0.003 |
sound | +0.003 |
pots | +0.003 |
rust | +0.003 |
ones | +0.003 |
Neg logit contributions | |
ver | -0.007 |
ifying | -0.007 |
ending | -0.007 |
igsaw | -0.007 |
enny | -0.007 |
Token | was |
Token ID | 373 |
Feature activation | +2.34e-03 |
Pos logit contributions | |
ite | +0.007 |
Having | +0.007 |
ending | +0.007 |
ver | +0.007 |
ifying | +0.007 |
Neg logit contributions | |
pots | -0.006 |
ie | -0.006 |
fl | -0.005 |
rust | -0.005 |
ty | -0.005 |
Token | time |
Token ID | 640 |
Feature activation | +6.05e-04 |
Pos logit contributions | |
pots | +0.022 |
ie | +0.022 |
rust | +0.020 |
ty | +0.020 |
fl | +0.020 |
Neg logit contributions | |
ite | -0.016 |
ending | -0.016 |
Having | -0.016 |
ifying | -0.015 |
ver | -0.015 |
Token | there |
Token ID | 612 |
Feature activation | +4.81e-03 |
Pos logit contributions | |
ie | +0.000 |
pots | +0.000 |
rust | +0.000 |
for | +0.000 |
fl | +0.000 |
Neg logit contributions | |
ite | -0.001 |
ifying | -0.001 |
Having | -0.001 |
ending | -0.001 |
Doing | -0.001 |
Token | was |
Token ID | 373 |
Feature activation | -1.05e-02 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
guys | +0.006 |
rust | +0.006 |
please | +0.006 |
Neg logit contributions | |
Having | -0.006 |
ite | -0.006 |
ver | -0.006 |
� | -0.006 |
Jimmy | -0.005 |
Token | an |
Token ID | 281 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
ite | +0.020 |
ending | +0.020 |
osity | +0.020 |
ver | +0.019 |
outage | +0.019 |
Neg logit contributions | |
pots | -0.008 |
him | -0.007 |
ie | -0.007 |
them | -0.007 |
for | -0.006 |
Token | adventurous |
Token ID | 39770 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
ite | +0.025 |
ending | +0.024 |
Having | +0.024 |
ver | +0.023 |
ifying | +0.023 |
Neg logit contributions | |
pots | -0.021 |
ie | -0.021 |
rust | -0.019 |
fl | -0.019 |
ty | -0.019 |
Token | bear |
Token ID | 6842 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
ending | +0.023 |
Having | +0.023 |
ver | +0.023 |
ifying | +0.023 |
ite | +0.022 |
Neg logit contributions | |
ie | -0.017 |
pots | -0.017 |
guys | -0.016 |
b | -0.016 |
hunt | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +2.66e-03 |
Pos logit contributions | |
pots | +0.014 |
guys | +0.013 |
rust | +0.012 |
ie | +0.012 |
ger | +0.012 |
Neg logit contributions | |
ite | -0.014 |
ending | -0.014 |
ver | -0.013 |
Having | -0.013 |
ifying | -0.013 |
Token | One |
Token ID | 1881 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.004 |
rust | +0.004 |
S | +0.004 |
hunt | +0.004 |
Neg logit contributions | |
ending | -0.003 |
ite | -0.003 |
Having | -0.003 |
ifying | -0.003 |
ver | -0.003 |
Token | day |
Token ID | 1110 |
Feature activation | +1.25e-02 |
Pos logit contributions | |
ie | +0.011 |
pots | +0.010 |
rust | +0.010 |
ty | +0.010 |
fl | +0.010 |
Neg logit contributions | |
Having | -0.020 |
ifying | -0.020 |
ite | -0.020 |
ending | -0.020 |
ver | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | +6.95e-03 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.007 |
guys | +0.007 |
rust | +0.007 |
S | +0.006 |
Neg logit contributions | |
ite | -0.025 |
ending | -0.025 |
Having | -0.025 |
Doing | -0.024 |
ifying | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | +1.84e-02 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.008 |
rust | +0.007 |
fl | +0.007 |
ty | +0.007 |
Neg logit contributions | |
ite | -0.010 |
Having | -0.009 |
ending | -0.009 |
ver | -0.009 |
ifying | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
ie | +0.009 |
pots | +0.009 |
fl | +0.009 |
rust | +0.009 |
ty | +0.009 |
Neg logit contributions | |
ite | -0.013 |
Having | -0.013 |
ending | -0.013 |
ver | -0.012 |
ifying | -0.012 |
Token | couch |
Token ID | 18507 |
Feature activation | -4.51e-03 |
Pos logit contributions | |
Having | +0.012 |
case | +0.012 |
ite | +0.012 |
� | +0.012 |
Jimmy | +0.011 |
Neg logit contributions | |
ie | -0.017 |
pots | -0.016 |
rust | -0.016 |
fl | -0.016 |
bank | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | -9.85e-03 |
Pos logit contributions | |
ite | +0.006 |
ver | +0.006 |
ending | +0.006 |
Having | +0.006 |
case | +0.006 |
Neg logit contributions | |
pots | -0.005 |
fl | -0.005 |
ie | -0.005 |
rust | -0.005 |
guys | -0.005 |
Token | open |
Token ID | 1280 |
Feature activation | -3.01e-04 |
Pos logit contributions | |
ite | +0.017 |
ending | +0.017 |
Having | +0.016 |
ver | +0.016 |
ifying | +0.016 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.009 |
hunt | -0.008 |
rust | -0.008 |
guys | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +3.90e-03 |
Pos logit contributions | |
ite | +0.000 |
ending | +0.000 |
Having | +0.000 |
ver | +0.000 |
ifying | +0.000 |
Neg logit contributions | |
pots | -0.000 |
ie | -0.000 |
rust | -0.000 |
fl | -0.000 |
ty | -0.000 |
Token | door |
Token ID | 3420 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
ie | +0.005 |
please | +0.005 |
pots | +0.005 |
isk | +0.005 |
rust | +0.005 |
Neg logit contributions | |
ite | -0.005 |
ifying | -0.005 |
Having | -0.005 |
case | -0.004 |
� | -0.004 |
Token | to |
Token ID | 284 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.009 |
rust | +0.008 |
fl | +0.008 |
guys | +0.008 |
Neg logit contributions | |
ite | -0.023 |
ending | -0.022 |
Having | -0.022 |
ver | -0.022 |
ifying | -0.022 |
Token | a |
Token ID | 257 |
Feature activation | +3.30e-03 |
Pos logit contributions | |
fl | +0.018 |
cast | +0.017 |
bank | +0.016 |
rob | +0.016 |
ie | +0.016 |
Neg logit contributions | |
� | -0.013 |
Having | -0.013 |
Through | -0.013 |
It | -0.013 |
've | -0.013 |
Token | magical |
Token ID | 10883 |
Feature activation | +2.43e-03 |
Pos logit contributions | |
ie | +0.004 |
pots | +0.004 |
fl | +0.004 |
ty | +0.004 |
rust | +0.004 |
Neg logit contributions | |
ite | -0.004 |
Having | -0.004 |
ifying | -0.004 |
ending | -0.004 |
� | -0.004 |
Token | world |
Token ID | 995 |
Feature activation | -9.50e-03 |
Pos logit contributions | |
pots | +0.003 |
ie | +0.003 |
isk | +0.003 |
fl | +0.003 |
rust | +0.003 |
Neg logit contributions | |
ite | -0.003 |
igsaw | -0.003 |
Having | -0.003 |
case | -0.003 |
ifying | -0.003 |
Token | - |
Token ID | 532 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
ite | +0.018 |
Having | +0.017 |
ending | +0.017 |
ver | +0.017 |
ifying | +0.017 |
Neg logit contributions | |
pots | -0.006 |
ie | -0.006 |
rust | -0.006 |
fl | -0.006 |
ty | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
ie | +0.008 |
pots | +0.008 |
rust | +0.007 |
guys | +0.007 |
fl | +0.007 |
Neg logit contributions | |
ite | -0.017 |
ending | -0.016 |
ver | -0.016 |
ifying | -0.016 |
Having | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
pots | +0.020 |
ie | +0.019 |
guys | +0.019 |
rust | +0.019 |
S | +0.019 |
Neg logit contributions | |
ite | -0.016 |
ending | -0.016 |
Having | -0.015 |
ifying | -0.015 |
ver | -0.015 |
Token |
|
Token ID | 198 |
Feature activation | -5.26e-03 |
Pos logit contributions | |
ie | +0.017 |
pots | +0.017 |
ty | +0.016 |
them | +0.016 |
rust | +0.015 |
Neg logit contributions | |
ite | -0.014 |
ifying | -0.014 |
ending | -0.014 |
Having | -0.013 |
ver | -0.013 |
Token | " |
Token ID | 1 |
Feature activation | +2.16e-02 |
Pos logit contributions | |
ite | +0.006 |
ending | +0.006 |
ver | +0.006 |
igsaw | +0.006 |
Doing | +0.006 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.006 |
co | -0.006 |
ty | -0.006 |
guys | -0.006 |
Token | Very |
Token ID | 16371 |
Feature activation | +1.36e-03 |
Pos logit contributions | |
pots | +0.026 |
ie | +0.026 |
rust | +0.024 |
ty | +0.024 |
fl | +0.024 |
Neg logit contributions | |
ite | -0.029 |
Having | -0.028 |
ending | -0.028 |
ifying | -0.027 |
ver | -0.027 |
Token | good |
Token ID | 922 |
Feature activation | +8.60e-03 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
isk | +0.002 |
fl | +0.002 |
ty | +0.002 |
Neg logit contributions | |
ver | -0.001 |
ite | -0.001 |
glad | -0.001 |
ending | -0.001 |
Having | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
pots | +0.012 |
isk | +0.011 |
bank | +0.010 |
hunt | +0.010 |
rust | +0.010 |
Neg logit contributions | |
ite | -0.011 |
ending | -0.010 |
ver | -0.009 |
ago | -0.009 |
outage | -0.009 |
Token | Ben |
Token ID | 3932 |
Feature activation | +2.06e-02 |
Pos logit contributions | |
ie | +0.018 |
pots | +0.018 |
guys | +0.017 |
S | +0.017 |
ty | +0.017 |
Neg logit contributions | |
ite | -0.021 |
ending | -0.021 |
Having | -0.021 |
ifying | -0.020 |
ver | -0.020 |
Token | !" |
Token ID | 2474 |
Feature activation | +3.17e-02 |
Pos logit contributions | |
pots | +0.027 |
rust | +0.026 |
isk | +0.024 |
guys | +0.024 |
co | +0.024 |
Neg logit contributions | |
� | -0.025 |
ite | -0.024 |
Doing | -0.022 |
ver | -0.021 |
earing | -0.021 |
Token | Miss |
Token ID | 4544 |
Feature activation | +1.55e-02 |
Pos logit contributions | |
pots | +0.036 |
ie | +0.036 |
rust | +0.034 |
fl | +0.033 |
ty | +0.033 |
Neg logit contributions | |
ite | -0.044 |
Having | -0.043 |
ending | -0.043 |
ver | -0.042 |
ifying | -0.042 |
Token | Lee |
Token ID | 5741 |
Feature activation | +1.36e-03 |
Pos logit contributions | |
pots | +0.018 |
ie | +0.017 |
rust | +0.017 |
hunt | +0.016 |
guys | +0.016 |
Neg logit contributions | |
ite | -0.021 |
ver | -0.021 |
ending | -0.021 |
Having | -0.020 |
ifying | -0.020 |
Token | flew |
Token ID | 13112 |
Feature activation | -5.85e-03 |
Pos logit contributions | |
� | +0.025 |
ite | +0.025 |
ending | +0.024 |
Having | +0.023 |
ver | +0.023 |
Neg logit contributions | |
pots | -0.031 |
glob | -0.028 |
rob | -0.027 |
guys | -0.027 |
fl | -0.027 |
Token | away |
Token ID | 1497 |
Feature activation | -1.29e-02 |
Pos logit contributions | |
ite | +0.010 |
Having | +0.009 |
ver | +0.009 |
ifying | +0.009 |
ending | +0.009 |
Neg logit contributions | |
pots | -0.005 |
ie | -0.005 |
fl | -0.005 |
guys | -0.004 |
hunt | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -2.36e-02 |
Pos logit contributions | |
ite | +0.015 |
ver | +0.015 |
Having | +0.014 |
ending | +0.014 |
ifying | +0.014 |
Neg logit contributions | |
pots | -0.018 |
ie | -0.017 |
guys | -0.017 |
fl | -0.016 |
isk | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | -7.38e-04 |
Pos logit contributions | |
ite | +0.033 |
Having | +0.033 |
ending | +0.033 |
ver | +0.032 |
ifying | +0.032 |
Neg logit contributions | |
pots | -0.026 |
ie | -0.026 |
fl | -0.024 |
guys | -0.024 |
ty | -0.024 |
Token | Lily |
Token ID | 20037 |
Feature activation | -4.70e-03 |
Pos logit contributions | |
Having | +0.001 |
� | +0.001 |
ite | +0.001 |
Since | +0.001 |
ver | +0.001 |
Neg logit contributions | |
pots | -0.001 |
fl | -0.001 |
co | -0.001 |
hunt | -0.001 |
urg | -0.001 |
Token | was |
Token ID | 373 |
Feature activation | -5.89e-03 |
Pos logit contributions | |
ite | +0.007 |
Having | +0.006 |
ending | +0.006 |
ver | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
pots | -0.005 |
ie | -0.005 |
fl | -0.005 |
rust | -0.005 |
guys | -0.005 |
Token | sad |
Token ID | 6507 |
Feature activation | -8.35e-03 |
Pos logit contributions | |
ite | +0.009 |
ifying | +0.009 |
igsaw | +0.009 |
ending | +0.009 |
Having | +0.009 |
Neg logit contributions | |
rust | -0.006 |
ie | -0.006 |
pots | -0.006 |
for | -0.006 |
ty | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +5.17e-04 |
Pos logit contributions | |
ite | +0.013 |
ending | +0.013 |
Having | +0.013 |
ver | +0.013 |
ifying | +0.013 |
Neg logit contributions | |
pots | -0.008 |
ie | -0.007 |
fl | -0.007 |
rust | -0.007 |
guys | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | +1.75e-02 |
Pos logit contributions | |
pots | +0.001 |
ie | +0.001 |
fl | +0.001 |
rust | +0.001 |
S | +0.001 |
Neg logit contributions | |
ite | -0.001 |
ending | -0.001 |
ifying | -0.001 |
Having | -0.001 |
ver | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -6.41e-05 |
Pos logit contributions | |
pots | +0.030 |
ie | +0.029 |
guys | +0.028 |
rust | +0.028 |
fl | +0.028 |
Neg logit contributions | |
ite | -0.014 |
Having | -0.014 |
ending | -0.014 |
ver | -0.014 |
Doing | -0.013 |
Token | Suddenly |
Token ID | 38582 |
Feature activation | +4.50e-03 |
Pos logit contributions | |
ite | +0.000 |
ifying | +0.000 |
ver | +0.000 |
osity | +0.000 |
igsaw | +0.000 |
Neg logit contributions | |
ie | -0.000 |
ty | -0.000 |
co | -0.000 |
pots | -0.000 |
isk | -0.000 |
Token | make |
Token ID | 787 |
Feature activation | +6.98e-03 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.004 |
fl | +0.004 |
rust | +0.004 |
ty | +0.004 |
Neg logit contributions | |
ite | -0.005 |
Having | -0.005 |
ending | -0.005 |
ver | -0.005 |
ifying | -0.005 |
Token | you |
Token ID | 345 |
Feature activation | -1.22e-02 |
Pos logit contributions | |
pots | +0.008 |
fl | +0.008 |
ie | +0.008 |
hunt | +0.008 |
isk | +0.008 |
Neg logit contributions | |
� | -0.009 |
Having | -0.009 |
Jimmy | -0.008 |
ending | -0.008 |
Doing | -0.008 |
Token | happy |
Token ID | 3772 |
Feature activation | +1.50e-02 |
Pos logit contributions | |
ite | +0.017 |
ending | +0.017 |
Having | +0.017 |
ifying | +0.017 |
ver | +0.016 |
Neg logit contributions | |
ie | -0.014 |
pots | -0.013 |
rust | -0.013 |
guys | -0.013 |
for | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -5.89e-03 |
Pos logit contributions | |
pots | +0.018 |
isk | +0.018 |
ty | +0.018 |
rust | +0.017 |
ie | +0.017 |
Neg logit contributions | |
ite | -0.018 |
Sharing | -0.018 |
Doing | -0.018 |
� | -0.017 |
Having | -0.017 |
Token | I |
Token ID | 314 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
ending | +0.008 |
ite | +0.008 |
igsaw | +0.007 |
Having | +0.007 |
ver | +0.007 |
Neg logit contributions | |
S | -0.008 |
him | -0.007 |
for | -0.007 |
pots | -0.007 |
fl | -0.007 |
Token | did |
Token ID | 750 |
Feature activation | +4.75e-03 |
Pos logit contributions | |
ite | +0.020 |
ending | +0.020 |
ifying | +0.020 |
Having | +0.020 |
igsaw | +0.019 |
Neg logit contributions | |
ie | -0.018 |
pots | -0.017 |
ty | -0.016 |
rust | -0.016 |
fl | -0.016 |
Token | not |
Token ID | 407 |
Feature activation | +1.06e-02 |
Pos logit contributions | |
pots | +0.005 |
for | +0.005 |
ie | +0.005 |
them | +0.005 |
guys | +0.005 |
Neg logit contributions | |
ite | -0.008 |
ifying | -0.007 |
ending | -0.007 |
ver | -0.007 |
Having | -0.007 |
Token | know |
Token ID | 760 |
Feature activation | +9.55e-03 |
Pos logit contributions | |
pots | +0.017 |
fl | +0.017 |
rust | +0.016 |
ie | +0.015 |
cast | +0.015 |
Neg logit contributions | |
� | -0.010 |
ending | -0.010 |
Having | -0.010 |
ite | -0.010 |
Doing | -0.009 |
Token | you |
Token ID | 345 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
ie | +0.011 |
pots | +0.011 |
rust | +0.010 |
ty | +0.010 |
fl | +0.010 |
Neg logit contributions | |
ite | -0.014 |
Having | -0.013 |
ending | -0.013 |
ifying | -0.013 |
ver | -0.013 |
Token | would |
Token ID | 561 |
Feature activation | +7.53e-03 |
Pos logit contributions | |
ite | +0.031 |
Having | +0.030 |
ending | +0.030 |
ifying | +0.029 |
ver | +0.029 |
Neg logit contributions | |
ie | -0.023 |
pots | -0.023 |
guys | -0.021 |
ty | -0.021 |
rust | -0.021 |
Token | mind |
Token ID | 2000 |
Feature activation | -3.06e-03 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.009 |
fl | +0.009 |
rob | +0.009 |
glob | +0.008 |
Neg logit contributions | |
Having | -0.009 |
ite | -0.009 |
� | -0.009 |
ending | -0.009 |
ver | -0.009 |
Token | at |
Token ID | 379 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
ite | +0.000 |
ending | +0.000 |
Having | +0.000 |
ver | +0.000 |
ifying | +0.000 |
Neg logit contributions | |
pots | -0.000 |
ie | -0.000 |
rust | -0.000 |
fl | -0.000 |
ty | -0.000 |
Token | the |
Token ID | 262 |
Feature activation | +3.65e-03 |
Pos logit contributions | |
ite | +0.021 |
ending | +0.020 |
Having | +0.020 |
ver | +0.020 |
ifying | +0.020 |
Neg logit contributions | |
pots | -0.017 |
ie | -0.017 |
rust | -0.015 |
fl | -0.015 |
ty | -0.015 |
Token | umbrella |
Token ID | 25510 |
Feature activation | -8.51e-03 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.004 |
rust | +0.004 |
ty | +0.004 |
fl | +0.004 |
Neg logit contributions | |
ite | -0.005 |
Having | -0.005 |
ending | -0.005 |
ifying | -0.005 |
ver | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -6.23e-03 |
Pos logit contributions | |
ite | +0.012 |
ending | +0.012 |
ver | +0.012 |
� | +0.011 |
Having | +0.011 |
Neg logit contributions | |
pots | -0.009 |
guys | -0.009 |
ie | -0.009 |
please | -0.009 |
fl | -0.008 |
Token | She |
Token ID | 1375 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
ending | +0.007 |
ite | +0.007 |
ifying | +0.007 |
Having | +0.007 |
ver | +0.007 |
Neg logit contributions | |
pots | -0.009 |
S | -0.008 |
rust | -0.008 |
for | -0.008 |
them | -0.008 |
Token | realized |
Token ID | 6939 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
ite | +0.017 |
Having | +0.017 |
ending | +0.017 |
ver | +0.016 |
ifying | +0.016 |
Neg logit contributions | |
pots | -0.012 |
ie | -0.012 |
rust | -0.011 |
fl | -0.011 |
ty | -0.011 |
Token | Tom |
Token ID | 4186 |
Feature activation | -5.41e-03 |
Pos logit contributions | |
ite | +0.024 |
ifying | +0.024 |
ending | +0.023 |
Having | +0.023 |
ver | +0.022 |
Neg logit contributions | |
ie | -0.015 |
pots | -0.014 |
rust | -0.014 |
them | -0.014 |
ty | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | +9.61e-03 |
Pos logit contributions | |
ite | +0.008 |
ending | +0.007 |
Having | +0.007 |
ifying | +0.007 |
ver | +0.007 |
Neg logit contributions | |
ie | -0.006 |
pots | -0.006 |
ty | -0.006 |
rust | -0.006 |
fl | -0.006 |
Token | right |
Token ID | 826 |
Feature activation | +2.35e-03 |
Pos logit contributions | |
pots | +0.010 |
rust | +0.009 |
ie | +0.009 |
ty | +0.009 |
for | +0.008 |
Neg logit contributions | |
ite | -0.016 |
ending | -0.015 |
ifying | -0.015 |
Having | -0.015 |
ver | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | -3.73e-03 |
Pos logit contributions | |
pots | +0.002 |
ie | +0.002 |
rust | +0.002 |
guys | +0.002 |
hunt | +0.002 |
Neg logit contributions | |
ite | -0.004 |
ifying | -0.004 |
ending | -0.004 |
ver | -0.004 |
Having | -0.004 |
Token | She |
Token ID | 1375 |
Feature activation | -7.12e-03 |
Pos logit contributions | |
ending | +0.005 |
ite | +0.005 |
ifying | +0.005 |
Having | +0.005 |
ver | +0.005 |
Neg logit contributions | |
S | -0.004 |
pots | -0.004 |
rust | -0.004 |
him | -0.004 |
them | -0.004 |
Token | visit |
Token ID | 3187 |
Feature activation | -1.87e-02 |
Pos logit contributions | |
Having | +0.003 |
Having | +0.002 |
Jimmy | +0.002 |
've | +0.002 |
Doing | +0.002 |
Neg logit contributions | |
fl | -0.002 |
pots | -0.002 |
rust | -0.002 |
bat | -0.002 |
rob | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
Having | +0.022 |
� | +0.021 |
Doing | +0.021 |
ver | +0.021 |
Jimmy | +0.021 |
Neg logit contributions | |
fl | -0.027 |
rust | -0.026 |
rob | -0.025 |
pots | -0.024 |
bank | -0.024 |
Token | but |
Token ID | 475 |
Feature activation | -6.66e-03 |
Pos logit contributions | |
ite | +0.026 |
ending | +0.025 |
ifying | +0.024 |
ver | +0.024 |
Having | +0.024 |
Neg logit contributions | |
pots | -0.016 |
ie | -0.016 |
rust | -0.015 |
ty | -0.014 |
for | -0.014 |
Token | Lily |
Token ID | 20037 |
Feature activation | -8.89e-03 |
Pos logit contributions | |
ite | +0.010 |
ending | +0.010 |
Having | +0.010 |
ifying | +0.010 |
ver | +0.010 |
Neg logit contributions | |
ie | -0.007 |
pots | -0.007 |
for | -0.006 |
rust | -0.006 |
ty | -0.006 |
Token | was |
Token ID | 373 |
Feature activation | -4.99e-03 |
Pos logit contributions | |
ite | +0.011 |
Having | +0.011 |
ver | +0.011 |
ending | +0.011 |
Doing | +0.010 |
Neg logit contributions | |
pots | -0.011 |
ie | -0.011 |
rust | -0.011 |
fl | -0.011 |
guys | -0.010 |
Token | too |
Token ID | 1165 |
Feature activation | -6.28e-03 |
Pos logit contributions | |
ite | +0.009 |
igsaw | +0.009 |
ending | +0.008 |
ifying | +0.008 |
osity | +0.008 |
Neg logit contributions | |
all | -0.005 |
for | -0.005 |
even | -0.004 |
b | -0.004 |
them | -0.004 |
Token | sick |
Token ID | 6639 |
Feature activation | +3.24e-03 |
Pos logit contributions | |
ite | +0.009 |
ifying | +0.009 |
ending | +0.008 |
Having | +0.008 |
osity | +0.008 |
Neg logit contributions | |
ie | -0.007 |
pots | -0.007 |
rust | -0.007 |
b | -0.007 |
ty | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | +3.62e-03 |
Pos logit contributions | |
pots | +0.004 |
ie | +0.004 |
rust | +0.004 |
fl | +0.004 |
please | +0.003 |
Neg logit contributions | |
ite | -0.004 |
ending | -0.004 |
ver | -0.004 |
� | -0.004 |
Doing | -0.004 |
Token | play |
Token ID | 711 |
Feature activation | +3.80e-03 |
Pos logit contributions | |
rob | +0.006 |
fl | +0.006 |
pots | +0.005 |
glob | +0.005 |
cast | +0.005 |
Neg logit contributions | |
� | -0.004 |
have | -0.003 |
Having | -0.003 |
case | -0.003 |
've | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
fl | +0.005 |
pots | +0.005 |
rust | +0.005 |
ie | +0.005 |
ho | +0.005 |
Neg logit contributions | |
case | -0.004 |
� | -0.004 |
ver | -0.004 |
Having | -0.004 |
Jimmy | -0.004 |
Token | Emma |
Token ID | 18966 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
ite | +0.017 |
ending | +0.016 |
ifying | +0.015 |
ver | +0.015 |
outage | +0.014 |
Neg logit contributions | |
pots | -0.013 |
S | -0.012 |
for | -0.012 |
ie | -0.012 |
isk | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | -1.51e-02 |
Pos logit contributions | |
pots | +0.018 |
ie | +0.018 |
rust | +0.016 |
fl | +0.016 |
ty | +0.016 |
Neg logit contributions | |
ite | -0.032 |
Having | -0.031 |
ending | -0.031 |
ver | -0.031 |
ifying | -0.030 |
Token | a |
Token ID | 257 |
Feature activation | -3.80e-04 |
Pos logit contributions | |
ite | +0.022 |
ending | +0.022 |
ver | +0.022 |
Having | +0.022 |
ifying | +0.021 |
Neg logit contributions | |
pots | -0.017 |
ie | -0.015 |
rust | -0.015 |
fl | -0.015 |
guys | -0.014 |
Token | drain |
Token ID | 14782 |
Feature activation | -1.27e-03 |
Pos logit contributions | |
ending | +0.001 |
ver | +0.001 |
ite | +0.001 |
Having | +0.001 |
Doing | +0.001 |
Neg logit contributions | |
pots | -0.000 |
rust | -0.000 |
ie | -0.000 |
guys | -0.000 |
hunt | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | -1.50e-02 |
Pos logit contributions | |
ite | +0.002 |
ifying | +0.002 |
Having | +0.002 |
ending | +0.002 |
ver | +0.002 |
Neg logit contributions | |
ie | -0.001 |
pots | -0.001 |
fl | -0.001 |
guys | -0.001 |
ty | -0.001 |
Token | They |
Token ID | 1119 |
Feature activation | -8.38e-03 |
Pos logit contributions | |
ending | +0.017 |
ite | +0.016 |
igsaw | +0.014 |
Having | +0.014 |
ver | +0.013 |
Neg logit contributions | |
pots | -0.024 |
S | -0.024 |
them | -0.023 |
for | -0.021 |
him | -0.021 |
Token | are |
Token ID | 389 |
Feature activation | -5.64e-03 |
Pos logit contributions | |
ending | +0.015 |
ite | +0.014 |
igsaw | +0.014 |
Having | +0.014 |
ver | +0.014 |
Neg logit contributions | |
pots | -0.008 |
rust | -0.007 |
hunt | -0.007 |
guys | -0.007 |
b | -0.007 |
Token | curious |
Token ID | 11040 |
Feature activation | +4.42e-04 |
Pos logit contributions | |
ite | +0.008 |
ending | +0.008 |
Having | +0.008 |
ver | +0.007 |
ifying | +0.007 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.006 |
rust | -0.006 |
fl | -0.006 |
ty | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -1.39e-02 |
Pos logit contributions | |
pots | +0.000 |
ie | +0.000 |
rust | +0.000 |
fl | +0.000 |
ty | +0.000 |
Neg logit contributions | |
ite | -0.001 |
Having | -0.001 |
ending | -0.001 |
ver | -0.001 |
ifying | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -8.62e-03 |
Pos logit contributions | |
ending | +0.017 |
ite | +0.017 |
Having | +0.016 |
igsaw | +0.016 |
ifying | +0.016 |
Neg logit contributions | |
pots | -0.019 |
S | -0.018 |
fl | -0.018 |
them | -0.018 |
rust | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | -2.49e-02 |
Pos logit contributions | |
ifying | +0.010 |
ite | +0.010 |
ending | +0.010 |
Having | +0.009 |
ver | +0.009 |
Neg logit contributions | |
pots | -0.012 |
ie | -0.012 |
them | -0.011 |
rust | -0.011 |
ty | -0.011 |
Token | " |
Token ID | 1 |
Feature activation | +1.42e-02 |
Pos logit contributions | |
igsaw | +0.038 |
osity | +0.037 |
ending | +0.037 |
fault | +0.036 |
ifying | +0.036 |
Neg logit contributions | |
pots | -0.028 |
them | -0.026 |
each | -0.025 |
co | -0.024 |
ty | -0.024 |
Token | time |
Token ID | 640 |
Feature activation | -1.35e-02 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
ty | +0.005 |
hunt | +0.005 |
guys | +0.005 |
Neg logit contributions | |
ite | -0.006 |
ending | -0.006 |
ifying | -0.006 |
Having | -0.005 |
osity | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -1.41e-02 |
Pos logit contributions | |
ifying | +0.026 |
Having | +0.026 |
ending | +0.026 |
ite | +0.026 |
Doing | +0.025 |
Neg logit contributions | |
ie | -0.008 |
pots | -0.008 |
for | -0.007 |
S | -0.007 |
fl | -0.007 |
Token | there |
Token ID | 612 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
ending | +0.024 |
igsaw | +0.024 |
ite | +0.023 |
Having | +0.023 |
ifying | +0.023 |
Neg logit contributions | |
ie | -0.013 |
pots | -0.013 |
for | -0.013 |
rust | -0.011 |
them | -0.010 |
Token | was |
Token ID | 373 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
ite | +0.022 |
ending | +0.021 |
Having | +0.021 |
ifying | +0.021 |
ver | +0.021 |
Neg logit contributions | |
pots | -0.015 |
ie | -0.015 |
rust | -0.014 |
fl | -0.014 |
ty | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
ending | +0.031 |
osity | +0.031 |
ite | +0.030 |
ifying | +0.030 |
outage | +0.029 |
Neg logit contributions | |
pots | -0.010 |
for | -0.009 |
him | -0.008 |
all | -0.008 |
ie | -0.007 |
Token | kind |
Token ID | 1611 |
Feature activation | -3.17e-02 |
Pos logit contributions | |
ending | +0.024 |
ifying | +0.024 |
ite | +0.023 |
ver | +0.023 |
Having | +0.023 |
Neg logit contributions | |
pots | -0.017 |
ie | -0.016 |
b | -0.016 |
rust | -0.016 |
guys | -0.016 |
Token | girl |
Token ID | 2576 |
Feature activation | +1.90e-03 |
Pos logit contributions | |
ifying | +0.047 |
Having | +0.047 |
ending | +0.046 |
ver | +0.046 |
ite | +0.045 |
Neg logit contributions | |
ie | -0.035 |
pots | -0.034 |
rust | -0.032 |
guys | -0.032 |
ty | -0.031 |
Token | named |
Token ID | 3706 |
Feature activation | +9.35e-03 |
Pos logit contributions | |
pots | +0.002 |
rust | +0.002 |
guys | +0.002 |
ie | +0.002 |
fl | +0.002 |
Neg logit contributions | |
ite | -0.003 |
Having | -0.002 |
ending | -0.002 |
Doing | -0.002 |
� | -0.002 |
Token | Lily |
Token ID | 20037 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
ie | +0.012 |
fl | +0.012 |
rust | +0.012 |
pots | +0.012 |
bank | +0.012 |
Neg logit contributions | |
ite | -0.011 |
ver | -0.011 |
Having | -0.010 |
ending | -0.010 |
ifying | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +6.23e-03 |
Pos logit contributions | |
ite | +0.020 |
ending | +0.019 |
Having | +0.019 |
ver | +0.019 |
ifying | +0.019 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.007 |
rust | -0.006 |
fl | -0.006 |
ty | -0.006 |
Token | She |
Token ID | 1375 |
Feature activation | +2.67e-03 |
Pos logit contributions | |
ie | +0.009 |
pots | +0.009 |
ty | +0.009 |
fl | +0.009 |
rust | +0.009 |
Neg logit contributions | |
ite | -0.007 |
Having | -0.006 |
ending | -0.006 |
ver | -0.006 |
ifying | -0.006 |
Token | says |
Token ID | 1139 |
Feature activation | +6.47e-03 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
rust | +0.005 |
fl | +0.005 |
ty | +0.005 |
Neg logit contributions | |
ite | -0.010 |
ifying | -0.010 |
ending | -0.009 |
Having | -0.009 |
ver | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | -9.29e-03 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
hunt | +0.006 |
fl | +0.006 |
isk | +0.006 |
Neg logit contributions | |
ver | -0.010 |
ite | -0.009 |
ending | -0.009 |
� | -0.009 |
Having | -0.009 |
Token | smart |
Token ID | 4451 |
Feature activation | -7.56e-03 |
Pos logit contributions | |
ite | +0.015 |
ending | +0.014 |
ifying | +0.014 |
ver | +0.014 |
igsaw | +0.014 |
Neg logit contributions | |
pots | -0.009 |
ie | -0.009 |
rust | -0.009 |
b | -0.009 |
ty | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
ite | +0.013 |
ending | +0.013 |
Having | +0.013 |
ver | +0.013 |
ifying | +0.013 |
Neg logit contributions | |
pots | -0.006 |
ie | -0.006 |
rust | -0.005 |
fl | -0.005 |
hunt | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
ending | +0.020 |
ite | +0.019 |
osity | +0.018 |
ifying | +0.018 |
igsaw | +0.018 |
Neg logit contributions | |
pots | -0.014 |
S | -0.013 |
them | -0.013 |
for | -0.012 |
b | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | -3.31e-02 |
Pos logit contributions | |
ending | +0.014 |
ite | +0.014 |
ifying | +0.014 |
ver | +0.014 |
Having | +0.013 |
Neg logit contributions | |
pots | -0.016 |
ie | -0.016 |
them | -0.015 |
ty | -0.015 |
rust | -0.015 |
Token | " |
Token ID | 1 |
Feature activation | -6.22e-03 |
Pos logit contributions | |
ending | +0.054 |
osity | +0.053 |
ver | +0.052 |
igsaw | +0.052 |
ite | +0.051 |
Neg logit contributions | |
ie | -0.032 |
pots | -0.032 |
them | -0.030 |
each | -0.030 |
ty | -0.029 |
Token | Right |
Token ID | 11028 |
Feature activation | -7.58e-03 |
Pos logit contributions | |
ver | +0.009 |
ite | +0.009 |
igsaw | +0.009 |
ending | +0.009 |
ifying | +0.008 |
Neg logit contributions | |
pots | -0.007 |
co | -0.007 |
rust | -0.007 |
please | -0.007 |
fl | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
glad | +0.007 |
Jimmy | +0.007 |
ite | +0.007 |
ago | +0.007 |
� | +0.007 |
Neg logit contributions | |
isk | -0.012 |
rob | -0.011 |
rust | -0.011 |
bank | -0.011 |
hunt | -0.011 |
Token | Ben |
Token ID | 3932 |
Feature activation | -1.39e-03 |
Pos logit contributions | |
ending | +0.025 |
ite | +0.025 |
ver | +0.023 |
Having | +0.023 |
ifying | +0.023 |
Neg logit contributions | |
pots | -0.014 |
for | -0.014 |
ie | -0.013 |
b | -0.013 |
o | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -2.04e-02 |
Pos logit contributions | |
ite | +0.002 |
� | +0.002 |
ver | +0.002 |
Doing | +0.002 |
ending | +0.002 |
Neg logit contributions | |
pots | -0.001 |
rust | -0.001 |
ie | -0.001 |
guys | -0.001 |
fl | -0.001 |
Token | long |
Token ID | 890 |
Feature activation | +5.74e-03 |
Pos logit contributions | |
pots | +0.004 |
hunt | +0.004 |
rust | +0.004 |
ie | +0.004 |
guys | +0.004 |
Neg logit contributions | |
ending | -0.007 |
ite | -0.007 |
Doing | -0.006 |
Having | -0.006 |
ifying | -0.006 |
Token | time |
Token ID | 640 |
Feature activation | +9.96e-03 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.007 |
hunt | +0.007 |
guys | +0.006 |
ty | +0.006 |
Neg logit contributions | |
ending | -0.008 |
ite | -0.008 |
ifying | -0.008 |
Doing | -0.008 |
Having | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
pots | +0.009 |
ie | +0.009 |
rust | +0.008 |
fl | +0.008 |
ty | +0.008 |
Neg logit contributions | |
ite | -0.016 |
Having | -0.016 |
ending | -0.016 |
ver | -0.015 |
ifying | -0.015 |
Token | but |
Token ID | 475 |
Feature activation | +6.45e-03 |
Pos logit contributions | |
Having | +0.019 |
ver | +0.018 |
ite | +0.018 |
Through | +0.018 |
ending | +0.018 |
Neg logit contributions | |
ie | -0.015 |
fl | -0.013 |
pots | -0.013 |
guys | -0.013 |
ty | -0.013 |
Token | couldn |
Token ID | 3521 |
Feature activation | -3.53e-02 |
Pos logit contributions | |
pots | +0.007 |
ie | +0.007 |
rust | +0.007 |
fl | +0.007 |
ty | +0.007 |
Neg logit contributions | |
ite | -0.009 |
Having | -0.009 |
ending | -0.009 |
ver | -0.009 |
ifying | -0.008 |
Token | 't |
Token ID | 470 |
Feature activation | -3.13e-02 |
Pos logit contributions | |
ite | +0.057 |
osity | +0.055 |
ifying | +0.055 |
endant | +0.054 |
rou | +0.053 |
Neg logit contributions | |
them | -0.036 |
him | -0.033 |
S | -0.032 |
all | -0.031 |
ie | -0.030 |
Token | find |
Token ID | 1064 |
Feature activation | +3.80e-03 |
Pos logit contributions | |
� | +0.044 |
ver | +0.043 |
Having | +0.041 |
ending | +0.040 |
've | +0.040 |
Neg logit contributions | |
pots | -0.037 |
fl | -0.036 |
rob | -0.036 |
ie | -0.035 |
co | -0.033 |
Token | it |
Token ID | 340 |
Feature activation | +8.75e-03 |
Pos logit contributions | |
co | +0.006 |
please | +0.006 |
isk | +0.006 |
fl | +0.006 |
rust | +0.006 |
Neg logit contributions | |
ite | -0.004 |
ver | -0.003 |
Having | -0.003 |
ifying | -0.003 |
It | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
rob | +0.010 |
pots | +0.010 |
please | +0.010 |
fl | +0.010 |
co | +0.010 |
Neg logit contributions | |
ver | -0.012 |
� | -0.012 |
ite | -0.011 |
ending | -0.011 |
case | -0.011 |
Token | Jane |
Token ID | 12091 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
ite | +0.027 |
ending | +0.026 |
ifying | +0.025 |
outage | +0.023 |
Having | +0.023 |
Neg logit contributions | |
pots | -0.024 |
S | -0.022 |
them | -0.022 |
for | -0.021 |
bank | -0.021 |
Token | was |
Token ID | 373 |
Feature activation | -7.98e-03 |
Pos logit contributions | |
ite | +0.013 |
ver | +0.013 |
Having | +0.013 |
ending | +0.013 |
� | +0.013 |
Neg logit contributions | |
pots | -0.014 |
fl | -0.013 |
ie | -0.013 |
guys | -0.013 |
rust | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | +2.80e-02 |
Pos logit contributions | |
ite | +0.006 |
ending | +0.006 |
Having | +0.006 |
ver | +0.006 |
ifying | +0.006 |
Neg logit contributions | |
pots | -0.004 |
ie | -0.004 |
rust | -0.004 |
fl | -0.004 |
guys | -0.004 |
Token | play |
Token ID | 711 |
Feature activation | +9.21e-03 |
Pos logit contributions | |
pots | +0.027 |
ie | +0.027 |
rust | +0.024 |
fl | +0.024 |
ty | +0.024 |
Neg logit contributions | |
ite | -0.044 |
Having | -0.043 |
ending | -0.043 |
ver | -0.042 |
ifying | -0.042 |
Token | in |
Token ID | 287 |
Feature activation | -1.00e-03 |
Pos logit contributions | |
ho | +0.013 |
isk | +0.013 |
mel | +0.013 |
ie | +0.013 |
fl | +0.013 |
Neg logit contributions | |
football | -0.010 |
soccer | -0.009 |
ite | -0.008 |
Jimmy | -0.008 |
Through | -0.008 |
Token | their |
Token ID | 511 |
Feature activation | +6.18e-03 |
Pos logit contributions | |
ite | +0.002 |
Having | +0.001 |
ending | +0.001 |
ifying | +0.001 |
ver | +0.001 |
Neg logit contributions | |
pots | -0.001 |
ie | -0.001 |
rust | -0.001 |
fl | -0.001 |
ty | -0.001 |
Token | room |
Token ID | 2119 |
Feature activation | +2.26e-02 |
Pos logit contributions | |
pots | +0.008 |
ie | +0.007 |
fl | +0.007 |
hunt | +0.007 |
rust | +0.007 |
Neg logit contributions | |
ending | -0.008 |
ver | -0.008 |
ite | -0.008 |
Having | -0.008 |
ifying | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -3.54e-02 |
Pos logit contributions | |
fl | +0.027 |
please | +0.026 |
rob | +0.026 |
ger | +0.025 |
rust | +0.025 |
Neg logit contributions | |
ver | -0.029 |
case | -0.028 |
ite | -0.027 |
ago | -0.026 |
erv | -0.026 |
Token | They |
Token ID | 1119 |
Feature activation | +1.39e-02 |
Pos logit contributions | |
ending | +0.069 |
ite | +0.066 |
ended | +0.062 |
ver | +0.061 |
outage | +0.061 |
Neg logit contributions | |
pots | -0.031 |
them | -0.029 |
for | -0.027 |
each | -0.026 |
him | -0.025 |
Token | had |
Token ID | 550 |
Feature activation | +3.86e-03 |
Pos logit contributions | |
fl | +0.020 |
pots | +0.019 |
ie | +0.019 |
rust | +0.019 |
ty | +0.018 |
Neg logit contributions | |
ite | -0.015 |
ver | -0.015 |
Having | -0.015 |
� | -0.014 |
ifying | -0.014 |
Token | many |
Token ID | 867 |
Feature activation | +3.12e-03 |
Pos logit contributions | |
ie | +0.005 |
ty | +0.005 |
fl | +0.005 |
pots | +0.005 |
rust | +0.005 |
Neg logit contributions | |
Having | -0.005 |
ite | -0.005 |
ifying | -0.004 |
Jimmy | -0.004 |
ver | -0.004 |
Token | toys |
Token ID | 14958 |
Feature activation | +4.57e-03 |
Pos logit contributions | |
fl | +0.004 |
isk | +0.004 |
please | +0.004 |
bank | +0.004 |
ty | +0.004 |
Neg logit contributions | |
ite | -0.003 |
Having | -0.003 |
Through | -0.003 |
ending | -0.003 |
igsaw | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +1.83e-03 |
Pos logit contributions | |
ie | +0.005 |
pots | +0.005 |
fl | +0.005 |
please | +0.005 |
rust | +0.005 |
Neg logit contributions | |
ite | -0.006 |
ver | -0.006 |
ending | -0.006 |
Having | -0.006 |
ifying | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +4.91e-03 |
Pos logit contributions | |
pots | +0.006 |
ie | +0.006 |
rust | +0.006 |
ty | +0.006 |
fl | +0.006 |
Neg logit contributions | |
ite | -0.012 |
Having | -0.012 |
ending | -0.012 |
ver | -0.012 |
ifying | -0.012 |
Token | They |
Token ID | 1119 |
Feature activation | +2.12e-05 |
Pos logit contributions | |
S | +0.006 |
pots | +0.006 |
them | +0.005 |
fl | +0.005 |
isk | +0.005 |
Neg logit contributions | |
ite | -0.007 |
ending | -0.007 |
ifying | -0.007 |
ver | -0.007 |
Having | -0.006 |
Token | made |
Token ID | 925 |
Feature activation | -2.12e-02 |
Pos logit contributions | |
pots | +0.000 |
fl | +0.000 |
ie | +0.000 |
ty | +0.000 |
guys | +0.000 |
Neg logit contributions | |
ver | -0.000 |
ite | -0.000 |
Having | -0.000 |
� | -0.000 |
Doing | -0.000 |
Token | their |
Token ID | 511 |
Feature activation | -5.85e-03 |
Pos logit contributions | |
Having | +0.027 |
ite | +0.026 |
ending | +0.026 |
ver | +0.025 |
Doing | +0.025 |
Neg logit contributions | |
ie | -0.025 |
pots | -0.024 |
fl | -0.023 |
hunt | -0.023 |
co | -0.023 |
Token | w |
Token ID | 266 |
Feature activation | +9.91e-03 |
Pos logit contributions | |
ite | +0.008 |
ending | +0.008 |
Having | +0.008 |
ver | +0.008 |
ifying | +0.008 |
Neg logit contributions | |
pots | -0.007 |
ie | -0.007 |
rust | -0.006 |
fl | -0.006 |
guys | -0.006 |
Token | agons |
Token ID | 34765 |
Feature activation | -3.15e-02 |
Pos logit contributions | |
pots | +0.010 |
ie | +0.010 |
rust | +0.009 |
ty | +0.009 |
fl | +0.009 |
Neg logit contributions | |
ite | -0.015 |
Having | -0.015 |
ending | -0.015 |
ver | -0.015 |
ifying | -0.015 |
Token | look |
Token ID | 804 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
ite | +0.045 |
Having | +0.044 |
ending | +0.044 |
ver | +0.043 |
ifying | +0.043 |
Neg logit contributions | |
pots | -0.034 |
ie | -0.034 |
fl | -0.031 |
rust | -0.031 |
ty | -0.031 |
Token | like |
Token ID | 588 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
ifying | +0.007 |
ver | +0.007 |
Having | +0.007 |
� | +0.007 |
ite | +0.007 |
Neg logit contributions | |
fl | -0.007 |
pots | -0.007 |
ie | -0.007 |
bank | -0.006 |
isk | -0.006 |
Token | rockets |
Token ID | 20293 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
ite | +0.018 |
Having | +0.018 |
ending | +0.018 |
ver | +0.017 |
ifying | +0.017 |
Neg logit contributions | |
ie | -0.014 |
pots | -0.014 |
rust | -0.013 |
fl | -0.013 |
ty | -0.013 |
Token | and |
Token ID | 290 |
Feature activation | +9.80e-03 |
Pos logit contributions | |
ite | +0.016 |
Having | +0.015 |
ending | +0.015 |
ver | +0.015 |
ifying | +0.015 |
Neg logit contributions | |
pots | -0.014 |
ie | -0.014 |
rust | -0.013 |
fl | -0.013 |
ty | -0.013 |
Token | trains |
Token ID | 13404 |
Feature activation | +1.94e-03 |
Pos logit contributions | |
pots | +0.009 |
ie | +0.009 |
rust | +0.008 |
fl | +0.008 |
ty | +0.008 |
Neg logit contributions | |
ite | -0.016 |
Having | -0.016 |
ending | -0.016 |
ver | -0.015 |
ifying | -0.015 |