Token | share |
Token ID | 2648 |
Feature activation | +5.12e-03 |
Pos logit contributions | |
ores | +0.012 |
us | +0.011 |
om | +0.011 |
ill | +0.011 |
ubs | +0.010 |
Neg logit contributions | |
Deal | -0.015 |
nam | -0.014 |
guys | -0.012 |
smartest | -0.011 |
simplest | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | -1.35e-03 |
Pos logit contributions | |
nam | +0.011 |
Deal | +0.011 |
guys | +0.009 |
simplest | +0.009 |
smartest | +0.008 |
Neg logit contributions | |
ores | -0.006 |
us | -0.005 |
om | -0.005 |
anging | -0.005 |
Matt | -0.005 |
Token | be |
Token ID | 307 |
Feature activation | +6.73e-03 |
Pos logit contributions | |
ores | +0.002 |
us | +0.002 |
om | +0.002 |
ill | +0.002 |
ubs | +0.002 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
smartest | -0.001 |
simplest | -0.001 |
Token | kind |
Token ID | 1611 |
Feature activation | +4.67e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.011 |
guys | +0.010 |
cient | +0.009 |
smartest | +0.009 |
Neg logit contributions | |
ores | -0.010 |
om | -0.009 |
ubs | -0.009 |
us | -0.009 |
it | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | -7.79e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.011 |
guys | +0.009 |
smartest | +0.009 |
simplest | +0.009 |
Neg logit contributions | |
ores | -0.004 |
us | -0.004 |
om | -0.004 |
ubs | -0.003 |
ill | -0.003 |
Token | each |
Token ID | 1123 |
Feature activation | +2.82e-02 |
Pos logit contributions | |
them | +0.009 |
it | +0.009 |
ubs | +0.009 |
their | +0.008 |
ores | +0.008 |
Neg logit contributions | |
Deal | -0.016 |
nam | -0.014 |
smartest | -0.013 |
strongest | -0.013 |
nic | -0.013 |
Token | other |
Token ID | 584 |
Feature activation | +6.04e-03 |
Pos logit contributions | |
Deal | +0.046 |
nam | +0.042 |
guys | +0.033 |
smartest | +0.031 |
cient | +0.030 |
Neg logit contributions | |
ores | -0.045 |
us | -0.045 |
ubs | -0.044 |
om | -0.044 |
ill | -0.043 |
Token | ." |
Token ID | 526 |
Feature activation | +1.09e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.011 |
smartest | +0.010 |
strongest | +0.010 |
Neg logit contributions | |
ores | -0.007 |
us | -0.007 |
om | -0.006 |
Matt | -0.006 |
ill | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +5.24e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
Please | +0.002 |
Really | +0.002 |
Sorry | +0.002 |
Neg logit contributions | |
ores | -0.001 |
ine | -0.001 |
us | -0.001 |
anging | -0.001 |
om | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +4.12e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
Fine | +0.008 |
Really | +0.008 |
Okay | +0.008 |
Neg logit contributions | |
ores | -0.006 |
anging | -0.005 |
ine | -0.005 |
ill | -0.005 |
om | -0.005 |
Token | L |
Token ID | 43 |
Feature activation | +2.26e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.007 |
Fine | +0.005 |
Okay | +0.005 |
guys | +0.005 |
Neg logit contributions | |
ores | -0.006 |
om | -0.006 |
us | -0.006 |
int | -0.006 |
ill | -0.006 |
Token | share |
Token ID | 2648 |
Feature activation | +5.97e-03 |
Pos logit contributions | |
us | +0.010 |
ores | +0.010 |
om | +0.010 |
anging | +0.009 |
int | +0.009 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.007 |
guys | -0.006 |
simplest | -0.005 |
Sorry | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +1.31e-03 |
Pos logit contributions | |
nam | +0.012 |
Deal | +0.011 |
guys | +0.010 |
songs | +0.009 |
games | +0.008 |
Neg logit contributions | |
ores | -0.008 |
anging | -0.008 |
itched | -0.007 |
Matt | -0.007 |
us | -0.007 |
Token | be |
Token ID | 307 |
Feature activation | +7.00e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.001 |
smartest | +0.001 |
simplest | +0.001 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
ill | -0.002 |
ubs | -0.002 |
Token | kind |
Token ID | 1611 |
Feature activation | +5.79e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
guys | +0.009 |
smartest | +0.008 |
cient | +0.008 |
Neg logit contributions | |
ores | -0.012 |
us | -0.011 |
om | -0.011 |
ubs | -0.011 |
ill | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | -5.73e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.011 |
guys | +0.010 |
smartest | +0.009 |
simplest | +0.009 |
Neg logit contributions | |
ores | -0.007 |
us | -0.006 |
om | -0.006 |
Matt | -0.006 |
ubs | -0.006 |
Token | each |
Token ID | 1123 |
Feature activation | +2.77e-02 |
Pos logit contributions | |
ores | +0.009 |
us | +0.008 |
ubs | +0.008 |
om | +0.008 |
Josh | +0.008 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.009 |
guys | -0.007 |
smartest | -0.007 |
strongest | -0.007 |
Token | other |
Token ID | 584 |
Feature activation | +6.45e-03 |
Pos logit contributions | |
Deal | +0.038 |
nam | +0.035 |
guys | +0.028 |
smartest | +0.025 |
strongest | +0.024 |
Neg logit contributions | |
ores | -0.052 |
us | -0.050 |
om | -0.050 |
ubs | -0.048 |
ill | -0.048 |
Token | . |
Token ID | 13 |
Feature activation | +3.05e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.011 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.010 |
us | -0.009 |
Matt | -0.009 |
om | -0.009 |
Matt | -0.009 |
Token | Do |
Token ID | 2141 |
Feature activation | -6.39e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
simplest | +0.004 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.004 |
ubs | -0.004 |
ill | -0.004 |
Token | you |
Token ID | 345 |
Feature activation | -8.05e-03 |
Pos logit contributions | |
ores | +0.009 |
us | +0.009 |
om | +0.009 |
� | +0.009 |
uts | +0.009 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.010 |
guys | -0.008 |
smartest | -0.008 |
strongest | -0.008 |
Token | understand |
Token ID | 1833 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
ores | +0.010 |
us | +0.010 |
om | +0.009 |
Matt | +0.009 |
uts | +0.009 |
Neg logit contributions | |
Deal | -0.016 |
nam | -0.016 |
guys | -0.014 |
smartest | -0.013 |
simplest | -0.013 |
Token | be |
Token ID | 307 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
ores | +0.009 |
us | +0.009 |
om | +0.009 |
ubs | +0.008 |
ill | +0.008 |
Neg logit contributions | |
Deal | -0.009 |
nam | -0.008 |
guys | -0.007 |
smartest | -0.006 |
simplest | -0.006 |
Token | kind |
Token ID | 1611 |
Feature activation | +8.09e-03 |
Pos logit contributions | |
Deal | +0.017 |
nam | +0.017 |
guys | +0.014 |
smartest | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
ores | -0.018 |
us | -0.018 |
om | -0.017 |
ill | -0.017 |
uts | -0.017 |
Token | and |
Token ID | 290 |
Feature activation | +9.08e-03 |
Pos logit contributions | |
Deal | +0.021 |
nam | +0.021 |
guys | +0.018 |
smartest | +0.018 |
strongest | +0.017 |
Neg logit contributions | |
ores | -0.005 |
us | -0.004 |
om | -0.004 |
ill | -0.004 |
ubs | -0.004 |
Token | friendly |
Token ID | 8030 |
Feature activation | +7.34e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.009 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.016 |
om | -0.015 |
us | -0.014 |
� | -0.014 |
int | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | -3.48e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.010 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.011 |
us | -0.010 |
om | -0.010 |
ill | -0.010 |
ubs | -0.010 |
Token | each |
Token ID | 1123 |
Feature activation | +2.71e-02 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
om | +0.004 |
ubs | +0.003 |
ill | +0.003 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
guys | -0.006 |
smartest | -0.006 |
strongest | -0.006 |
Token | other |
Token ID | 584 |
Feature activation | +7.78e-03 |
Pos logit contributions | |
Deal | +0.039 |
nam | +0.036 |
guys | +0.028 |
smartest | +0.026 |
strongest | +0.025 |
Neg logit contributions | |
ores | -0.049 |
us | -0.048 |
om | -0.047 |
ubs | -0.046 |
ill | -0.046 |
Token | too |
Token ID | 1165 |
Feature activation | +6.37e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.010 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.012 |
us | -0.011 |
om | -0.011 |
ill | -0.011 |
ubs | -0.011 |
Token | ?" |
Token ID | 1701 |
Feature activation | -3.93e-04 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.007 |
smartest | +0.007 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.011 |
om | -0.011 |
us | -0.011 |
ubs | -0.010 |
ill | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +2.22e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
anging | +0.001 |
ine | +0.000 |
ge | +0.000 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
Please | -0.001 |
Really | -0.001 |
Fine | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +1.72e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
Really | +0.003 |
OK | +0.003 |
Fine | +0.003 |
Neg logit contributions | |
ores | -0.003 |
anging | -0.003 |
ill | -0.003 |
ine | -0.003 |
int | -0.002 |
Token | need |
Token ID | 761 |
Feature activation | +1.84e-03 |
Pos logit contributions | |
ores | +0.009 |
om | +0.009 |
us | +0.009 |
� | +0.009 |
s | +0.008 |
Neg logit contributions | |
Deal | -0.013 |
nam | -0.012 |
guys | -0.010 |
smartest | -0.010 |
strongest | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | +4.52e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ubs | -0.001 |
ill | -0.001 |
Token | be |
Token ID | 307 |
Feature activation | +7.39e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.004 |
simplest | +0.004 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
om | -0.008 |
ill | -0.007 |
anging | -0.007 |
Token | nice |
Token ID | 3621 |
Feature activation | +2.56e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.011 |
smartest | +0.010 |
cient | +0.010 |
Neg logit contributions | |
ores | -0.011 |
us | -0.010 |
om | -0.010 |
ubs | -0.010 |
� | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | -1.77e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
simplest | +0.005 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
Matt | -0.002 |
ubs | -0.002 |
Token | each |
Token ID | 1123 |
Feature activation | +2.69e-02 |
Pos logit contributions | |
ores | +0.002 |
ubs | +0.002 |
us | +0.002 |
Josh | +0.002 |
om | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.003 |
smartest | -0.003 |
strongest | -0.002 |
Token | other |
Token ID | 584 |
Feature activation | +7.53e-03 |
Pos logit contributions | |
Deal | +0.042 |
nam | +0.040 |
guys | +0.031 |
smartest | +0.029 |
simplest | +0.028 |
Neg logit contributions | |
ores | -0.045 |
us | -0.044 |
om | -0.043 |
ubs | -0.042 |
ill | -0.042 |
Token | . |
Token ID | 13 |
Feature activation | +5.84e-03 |
Pos logit contributions | |
Deal | +0.016 |
nam | +0.016 |
guys | +0.014 |
smartest | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
ores | -0.008 |
us | -0.007 |
om | -0.007 |
ill | -0.007 |
Matt | -0.007 |
Token | You |
Token ID | 921 |
Feature activation | -6.28e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
om | -0.008 |
� | -0.008 |
Josh | -0.007 |
Token | need |
Token ID | 761 |
Feature activation | +2.45e-03 |
Pos logit contributions | |
ores | +0.008 |
� | +0.008 |
om | +0.008 |
us | +0.008 |
s | +0.007 |
Neg logit contributions | |
Deal | -0.012 |
nam | -0.012 |
guys | -0.009 |
smartest | -0.009 |
strongest | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | +4.69e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.002 |
us | -0.001 |
om | -0.001 |
ubs | -0.001 |
ill | -0.001 |
Token | share |
Token ID | 2648 |
Feature activation | +8.56e-03 |
Pos logit contributions | |
ores | +0.003 |
us | +0.003 |
om | +0.003 |
ill | +0.003 |
� | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | +1.94e-05 |
Pos logit contributions | |
nam | +0.016 |
Deal | +0.016 |
guys | +0.014 |
simplest | +0.012 |
nic | +0.012 |
Neg logit contributions | |
ores | -0.012 |
us | -0.011 |
om | -0.011 |
anging | -0.011 |
Matt | -0.010 |
Token | be |
Token ID | 307 |
Feature activation | +9.16e-03 |
Pos logit contributions | |
Deal | +0.000 |
nam | +0.000 |
guys | +0.000 |
smartest | +0.000 |
simplest | +0.000 |
Neg logit contributions | |
ores | -0.000 |
us | -0.000 |
om | -0.000 |
anging | -0.000 |
ill | -0.000 |
Token | nice |
Token ID | 3621 |
Feature activation | +4.85e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.013 |
guys | +0.011 |
smartest | +0.010 |
strongest | +0.010 |
Neg logit contributions | |
ores | -0.016 |
us | -0.015 |
om | -0.015 |
ubs | -0.014 |
ill | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | -4.36e-04 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
strongest | +0.007 |
Neg logit contributions | |
ores | -0.006 |
us | -0.006 |
om | -0.006 |
ubs | -0.005 |
ill | -0.005 |
Token | each |
Token ID | 1123 |
Feature activation | +2.67e-02 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
it | +0.001 |
them | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
guys | -0.001 |
Token | other |
Token ID | 584 |
Feature activation | +8.35e-03 |
Pos logit contributions | |
Deal | +0.039 |
nam | +0.037 |
guys | +0.029 |
smartest | +0.027 |
strongest | +0.025 |
Neg logit contributions | |
ores | -0.048 |
us | -0.047 |
om | -0.046 |
ubs | -0.045 |
ill | -0.044 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.13e-03 |
Pos logit contributions | |
Deal | +0.015 |
nam | +0.014 |
guys | +0.011 |
smartest | +0.011 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.012 |
us | -0.012 |
om | -0.011 |
ill | -0.011 |
� | -0.011 |
Token | Mom |
Token ID | 11254 |
Feature activation | -2.71e-03 |
Pos logit contributions | |
nam | +0.004 |
Deal | +0.003 |
Sorry | +0.003 |
guys | +0.002 |
smartest | +0.002 |
Neg logit contributions | |
us | -0.004 |
ores | -0.003 |
ork | -0.003 |
uts | -0.003 |
om | -0.003 |
Token | said |
Token ID | 531 |
Feature activation | +2.55e-03 |
Pos logit contributions | |
ores | +0.004 |
ork | +0.004 |
ubs | +0.004 |
alks | +0.004 |
acks | +0.004 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
guys | -0.003 |
nic | -0.003 |
smartest | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | -9.79e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.003 |
Matt | -0.003 |
us | -0.003 |
ubs | -0.003 |
om | -0.003 |
Token | you |
Token ID | 345 |
Feature activation | -5.48e-03 |
Pos logit contributions | |
Deal | +0.015 |
nam | +0.014 |
guys | +0.012 |
smartest | +0.011 |
cient | +0.010 |
Neg logit contributions | |
ores | -0.015 |
om | -0.014 |
� | -0.014 |
us | -0.014 |
ill | -0.013 |
Token | can |
Token ID | 460 |
Feature activation | +3.04e-03 |
Pos logit contributions | |
ores | +0.007 |
om | +0.007 |
� | +0.007 |
us | +0.007 |
ill | +0.007 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.010 |
guys | -0.008 |
smartest | -0.008 |
strongest | -0.008 |
Token | be |
Token ID | 307 |
Feature activation | +9.29e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.005 |
ubs | -0.005 |
ill | -0.005 |
Token | nice |
Token ID | 3621 |
Feature activation | +4.53e-03 |
Pos logit contributions | |
Deal | +0.018 |
nam | +0.017 |
guys | +0.014 |
smartest | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
ores | -0.013 |
us | -0.012 |
om | -0.012 |
ubs | -0.011 |
ill | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | -3.16e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.005 |
us | -0.004 |
Matt | -0.004 |
itched | -0.004 |
om | -0.004 |
Token | each |
Token ID | 1123 |
Feature activation | +2.63e-02 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
om | +0.004 |
Josh | +0.004 |
ubs | +0.004 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.006 |
guys | -0.005 |
smartest | -0.005 |
simplest | -0.004 |
Token | other |
Token ID | 584 |
Feature activation | +9.67e-03 |
Pos logit contributions | |
Deal | +0.041 |
nam | +0.039 |
guys | +0.030 |
smartest | +0.028 |
simplest | +0.028 |
Neg logit contributions | |
us | -0.044 |
om | -0.043 |
ores | -0.043 |
ubs | -0.041 |
ill | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | +5.11e-03 |
Pos logit contributions | |
Deal | +0.019 |
nam | +0.018 |
guys | +0.016 |
smartest | +0.014 |
strongest | +0.014 |
Neg logit contributions | |
ores | -0.013 |
us | -0.012 |
om | -0.012 |
ubs | -0.011 |
Matt | -0.011 |
Token | That |
Token ID | 1320 |
Feature activation | -9.65e-04 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
cient | +0.007 |
Neg logit contributions | |
ores | -0.007 |
� | -0.007 |
om | -0.006 |
us | -0.006 |
Josh | -0.006 |
Token | is |
Token ID | 318 |
Feature activation | +6.13e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ubs | +0.001 |
ill | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
smartest | -0.001 |
strongest | -0.001 |
Token | fair |
Token ID | 3148 |
Feature activation | +1.83e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.011 |
cient | +0.010 |
smartest | +0.010 |
Neg logit contributions | |
ores | -0.007 |
� | -0.006 |
om | -0.006 |
us | -0.006 |
Josh | -0.005 |
Token | share |
Token ID | 2648 |
Feature activation | +7.11e-03 |
Pos logit contributions | |
ores | +0.008 |
us | +0.008 |
om | +0.008 |
anging | +0.007 |
int | +0.007 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.008 |
guys | -0.007 |
smartest | -0.006 |
simplest | -0.006 |
Token | and |
Token ID | 290 |
Feature activation | -7.38e-04 |
Pos logit contributions | |
nam | +0.015 |
Deal | +0.014 |
guys | +0.013 |
fart | +0.011 |
simplest | +0.011 |
Neg logit contributions | |
ores | -0.009 |
us | -0.008 |
anging | -0.008 |
Matt | -0.007 |
ill | -0.007 |
Token | be |
Token ID | 307 |
Feature activation | +6.74e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ill | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
simplest | -0.001 |
Token | nice |
Token ID | 3621 |
Feature activation | +4.53e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
guys | +0.009 |
smartest | +0.008 |
cient | +0.008 |
Neg logit contributions | |
ores | -0.011 |
om | -0.010 |
us | -0.010 |
ubs | -0.010 |
� | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | -2.84e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
simplest | +0.007 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.005 |
Matt | -0.004 |
int | -0.004 |
Token | each |
Token ID | 1123 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
ores | +0.003 |
ubs | +0.003 |
it | +0.003 |
us | +0.003 |
om | +0.003 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.005 |
smartest | -0.004 |
strongest | -0.004 |
nic | -0.004 |
Token | other |
Token ID | 584 |
Feature activation | +7.40e-03 |
Pos logit contributions | |
Deal | +0.041 |
nam | +0.038 |
guys | +0.030 |
smartest | +0.028 |
simplest | +0.027 |
Neg logit contributions | |
us | -0.044 |
ores | -0.044 |
om | -0.043 |
ubs | -0.042 |
s | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | +3.66e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.011 |
smartest | +0.010 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.011 |
us | -0.011 |
om | -0.010 |
Matt | -0.010 |
ill | -0.010 |
Token | You |
Token ID | 921 |
Feature activation | -8.38e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.005 |
om | -0.005 |
us | -0.005 |
� | -0.005 |
ubs | -0.005 |
Token | are |
Token ID | 389 |
Feature activation | +5.28e-03 |
Pos logit contributions | |
� | +0.012 |
ores | +0.012 |
om | +0.012 |
us | +0.011 |
s | +0.011 |
Neg logit contributions | |
Deal | -0.015 |
nam | -0.014 |
smartest | -0.011 |
guys | -0.011 |
simplest | -0.011 |
Token | twins |
Token ID | 20345 |
Feature activation | +1.66e-02 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.010 |
Okay | +0.009 |
guys | +0.009 |
cient | +0.009 |
Neg logit contributions | |
ores | -0.006 |
� | -0.005 |
it | -0.005 |
us | -0.005 |
om | -0.005 |
Token | share |
Token ID | 2648 |
Feature activation | +6.77e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.006 |
us | -0.006 |
om | -0.006 |
ill | -0.005 |
ubs | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -3.20e-03 |
Pos logit contributions | |
nam | +0.014 |
Deal | +0.014 |
guys | +0.012 |
fart | +0.011 |
simplest | +0.011 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
om | -0.007 |
Matt | -0.007 |
anging | -0.007 |
Token | be |
Token ID | 307 |
Feature activation | +6.47e-03 |
Pos logit contributions | |
ores | +0.006 |
us | +0.006 |
om | +0.005 |
ill | +0.005 |
ubs | +0.005 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.004 |
guys | -0.004 |
smartest | -0.003 |
simplest | -0.003 |
Token | nice |
Token ID | 3621 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
guys | +0.009 |
cient | +0.008 |
smartest | +0.008 |
Neg logit contributions | |
ores | -0.010 |
om | -0.009 |
ubs | -0.009 |
us | -0.009 |
� | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | -4.78e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
simplest | +0.007 |
Neg logit contributions | |
ores | -0.005 |
us | -0.004 |
om | -0.004 |
Matt | -0.004 |
ubs | -0.004 |
Token | each |
Token ID | 1123 |
Feature activation | +2.62e-02 |
Pos logit contributions | |
them | +0.005 |
it | +0.005 |
ubs | +0.005 |
ores | +0.005 |
their | +0.005 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.009 |
smartest | -0.008 |
strongest | -0.008 |
nic | -0.008 |
Token | other |
Token ID | 584 |
Feature activation | +7.56e-03 |
Pos logit contributions | |
Deal | +0.039 |
nam | +0.037 |
guys | +0.029 |
smartest | +0.027 |
simplest | +0.026 |
Neg logit contributions | |
ores | -0.046 |
us | -0.044 |
om | -0.044 |
ubs | -0.043 |
ill | -0.043 |
Token | ." |
Token ID | 526 |
Feature activation | -7.22e-04 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.013 |
guys | +0.012 |
smartest | +0.011 |
strongest | +0.010 |
Neg logit contributions | |
ores | -0.011 |
us | -0.010 |
om | -0.010 |
Matt | -0.010 |
ubs | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | +3.68e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
ine | +0.001 |
anging | +0.001 |
acks | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
Sorry | -0.001 |
Really | -0.001 |
Please | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +2.19e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.007 |
Sorry | +0.006 |
Okay | +0.006 |
Really | +0.006 |
Neg logit contributions | |
ores | -0.004 |
ill | -0.004 |
int | -0.004 |
ine | -0.004 |
anging | -0.004 |
Token | She |
Token ID | 3347 |
Feature activation | +7.63e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
Okay | +0.003 |
Fine | +0.003 |
Neg logit contributions | |
ores | -0.003 |
om | -0.003 |
us | -0.003 |
int | -0.003 |
ill | -0.003 |
Token | ? |
Token ID | 30 |
Feature activation | +1.59e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
guys | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.005 |
ubs | -0.005 |
ill | -0.005 |
Token | Why |
Token ID | 4162 |
Feature activation | +7.79e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
Sorry | +0.001 |
guys | +0.001 |
smartest | +0.001 |
Neg logit contributions | |
ores | -0.003 |
ubs | -0.003 |
int | -0.003 |
ill | -0.003 |
us | -0.003 |
Token | are |
Token ID | 389 |
Feature activation | -9.95e-04 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.007 |
smartest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.016 |
us | -0.015 |
om | -0.015 |
int | -0.015 |
ubs | -0.014 |
Token | you |
Token ID | 345 |
Feature activation | -6.95e-04 |
Pos logit contributions | |
ores | +0.002 |
us | +0.001 |
om | +0.001 |
� | +0.001 |
Josh | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
simplest | -0.001 |
Token | hurting |
Token ID | 21530 |
Feature activation | +5.67e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
acks | +0.001 |
ork | +0.001 |
ill | +0.001 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | each |
Token ID | 1123 |
Feature activation | +2.61e-02 |
Pos logit contributions | |
nam | +0.010 |
Deal | +0.010 |
guys | +0.008 |
smartest | +0.008 |
strongest | +0.007 |
Neg logit contributions | |
ores | -0.008 |
om | -0.008 |
int | -0.008 |
us | -0.008 |
anging | -0.007 |
Token | other |
Token ID | 584 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
Deal | +0.033 |
nam | +0.031 |
guys | +0.024 |
smartest | +0.021 |
strongest | +0.021 |
Neg logit contributions | |
ores | -0.053 |
us | -0.050 |
om | -0.049 |
ill | -0.048 |
int | -0.048 |
Token | ? |
Token ID | 30 |
Feature activation | +2.93e-03 |
Pos logit contributions | |
Deal | +0.028 |
nam | +0.027 |
guys | +0.024 |
smartest | +0.023 |
strongest | +0.022 |
Neg logit contributions | |
ores | -0.008 |
us | -0.007 |
om | -0.007 |
ubs | -0.007 |
ill | -0.007 |
Token | You |
Token ID | 921 |
Feature activation | -5.97e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.003 |
Sorry | +0.003 |
guys | +0.002 |
smartest | +0.002 |
Neg logit contributions | |
ores | -0.006 |
ubs | -0.006 |
int | -0.006 |
us | -0.005 |
ill | -0.005 |
Token | should |
Token ID | 815 |
Feature activation | -6.42e-03 |
Pos logit contributions | |
ores | +0.010 |
us | +0.009 |
om | +0.009 |
ubs | +0.009 |
ill | +0.009 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.009 |
guys | -0.007 |
smartest | -0.007 |
strongest | -0.007 |
Token | share |
Token ID | 2648 |
Feature activation | +7.27e-03 |
Pos logit contributions | |
us | +0.011 |
ores | +0.011 |
om | +0.011 |
int | +0.010 |
anging | +0.010 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.009 |
guys | -0.008 |
Sorry | -0.007 |
smartest | -0.007 |
Token | You |
Token ID | 921 |
Feature activation | -7.28e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.007 |
om | -0.006 |
� | -0.006 |
us | -0.006 |
ubs | -0.006 |
Token | should |
Token ID | 815 |
Feature activation | -6.67e-03 |
Pos logit contributions | |
ores | +0.011 |
om | +0.010 |
us | +0.010 |
� | +0.010 |
s | +0.010 |
Neg logit contributions | |
Deal | -0.013 |
nam | -0.012 |
guys | -0.010 |
smartest | -0.010 |
strongest | -0.009 |
Token | be |
Token ID | 307 |
Feature activation | +9.64e-03 |
Pos logit contributions | |
ores | +0.012 |
us | +0.012 |
om | +0.012 |
ill | +0.011 |
ubs | +0.011 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.009 |
guys | -0.007 |
smartest | -0.007 |
simplest | -0.006 |
Token | nice |
Token ID | 3621 |
Feature activation | +4.65e-03 |
Pos logit contributions | |
Deal | +0.018 |
nam | +0.017 |
guys | +0.017 |
cient | +0.015 |
ode | +0.014 |
Neg logit contributions | |
ores | -0.012 |
late | -0.011 |
their | -0.011 |
and | -0.011 |
it | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | -3.35e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
guys | +0.009 |
smartest | +0.009 |
simplest | +0.008 |
Neg logit contributions | |
ores | -0.004 |
us | -0.004 |
om | -0.004 |
Matt | -0.004 |
ubs | -0.004 |
Token | each |
Token ID | 1123 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
it | +0.003 |
ores | +0.003 |
ubs | +0.003 |
them | +0.003 |
om | +0.003 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
smartest | -0.006 |
nic | -0.006 |
strongest | -0.006 |
Token | other |
Token ID | 584 |
Feature activation | +6.56e-03 |
Pos logit contributions | |
Deal | +0.046 |
nam | +0.043 |
guys | +0.034 |
smartest | +0.033 |
nic | +0.033 |
Neg logit contributions | |
om | -0.037 |
s | -0.036 |
us | -0.036 |
ubs | -0.036 |
and | -0.035 |
Token | ." |
Token ID | 526 |
Feature activation | +6.07e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.011 |
smartest | +0.010 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.009 |
us | -0.008 |
om | -0.008 |
Matt | -0.008 |
ill | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +6.98e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.013 |
Sorry | +0.011 |
guys | +0.011 |
simplest | +0.011 |
Neg logit contributions | |
ores | -0.006 |
us | -0.005 |
ine | -0.005 |
anging | -0.005 |
om | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | +4.39e-03 |
Pos logit contributions | |
Deal | +0.015 |
nam | +0.013 |
OK | +0.011 |
Okay | +0.011 |
Fine | +0.011 |
Neg logit contributions | |
ores | -0.007 |
anging | -0.007 |
ill | -0.007 |
ine | -0.007 |
om | -0.006 |
Token | Anna |
Token ID | 31160 |
Feature activation | -3.11e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.006 |
om | -0.006 |
us | -0.006 |
ubs | -0.005 |
ill | -0.005 |
Token | share |
Token ID | 2648 |
Feature activation | +6.71e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.006 |
smartest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.009 |
om | -0.009 |
us | -0.009 |
ubs | -0.009 |
ill | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -3.04e-03 |
Pos logit contributions | |
nam | +0.014 |
Deal | +0.014 |
guys | +0.012 |
simplest | +0.011 |
fart | +0.011 |
Neg logit contributions | |
ores | -0.008 |
us | -0.007 |
Matt | -0.007 |
anging | -0.007 |
om | -0.007 |
Token | be |
Token ID | 307 |
Feature activation | +6.40e-03 |
Pos logit contributions | |
ores | +0.005 |
us | +0.005 |
om | +0.005 |
ubs | +0.005 |
ill | +0.005 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.004 |
smartest | -0.003 |
strongest | -0.003 |
Token | nice |
Token ID | 3621 |
Feature activation | +3.75e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.009 |
cient | +0.009 |
smartest | +0.008 |
Neg logit contributions | |
ores | -0.009 |
om | -0.009 |
ubs | -0.009 |
late | -0.008 |
their | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | -5.66e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.004 |
us | -0.004 |
om | -0.004 |
Matt | -0.004 |
ill | -0.004 |
Token | each |
Token ID | 1123 |
Feature activation | +2.59e-02 |
Pos logit contributions | |
ubs | +0.006 |
ores | +0.006 |
it | +0.006 |
them | +0.006 |
Josh | +0.006 |
Neg logit contributions | |
Deal | -0.012 |
nam | -0.011 |
smartest | -0.009 |
strongest | -0.009 |
nic | -0.009 |
Token | other |
Token ID | 584 |
Feature activation | +6.75e-03 |
Pos logit contributions | |
Deal | +0.041 |
nam | +0.038 |
guys | +0.030 |
smartest | +0.028 |
simplest | +0.027 |
Neg logit contributions | |
us | -0.043 |
ores | -0.042 |
om | -0.042 |
ubs | -0.041 |
s | -0.039 |
Token | ." |
Token ID | 526 |
Feature activation | +4.10e-03 |
Pos logit contributions | |
Deal | +0.015 |
nam | +0.014 |
guys | +0.012 |
smartest | +0.012 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.007 |
us | -0.007 |
om | -0.007 |
ill | -0.006 |
Matt | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +6.19e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
Sorry | +0.007 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.005 |
anging | -0.004 |
ine | -0.004 |
hovering | -0.004 |
om | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +3.19e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.011 |
OK | +0.009 |
Sorry | +0.009 |
guys | +0.009 |
Neg logit contributions | |
anging | -0.007 |
ine | -0.006 |
ores | -0.006 |
ill | -0.006 |
int | -0.006 |
Token | L |
Token ID | 43 |
Feature activation | +2.14e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
Okay | +0.004 |
OK | +0.004 |
simplest | +0.003 |
Neg logit contributions | |
ores | -0.005 |
om | -0.005 |
anging | -0.005 |
int | -0.005 |
uts | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | +5.64e-03 |
Pos logit contributions | |
us | +0.007 |
ores | +0.007 |
uts | +0.006 |
om | +0.006 |
ork | +0.006 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.008 |
guys | -0.007 |
smartest | -0.006 |
simplest | -0.006 |
Token | m |
Token ID | 285 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
simplest | +0.007 |
Neg logit contributions | |
ores | -0.008 |
om | -0.008 |
us | -0.008 |
� | -0.008 |
s | -0.007 |
Token | ama |
Token ID | 1689 |
Feature activation | +7.89e-03 |
Pos logit contributions | |
Deal | +0.031 |
nam | +0.028 |
guys | +0.024 |
smartest | +0.024 |
cient | +0.024 |
Neg logit contributions | |
ores | -0.018 |
ill | -0.016 |
ubs | -0.016 |
acks | -0.015 |
int | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | -2.29e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.012 |
guys | +0.011 |
smartest | +0.011 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.011 |
acks | -0.011 |
irs | -0.011 |
int | -0.010 |
ork | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | +9.37e-04 |
Pos logit contributions | |
ores | +0.002 |
us | +0.002 |
om | +0.002 |
ill | +0.002 |
ubs | +0.002 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.004 |
smartest | -0.004 |
strongest | -0.004 |
Token | pap |
Token ID | 20461 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.001 |
guys | +0.001 |
smartest | +0.001 |
simplest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
om | -0.001 |
us | -0.001 |
� | -0.001 |
s | -0.001 |
Token | a |
Token ID | 64 |
Feature activation | +5.51e-03 |
Pos logit contributions | |
Deal | +0.058 |
nam | +0.054 |
guys | +0.048 |
smartest | +0.046 |
strongest | +0.044 |
Neg logit contributions | |
ores | -0.027 |
om | -0.023 |
ubs | -0.023 |
Matt | -0.022 |
ill | -0.022 |
Token | who |
Token ID | 508 |
Feature activation | -2.92e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.010 |
strongest | +0.010 |
Neg logit contributions | |
ores | -0.006 |
us | -0.005 |
om | -0.005 |
ill | -0.005 |
ubs | -0.005 |
Token | loved |
Token ID | 6151 |
Feature activation | -6.86e-04 |
Pos logit contributions | |
ores | +0.006 |
us | +0.006 |
om | +0.006 |
ill | +0.006 |
ubs | +0.006 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
Token | each |
Token ID | 1123 |
Feature activation | +1.53e-02 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ill | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | other |
Token ID | 584 |
Feature activation | +3.71e-03 |
Pos logit contributions | |
Deal | +0.023 |
nam | +0.022 |
guys | +0.017 |
smartest | +0.016 |
simplest | +0.015 |
Neg logit contributions | |
ores | -0.026 |
us | -0.026 |
om | -0.025 |
ubs | -0.024 |
ill | -0.024 |
Token | you |
Token ID | 345 |
Feature activation | -3.38e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.003 |
us | -0.002 |
om | -0.002 |
ubs | -0.002 |
ill | -0.002 |
Token | are |
Token ID | 389 |
Feature activation | +5.72e-03 |
Pos logit contributions | |
� | +0.005 |
us | +0.004 |
ores | +0.004 |
om | +0.004 |
s | +0.004 |
Neg logit contributions | |
nam | -0.006 |
Deal | -0.006 |
smartest | -0.005 |
guys | -0.005 |
strongest | -0.005 |
Token | lucky |
Token ID | 9670 |
Feature activation | -6.98e-04 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
guys | +0.008 |
smartest | +0.008 |
simplest | +0.008 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
om | -0.008 |
ubs | -0.007 |
� | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | -1.86e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ubs | +0.001 |
ill | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | have |
Token ID | 423 |
Feature activation | +4.05e-04 |
Pos logit contributions | |
ores | +0.003 |
us | +0.003 |
om | +0.003 |
ubs | +0.003 |
ill | +0.003 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.003 |
smartest | -0.002 |
strongest | -0.002 |
Token | each |
Token ID | 1123 |
Feature activation | +2.58e-02 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ubs | -0.000 |
� | -0.000 |
Token | other |
Token ID | 584 |
Feature activation | +6.28e-03 |
Pos logit contributions | |
Deal | +0.044 |
nam | +0.042 |
guys | +0.033 |
smartest | +0.031 |
cient | +0.031 |
Neg logit contributions | |
us | -0.039 |
om | -0.038 |
ores | -0.036 |
and | -0.036 |
� | -0.036 |
Token | ." |
Token ID | 526 |
Feature activation | +5.41e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.013 |
guys | +0.011 |
smartest | +0.011 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.007 |
us | -0.006 |
om | -0.006 |
ubs | -0.006 |
ill | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +5.17e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.009 |
Please | +0.007 |
Really | +0.007 |
OK | +0.007 |
Neg logit contributions | |
ores | -0.008 |
ine | -0.007 |
anging | -0.007 |
ake | -0.007 |
iced | -0.007 |
Token |
|
Token ID | 198 |
Feature activation | +4.38e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
Really | +0.007 |
OK | +0.007 |
Okay | +0.007 |
Neg logit contributions | |
ores | -0.007 |
anging | -0.006 |
ine | -0.006 |
int | -0.006 |
ill | -0.006 |
Token | L |
Token ID | 43 |
Feature activation | +2.24e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
Okay | +0.005 |
Fine | +0.004 |
OK | +0.004 |
Neg logit contributions | |
ores | -0.008 |
int | -0.008 |
om | -0.007 |
us | -0.007 |
Matt | -0.007 |
Token | We |
Token ID | 775 |
Feature activation | -8.14e-03 |
Pos logit contributions | |
Deal | +0.016 |
nam | +0.016 |
guys | +0.013 |
smartest | +0.012 |
strongest | +0.012 |
Neg logit contributions | |
ores | -0.010 |
� | -0.009 |
om | -0.009 |
us | -0.009 |
Josh | -0.008 |
Token | will |
Token ID | 481 |
Feature activation | +7.11e-03 |
Pos logit contributions | |
ores | +0.011 |
om | +0.011 |
� | +0.011 |
s | +0.011 |
us | +0.011 |
Neg logit contributions | |
nam | -0.014 |
Deal | -0.014 |
guys | -0.011 |
smartest | -0.011 |
strongest | -0.011 |
Token | be |
Token ID | 307 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.011 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.011 |
us | -0.011 |
om | -0.011 |
ubs | -0.010 |
ill | -0.010 |
Token | nice |
Token ID | 3621 |
Feature activation | +1.73e-03 |
Pos logit contributions | |
Deal | +0.020 |
nam | +0.019 |
guys | +0.016 |
cient | +0.015 |
smartest | +0.015 |
Neg logit contributions | |
ores | -0.015 |
us | -0.014 |
om | -0.014 |
ubs | -0.013 |
ill | -0.013 |
Token | to |
Token ID | 284 |
Feature activation | -1.63e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.003 |
guys | +0.003 |
smartest | +0.003 |
simplest | +0.003 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
Matt | -0.002 |
ubs | -0.002 |
Token | each |
Token ID | 1123 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
ores | +0.002 |
it | +0.002 |
them | +0.002 |
us | +0.002 |
� | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
smartest | -0.003 |
strongest | -0.003 |
simplest | -0.003 |
Token | other |
Token ID | 584 |
Feature activation | +7.52e-03 |
Pos logit contributions | |
Deal | +0.044 |
nam | +0.042 |
guys | +0.033 |
smartest | +0.032 |
strongest | +0.031 |
Neg logit contributions | |
us | -0.039 |
ores | -0.038 |
s | -0.037 |
om | -0.037 |
ubs | -0.037 |
Token | ." |
Token ID | 526 |
Feature activation | +2.88e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.009 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.012 |
us | -0.012 |
om | -0.011 |
Matt | -0.011 |
ubs | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | +3.21e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.005 |
Sorry | +0.005 |
OK | +0.005 |
Okay | +0.005 |
Neg logit contributions | |
ge | -0.003 |
us | -0.003 |
ores | -0.003 |
ine | -0.003 |
anging | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +3.30e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.005 |
Sorry | +0.005 |
OK | +0.005 |
Really | +0.005 |
Neg logit contributions | |
anging | -0.003 |
ill | -0.003 |
ge | -0.003 |
ores | -0.003 |
int | -0.003 |
Token | Mom |
Token ID | 29252 |
Feature activation | -3.40e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
Okay | +0.004 |
Sorry | +0.003 |
OK | +0.003 |
Neg logit contributions | |
ores | -0.006 |
int | -0.005 |
anging | -0.005 |
om | -0.005 |
ubs | -0.005 |
Token | share |
Token ID | 2648 |
Feature activation | +5.42e-03 |
Pos logit contributions | |
ores | +0.011 |
us | +0.011 |
om | +0.011 |
int | +0.010 |
ill | +0.010 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.009 |
guys | -0.008 |
Sorry | -0.007 |
smartest | -0.007 |
Token | and |
Token ID | 290 |
Feature activation | +8.23e-04 |
Pos logit contributions | |
nam | +0.011 |
Deal | +0.010 |
guys | +0.010 |
songs | +0.008 |
fart | +0.008 |
Neg logit contributions | |
ores | -0.007 |
us | -0.006 |
anging | -0.006 |
int | -0.006 |
itched | -0.006 |
Token | be |
Token ID | 307 |
Feature activation | +8.19e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
guys | +0.001 |
smartest | +0.001 |
simplest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ill | -0.001 |
ubs | -0.001 |
Token | nice |
Token ID | 3621 |
Feature activation | +4.62e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.009 |
cient | +0.009 |
Neg logit contributions | |
ores | -0.013 |
om | -0.013 |
us | -0.013 |
ubs | -0.012 |
� | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | -3.33e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.008 |
simplest | +0.007 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.005 |
Matt | -0.005 |
int | -0.004 |
Token | each |
Token ID | 1123 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
ores | +0.004 |
ubs | +0.004 |
us | +0.004 |
om | +0.004 |
Josh | +0.004 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.006 |
guys | -0.005 |
smartest | -0.005 |
nic | -0.005 |
Token | other |
Token ID | 584 |
Feature activation | +7.21e-03 |
Pos logit contributions | |
Deal | +0.038 |
nam | +0.035 |
guys | +0.028 |
smartest | +0.026 |
simplest | +0.024 |
Neg logit contributions | |
ores | -0.046 |
us | -0.045 |
om | -0.044 |
ubs | -0.043 |
ill | -0.042 |
Token | ." |
Token ID | 526 |
Feature activation | +7.28e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.013 |
guys | +0.011 |
smartest | +0.010 |
strongest | +0.010 |
Neg logit contributions | |
ores | -0.010 |
us | -0.010 |
om | -0.010 |
Matt | -0.009 |
ill | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | +4.19e-03 |
Pos logit contributions | |
nam | +0.015 |
Deal | +0.014 |
Sorry | +0.013 |
Really | +0.011 |
guys | +0.011 |
Neg logit contributions | |
ores | -0.009 |
anging | -0.008 |
ine | -0.008 |
us | -0.008 |
int | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +1.53e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.007 |
Really | +0.006 |
Fine | +0.006 |
OK | +0.006 |
Neg logit contributions | |
ores | -0.006 |
anging | -0.005 |
int | -0.005 |
ill | -0.005 |
ine | -0.005 |
Token | Anna |
Token ID | 31160 |
Feature activation | -4.22e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
Okay | +0.002 |
Fine | +0.002 |
OK | +0.002 |
Neg logit contributions | |
ores | -0.003 |
int | -0.003 |
anging | -0.003 |
om | -0.003 |
acks | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | +2.80e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.004 |
Matt | -0.004 |
om | -0.004 |
us | -0.004 |
ubs | -0.004 |
Token | still |
Token ID | 991 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.004 |
ill | -0.004 |
ubs | -0.004 |
Token | be |
Token ID | 307 |
Feature activation | +4.91e-03 |
Pos logit contributions | |
Deal | +0.025 |
nam | +0.024 |
guys | +0.021 |
smartest | +0.019 |
strongest | +0.018 |
Neg logit contributions | |
ores | -0.023 |
us | -0.023 |
om | -0.022 |
Matt | -0.021 |
ill | -0.021 |
Token | nice |
Token ID | 3621 |
Feature activation | +2.73e-03 |
Pos logit contributions | |
nam | +0.008 |
Deal | +0.007 |
guys | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
int | -0.008 |
ill | -0.008 |
om | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | -2.61e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
simplest | +0.005 |
Neg logit contributions | |
ores | -0.003 |
us | -0.002 |
Matt | -0.002 |
om | -0.002 |
itched | -0.002 |
Token | each |
Token ID | 1123 |
Feature activation | +2.57e-02 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
ubs | +0.004 |
om | +0.004 |
Josh | +0.003 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.004 |
guys | -0.003 |
smartest | -0.003 |
strongest | -0.003 |
Token | other |
Token ID | 584 |
Feature activation | +7.89e-03 |
Pos logit contributions | |
Deal | +0.040 |
nam | +0.037 |
guys | +0.029 |
smartest | +0.027 |
simplest | +0.026 |
Neg logit contributions | |
ores | -0.043 |
us | -0.043 |
om | -0.042 |
ubs | -0.041 |
ill | -0.040 |
Token | . |
Token ID | 13 |
Feature activation | +3.81e-03 |
Pos logit contributions | |
Deal | +0.016 |
nam | +0.016 |
guys | +0.014 |
smartest | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
ores | -0.009 |
us | -0.009 |
Matt | -0.008 |
om | -0.008 |
ubs | -0.008 |
Token | Mia |
Token ID | 32189 |
Feature activation | +7.90e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.006 |
us | -0.005 |
om | -0.005 |
� | -0.005 |
ubs | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +5.10e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.013 |
guys | +0.011 |
smartest | +0.010 |
simplest | +0.010 |
Neg logit contributions | |
ores | -0.012 |
us | -0.011 |
ubs | -0.011 |
om | -0.011 |
ill | -0.011 |
Token | you |
Token ID | 345 |
Feature activation | -5.46e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.004 |
Neg logit contributions | |
us | -0.010 |
ores | -0.010 |
om | -0.010 |
itched | -0.010 |
ubs | -0.009 |
Token | happy |
Token ID | 3772 |
Feature activation | -1.97e-03 |
Pos logit contributions | |
nam | +0.005 |
Deal | +0.005 |
smartest | +0.004 |
strongest | +0.004 |
happiest | +0.004 |
Neg logit contributions | |
us | -0.006 |
ork | -0.006 |
om | -0.006 |
acks | -0.006 |
udge | -0.006 |
Token | to |
Token ID | 284 |
Feature activation | -2.86e-03 |
Pos logit contributions | |
us | +0.002 |
ores | +0.002 |
om | +0.002 |
ubs | +0.002 |
irs | +0.002 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
guys | -0.003 |
songs | -0.003 |
smartest | -0.003 |
Token | be |
Token ID | 307 |
Feature activation | +1.11e-03 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
om | +0.004 |
ubs | +0.004 |
anging | +0.004 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.004 |
guys | -0.004 |
smartest | -0.004 |
Sorry | -0.003 |
Token | married |
Token ID | 6405 |
Feature activation | +6.60e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
int | -0.002 |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
ork | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | +3.46e-03 |
Pos logit contributions | |
Deal | +0.015 |
nam | +0.014 |
guys | +0.013 |
smartest | +0.012 |
strongest | +0.012 |
Neg logit contributions | |
ores | -0.006 |
om | -0.006 |
ubs | -0.006 |
us | -0.006 |
anging | -0.006 |
Token | each |
Token ID | 1123 |
Feature activation | +2.56e-02 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ill | -0.003 |
ubs | -0.003 |
Token | other |
Token ID | 584 |
Feature activation | +8.14e-03 |
Pos logit contributions | |
Deal | +0.030 |
nam | +0.027 |
guys | +0.022 |
smartest | +0.020 |
strongest | +0.019 |
Neg logit contributions | |
ores | -0.054 |
om | -0.051 |
us | -0.051 |
uts | -0.050 |
ubs | -0.049 |
Token | . |
Token ID | 13 |
Feature activation | -8.29e-04 |
Pos logit contributions | |
Deal | +0.017 |
nam | +0.016 |
guys | +0.015 |
smartest | +0.013 |
songs | +0.013 |
Neg logit contributions | |
ores | -0.010 |
Matt | -0.009 |
us | -0.009 |
ubs | -0.009 |
om | -0.009 |
Token | They |
Token ID | 1119 |
Feature activation | +4.75e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ill | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
smartest | -0.002 |
simplest | -0.001 |
Token | were |
Token ID | 547 |
Feature activation | +3.80e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.007 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.007 |
� | -0.006 |
us | -0.006 |
om | -0.006 |
ill | -0.006 |
Token | now |
Token ID | 783 |
Feature activation | +7.43e-04 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
happiest | +0.005 |
Neg logit contributions | |
us | -0.006 |
ork | -0.006 |
om | -0.006 |
ores | -0.006 |
acks | -0.006 |
Token | share |
Token ID | 2648 |
Feature activation | +8.51e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.006 |
smartest | +0.006 |
cient | +0.006 |
Neg logit contributions | |
ores | -0.009 |
ubs | -0.008 |
ill | -0.008 |
us | -0.008 |
om | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -4.13e-03 |
Pos logit contributions | |
nam | +0.016 |
Deal | +0.016 |
guys | +0.013 |
fart | +0.011 |
smartest | +0.011 |
Neg logit contributions | |
ores | -0.012 |
us | -0.011 |
Matt | -0.011 |
anging | -0.011 |
itched | -0.011 |
Token | be |
Token ID | 307 |
Feature activation | +7.32e-03 |
Pos logit contributions | |
ores | +0.008 |
us | +0.007 |
om | +0.007 |
ill | +0.007 |
anging | +0.007 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.006 |
guys | -0.005 |
smartest | -0.004 |
simplest | -0.004 |
Token | nice |
Token ID | 3621 |
Feature activation | +6.12e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.011 |
guys | +0.010 |
cient | +0.009 |
smartest | +0.009 |
Neg logit contributions | |
ores | -0.011 |
om | -0.011 |
ubs | -0.011 |
us | -0.011 |
� | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | -4.72e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.012 |
guys | +0.011 |
smartest | +0.009 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.007 |
us | -0.007 |
itched | -0.007 |
Matt | -0.007 |
om | -0.007 |
Token | each |
Token ID | 1123 |
Feature activation | +2.56e-02 |
Pos logit contributions | |
them | +0.007 |
ubs | +0.007 |
it | +0.006 |
ores | +0.006 |
their | +0.006 |
Neg logit contributions | |
Deal | -0.009 |
nam | -0.008 |
smartest | -0.007 |
strongest | -0.006 |
nic | -0.006 |
Token | other |
Token ID | 584 |
Feature activation | +6.84e-03 |
Pos logit contributions | |
Deal | +0.038 |
nam | +0.036 |
guys | +0.028 |
smartest | +0.026 |
simplest | +0.025 |
Neg logit contributions | |
ores | -0.045 |
us | -0.044 |
om | -0.043 |
ubs | -0.042 |
ill | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | +4.66e-04 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.011 |
smartest | +0.010 |
strongest | +0.010 |
Neg logit contributions | |
ores | -0.010 |
us | -0.009 |
om | -0.009 |
Matt | -0.009 |
ubs | -0.008 |
Token | If |
Token ID | 1002 |
Feature activation | +7.94e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ubs | -0.001 |
ill | -0.001 |
Token | you |
Token ID | 345 |
Feature activation | -6.64e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.010 |
cient | +0.010 |
Neg logit contributions | |
ores | -0.012 |
it | -0.011 |
us | -0.011 |
� | -0.011 |
Josh | -0.011 |
Token | don |
Token ID | 836 |
Feature activation | -6.18e-03 |
Pos logit contributions | |
ores | +0.010 |
om | +0.010 |
us | +0.010 |
ill | +0.010 |
� | +0.009 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.011 |
guys | -0.009 |
smartest | -0.008 |
strongest | -0.008 |
Token | share |
Token ID | 2648 |
Feature activation | +5.79e-03 |
Pos logit contributions | |
ores | +0.011 |
us | +0.010 |
om | +0.010 |
ill | +0.010 |
int | +0.010 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.008 |
guys | -0.006 |
smartest | -0.005 |
simplest | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -2.26e-03 |
Pos logit contributions | |
nam | +0.012 |
Deal | +0.012 |
guys | +0.010 |
simplest | +0.009 |
fart | +0.009 |
Neg logit contributions | |
ores | -0.007 |
us | -0.007 |
anging | -0.006 |
om | -0.006 |
Matt | -0.006 |
Token | be |
Token ID | 307 |
Feature activation | +7.98e-03 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
om | +0.004 |
ill | +0.003 |
ubs | +0.003 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.003 |
guys | -0.003 |
smartest | -0.003 |
simplest | -0.002 |
Token | kind |
Token ID | 1611 |
Feature activation | +5.21e-03 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.011 |
cient | +0.010 |
smartest | +0.010 |
Neg logit contributions | |
ores | -0.012 |
om | -0.012 |
us | -0.011 |
ubs | -0.011 |
� | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | -7.10e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.011 |
guys | +0.010 |
smartest | +0.009 |
strongest | +0.009 |
Neg logit contributions | |
ores | -0.006 |
us | -0.005 |
om | -0.005 |
Matt | -0.005 |
ill | -0.005 |
Token | each |
Token ID | 1123 |
Feature activation | +2.55e-02 |
Pos logit contributions | |
ores | +0.009 |
ubs | +0.009 |
us | +0.009 |
it | +0.009 |
om | +0.009 |
Neg logit contributions | |
Deal | -0.013 |
nam | -0.012 |
smartest | -0.010 |
guys | -0.010 |
nic | -0.010 |
Token | other |
Token ID | 584 |
Feature activation | +5.36e-03 |
Pos logit contributions | |
Deal | +0.039 |
nam | +0.037 |
guys | +0.029 |
smartest | +0.027 |
simplest | +0.026 |
Neg logit contributions | |
ores | -0.043 |
us | -0.043 |
om | -0.042 |
ubs | -0.041 |
ill | -0.040 |
Token | . |
Token ID | 13 |
Feature activation | -3.19e-04 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.007 |
us | -0.007 |
om | -0.007 |
Matt | -0.007 |
ill | -0.006 |
Token | You |
Token ID | 921 |
Feature activation | -9.59e-03 |
Pos logit contributions | |
ores | +0.000 |
us | +0.000 |
om | +0.000 |
ubs | +0.000 |
ill | +0.000 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.000 |
smartest | -0.000 |
strongest | -0.000 |
Token | are |
Token ID | 389 |
Feature activation | +5.99e-03 |
Pos logit contributions | |
� | +0.013 |
ores | +0.013 |
om | +0.013 |
s | +0.013 |
us | +0.013 |
Neg logit contributions | |
Deal | -0.018 |
nam | -0.017 |
smartest | -0.013 |
guys | -0.013 |
Okay | -0.013 |
Token | brothers |
Token ID | 9397 |
Feature activation | +1.82e-02 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.011 |
guys | +0.010 |
Okay | +0.009 |
cient | +0.009 |
Neg logit contributions | |
ores | -0.007 |
� | -0.007 |
us | -0.007 |
om | -0.006 |
it | -0.006 |
Token | could |
Token ID | 714 |
Feature activation | +5.09e-03 |
Pos logit contributions | |
ores | +0.006 |
us | +0.006 |
om | +0.006 |
� | +0.006 |
ubs | +0.006 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.007 |
guys | -0.006 |
smartest | -0.006 |
strongest | -0.006 |
Token | have |
Token ID | 423 |
Feature activation | +8.39e-04 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
strongest | +0.007 |
Neg logit contributions | |
ores | -0.007 |
us | -0.007 |
om | -0.007 |
ill | -0.006 |
ubs | -0.006 |
Token | hurt |
Token ID | 5938 |
Feature activation | +3.92e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.001 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ubs | -0.001 |
ill | -0.001 |
Token | yourself |
Token ID | 3511 |
Feature activation | +9.32e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.003 |
simplest | +0.003 |
Neg logit contributions | |
ores | -0.008 |
om | -0.007 |
us | -0.007 |
int | -0.007 |
ill | -0.007 |
Token | or |
Token ID | 393 |
Feature activation | +9.82e-03 |
Pos logit contributions | |
nam | +0.018 |
Deal | +0.017 |
guys | +0.015 |
smartest | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
ores | -0.013 |
Matt | -0.013 |
us | -0.012 |
Matt | -0.012 |
Josh | -0.012 |
Token | each |
Token ID | 1123 |
Feature activation | +2.53e-02 |
Pos logit contributions | |
Deal | +0.019 |
nam | +0.016 |
guys | +0.014 |
smartest | +0.014 |
simplest | +0.013 |
Neg logit contributions | |
ores | -0.013 |
om | -0.012 |
us | -0.012 |
ubs | -0.012 |
� | -0.012 |
Token | other |
Token ID | 584 |
Feature activation | +6.81e-03 |
Pos logit contributions | |
Deal | +0.035 |
nam | +0.033 |
guys | +0.026 |
smartest | +0.024 |
strongest | +0.022 |
Neg logit contributions | |
ores | -0.047 |
us | -0.045 |
om | -0.045 |
ubs | -0.043 |
ill | -0.043 |
Token | . |
Token ID | 13 |
Feature activation | +4.54e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.014 |
guys | +0.012 |
smartest | +0.011 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.008 |
us | -0.007 |
om | -0.007 |
ill | -0.007 |
Matt | -0.007 |
Token | You |
Token ID | 921 |
Feature activation | -3.87e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.007 |
guys | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.007 |
us | -0.007 |
om | -0.007 |
ubs | -0.007 |
� | -0.007 |
Token | should |
Token ID | 815 |
Feature activation | -6.16e-03 |
Pos logit contributions | |
ores | +0.005 |
om | +0.005 |
us | +0.005 |
� | +0.005 |
s | +0.005 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
guys | -0.005 |
smartest | -0.005 |
strongest | -0.005 |
Token | have |
Token ID | 423 |
Feature activation | +3.46e-03 |
Pos logit contributions | |
ores | +0.010 |
us | +0.009 |
om | +0.009 |
ill | +0.009 |
int | +0.009 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.010 |
guys | -0.008 |
smartest | -0.007 |
simplest | -0.007 |
Token | feels |
Token ID | 5300 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
Deal | +0.004 |
guys | +0.004 |
nam | +0.004 |
nic | +0.003 |
simplest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
ubs | -0.003 |
us | -0.003 |
ork | -0.003 |
anging | -0.003 |
Token | even |
Token ID | 772 |
Feature activation | +4.70e-03 |
Pos logit contributions | |
nam | +0.016 |
Deal | +0.016 |
smartest | +0.013 |
guys | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
om | -0.016 |
ill | -0.015 |
us | -0.015 |
Matt | -0.015 |
ork | -0.015 |
Token | happier |
Token ID | 23030 |
Feature activation | +3.74e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
simplest | +0.007 |
Neg logit contributions | |
ores | -0.006 |
us | -0.005 |
om | -0.005 |
ill | -0.005 |
ubs | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
guys | +0.005 |
Please | +0.005 |
smartest | +0.005 |
Neg logit contributions | |
irs | -0.005 |
om | -0.005 |
ork | -0.005 |
ores | -0.005 |
Matt | -0.005 |
Token | p |
Token ID | 279 |
Feature activation | +5.07e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
om | -0.003 |
us | -0.003 |
ubs | -0.002 |
ill | -0.002 |
Token | rou |
Token ID | 472 |
Feature activation | -3.40e-02 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
cient | +0.007 |
nic | +0.007 |
Sorry | +0.006 |
Neg logit contributions | |
� | -0.008 |
aid | -0.007 |
Josh | -0.006 |
Kat | -0.006 |
Judy | -0.006 |
Token | der |
Token ID | 1082 |
Feature activation | -9.46e-03 |
Pos logit contributions | |
ores | +0.048 |
ill | +0.048 |
Matt | +0.047 |
aid | +0.046 |
ine | +0.046 |
Neg logit contributions | |
Deal | -0.061 |
nam | -0.051 |
guys | -0.049 |
Fine | -0.041 |
smartest | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | -1.39e-03 |
Pos logit contributions | |
Matt | +0.011 |
aid | +0.011 |
ork | +0.011 |
ores | +0.011 |
om | +0.011 |
Neg logit contributions | |
Deal | -0.019 |
nam | -0.017 |
strongest | -0.014 |
smartest | -0.014 |
simplest | -0.013 |
Token | He |
Token ID | 679 |
Feature activation | +5.67e-03 |
Pos logit contributions | |
ge | +0.002 |
anging | +0.002 |
itched | +0.002 |
contact | +0.002 |
ores | +0.002 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
Sorry | -0.002 |
Really | -0.002 |
Okay | -0.002 |
Token | displays |
Token ID | 11298 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.010 |
us | -0.009 |
ubs | -0.009 |
ill | -0.009 |
om | -0.009 |
Token | his |
Token ID | 465 |
Feature activation | -3.12e-03 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
guys | +0.002 |
smartest | +0.002 |
brav | +0.002 |
Neg logit contributions | |
us | -0.001 |
ores | -0.001 |
anging | -0.001 |
uts | -0.001 |
ubs | -0.001 |
Token | sailed |
Token ID | 33835 |
Feature activation | +3.33e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.005 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.006 |
uts | -0.005 |
ubs | -0.005 |
ork | -0.005 |
us | -0.005 |
Token | for |
Token ID | 329 |
Feature activation | +8.92e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.005 |
uts | -0.004 |
us | -0.004 |
om | -0.004 |
ubs | -0.004 |
Token | days |
Token ID | 1528 |
Feature activation | -8.58e-04 |
Pos logit contributions | |
Deal | +0.016 |
nam | +0.015 |
guys | +0.013 |
smartest | +0.012 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.013 |
us | -0.013 |
om | -0.013 |
ill | -0.012 |
ubs | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | -5.18e-04 |
Pos logit contributions | |
ores | +0.001 |
Matt | +0.001 |
ork | +0.001 |
Jud | +0.001 |
ill | +0.001 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
guys | -0.001 |
strongest | -0.001 |
fastest | -0.001 |
Token | exploring |
Token ID | 13504 |
Feature activation | -2.81e-03 |
Pos logit contributions | |
ores | +0.001 |
ork | +0.001 |
uts | +0.001 |
us | +0.001 |
irs | +0.001 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
strongest | -0.001 |
guys | -0.001 |
smartest | -0.001 |
Token | unch |
Token ID | 16258 |
Feature activation | -3.39e-02 |
Pos logit contributions | |
ores | +0.004 |
uts | +0.004 |
om | +0.004 |
us | +0.003 |
ubs | +0.003 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.005 |
smartest | -0.004 |
strongest | -0.004 |
Token | arted |
Token ID | 19112 |
Feature activation | -1.16e-03 |
Pos logit contributions | |
us | +0.049 |
ores | +0.049 |
ork | +0.048 |
� | +0.048 |
aid | +0.048 |
Neg logit contributions | |
nam | -0.051 |
Deal | -0.051 |
guys | -0.040 |
Fine | -0.038 |
smartest | -0.037 |
Token | waters |
Token ID | 10150 |
Feature activation | +5.65e-04 |
Pos logit contributions | |
ores | +0.002 |
ill | +0.002 |
us | +0.002 |
uts | +0.002 |
Matt | +0.002 |
Neg logit contributions | |
Deal | -0.002 |
guys | -0.002 |
nam | -0.002 |
smartest | -0.002 |
strongest | -0.001 |
Token | until |
Token ID | 1566 |
Feature activation | -9.27e-03 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
songs | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
Matt | -0.001 |
Kat | -0.001 |
Jud | -0.001 |
Token | he |
Token ID | 339 |
Feature activation | -3.27e-03 |
Pos logit contributions | |
us | +0.012 |
om | +0.012 |
uts | +0.012 |
udge | +0.012 |
oing | +0.012 |
Neg logit contributions | |
nam | -0.017 |
Deal | -0.016 |
guys | -0.015 |
strongest | -0.014 |
wind | -0.014 |
Token | came |
Token ID | 1625 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
ores | +0.005 |
ubs | +0.005 |
om | +0.005 |
uts | +0.005 |
us | +0.005 |
Neg logit contributions | |
Deal | -0.005 |
guys | -0.004 |
nam | -0.004 |
smartest | -0.004 |
strongest | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | -2.75e-03 |
Pos logit contributions | |
us | +0.004 |
ork | +0.003 |
irs | +0.003 |
udge | +0.003 |
old | +0.003 |
Neg logit contributions | |
nam | -0.003 |
Deal | -0.003 |
happiest | -0.003 |
strongest | -0.003 |
nic | -0.003 |
Token | nothing |
Token ID | 2147 |
Feature activation | +7.75e-03 |
Pos logit contributions | |
us | +0.003 |
om | +0.003 |
ores | +0.003 |
ork | +0.003 |
udge | +0.003 |
Neg logit contributions | |
nam | -0.005 |
Deal | -0.005 |
smartest | -0.005 |
strongest | -0.005 |
guys | -0.004 |
Token | made |
Token ID | 925 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
Deal | +0.013 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.010 |
strongest | +0.010 |
Neg logit contributions | |
ores | -0.012 |
us | -0.011 |
om | -0.011 |
ubs | -0.011 |
Matt | -0.011 |
Token | it |
Token ID | 340 |
Feature activation | +8.13e-03 |
Pos logit contributions | |
us | +0.018 |
om | +0.017 |
oing | +0.017 |
uts | +0.017 |
anging | +0.017 |
Neg logit contributions | |
guys | -0.021 |
Deal | -0.020 |
nam | -0.019 |
matter | -0.018 |
smartest | -0.017 |
Token | p |
Token ID | 279 |
Feature activation | -6.00e-04 |
Pos logit contributions | |
nam | +0.011 |
Deal | +0.010 |
strongest | +0.009 |
smartest | +0.009 |
guys | +0.009 |
Neg logit contributions | |
us | -0.015 |
Matt | -0.014 |
om | -0.014 |
ores | -0.014 |
udge | -0.014 |
Token | rou |
Token ID | 472 |
Feature activation | -2.90e-02 |
Pos logit contributions | |
Josh | +0.001 |
� | +0.001 |
Andrew | +0.001 |
on | +0.001 |
aid | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
cient | -0.001 |
nic | -0.001 |
smartest | -0.001 |
Token | der |
Token ID | 1082 |
Feature activation | -9.00e-03 |
Pos logit contributions | |
ores | +0.043 |
us | +0.041 |
Matt | +0.041 |
om | +0.041 |
Josh | +0.041 |
Neg logit contributions | |
Deal | -0.050 |
nam | -0.041 |
guys | -0.040 |
smartest | -0.034 |
strongest | -0.034 |
Token | . |
Token ID | 13 |
Feature activation | +3.48e-03 |
Pos logit contributions | |
om | +0.011 |
Matt | +0.011 |
ores | +0.011 |
ork | +0.011 |
Josh | +0.011 |
Neg logit contributions | |
Deal | -0.017 |
nam | -0.014 |
strongest | -0.014 |
smartest | -0.014 |
simplest | -0.013 |
Token | |
Token ID | 220 |
Feature activation | -4.18e-04 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
Sorry | +0.005 |
Really | +0.005 |
nic | +0.005 |
Neg logit contributions | |
us | -0.004 |
ubs | -0.004 |
ores | -0.004 |
ge | -0.004 |
om | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +1.56e-03 |
Pos logit contributions | |
product | +0.001 |
int | +0.001 |
ine | +0.001 |
ge | +0.000 |
ores | +0.000 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
cient | -0.001 |
Sorry | -0.001 |
smartest | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | -1.30e-03 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.002 |
Okay | +0.002 |
Really | +0.002 |
Bug | +0.002 |
Neg logit contributions | |
ores | -0.002 |
anging | -0.002 |
ays | -0.002 |
om | -0.002 |
ine | -0.002 |
Token | hunger |
Token ID | 16460 |
Feature activation | +2.39e-03 |
Pos logit contributions | |
ores | +0.002 |
ill | +0.001 |
om | +0.001 |
us | +0.001 |
Matt | +0.001 |
Neg logit contributions | |
nam | -0.002 |
Deal | -0.002 |
guys | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
Token | or |
Token ID | 393 |
Feature activation | -1.66e-03 |
Pos logit contributions | |
Deal | +0.005 |
guys | +0.004 |
nam | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
Matt | -0.003 |
om | -0.003 |
ores | -0.003 |
us | -0.003 |
itched | -0.003 |
Token | eat |
Token ID | 4483 |
Feature activation | -7.90e-03 |
Pos logit contributions | |
ores | +0.002 |
us | +0.002 |
om | +0.002 |
ubs | +0.002 |
ill | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
Token | things |
Token ID | 1243 |
Feature activation | -3.95e-03 |
Pos logit contributions | |
Matt | +0.012 |
om | +0.011 |
ill | +0.011 |
ores | +0.011 |
anging | +0.011 |
Neg logit contributions | |
Deal | -0.013 |
nam | -0.013 |
guys | -0.012 |
strongest | -0.010 |
smartest | -0.010 |
Token | that |
Token ID | 326 |
Feature activation | -9.08e-03 |
Pos logit contributions | |
Matt | +0.005 |
om | +0.005 |
ine | +0.005 |
ores | +0.005 |
Jud | +0.005 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.007 |
guys | -0.007 |
strongest | -0.006 |
smartest | -0.006 |
Token | aren |
Token ID | 3588 |
Feature activation | -2.67e-02 |
Pos logit contributions | |
ores | +0.015 |
us | +0.014 |
om | +0.014 |
ubs | +0.014 |
ill | +0.014 |
Neg logit contributions | |
Deal | -0.015 |
nam | -0.014 |
guys | -0.011 |
smartest | -0.010 |
strongest | -0.010 |
Token | 't |
Token ID | 470 |
Feature activation | +1.97e-03 |
Pos logit contributions | |
om | +0.044 |
ores | +0.042 |
ine | +0.041 |
us | +0.041 |
aid | +0.040 |
Neg logit contributions | |
Deal | -0.040 |
nam | -0.035 |
guys | -0.034 |
smartest | -0.031 |
strongest | -0.031 |
Token | good |
Token ID | 922 |
Feature activation | +2.81e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.003 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ill | -0.003 |
Matt | -0.002 |
Token | for |
Token ID | 329 |
Feature activation | +2.24e-03 |
Pos logit contributions | |
Deal | +0.006 |
guys | +0.005 |
nam | +0.005 |
smartest | +0.005 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.003 |
Matt | -0.003 |
om | -0.003 |
us | -0.003 |
ine | -0.003 |
Token | him |
Token ID | 683 |
Feature activation | -1.22e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.004 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
om | -0.003 |
ill | -0.003 |
us | -0.003 |
int | -0.002 |
Token | like |
Token ID | 588 |
Feature activation | +1.96e-04 |
Pos logit contributions | |
Matt | +0.002 |
ores | +0.001 |
om | +0.001 |
Matt | +0.001 |
Josh | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
strongest | -0.002 |
smartest | -0.002 |
Token | they |
Token ID | 484 |
Feature activation | -2.90e-03 |
Pos logit contributions | |
us | +0.002 |
ork | +0.002 |
acks | +0.002 |
irs | +0.002 |
itched | +0.002 |
Neg logit contributions | |
nam | -0.003 |
Deal | -0.002 |
chard | -0.002 |
guys | -0.002 |
nic | -0.002 |
Token | both |
Token ID | 1111 |
Feature activation | +6.65e-03 |
Pos logit contributions | |
ores | +0.005 |
us | +0.005 |
uts | +0.005 |
ork | +0.005 |
om | +0.005 |
Neg logit contributions | |
nam | -0.004 |
Deal | -0.004 |
guys | -0.003 |
smartest | -0.003 |
cient | -0.003 |
Token | looked |
Token ID | 3114 |
Feature activation | +3.13e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
strongest | +0.007 |
Neg logit contributions | |
ores | -0.011 |
us | -0.011 |
ork | -0.011 |
ubs | -0.011 |
uts | -0.011 |
Token | around |
Token ID | 1088 |
Feature activation | +7.95e-04 |
Pos logit contributions | |
nam | +0.005 |
Deal | +0.005 |
guys | +0.004 |
nic | +0.004 |
smartest | +0.004 |
Neg logit contributions | |
us | -0.005 |
Matt | -0.005 |
uts | -0.005 |
ork | -0.005 |
ill | -0.005 |
Token | in |
Token ID | 287 |
Feature activation | +2.39e-04 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
most | +0.001 |
Please | +0.001 |
Neg logit contributions | |
uts | -0.001 |
us | -0.001 |
acks | -0.001 |
ubs | -0.001 |
ork | -0.001 |
Token | amaz |
Token ID | 40642 |
Feature activation | -2.65e-02 |
Pos logit contributions | |
nam | +0.000 |
Deal | +0.000 |
simplest | +0.000 |
smartest | +0.000 |
matter | +0.000 |
Neg logit contributions | |
uts | -0.000 |
us | -0.000 |
om | -0.000 |
ork | -0.000 |
ata | -0.000 |
Token | ement |
Token ID | 972 |
Feature activation | -5.43e-03 |
Pos logit contributions | |
ores | +0.043 |
om | +0.041 |
us | +0.039 |
ubs | +0.039 |
ine | +0.039 |
Neg logit contributions | |
Deal | -0.043 |
nam | -0.037 |
guys | -0.033 |
nic | -0.029 |
smartest | -0.029 |
Token | . |
Token ID | 13 |
Feature activation | +1.66e-03 |
Pos logit contributions | |
ores | +0.008 |
Matt | +0.008 |
ork | +0.008 |
acks | +0.008 |
irs | +0.008 |
Neg logit contributions | |
nam | -0.007 |
Deal | -0.007 |
guys | -0.007 |
songs | -0.006 |
cheeks | -0.006 |
Token | The |
Token ID | 383 |
Feature activation | +3.56e-03 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.003 |
Sorry | +0.002 |
Really | +0.002 |
Please | +0.002 |
Neg logit contributions | |
us | -0.002 |
ubs | -0.002 |
ge | -0.002 |
ores | -0.002 |
itched | -0.002 |
Token | lake |
Token ID | 13546 |
Feature activation | -1.74e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.006 |
us | -0.006 |
om | -0.006 |
ubs | -0.005 |
ill | -0.005 |
Token | was |
Token ID | 373 |
Feature activation | +3.28e-03 |
Pos logit contributions | |
us | +0.003 |
ubs | +0.003 |
ores | +0.003 |
irs | +0.003 |
anging | +0.003 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
nic | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +6.54e-03 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
us | -0.001 |
om | -0.001 |
ores | -0.001 |
ubs | -0.001 |
anging | -0.001 |
Token | girl |
Token ID | 2576 |
Feature activation | +3.52e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.008 |
smartest | +0.007 |
strongest | +0.007 |
Neg logit contributions | |
ores | -0.011 |
us | -0.010 |
om | -0.010 |
ubs | -0.010 |
ill | -0.010 |
Token | felt |
Token ID | 2936 |
Feature activation | +8.84e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
nic | +0.004 |
smartest | +0.004 |
guys | +0.004 |
Neg logit contributions | |
ores | -0.006 |
us | -0.006 |
ubs | -0.006 |
irs | -0.006 |
uts | -0.006 |
Token | even |
Token ID | 772 |
Feature activation | +7.42e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.014 |
smartest | +0.011 |
strongest | +0.011 |
guys | +0.010 |
Neg logit contributions | |
om | -0.014 |
us | -0.014 |
Matt | -0.014 |
ill | -0.013 |
uts | -0.013 |
Token | p |
Token ID | 279 |
Feature activation | +5.78e-03 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.013 |
guys | +0.012 |
smartest | +0.011 |
simplest | +0.010 |
Neg logit contributions | |
ores | -0.010 |
us | -0.009 |
om | -0.009 |
ill | -0.009 |
ubs | -0.009 |
Token | rou |
Token ID | 472 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
cient | +0.007 |
nic | +0.007 |
smartest | +0.007 |
Neg logit contributions | |
aid | -0.009 |
Josh | -0.008 |
� | -0.008 |
Judy | -0.008 |
Jud | -0.008 |
Token | der |
Token ID | 1082 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
ores | +0.038 |
Matt | +0.037 |
Josh | +0.037 |
aid | +0.037 |
ill | +0.036 |
Neg logit contributions | |
Deal | -0.046 |
nam | -0.037 |
guys | -0.036 |
Fine | -0.031 |
smartest | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | -6.36e-04 |
Pos logit contributions | |
aid | +0.015 |
ork | +0.014 |
om | +0.014 |
Josh | +0.014 |
Matt | +0.014 |
Neg logit contributions | |
Deal | -0.021 |
nam | -0.018 |
strongest | -0.017 |
smartest | -0.017 |
simplest | -0.016 |
Token | She |
Token ID | 1375 |
Feature activation | +8.19e-03 |
Pos logit contributions | |
us | +0.001 |
ores | +0.001 |
ge | +0.001 |
ubs | +0.001 |
om | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
Sorry | -0.001 |
Really | -0.001 |
Okay | -0.001 |
Token | was |
Token ID | 373 |
Feature activation | +7.17e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
nic | +0.008 |
guys | +0.008 |
smartest | +0.008 |
Neg logit contributions | |
ores | -0.015 |
us | -0.014 |
ubs | -0.014 |
uts | -0.013 |
om | -0.013 |
Token | happy |
Token ID | 3772 |
Feature activation | -4.40e-04 |
Pos logit contributions | |
nam | +0.008 |
Deal | +0.007 |
smartest | +0.006 |
happiest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
us | -0.015 |
ork | -0.015 |
s | -0.014 |
acks | -0.014 |
irs | -0.014 |
Token | little |
Token ID | 1310 |
Feature activation | +8.86e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
� | -0.002 |
int | -0.002 |
Token | girl |
Token ID | 2576 |
Feature activation | +1.51e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.019 |
us | -0.018 |
om | -0.018 |
ill | -0.018 |
ubs | -0.018 |
Token | looked |
Token ID | 3114 |
Feature activation | +4.22e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
nic | +0.002 |
smartest | +0.002 |
Neg logit contributions | |
ores | -0.003 |
us | -0.002 |
ubs | -0.002 |
uts | -0.002 |
om | -0.002 |
Token | up |
Token ID | 510 |
Feature activation | -1.39e-03 |
Pos logit contributions | |
nam | +0.007 |
Deal | +0.007 |
guys | +0.006 |
nic | +0.006 |
smartest | +0.006 |
Neg logit contributions | |
us | -0.006 |
uts | -0.006 |
Matt | -0.006 |
ores | -0.006 |
om | -0.006 |
Token | in |
Token ID | 287 |
Feature activation | +2.74e-03 |
Pos logit contributions | |
us | +0.002 |
Matt | +0.002 |
ores | +0.002 |
uts | +0.002 |
irs | +0.002 |
Neg logit contributions | |
nam | -0.002 |
Deal | -0.002 |
nic | -0.002 |
wind | -0.002 |
guys | -0.002 |
Token | amaz |
Token ID | 40642 |
Feature activation | -2.62e-02 |
Pos logit contributions | |
nam | +0.004 |
Deal | +0.004 |
simplest | +0.003 |
guys | +0.003 |
matter | +0.003 |
Neg logit contributions | |
us | -0.005 |
uts | -0.005 |
om | -0.005 |
ores | -0.004 |
anging | -0.004 |
Token | ement |
Token ID | 972 |
Feature activation | -7.40e-03 |
Pos logit contributions | |
ores | +0.038 |
om | +0.036 |
us | +0.035 |
ubs | +0.035 |
ine | +0.034 |
Neg logit contributions | |
Deal | -0.048 |
nam | -0.043 |
guys | -0.037 |
smartest | -0.034 |
nic | -0.033 |
Token | and |
Token ID | 290 |
Feature activation | -2.32e-03 |
Pos logit contributions | |
ores | +0.011 |
Matt | +0.011 |
us | +0.011 |
irs | +0.011 |
ork | +0.011 |
Neg logit contributions | |
nam | -0.011 |
Deal | -0.010 |
guys | -0.009 |
cheeks | -0.009 |
songs | -0.009 |
Token | said |
Token ID | 531 |
Feature activation | +4.85e-03 |
Pos logit contributions | |
us | +0.004 |
om | +0.004 |
ores | +0.004 |
uts | +0.003 |
ork | +0.003 |
Neg logit contributions | |
nam | -0.004 |
Deal | -0.004 |
smartest | -0.003 |
nic | -0.003 |
happiest | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | +4.95e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.009 |
guys | +0.007 |
smartest | +0.007 |
cient | +0.007 |
Neg logit contributions | |
ores | -0.007 |
us | -0.006 |
ubs | -0.006 |
om | -0.006 |
ill | -0.006 |
Token | " |
Token ID | 366 |
Feature activation | +5.80e-03 |
Pos logit contributions | |
nam | +0.007 |
Deal | +0.006 |
Really | +0.005 |
cient | +0.005 |
guys | +0.005 |
Neg logit contributions | |
us | -0.009 |
ubs | -0.009 |
udge | -0.009 |
ores | -0.009 |
acks | -0.009 |
Token | The |
Token ID | 383 |
Feature activation | -2.22e-04 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
Sorry | +0.004 |
guys | +0.004 |
Really | +0.004 |
Neg logit contributions | |
ubs | -0.005 |
ores | -0.005 |
us | -0.004 |
anging | -0.004 |
ge | -0.004 |
Token | boy |
Token ID | 2933 |
Feature activation | +1.25e-03 |
Pos logit contributions | |
ores | +0.000 |
us | +0.000 |
om | +0.000 |
ubs | +0.000 |
ill | +0.000 |
Neg logit contributions | |
Deal | -0.000 |
nam | -0.000 |
guys | -0.000 |
smartest | -0.000 |
strongest | -0.000 |
Token | looked |
Token ID | 3114 |
Feature activation | +3.30e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.001 |
nic | +0.001 |
smartest | +0.001 |
Neg logit contributions | |
ores | -0.002 |
ubs | -0.002 |
us | -0.002 |
irs | -0.002 |
alks | -0.002 |
Token | up |
Token ID | 510 |
Feature activation | -1.65e-03 |
Pos logit contributions | |
nam | +0.005 |
Deal | +0.005 |
nic | +0.004 |
guys | +0.004 |
smartest | +0.004 |
Neg logit contributions | |
us | -0.005 |
uts | -0.005 |
Matt | -0.005 |
ores | -0.005 |
ork | -0.005 |
Token | in |
Token ID | 287 |
Feature activation | +4.63e-03 |
Pos logit contributions | |
us | +0.003 |
irs | +0.003 |
ores | +0.003 |
wen | +0.002 |
uts | +0.002 |
Neg logit contributions | |
nam | -0.003 |
Deal | -0.002 |
nic | -0.002 |
wind | -0.002 |
most | -0.002 |
Token | amaz |
Token ID | 40642 |
Feature activation | -2.58e-02 |
Pos logit contributions | |
nam | +0.006 |
Deal | +0.006 |
wind | +0.005 |
matter | +0.005 |
simplest | +0.005 |
Neg logit contributions | |
us | -0.009 |
uts | -0.009 |
ores | -0.008 |
om | -0.008 |
anging | -0.008 |
Token | ement |
Token ID | 972 |
Feature activation | -7.76e-03 |
Pos logit contributions | |
ores | +0.041 |
om | +0.039 |
ubs | +0.038 |
� | +0.037 |
us | +0.037 |
Neg logit contributions | |
Deal | -0.043 |
nam | -0.037 |
guys | -0.032 |
smartest | -0.029 |
nic | -0.028 |
Token | ! |
Token ID | 0 |
Feature activation | +5.16e-04 |
Pos logit contributions | |
irs | +0.013 |
ores | +0.013 |
izz | +0.013 |
ork | +0.013 |
Jud | +0.012 |
Neg logit contributions | |
nam | -0.010 |
Deal | -0.008 |
cheeks | -0.008 |
songs | -0.008 |
guys | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -3.56e-04 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
Sorry | +0.001 |
Really | +0.001 |
Helic | +0.001 |
Neg logit contributions | |
ores | -0.001 |
ubs | -0.001 |
us | -0.001 |
ge | -0.001 |
ine | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -2.49e-03 |
Pos logit contributions | |
ays | +0.001 |
anging | +0.000 |
ores | +0.000 |
fault | +0.000 |
theirs | +0.000 |
Neg logit contributions | |
Deal | -0.001 |
Please | -0.000 |
OK | -0.000 |
Okay | -0.000 |
Tree | -0.000 |
Token | He |
Token ID | 1544 |
Feature activation | +7.35e-03 |
Pos logit contributions | |
ores | +0.004 |
ays | +0.004 |
fault | +0.004 |
om | +0.004 |
int | +0.004 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.003 |
Okay | -0.003 |
Please | -0.003 |
Fine | -0.003 |
Token | scary |
Token ID | 14343 |
Feature activation | -4.90e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
us | -0.006 |
ores | -0.006 |
om | -0.006 |
Matt | -0.006 |
ill | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
ores | +0.005 |
om | +0.005 |
Matt | +0.005 |
us | +0.005 |
ubs | +0.005 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.010 |
guys | -0.009 |
smartest | -0.009 |
strongest | -0.008 |
Token | but |
Token ID | 475 |
Feature activation | -2.28e-03 |
Pos logit contributions | |
Deal | +0.019 |
nam | +0.019 |
guys | +0.017 |
smartest | +0.014 |
strongest | +0.014 |
Neg logit contributions | |
us | -0.020 |
ores | -0.019 |
om | -0.019 |
anging | -0.018 |
ubs | -0.018 |
Token | sometimes |
Token ID | 3360 |
Feature activation | -1.26e-03 |
Pos logit contributions | |
ores | +0.003 |
us | +0.002 |
� | +0.002 |
om | +0.002 |
it | +0.002 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.004 |
guys | -0.004 |
smartest | -0.004 |
simplest | -0.004 |
Token | things |
Token ID | 1243 |
Feature activation | +1.98e-03 |
Pos logit contributions | |
ores | +0.002 |
� | +0.001 |
us | +0.001 |
om | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.002 |
guys | -0.002 |
smartest | -0.002 |
simplest | -0.002 |
Token | aren |
Token ID | 3588 |
Feature activation | -2.57e-02 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.003 |
guys | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ill | -0.003 |
ubs | -0.003 |
Token | 't |
Token ID | 470 |
Feature activation | +2.32e-03 |
Pos logit contributions | |
om | +0.040 |
ores | +0.039 |
us | +0.039 |
udge | +0.038 |
Matt | +0.037 |
Neg logit contributions | |
Deal | -0.039 |
nam | -0.036 |
guys | -0.035 |
smartest | -0.032 |
strongest | -0.032 |
Token | always |
Token ID | 1464 |
Feature activation | +3.13e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.004 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
om | -0.003 |
us | -0.003 |
ill | -0.003 |
Matt | -0.003 |
Token | what |
Token ID | 644 |
Feature activation | +4.84e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
us | -0.005 |
om | -0.005 |
ores | -0.005 |
Matt | -0.005 |
ill | -0.005 |
Token | they |
Token ID | 484 |
Feature activation | +2.31e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.007 |
guys | +0.006 |
smartest | +0.006 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
om | -0.008 |
ill | -0.007 |
ubs | -0.007 |
Token | seem |
Token ID | 1283 |
Feature activation | +5.70e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ubs | -0.003 |
ill | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -1.85e-03 |
Pos logit contributions | |
ubs | +0.009 |
om | +0.009 |
ores | +0.009 |
us | +0.009 |
izz | +0.009 |
Neg logit contributions | |
guys | -0.009 |
Deal | -0.008 |
nam | -0.008 |
songs | -0.008 |
ter | -0.007 |
Token | Tiger |
Token ID | 17030 |
Feature activation | +6.55e-03 |
Pos logit contributions | |
ores | +0.003 |
ill | +0.003 |
ubs | +0.003 |
us | +0.002 |
anging | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.003 |
cient | -0.002 |
Sorry | -0.002 |
Token | looked |
Token ID | 3114 |
Feature activation | +2.22e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.008 |
strongest | +0.007 |
Neg logit contributions | |
ores | -0.011 |
ubs | -0.010 |
irs | -0.010 |
us | -0.010 |
ill | -0.010 |
Token | around |
Token ID | 1088 |
Feature activation | -7.28e-04 |
Pos logit contributions | |
nam | +0.004 |
Deal | +0.003 |
guys | +0.003 |
nic | +0.003 |
smartest | +0.003 |
Neg logit contributions | |
uts | -0.003 |
us | -0.003 |
Matt | -0.003 |
ork | -0.003 |
om | -0.003 |
Token | in |
Token ID | 287 |
Feature activation | +5.98e-04 |
Pos logit contributions | |
uts | +0.001 |
us | +0.001 |
ubs | +0.001 |
ores | +0.001 |
om | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
songs | -0.001 |
Token | amaz |
Token ID | 40642 |
Feature activation | -2.57e-02 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
smartest | +0.001 |
guys | +0.001 |
simplest | +0.001 |
Neg logit contributions | |
uts | -0.001 |
us | -0.001 |
om | -0.001 |
ores | -0.001 |
ork | -0.001 |
Token | ement |
Token ID | 972 |
Feature activation | -9.62e-03 |
Pos logit contributions | |
ores | +0.038 |
om | +0.037 |
� | +0.035 |
us | +0.035 |
ubs | +0.035 |
Neg logit contributions | |
Deal | -0.045 |
nam | -0.039 |
guys | -0.036 |
smartest | -0.032 |
nic | -0.031 |
Token | and |
Token ID | 290 |
Feature activation | -4.61e-03 |
Pos logit contributions | |
ores | +0.015 |
irs | +0.015 |
izz | +0.015 |
us | +0.015 |
Matt | +0.015 |
Neg logit contributions | |
nam | -0.013 |
Deal | -0.012 |
guys | -0.011 |
cheeks | -0.011 |
songs | -0.011 |
Token | he |
Token ID | 339 |
Feature activation | +3.69e-03 |
Pos logit contributions | |
ores | +0.007 |
om | +0.007 |
uts | +0.007 |
ubs | +0.007 |
ork | +0.007 |
Neg logit contributions | |
nam | -0.008 |
Deal | -0.007 |
guys | -0.006 |
smartest | -0.006 |
strongest | -0.006 |
Token | knew |
Token ID | 2993 |
Feature activation | -2.33e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
nic | +0.004 |
smartest | +0.004 |
Neg logit contributions | |
ores | -0.007 |
ubs | -0.006 |
us | -0.006 |
uts | -0.006 |
om | -0.006 |
Token | he |
Token ID | 339 |
Feature activation | -8.72e-03 |
Pos logit contributions | |
om | +0.003 |
acks | +0.003 |
oing | +0.003 |
ores | +0.003 |
ill | +0.003 |
Neg logit contributions | |
nam | -0.005 |
Deal | -0.004 |
smartest | -0.004 |
strongest | -0.004 |
brav | -0.004 |
Token | both |
Token ID | 1111 |
Feature activation | +6.01e-03 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.003 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ubs | -0.003 |
ill | -0.003 |
Token | looked |
Token ID | 3114 |
Feature activation | +2.28e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
strongest | +0.007 |
Neg logit contributions | |
ores | -0.010 |
us | -0.009 |
om | -0.009 |
ubs | -0.009 |
ill | -0.009 |
Token | at |
Token ID | 379 |
Feature activation | +9.90e-05 |
Pos logit contributions | |
nam | +0.004 |
Deal | +0.004 |
guys | +0.004 |
smartest | +0.003 |
nic | +0.003 |
Neg logit contributions | |
us | -0.003 |
uts | -0.003 |
Matt | -0.003 |
ores | -0.003 |
ork | -0.003 |
Token | it |
Token ID | 340 |
Feature activation | +5.11e-03 |
Pos logit contributions | |
nam | +0.000 |
Deal | +0.000 |
guys | +0.000 |
smartest | +0.000 |
strongest | +0.000 |
Neg logit contributions | |
us | -0.000 |
uts | -0.000 |
ores | -0.000 |
anging | -0.000 |
oing | -0.000 |
Token | in |
Token ID | 287 |
Feature activation | +1.18e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
head | +0.007 |
fart | +0.007 |
Neg logit contributions | |
us | -0.008 |
ores | -0.008 |
Matt | -0.008 |
izz | -0.007 |
David | -0.007 |
Token | amaz |
Token ID | 40642 |
Feature activation | -2.57e-02 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
matter | +0.001 |
simplest | +0.001 |
guys | +0.001 |
Neg logit contributions | |
us | -0.002 |
ores | -0.002 |
uts | -0.002 |
to | -0.002 |
anging | -0.002 |
Token | ement |
Token ID | 972 |
Feature activation | -9.17e-03 |
Pos logit contributions | |
ores | +0.039 |
om | +0.037 |
� | +0.036 |
us | +0.036 |
ubs | +0.036 |
Neg logit contributions | |
Deal | -0.045 |
nam | -0.038 |
guys | -0.035 |
smartest | -0.030 |
nic | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | +1.36e-03 |
Pos logit contributions | |
izz | +0.016 |
Jud | +0.016 |
irs | +0.016 |
Kelly | +0.015 |
ores | +0.015 |
Neg logit contributions | |
nam | -0.011 |
Deal | -0.010 |
guys | -0.009 |
songs | -0.009 |
cheeks | -0.009 |
Token | It |
Token ID | 632 |
Feature activation | -4.71e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
Sorry | +0.002 |
Really | +0.002 |
Helic | +0.002 |
Neg logit contributions | |
us | -0.002 |
ge | -0.002 |
ores | -0.002 |
ubs | -0.002 |
anging | -0.002 |
Token | was |
Token ID | 373 |
Feature activation | +1.86e-03 |
Pos logit contributions | |
ores | +0.007 |
us | +0.007 |
ubs | +0.007 |
anging | +0.007 |
om | +0.007 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.007 |
guys | -0.006 |
smartest | -0.006 |
strongest | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | -1.50e-03 |
Pos logit contributions | |
nam | +0.003 |
Deal | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
coolest | +0.002 |
Neg logit contributions | |
us | -0.004 |
oing | -0.003 |
anging | -0.003 |
acks | -0.003 |
ork | -0.003 |
Token | 't |
Token ID | 470 |
Feature activation | +1.09e-03 |
Pos logit contributions | |
ores | +0.028 |
om | +0.028 |
us | +0.027 |
ill | +0.027 |
ubs | +0.026 |
Neg logit contributions | |
Deal | -0.028 |
nam | -0.027 |
guys | -0.025 |
Sorry | -0.022 |
smartest | -0.022 |
Token | chew |
Token ID | 34722 |
Feature activation | +2.70e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
ubs | -0.002 |
ill | -0.002 |
Token | on |
Token ID | 319 |
Feature activation | -3.14e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
strongest | +0.004 |
smartest | +0.004 |
Neg logit contributions | |
ores | -0.004 |
Matt | -0.004 |
ill | -0.004 |
om | -0.003 |
Matt | -0.003 |
Token | things |
Token ID | 1243 |
Feature activation | -5.62e-03 |
Pos logit contributions | |
ores | +0.004 |
ill | +0.004 |
us | +0.004 |
Matt | +0.004 |
om | +0.004 |
Neg logit contributions | |
nam | -0.006 |
Deal | -0.006 |
guys | -0.005 |
strongest | -0.005 |
smartest | -0.004 |
Token | that |
Token ID | 326 |
Feature activation | -7.69e-03 |
Pos logit contributions | |
Matt | +0.008 |
om | +0.008 |
ores | +0.008 |
us | +0.008 |
itched | +0.008 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.010 |
guys | -0.009 |
smartest | -0.008 |
strongest | -0.007 |
Token | aren |
Token ID | 3588 |
Feature activation | -2.56e-02 |
Pos logit contributions | |
ores | +0.014 |
us | +0.013 |
om | +0.013 |
ubs | +0.013 |
ill | +0.013 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.011 |
guys | -0.009 |
smartest | -0.008 |
strongest | -0.008 |
Token | 't |
Token ID | 470 |
Feature activation | +2.88e-03 |
Pos logit contributions | |
om | +0.043 |
ores | +0.042 |
us | +0.042 |
udge | +0.040 |
oing | +0.040 |
Neg logit contributions | |
Deal | -0.035 |
nam | -0.032 |
guys | -0.031 |
smartest | -0.029 |
strongest | -0.029 |
Token | yours |
Token ID | 12431 |
Feature activation | -1.41e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
guys | +0.004 |
strongest | +0.003 |
smartest | +0.003 |
Neg logit contributions | |
ores | -0.005 |
om | -0.005 |
us | -0.005 |
Matt | -0.004 |
ill | -0.004 |
Token | without |
Token ID | 1231 |
Feature activation | +1.49e-03 |
Pos logit contributions | |
ores | +0.002 |
om | +0.002 |
Matt | +0.002 |
us | +0.002 |
int | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.002 |
guys | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
Token | asking |
Token ID | 4737 |
Feature activation | +2.29e-03 |
Pos logit contributions | |
nam | +0.003 |
Deal | +0.003 |
guys | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.002 |
ill | -0.002 |
om | -0.002 |
ork | -0.002 |
Matt | -0.002 |
Token | first |
Token ID | 717 |
Feature activation | +1.93e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.004 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
om | -0.003 |
us | -0.003 |
ill | -0.003 |
ubs | -0.003 |
Token | reward |
Token ID | 6721 |
Feature activation | +5.84e-03 |
Pos logit contributions | |
ores | +0.007 |
us | +0.006 |
om | +0.006 |
ubs | +0.006 |
uts | +0.006 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.006 |
guys | -0.005 |
smartest | -0.004 |
simplest | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +3.19e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.011 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.008 |
om | -0.007 |
Matt | -0.007 |
ubs | -0.007 |
anging | -0.007 |
Token | It |
Token ID | 632 |
Feature activation | +1.66e-04 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
Sorry | +0.005 |
guys | +0.005 |
Really | +0.004 |
Neg logit contributions | |
ores | -0.004 |
us | -0.004 |
ubs | -0.004 |
om | -0.004 |
anging | -0.004 |
Token | was |
Token ID | 373 |
Feature activation | +3.35e-03 |
Pos logit contributions | |
Deal | +0.000 |
nam | +0.000 |
guys | +0.000 |
smartest | +0.000 |
strongest | +0.000 |
Neg logit contributions | |
ores | -0.000 |
us | -0.000 |
ubs | -0.000 |
om | -0.000 |
Matt | -0.000 |
Token | ch |
Token ID | 442 |
Feature activation | +2.93e-04 |
Pos logit contributions | |
nam | +0.005 |
Deal | +0.005 |
smartest | +0.004 |
strongest | +0.004 |
nic | +0.004 |
Neg logit contributions | |
us | -0.005 |
uts | -0.005 |
oing | -0.005 |
s | -0.005 |
acks | -0.005 |
Token | ocol |
Token ID | 4668 |
Feature activation | -2.55e-02 |
Pos logit contributions | |
Deal | +0.000 |
nam | +0.000 |
guys | +0.000 |
smartest | +0.000 |
strongest | +0.000 |
Neg logit contributions | |
ores | -0.000 |
us | -0.000 |
Matt | -0.000 |
Josh | -0.000 |
om | -0.000 |
Token | ates |
Token ID | 689 |
Feature activation | +5.26e-03 |
Pos logit contributions | |
ores | +0.047 |
om | +0.043 |
int | +0.043 |
ubs | +0.043 |
� | +0.043 |
Neg logit contributions | |
Deal | -0.036 |
nam | -0.033 |
guys | -0.026 |
smartest | -0.023 |
simplest | -0.022 |
Token | and |
Token ID | 290 |
Feature activation | -1.75e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
strongest | +0.008 |
smartest | +0.008 |
Neg logit contributions | |
ores | -0.006 |
Matt | -0.006 |
Jud | -0.006 |
ubs | -0.006 |
aid | -0.006 |
Token | sweets |
Token ID | 42402 |
Feature activation | +2.18e-03 |
Pos logit contributions | |
ores | +0.003 |
us | +0.002 |
om | +0.002 |
ill | +0.002 |
ubs | +0.002 |
Neg logit contributions | |
nam | -0.003 |
Deal | -0.003 |
guys | -0.003 |
smartest | -0.002 |
strongest | -0.002 |
Token | ! |
Token ID | 0 |
Feature activation | +3.17e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.002 |
om | -0.002 |
us | -0.002 |
ubs | -0.002 |
Matt | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -3.05e-03 |
Pos logit contributions | |
nam | +0.006 |
Deal | +0.005 |
Sorry | +0.005 |
Really | +0.004 |
Please | +0.004 |
Neg logit contributions | |
ores | -0.004 |
us | -0.004 |
ubs | -0.004 |
anging | -0.004 |
itched | -0.004 |
Token | ly |
Token ID | 306 |
Feature activation | +2.53e-03 |
Pos logit contributions | |
ores | +0.002 |
om | +0.002 |
Matt | +0.002 |
aid | +0.002 |
us | +0.002 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +5.66e-03 |
Pos logit contributions | |
nam | +0.005 |
Deal | +0.005 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
Matt | -0.003 |
ubs | -0.003 |
om | -0.003 |
Token | Jill |
Token ID | 22772 |
Feature activation | -5.19e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
Sorry | +0.008 |
Okay | +0.008 |
Really | +0.007 |
Neg logit contributions | |
us | -0.008 |
ores | -0.007 |
ge | -0.007 |
oing | -0.007 |
itched | -0.007 |
Token | nodded |
Token ID | 14464 |
Feature activation | +4.72e-03 |
Pos logit contributions | |
ores | +0.010 |
us | +0.009 |
ubs | +0.009 |
om | +0.009 |
alks | +0.008 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.007 |
nic | -0.006 |
guys | -0.005 |
Okay | -0.005 |
Token | in |
Token ID | 287 |
Feature activation | +3.67e-04 |
Pos logit contributions | |
nam | +0.009 |
Deal | +0.008 |
guys | +0.007 |
nic | +0.007 |
Please | +0.007 |
Neg logit contributions | |
us | -0.007 |
ubs | -0.006 |
ores | -0.006 |
om | -0.006 |
enn | -0.006 |
Token | amaz |
Token ID | 40642 |
Feature activation | -2.53e-02 |
Pos logit contributions | |
nam | +0.000 |
Deal | +0.000 |
simplest | +0.000 |
guys | +0.000 |
matter | +0.000 |
Neg logit contributions | |
us | -0.001 |
om | -0.001 |
uts | -0.001 |
ores | -0.001 |
ork | -0.001 |
Token | ement |
Token ID | 972 |
Feature activation | -8.51e-03 |
Pos logit contributions | |
ores | +0.038 |
om | +0.037 |
� | +0.036 |
us | +0.036 |
ubs | +0.035 |
Neg logit contributions | |
Deal | -0.044 |
nam | -0.038 |
guys | -0.033 |
nic | -0.030 |
Fine | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | +1.50e-03 |
Pos logit contributions | |
ores | +0.014 |
irs | +0.014 |
Matt | +0.014 |
izz | +0.013 |
us | +0.013 |
Neg logit contributions | |
nam | -0.012 |
Deal | -0.011 |
cheeks | -0.010 |
songs | -0.009 |
guys | -0.009 |
Token | |
Token ID | 220 |
Feature activation | -2.79e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
Sorry | +0.002 |
Really | +0.002 |
Okay | +0.002 |
Neg logit contributions | |
us | -0.002 |
ge | -0.002 |
ores | -0.002 |
ck | -0.002 |
ching | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -6.63e-04 |
Pos logit contributions | |
product | +0.004 |
ge | +0.004 |
oing | +0.004 |
ores | +0.004 |
aster | +0.004 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.003 |
cient | -0.003 |
Sorry | -0.003 |
asure | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -1.99e-03 |
Pos logit contributions | |
ores | +0.001 |
hovering | +0.001 |
ge | +0.001 |
anging | +0.001 |
product | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
Okay | -0.001 |
nam | -0.001 |
OK | -0.001 |
Please | -0.001 |
Token | stopped |
Token ID | 5025 |
Feature activation | -1.44e-02 |
Pos logit contributions | |
ores | +0.009 |
us | +0.009 |
om | +0.008 |
irs | +0.008 |
udge | +0.008 |
Neg logit contributions | |
Deal | -0.005 |
guys | -0.005 |
smartest | -0.004 |
nam | -0.004 |
strongest | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | -3.98e-03 |
Pos logit contributions | |
ores | +0.023 |
ork | +0.022 |
ata | +0.022 |
us | +0.021 |
old | +0.021 |
Neg logit contributions | |
nam | -0.020 |
Deal | -0.019 |
smartest | -0.018 |
guys | -0.017 |
strongest | -0.017 |
Token | looked |
Token ID | 3114 |
Feature activation | +1.24e-03 |
Pos logit contributions | |
ubs | +0.006 |
om | +0.006 |
us | +0.006 |
uts | +0.006 |
ores | +0.006 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
guys | -0.006 |
nic | -0.005 |
smartest | -0.005 |
Token | around |
Token ID | 1088 |
Feature activation | -2.92e-03 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
guys | +0.002 |
smartest | +0.002 |
nic | +0.002 |
Neg logit contributions | |
us | -0.002 |
uts | -0.002 |
om | -0.002 |
Matt | -0.002 |
ores | -0.002 |
Token | in |
Token ID | 287 |
Feature activation | -3.15e-04 |
Pos logit contributions | |
uts | +0.005 |
us | +0.005 |
ubs | +0.005 |
ores | +0.005 |
om | +0.005 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
guys | -0.004 |
smartest | -0.003 |
wind | -0.003 |
Token | amaz |
Token ID | 40642 |
Feature activation | -2.52e-02 |
Pos logit contributions | |
uts | +0.001 |
us | +0.001 |
om | +0.000 |
ores | +0.000 |
oing | +0.000 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.000 |
smartest | -0.000 |
simplest | -0.000 |
matter | -0.000 |
Token | ement |
Token ID | 972 |
Feature activation | -8.87e-03 |
Pos logit contributions | |
ores | +0.037 |
om | +0.036 |
� | +0.035 |
us | +0.035 |
ine | +0.034 |
Neg logit contributions | |
Deal | -0.044 |
nam | -0.038 |
guys | -0.035 |
smartest | -0.031 |
nic | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | +3.12e-03 |
Pos logit contributions | |
ores | +0.014 |
irs | +0.013 |
us | +0.013 |
Jud | +0.013 |
Matt | +0.013 |
Neg logit contributions | |
nam | -0.012 |
Deal | -0.011 |
guys | -0.010 |
cheeks | -0.010 |
songs | -0.009 |
Token | He |
Token ID | 679 |
Feature activation | +5.52e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
Really | +0.004 |
Neg logit contributions | |
us | -0.004 |
ores | -0.004 |
ubs | -0.004 |
om | -0.004 |
itched | -0.004 |
Token | had |
Token ID | 550 |
Feature activation | -4.72e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.006 |
smartest | +0.006 |
nic | +0.006 |
Neg logit contributions | |
ores | -0.010 |
us | -0.009 |
ubs | -0.009 |
uts | -0.009 |
om | -0.009 |
Token | just |
Token ID | 655 |
Feature activation | -2.76e-03 |
Pos logit contributions | |
ores | +0.009 |
us | +0.009 |
oing | +0.008 |
om | +0.008 |
udge | +0.008 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.006 |
smartest | -0.005 |
strongest | -0.005 |
guys | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | -8.01e-03 |
Pos logit contributions | |
Deal | +0.018 |
nam | +0.017 |
guys | +0.016 |
smartest | +0.015 |
simplest | +0.015 |
Neg logit contributions | |
ores | -0.008 |
us | -0.007 |
Matt | -0.007 |
om | -0.007 |
int | -0.007 |
Token | not |
Token ID | 407 |
Feature activation | +4.39e-03 |
Pos logit contributions | |
ores | +0.012 |
us | +0.012 |
om | +0.012 |
ill | +0.011 |
ubs | +0.011 |
Neg logit contributions | |
Deal | -0.014 |
nam | -0.014 |
guys | -0.011 |
smartest | -0.011 |
simplest | -0.010 |
Token | touch |
Token ID | 3638 |
Feature activation | +1.17e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.006 |
smartest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.006 |
us | -0.006 |
om | -0.006 |
ill | -0.006 |
ubs | -0.006 |
Token | things |
Token ID | 1243 |
Feature activation | -7.23e-04 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
Matt | -0.002 |
om | -0.002 |
ill | -0.002 |
Token | that |
Token ID | 326 |
Feature activation | -8.51e-03 |
Pos logit contributions | |
Matt | +0.001 |
om | +0.001 |
ores | +0.001 |
us | +0.001 |
ill | +0.001 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | aren |
Token ID | 3588 |
Feature activation | -2.51e-02 |
Pos logit contributions | |
ores | +0.015 |
us | +0.014 |
om | +0.014 |
ubs | +0.014 |
ill | +0.014 |
Neg logit contributions | |
Deal | -0.013 |
nam | -0.012 |
guys | -0.010 |
smartest | -0.009 |
strongest | -0.009 |
Token | 't |
Token ID | 470 |
Feature activation | +1.38e-03 |
Pos logit contributions | |
om | +0.045 |
ores | +0.044 |
us | +0.044 |
oing | +0.043 |
aid | +0.042 |
Neg logit contributions | |
Deal | -0.030 |
nam | -0.027 |
guys | -0.026 |
smartest | -0.024 |
strongest | -0.023 |
Token | hers |
Token ID | 25144 |
Feature activation | -2.70e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
Matt | -0.002 |
ill | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -3.16e-03 |
Pos logit contributions | |
ores | +0.004 |
Matt | +0.003 |
om | +0.003 |
izzle | +0.003 |
us | +0.003 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.005 |
smartest | -0.004 |
strongest | -0.004 |
Token | From |
Token ID | 3574 |
Feature activation | -6.76e-04 |
Pos logit contributions | |
us | +0.004 |
ores | +0.004 |
om | +0.004 |
itched | +0.003 |
ubs | +0.003 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.006 |
Sorry | -0.005 |
Really | -0.005 |
simplest | -0.005 |
Token | that |
Token ID | 326 |
Feature activation | -4.10e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ill | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
simplest | -0.001 |
Token | shouldn |
Token ID | 6584 |
Feature activation | -7.48e-03 |
Pos logit contributions | |
ores | +0.017 |
ubs | +0.016 |
om | +0.016 |
us | +0.016 |
ill | +0.016 |
Neg logit contributions | |
Deal | -0.014 |
nam | -0.013 |
guys | -0.011 |
smartest | -0.010 |
strongest | -0.010 |
Token | 't |
Token ID | 470 |
Feature activation | +9.85e-04 |
Pos logit contributions | |
ores | +0.013 |
om | +0.012 |
int | +0.012 |
rou | +0.012 |
oing | +0.012 |
Neg logit contributions | |
Deal | -0.010 |
guys | -0.010 |
ha | -0.009 |
smartest | -0.008 |
strongest | -0.008 |
Token | touch |
Token ID | 3638 |
Feature activation | +2.85e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.002 |
om | -0.002 |
us | -0.002 |
Matt | -0.001 |
int | -0.001 |
Token | things |
Token ID | 1243 |
Feature activation | -3.18e-04 |
Pos logit contributions | |
nam | +0.006 |
Deal | +0.006 |
guys | +0.005 |
strongest | +0.005 |
smartest | +0.005 |
Neg logit contributions | |
ores | -0.003 |
om | -0.003 |
us | -0.003 |
anging | -0.003 |
ill | -0.003 |
Token | that |
Token ID | 326 |
Feature activation | -6.66e-03 |
Pos logit contributions | |
Matt | +0.000 |
om | +0.000 |
ores | +0.000 |
Jud | +0.000 |
itched | +0.000 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
guys | -0.000 |
strongest | -0.000 |
smartest | -0.000 |
Token | aren |
Token ID | 3588 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
ores | +0.010 |
us | +0.010 |
om | +0.010 |
ubs | +0.009 |
ill | +0.009 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.011 |
guys | -0.009 |
smartest | -0.008 |
strongest | -0.008 |
Token | 't |
Token ID | 470 |
Feature activation | +9.73e-04 |
Pos logit contributions | |
ores | +0.047 |
om | +0.047 |
oing | +0.046 |
udge | +0.046 |
aid | +0.044 |
Neg logit contributions | |
Deal | -0.026 |
guys | -0.025 |
nam | -0.024 |
brav | -0.023 |
strongest | -0.023 |
Token | his |
Token ID | 465 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
strongest | +0.001 |
smartest | +0.001 |
Neg logit contributions | |
om | -0.002 |
ores | -0.002 |
Matt | -0.002 |
itched | -0.002 |
acks | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -4.97e-03 |
Pos logit contributions | |
ores | +0.021 |
us | +0.020 |
Matt | +0.019 |
ill | +0.019 |
izzle | +0.019 |
Neg logit contributions | |
Deal | -0.018 |
nam | -0.017 |
guys | -0.015 |
smartest | -0.014 |
strongest | -0.013 |
Token | His |
Token ID | 2399 |
Feature activation | -1.66e-03 |
Pos logit contributions | |
ores | +0.007 |
us | +0.007 |
ubs | +0.007 |
itched | +0.007 |
om | +0.007 |
Neg logit contributions | |
Deal | -0.009 |
nam | -0.008 |
Sorry | -0.007 |
Really | -0.007 |
Okay | -0.006 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.17e-03 |
Pos logit contributions | |
ores | +0.003 |
us | +0.003 |
ill | +0.003 |
ubs | +0.003 |
anging | +0.003 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.002 |
smartest | -0.002 |
simplest | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | -4.80e-03 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
guys | +0.002 |
strongest | +0.002 |
smartest | +0.002 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
anging | -0.001 |
itched | -0.001 |
Token | ship |
Token ID | 4074 |
Feature activation | -1.66e-03 |
Pos logit contributions | |
ores | +0.008 |
ill | +0.008 |
us | +0.008 |
ubs | +0.008 |
uts | +0.007 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
guys | -0.006 |
smartest | -0.005 |
strongest | -0.005 |
Token | had |
Token ID | 550 |
Feature activation | -2.28e-03 |
Pos logit contributions | |
ores | +0.003 |
us | +0.003 |
ubs | +0.003 |
ill | +0.002 |
om | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
guys | -0.002 |
nam | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
Token | wrecked |
Token ID | 44770 |
Feature activation | -5.30e-03 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
ill | +0.004 |
int | +0.004 |
acks | +0.003 |
Neg logit contributions | |
nam | -0.003 |
guys | -0.003 |
Deal | -0.003 |
strongest | -0.003 |
smartest | -0.003 |
Token | long |
Token ID | 890 |
Feature activation | -6.44e-03 |
Pos logit contributions | |
ores | +0.009 |
uts | +0.008 |
anging | +0.008 |
us | +0.008 |
ill | +0.008 |
Neg logit contributions | |
nam | -0.009 |
guys | -0.008 |
Deal | -0.007 |
strongest | -0.006 |
fart | -0.006 |
Token | ago |
Token ID | 2084 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
ores | +0.010 |
us | +0.009 |
ill | +0.009 |
Matt | +0.008 |
uts | +0.008 |
Neg logit contributions | |
nam | -0.011 |
guys | -0.010 |
Deal | -0.010 |
simplest | -0.009 |
strongest | -0.009 |
Token | , |
Token ID | 11 |
Feature activation | +4.09e-03 |
Pos logit contributions | |
ores | +0.034 |
us | +0.030 |
int | +0.028 |
irs | +0.028 |
acks | +0.027 |
Neg logit contributions | |
nam | -0.047 |
Deal | -0.046 |
guys | -0.041 |
smartest | -0.035 |
games | -0.035 |
Token | and |
Token ID | 290 |
Feature activation | -7.22e-04 |
Pos logit contributions | |
nam | +0.007 |
Deal | +0.007 |
guys | +0.006 |
strongest | +0.006 |
smartest | +0.006 |
Neg logit contributions | |
us | -0.006 |
ores | -0.006 |
om | -0.006 |
acks | -0.006 |
irs | -0.005 |
Token | now |
Token ID | 783 |
Feature activation | -2.90e-03 |
Pos logit contributions | |
ores | +0.001 |
om | +0.001 |
us | +0.001 |
ill | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
nam | -0.002 |
Deal | -0.002 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | -8.85e-03 |
Pos logit contributions | |
om | +0.003 |
ores | +0.003 |
us | +0.003 |
udge | +0.003 |
ubs | +0.003 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.006 |
guys | -0.006 |
smartest | -0.005 |
strongest | -0.005 |
Token | was |
Token ID | 373 |
Feature activation | -3.34e-04 |
Pos logit contributions | |
ores | +0.015 |
ubs | +0.014 |
us | +0.014 |
om | +0.014 |
ill | +0.014 |
Neg logit contributions | |
Deal | -0.013 |
nam | -0.012 |
guys | -0.012 |
smartest | -0.011 |
strongest | -0.011 |
Token | not |
Token ID | 407 |
Feature activation | +3.06e-03 |
Pos logit contributions | |
om | +0.026 |
ores | +0.025 |
us | +0.025 |
anging | +0.024 |
oing | +0.024 |
Neg logit contributions | |
Deal | -0.017 |
nam | -0.013 |
guys | -0.012 |
simplest | -0.011 |
smartest | -0.010 |
Token | eat |
Token ID | 4483 |
Feature activation | -9.61e-04 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.005 |
ill | -0.005 |
ubs | -0.005 |
Token | too |
Token ID | 1165 |
Feature activation | +9.63e-04 |
Pos logit contributions | |
ores | +0.001 |
Matt | +0.001 |
anging | +0.001 |
om | +0.001 |
us | +0.001 |
Neg logit contributions | |
nam | -0.002 |
Deal | -0.002 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | many |
Token ID | 867 |
Feature activation | -2.82e-03 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
guys | +0.001 |
simplest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
Matt | -0.001 |
ores | -0.001 |
ill | -0.001 |
Matt | -0.001 |
int | -0.001 |
Token | ch |
Token ID | 442 |
Feature activation | -7.06e-03 |
Pos logit contributions | |
ores | +0.005 |
us | +0.004 |
om | +0.004 |
ill | +0.004 |
ubs | +0.004 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
guys | -0.003 |
smartest | -0.003 |
strongest | -0.003 |
Token | ocol |
Token ID | 4668 |
Feature activation | -2.50e-02 |
Pos logit contributions | |
� | +0.010 |
Matt | +0.010 |
ores | +0.010 |
Josh | +0.009 |
Matt | +0.009 |
Neg logit contributions | |
nam | -0.012 |
Deal | -0.012 |
guys | -0.010 |
smartest | -0.009 |
simplest | -0.009 |
Token | ates |
Token ID | 689 |
Feature activation | +7.23e-03 |
Pos logit contributions | |
ores | +0.044 |
om | +0.041 |
us | +0.040 |
ubs | +0.040 |
int | +0.040 |
Neg logit contributions | |
Deal | -0.038 |
nam | -0.035 |
guys | -0.028 |
smartest | -0.025 |
simplest | -0.024 |
Token | and |
Token ID | 290 |
Feature activation | -4.99e-03 |
Pos logit contributions | |
nam | +0.013 |
Deal | +0.013 |
guys | +0.011 |
strongest | +0.010 |
smartest | +0.010 |
Neg logit contributions | |
Matt | -0.010 |
ores | -0.009 |
Jud | -0.009 |
aid | -0.009 |
om | -0.009 |
Token | his |
Token ID | 465 |
Feature activation | -9.03e-03 |
Pos logit contributions | |
ores | +0.007 |
us | +0.007 |
om | +0.007 |
ill | +0.007 |
Matt | +0.007 |
Neg logit contributions | |
Deal | -0.009 |
nam | -0.009 |
guys | -0.007 |
smartest | -0.007 |
strongest | -0.007 |
Token | friend |
Token ID | 1545 |
Feature activation | -2.54e-03 |
Pos logit contributions | |
ores | +0.015 |
us | +0.014 |
om | +0.014 |
ubs | +0.014 |
ill | +0.014 |
Neg logit contributions | |
Deal | -0.014 |
nam | -0.013 |
guys | -0.011 |
smartest | -0.010 |
strongest | -0.010 |
Token | learned |
Token ID | 4499 |
Feature activation | -4.27e-03 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
ubs | +0.004 |
om | +0.004 |
ill | +0.004 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
guys | -0.003 |
smartest | -0.003 |
strongest | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +7.58e-04 |
Pos logit contributions | |
us | +0.010 |
irs | +0.010 |
ubs | +0.010 |
ores | +0.010 |
om | +0.009 |
Neg logit contributions | |
Deal | -0.014 |
nam | -0.013 |
smartest | -0.011 |
guys | -0.011 |
strongest | -0.011 |
Token | Flowers |
Token ID | 30036 |
Feature activation | +4.56e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
smartest | +0.001 |
guys | +0.001 |
simplest | +0.001 |
Neg logit contributions | |
us | -0.001 |
ores | -0.001 |
om | -0.001 |
ill | -0.001 |
ubs | -0.001 |
Token | of |
Token ID | 286 |
Feature activation | -1.66e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.007 |
guys | +0.006 |
smartest | +0.006 |
simplest | +0.006 |
Neg logit contributions | |
us | -0.007 |
ores | -0.007 |
Matt | -0.006 |
om | -0.006 |
ubs | -0.006 |
Token | all |
Token ID | 477 |
Feature activation | +1.08e-03 |
Pos logit contributions | |
ores | +0.002 |
us | +0.002 |
om | +0.002 |
uts | +0.002 |
anging | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.002 |
smartest | -0.002 |
simplest | -0.002 |
Token | colors |
Token ID | 7577 |
Feature activation | +2.20e-03 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
smartest | +0.001 |
strongest | +0.001 |
simplest | +0.001 |
Neg logit contributions | |
us | -0.002 |
ork | -0.002 |
ores | -0.002 |
aid | -0.002 |
Matt | -0.002 |
Token | filled |
Token ID | 5901 |
Feature activation | -2.49e-02 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
aid | -0.003 |
us | -0.003 |
ores | -0.003 |
Matt | -0.003 |
ork | -0.003 |
Token | the |
Token ID | 262 |
Feature activation | +2.10e-03 |
Pos logit contributions | |
om | +0.036 |
us | +0.036 |
ores | +0.036 |
orse | +0.035 |
uts | +0.035 |
Neg logit contributions | |
nam | -0.042 |
Deal | -0.041 |
guys | -0.035 |
songs | -0.031 |
games | -0.031 |
Token | space |
Token ID | 2272 |
Feature activation | -8.57e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.003 |
guys | +0.003 |
smartest | +0.002 |
Sorry | +0.002 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ubs | -0.003 |
� | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +3.05e-03 |
Pos logit contributions | |
us | +0.012 |
Matt | +0.011 |
ores | +0.011 |
Dan | +0.011 |
David | +0.010 |
Neg logit contributions | |
nam | -0.015 |
Deal | -0.015 |
guys | -0.013 |
strongest | -0.013 |
smartest | -0.013 |
Token | Suddenly |
Token ID | 24975 |
Feature activation | -2.99e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
simplest | +0.004 |
Neg logit contributions | |
us | -0.004 |
ores | -0.004 |
om | -0.004 |
ill | -0.004 |
ank | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | -2.44e-03 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
om | +0.004 |
ubs | +0.004 |
uts | +0.004 |
Neg logit contributions | |
nam | -0.005 |
Deal | -0.005 |
guys | -0.005 |
smartest | -0.004 |
strongest | -0.004 |
Token | She |
Token ID | 1375 |
Feature activation | +4.90e-03 |
Pos logit contributions | |
us | +0.000 |
ores | +0.000 |
om | +0.000 |
ubs | +0.000 |
ine | +0.000 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
simplest | -0.000 |
Token | says |
Token ID | 1139 |
Feature activation | +1.29e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.006 |
guys | +0.006 |
nic | +0.005 |
smartest | +0.005 |
Neg logit contributions | |
ores | -0.009 |
us | -0.009 |
ubs | -0.008 |
ill | -0.008 |
uts | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | +2.70e-03 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.001 |
ubs | -0.001 |
ill | -0.001 |
Token | " |
Token ID | 366 |
Feature activation | +5.81e-04 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
cient | +0.004 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
ubs | -0.003 |
om | -0.003 |
ill | -0.003 |
Token | Tom |
Token ID | 13787 |
Feature activation | -4.67e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ubs | -0.001 |
ill | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +1.15e-02 |
Pos logit contributions | |
ores | +0.007 |
us | +0.006 |
int | +0.006 |
ubs | +0.006 |
Matt | +0.006 |
Neg logit contributions | |
Deal | -0.009 |
nam | -0.008 |
guys | -0.007 |
smartest | -0.007 |
strongest | -0.007 |
Token | stop |
Token ID | 2245 |
Feature activation | +4.22e-04 |
Pos logit contributions | |
Deal | +0.019 |
nam | +0.017 |
guys | +0.014 |
smartest | +0.013 |
simplest | +0.013 |
Neg logit contributions | |
ores | -0.019 |
om | -0.018 |
us | -0.018 |
ill | -0.017 |
� | -0.017 |
Token | it |
Token ID | 340 |
Feature activation | +3.15e-03 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
Sorry | +0.001 |
smartest | +0.001 |
Neg logit contributions | |
ork | -0.001 |
us | -0.001 |
ores | -0.001 |
uts | -0.001 |
ill | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -6.22e-04 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
guys | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
Matt | -0.003 |
om | -0.003 |
ubs | -0.003 |
Token | That |
Token ID | 1320 |
Feature activation | -9.19e-03 |
Pos logit contributions | |
ores | +0.001 |
om | +0.001 |
us | +0.001 |
ill | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | is |
Token ID | 318 |
Feature activation | +1.19e-03 |
Pos logit contributions | |
ores | +0.015 |
us | +0.015 |
ubs | +0.014 |
ill | +0.014 |
uts | +0.014 |
Neg logit contributions | |
Deal | -0.014 |
guys | -0.012 |
nam | -0.012 |
smartest | -0.011 |
strongest | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | -5.39e-03 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.000 |
strongest | +0.000 |
smartest | +0.000 |
Neg logit contributions | |
us | -0.001 |
om | -0.001 |
ork | -0.001 |
itched | -0.001 |
irs | -0.001 |
Token | they |
Token ID | 484 |
Feature activation | -5.37e-04 |
Pos logit contributions | |
us | +0.009 |
om | +0.009 |
ores | +0.008 |
ubs | +0.008 |
anging | +0.008 |
Neg logit contributions | |
nam | -0.009 |
Deal | -0.009 |
guys | -0.007 |
smartest | -0.007 |
strongest | -0.007 |
Token | had |
Token ID | 550 |
Feature activation | -5.54e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ubs | +0.001 |
ill | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | -1.19e-04 |
Pos logit contributions | |
ores | +0.006 |
us | +0.006 |
ill | +0.006 |
om | +0.005 |
anging | +0.005 |
Neg logit contributions | |
Deal | -0.012 |
nam | -0.011 |
guys | -0.010 |
smartest | -0.009 |
simplest | -0.009 |
Token | stay |
Token ID | 2652 |
Feature activation | +1.13e-03 |
Pos logit contributions | |
us | +0.000 |
om | +0.000 |
ores | +0.000 |
anging | +0.000 |
uts | +0.000 |
Neg logit contributions | |
Deal | -0.000 |
nam | -0.000 |
guys | -0.000 |
smartest | -0.000 |
strongest | -0.000 |
Token | close |
Token ID | 1969 |
Feature activation | +1.03e-02 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.001 |
smartest | +0.001 |
nic | +0.001 |
Neg logit contributions | |
uts | -0.002 |
ill | -0.002 |
om | -0.002 |
ores | -0.002 |
Matt | -0.002 |
Token | to |
Token ID | 284 |
Feature activation | -1.58e-03 |
Pos logit contributions | |
Deal | +0.018 |
nam | +0.018 |
guys | +0.015 |
smartest | +0.014 |
strongest | +0.014 |
Neg logit contributions | |
ores | -0.013 |
ork | -0.013 |
Matt | -0.013 |
acks | -0.013 |
on | -0.012 |
Token | him |
Token ID | 683 |
Feature activation | +2.56e-03 |
Pos logit contributions | |
om | +0.002 |
uts | +0.002 |
us | +0.002 |
ores | +0.002 |
anging | +0.002 |
Neg logit contributions | |
nam | -0.003 |
Deal | -0.003 |
guys | -0.003 |
smartest | -0.002 |
strongest | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +3.74e-04 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.005 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.003 |
Matt | -0.003 |
us | -0.003 |
ubs | -0.003 |
om | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
Sorry | +0.001 |
Really | +0.001 |
guys | +0.001 |
Neg logit contributions | |
anging | -0.000 |
ge | -0.000 |
ake | -0.000 |
ores | -0.000 |
brewing | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | +3.67e-04 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
OK | +0.005 |
Okay | +0.005 |
lived | +0.005 |
Neg logit contributions | |
anging | -0.006 |
uts | -0.005 |
ores | -0.005 |
ill | -0.005 |
hovering | -0.005 |
Token | them |
Token ID | 606 |
Feature activation | +1.05e-03 |
Pos logit contributions | |
ores | +0.012 |
ill | +0.011 |
us | +0.011 |
anging | +0.011 |
acks | +0.011 |
Neg logit contributions | |
nam | -0.010 |
Deal | -0.009 |
guys | -0.008 |
smartest | -0.007 |
nic | -0.007 |
Token | . |
Token ID | 13 |
Feature activation | +9.42e-04 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.002 |
nic | +0.002 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
Matt | -0.001 |
ubs | -0.001 |
acks | -0.001 |
Token | Lily |
Token ID | 20037 |
Feature activation | -7.25e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.002 |
simplest | +0.002 |
Neg logit contributions | |
us | -0.001 |
ores | -0.001 |
om | -0.001 |
ubs | -0.001 |
Matt | -0.001 |
Token | loved |
Token ID | 6151 |
Feature activation | -3.58e-03 |
Pos logit contributions | |
ores | +0.012 |
us | +0.011 |
om | +0.011 |
ill | +0.011 |
ubs | +0.011 |
Neg logit contributions | |
Deal | -0.012 |
nam | -0.011 |
guys | -0.010 |
smartest | -0.009 |
strongest | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | -1.81e-04 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
om | +0.003 |
ill | +0.003 |
ubs | +0.003 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.008 |
guys | -0.007 |
smartest | -0.006 |
strongest | -0.006 |
Token | count |
Token ID | 954 |
Feature activation | +9.97e-03 |
Pos logit contributions | |
ores | +0.000 |
om | +0.000 |
us | +0.000 |
ubs | +0.000 |
ill | +0.000 |
Neg logit contributions | |
Deal | -0.000 |
nam | -0.000 |
guys | -0.000 |
smartest | -0.000 |
simplest | -0.000 |
Token | the |
Token ID | 262 |
Feature activation | -8.74e-04 |
Pos logit contributions | |
nam | +0.018 |
Deal | +0.017 |
guys | +0.015 |
smartest | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
ores | -0.015 |
us | -0.013 |
ill | -0.013 |
acks | -0.013 |
anging | -0.013 |
Token | bags |
Token ID | 11668 |
Feature activation | +6.98e-03 |
Pos logit contributions | |
ores | +0.001 |
om | +0.001 |
us | +0.001 |
ubs | +0.001 |
s | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
Sorry | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -4.65e-03 |
Pos logit contributions | |
nam | +0.013 |
Deal | +0.013 |
guys | +0.010 |
smartest | +0.010 |
strongest | +0.010 |
Neg logit contributions | |
us | -0.010 |
ores | -0.009 |
Matt | -0.009 |
ez | -0.009 |
itched | -0.009 |
Token | " |
Token ID | 366 |
Feature activation | +5.50e-03 |
Pos logit contributions | |
us | +0.005 |
ores | +0.005 |
anging | +0.004 |
ge | +0.004 |
Matt | +0.004 |
Neg logit contributions | |
Deal | -0.010 |
nam | -0.009 |
guys | -0.008 |
nic | -0.008 |
smartest | -0.008 |
Token | One |
Token ID | 3198 |
Feature activation | +5.55e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.008 |
cient | +0.008 |
smartest | +0.008 |
Neg logit contributions | |
ores | -0.007 |
� | -0.007 |
om | -0.007 |
Matt | -0.007 |
us | -0.007 |
Token | asked |
Token ID | 1965 |
Feature activation | +2.94e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.007 |
guys | +0.006 |
nic | +0.005 |
smartest | +0.005 |
Neg logit contributions | |
ores | -0.009 |
us | -0.008 |
ubs | -0.008 |
om | -0.008 |
irs | -0.008 |
Token | : |
Token ID | 25 |
Feature activation | -2.61e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.004 |
simplest | +0.004 |
Neg logit contributions | |
ores | -0.004 |
om | -0.003 |
us | -0.003 |
ubs | -0.003 |
uts | -0.003 |
Token | " |
Token ID | 366 |
Feature activation | +6.65e-03 |
Pos logit contributions | |
ubs | +0.004 |
ores | +0.004 |
us | +0.004 |
acks | +0.004 |
old | +0.004 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
Really | -0.003 |
Sorry | -0.003 |
chard | -0.003 |
Token | What |
Token ID | 2061 |
Feature activation | +4.15e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.011 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.010 |
us | -0.010 |
om | -0.009 |
ill | -0.009 |
ubs | -0.009 |
Token | is |
Token ID | 318 |
Feature activation | -2.54e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.005 |
om | -0.005 |
� | -0.005 |
us | -0.005 |
ill | -0.004 |
Token | that |
Token ID | 326 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
ores | +0.002 |
us | +0.002 |
om | +0.002 |
ubs | +0.001 |
� | +0.001 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.006 |
guys | -0.005 |
smartest | -0.005 |
simplest | -0.005 |
Token | big |
Token ID | 1263 |
Feature activation | +4.03e-03 |
Pos logit contributions | |
Deal | +0.016 |
nam | +0.015 |
guys | +0.013 |
smartest | +0.012 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.022 |
us | -0.022 |
om | -0.021 |
ill | -0.021 |
ubs | -0.021 |
Token | thing |
Token ID | 1517 |
Feature activation | +2.57e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.007 |
guys | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.006 |
us | -0.006 |
om | -0.006 |
ubs | -0.006 |
ill | -0.006 |
Token | ?". |
Token ID | 43634 |
Feature activation | -4.91e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
simplest | +0.003 |
Neg logit contributions | |
ores | -0.004 |
us | -0.004 |
om | -0.004 |
ubs | -0.004 |
ill | -0.004 |
Token | |
Token ID | 220 |
Feature activation | -5.96e-03 |
Pos logit contributions | |
ores | +0.004 |
us | +0.004 |
om | +0.004 |
ubs | +0.004 |
ill | +0.004 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.011 |
guys | -0.009 |
Sorry | -0.009 |
smartest | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -3.91e-03 |
Pos logit contributions | |
product | +0.008 |
bones | +0.008 |
ge | +0.008 |
oing | +0.008 |
ores | +0.008 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.006 |
cient | -0.006 |
Bug | -0.006 |
Sorry | -0.006 |
Token | who |
Token ID | 508 |
Feature activation | -7.92e-04 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.003 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
Matt | -0.003 |
itched | -0.003 |
om | -0.003 |
us | -0.003 |
Token | love |
Token ID | 1842 |
Feature activation | +4.30e-04 |
Pos logit contributions | |
ores | +0.002 |
ill | +0.001 |
Matt | +0.001 |
us | +0.001 |
int | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
cient | -0.001 |
Token | toys |
Token ID | 14958 |
Feature activation | +6.06e-03 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
simplest | +0.001 |
smartest | +0.001 |
Neg logit contributions | |
ores | -0.000 |
itched | -0.000 |
anging | -0.000 |
Matt | -0.000 |
ill | -0.000 |
Token | like |
Token ID | 588 |
Feature activation | +5.37e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.011 |
guys | +0.010 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.008 |
Matt | -0.008 |
om | -0.008 |
itched | -0.008 |
int | -0.008 |
Token | you |
Token ID | 345 |
Feature activation | +1.29e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.008 |
smartest | +0.007 |
simplest | +0.007 |
Neg logit contributions | |
ores | -0.008 |
us | -0.007 |
ill | -0.007 |
Matt | -0.007 |
om | -0.007 |
Token | do |
Token ID | 466 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
ill | -0.002 |
ubs | -0.002 |
Token | ." |
Token ID | 526 |
Feature activation | -1.07e-04 |
Pos logit contributions | |
Deal | +0.019 |
nam | +0.018 |
guys | +0.016 |
smartest | +0.013 |
simplest | +0.013 |
Neg logit contributions | |
ores | -0.018 |
ill | -0.017 |
Matt | -0.017 |
us | -0.017 |
om | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | +5.46e-04 |
Pos logit contributions | |
ores | +0.000 |
anging | +0.000 |
ine | +0.000 |
int | +0.000 |
iced | +0.000 |
Neg logit contributions | |
Deal | -0.000 |
nam | -0.000 |
Really | -0.000 |
OK | -0.000 |
Please | -0.000 |
Token |
|
Token ID | 198 |
Feature activation | +7.15e-04 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
OK | +0.001 |
Really | +0.001 |
Okay | +0.001 |
Neg logit contributions | |
ores | -0.001 |
anging | -0.001 |
ine | -0.001 |
ill | -0.001 |
int | -0.001 |
Token | S |
Token ID | 50 |
Feature activation | +2.90e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
Okay | +0.001 |
Fine | +0.001 |
OK | +0.001 |
Neg logit contributions | |
ores | -0.001 |
int | -0.001 |
Matt | -0.001 |
anging | -0.001 |
Joe | -0.001 |
Token | ara |
Token ID | 3301 |
Feature activation | -2.22e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
simplest | +0.005 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ubs | -0.003 |
ill | -0.003 |
Token | Lily |
Token ID | 20037 |
Feature activation | -3.83e-04 |
Pos logit contributions | |
us | +0.006 |
om | +0.005 |
ores | +0.005 |
anging | +0.005 |
itched | +0.005 |
Neg logit contributions | |
nam | -0.005 |
Deal | -0.005 |
guys | -0.004 |
smartest | -0.003 |
Sorry | -0.003 |
Token | went |
Token ID | 1816 |
Feature activation | +6.65e-04 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
ubs | +0.001 |
om | +0.001 |
uts | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.000 |
smartest | -0.000 |
nic | -0.000 |
Token | to |
Token ID | 284 |
Feature activation | +6.42e-04 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
seeker | +0.001 |
guys | +0.001 |
ha | +0.001 |
Neg logit contributions | |
Matt | -0.001 |
itched | -0.001 |
om | -0.001 |
uts | -0.001 |
ill | -0.001 |
Token | bed |
Token ID | 3996 |
Feature activation | -7.33e-04 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
smartest | +0.001 |
seeker | +0.001 |
Neg logit contributions | |
us | -0.001 |
om | -0.001 |
ores | -0.001 |
uts | -0.001 |
anging | -0.001 |
Token | with |
Token ID | 351 |
Feature activation | -5.48e-04 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
Matt | +0.001 |
irs | +0.001 |
� | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
nic | -0.001 |
smartest | -0.001 |
Token | Snow |
Token ID | 7967 |
Feature activation | +1.79e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ubs | +0.001 |
ill | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
simplest | -0.001 |
Token | y |
Token ID | 88 |
Feature activation | +3.77e-03 |
Pos logit contributions | |
Deal | +0.003 |
guys | +0.003 |
nam | +0.003 |
cient | +0.002 |
smartest | +0.002 |
Neg logit contributions | |
ores | -0.003 |
ubs | -0.003 |
int | -0.003 |
Matt | -0.003 |
alks | -0.003 |
Token | by |
Token ID | 416 |
Feature activation | -2.45e-05 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.005 |
us | -0.004 |
om | -0.004 |
ubs | -0.004 |
ill | -0.004 |
Token | her |
Token ID | 607 |
Feature activation | -4.40e-03 |
Pos logit contributions | |
us | +0.000 |
ores | +0.000 |
om | +0.000 |
s | +0.000 |
uts | +0.000 |
Neg logit contributions | |
nam | -0.000 |
Deal | -0.000 |
guys | -0.000 |
smartest | -0.000 |
simplest | -0.000 |
Token | side |
Token ID | 1735 |
Feature activation | +4.29e-03 |
Pos logit contributions | |
ores | +0.007 |
us | +0.007 |
om | +0.007 |
ubs | +0.006 |
ill | +0.006 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
guys | -0.006 |
smartest | -0.005 |
strongest | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.04e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.007 |
smartest | +0.006 |
strongest | +0.006 |
guys | +0.006 |
Neg logit contributions | |
ores | -0.006 |
us | -0.006 |
irs | -0.005 |
Matt | -0.005 |
int | -0.005 |
Token | it |
Token ID | 340 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
ill | +0.000 |
ores | +0.000 |
us | +0.000 |
om | +0.000 |
� | +0.000 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
guys | -0.001 |
simplest | -0.001 |
smartest | -0.001 |
Token | so |
Token ID | 523 |
Feature activation | -6.14e-03 |
Pos logit contributions | |
Deal | +0.023 |
nam | +0.021 |
guys | +0.018 |
Sorry | +0.018 |
Fine | +0.017 |
Neg logit contributions | |
ores | -0.013 |
� | -0.013 |
om | -0.013 |
us | -0.013 |
and | -0.012 |
Token | much |
Token ID | 881 |
Feature activation | +5.86e-04 |
Pos logit contributions | |
ores | +0.005 |
us | +0.004 |
om | +0.004 |
ill | +0.004 |
ubs | +0.004 |
Neg logit contributions | |
Deal | -0.015 |
nam | -0.015 |
guys | -0.013 |
smartest | -0.012 |
strongest | -0.012 |
Token | that |
Token ID | 326 |
Feature activation | -4.21e-03 |
Pos logit contributions | |
Deal | +0.001 |
guys | +0.001 |
nam | +0.001 |
strongest | +0.001 |
songs | +0.001 |
Neg logit contributions | |
om | -0.001 |
itched | -0.001 |
ill | -0.001 |
Matt | -0.001 |
ores | -0.001 |
Token | he |
Token ID | 339 |
Feature activation | +2.70e-03 |
Pos logit contributions | |
ores | +0.003 |
us | +0.002 |
om | +0.002 |
ubs | +0.002 |
ill | +0.002 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.011 |
guys | -0.010 |
smartest | -0.009 |
strongest | -0.009 |
Token | would |
Token ID | 561 |
Feature activation | +2.20e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
smartest | +0.004 |
guys | +0.004 |
Sorry | +0.004 |
Neg logit contributions | |
us | -0.004 |
ores | -0.004 |
� | -0.004 |
om | -0.004 |
ine | -0.004 |
Token | always |
Token ID | 1464 |
Feature activation | +6.79e-03 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.003 |
guys | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
us | -0.004 |
ores | -0.004 |
om | -0.004 |
Matt | -0.004 |
ill | -0.004 |
Token | try |
Token ID | 1949 |
Feature activation | +1.41e-02 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.011 |
guys | +0.009 |
smartest | +0.008 |
strongest | +0.008 |
Neg logit contributions | |
ores | -0.011 |
us | -0.010 |
om | -0.010 |
ill | -0.010 |
ubs | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | +6.27e-03 |
Pos logit contributions | |
nam | +0.022 |
guys | +0.022 |
songs | +0.018 |
Deal | +0.017 |
fart | +0.017 |
Neg logit contributions | |
ores | -0.022 |
old | -0.020 |
izz | -0.020 |
ill | -0.020 |
Matt | -0.020 |
Token | zip |
Token ID | 19974 |
Feature activation | +1.47e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.011 |
om | -0.011 |
us | -0.011 |
uts | -0.011 |
ill | -0.010 |
Token | into |
Token ID | 656 |
Feature activation | -2.54e-03 |
Pos logit contributions | |
guys | +0.003 |
nam | +0.003 |
Deal | +0.002 |
fart | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
old | -0.002 |
anging | -0.002 |
ucking | -0.002 |
oing | -0.002 |
Matt | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -3.15e-03 |
Pos logit contributions | |
ores | +0.001 |
anging | +0.001 |
int | +0.001 |
product | +0.001 |
hovering | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
cient | -0.002 |
Okay | -0.002 |
Token | The |
Token ID | 464 |
Feature activation | -3.86e-03 |
Pos logit contributions | |
ores | +0.005 |
us | +0.004 |
om | +0.004 |
ill | +0.004 |
ubs | +0.004 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.005 |
guys | -0.004 |
Okay | -0.004 |
Fine | -0.004 |
Token | father |
Token ID | 2988 |
Feature activation | +1.82e-03 |
Pos logit contributions | |
ores | +0.006 |
us | +0.005 |
om | +0.005 |
ubs | +0.005 |
ill | +0.005 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
guys | -0.006 |
smartest | -0.005 |
strongest | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +3.03e-03 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.003 |
guys | +0.002 |
smartest | +0.002 |
nic | +0.002 |
Neg logit contributions | |
ores | -0.003 |
ubs | -0.003 |
acks | -0.003 |
uts | -0.003 |
us | -0.003 |
Token | son |
Token ID | 3367 |
Feature activation | -3.74e-03 |
Pos logit contributions | |
nam | +0.007 |
Deal | +0.006 |
guys | +0.006 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.003 |
uts | -0.003 |
us | -0.003 |
ork | -0.003 |
om | -0.003 |
Token | went |
Token ID | 1816 |
Feature activation | -9.87e-04 |
Pos logit contributions | |
ores | +0.006 |
us | +0.006 |
om | +0.006 |
ubs | +0.006 |
uts | +0.005 |
Neg logit contributions | |
Deal | -0.006 |
nam | -0.006 |
guys | -0.005 |
smartest | -0.004 |
strongest | -0.004 |
Token | on |
Token ID | 319 |
Feature activation | -4.68e-03 |
Pos logit contributions | |
Matt | +0.002 |
itched | +0.001 |
ill | +0.001 |
uts | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
seeker | -0.001 |
nic | -0.001 |
Token | their |
Token ID | 511 |
Feature activation | +8.71e-04 |
Pos logit contributions | |
ubs | +0.007 |
us | +0.007 |
uts | +0.007 |
ill | +0.007 |
ores | +0.007 |
Neg logit contributions | |
nam | -0.008 |
Deal | -0.008 |
guys | -0.007 |
simplest | -0.006 |
games | -0.006 |
Token | trip |
Token ID | 5296 |
Feature activation | -1.78e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
guys | +0.001 |
Okay | +0.001 |
Fine | +0.001 |
Neg logit contributions | |
� | -0.001 |
s | -0.001 |
Josh | -0.001 |
aid | -0.001 |
om | -0.001 |
Token | and |
Token ID | 290 |
Feature activation | -5.24e-03 |
Pos logit contributions | |
ores | +0.002 |
irs | +0.002 |
itched | +0.002 |
ubs | +0.002 |
us | +0.002 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.003 |
guys | -0.003 |
smartest | -0.003 |
strongest | -0.003 |
Token | ended |
Token ID | 4444 |
Feature activation | -4.92e-03 |
Pos logit contributions | |
ores | +0.008 |
us | +0.008 |
ubs | +0.008 |
om | +0.008 |
uts | +0.008 |
Neg logit contributions | |
nam | -0.008 |
Deal | -0.008 |
guys | -0.007 |
smartest | -0.006 |
strongest | -0.006 |
Token | heart |
Token ID | 2612 |
Feature activation | +1.26e-02 |
Pos logit contributions | |
Deal | +0.003 |
nam | +0.003 |
guys | +0.002 |
smartest | +0.002 |
simplest | +0.002 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
ubs | -0.003 |
ill | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +2.49e-03 |
Pos logit contributions | |
nam | +0.026 |
Deal | +0.025 |
guys | +0.022 |
smartest | +0.021 |
strongest | +0.020 |
Neg logit contributions | |
ores | -0.015 |
us | -0.014 |
Matt | -0.013 |
om | -0.013 |
anging | -0.013 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +8.25e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
Sorry | +0.004 |
Really | +0.003 |
smartest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.003 |
itched | -0.003 |
ubs | -0.003 |
Token | S |
Token ID | 50 |
Feature activation | +6.79e-03 |
Pos logit contributions | |
Deal | +0.015 |
nam | +0.013 |
guys | +0.012 |
smartest | +0.011 |
simplest | +0.011 |
Neg logit contributions | |
ores | -0.011 |
int | -0.010 |
ubs | -0.010 |
anging | -0.010 |
ine | -0.010 |
Token | ara |
Token ID | 3301 |
Feature activation | +5.08e-03 |
Pos logit contributions | |
Deal | +0.011 |
nam | +0.010 |
cient | +0.009 |
guys | +0.008 |
nic | +0.008 |
Neg logit contributions | |
ores | -0.010 |
uts | -0.010 |
ubs | -0.009 |
udge | -0.009 |
anging | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | +4.70e-03 |
Pos logit contributions | |
Deal | +0.010 |
liked | +0.008 |
lived | +0.008 |
guys | +0.008 |
nam | +0.008 |
Neg logit contributions | |
ores | -0.007 |
int | -0.006 |
irs | -0.006 |
ula | -0.006 |
uts | -0.006 |
Token | Ben |
Token ID | 3932 |
Feature activation | +2.57e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.009 |
Sorry | +0.008 |
smartest | +0.008 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
om | -0.005 |
ubs | -0.005 |
ill | -0.005 |
Token | like |
Token ID | 588 |
Feature activation | -5.99e-05 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.003 |
guys | +0.003 |
smartest | +0.002 |
simplest | +0.002 |
Neg logit contributions | |
ores | -0.005 |
us | -0.005 |
int | -0.004 |
ubs | -0.004 |
om | -0.004 |
Token | to |
Token ID | 284 |
Feature activation | -9.76e-04 |
Pos logit contributions | |
ores | +0.000 |
us | +0.000 |
om | +0.000 |
ill | +0.000 |
ubs | +0.000 |
Neg logit contributions | |
Deal | -0.000 |
nam | -0.000 |
guys | -0.000 |
smartest | -0.000 |
strongest | -0.000 |
Token | play |
Token ID | 711 |
Feature activation | +7.79e-03 |
Pos logit contributions | |
us | +0.002 |
ores | +0.002 |
om | +0.002 |
int | +0.002 |
ubs | +0.002 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
simplest | -0.001 |
Token | with |
Token ID | 351 |
Feature activation | -2.33e-03 |
Pos logit contributions | |
Deal | +0.016 |
nam | +0.016 |
smartest | +0.013 |
guys | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
ores | -0.009 |
us | -0.008 |
om | -0.008 |
ubs | -0.008 |
itched | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | +5.18e-03 |
Pos logit contributions | |
Matt | +0.003 |
ubs | +0.003 |
ores | +0.003 |
Dan | +0.003 |
Jud | +0.003 |
Neg logit contributions | |
nam | -0.003 |
Deal | -0.003 |
head | -0.003 |
guys | -0.003 |
forth | -0.003 |
Token | hugs |
Token ID | 40657 |
Feature activation | -2.94e-04 |
Pos logit contributions | |
nam | +0.008 |
Deal | +0.008 |
guys | +0.006 |
nic | +0.006 |
Sorry | +0.006 |
Neg logit contributions | |
us | -0.009 |
ill | -0.009 |
ores | -0.009 |
ubs | -0.008 |
ork | -0.008 |
Token | him |
Token ID | 683 |
Feature activation | +3.33e-03 |
Pos logit contributions | |
om | +0.000 |
ores | +0.000 |
anging | +0.000 |
uts | +0.000 |
ork | +0.000 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
guys | -0.001 |
songs | -0.000 |
Please | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | -1.02e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.007 |
strongest | +0.006 |
Neg logit contributions | |
ores | -0.003 |
us | -0.003 |
om | -0.002 |
ubs | -0.002 |
ill | -0.002 |
Token | She |
Token ID | 1375 |
Feature activation | +7.98e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ork | +0.001 |
ill | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
Sorry | -0.001 |
smartest | -0.001 |
Token | says |
Token ID | 1139 |
Feature activation | +1.49e-04 |
Pos logit contributions | |
Deal | +0.014 |
nam | +0.012 |
guys | +0.011 |
nic | +0.011 |
smartest | +0.010 |
Neg logit contributions | |
us | -0.012 |
ores | -0.012 |
ubs | -0.011 |
ill | -0.011 |
Matt | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | +6.53e-03 |
Pos logit contributions | |
Deal | +0.000 |
nam | +0.000 |
guys | +0.000 |
smartest | +0.000 |
strongest | +0.000 |
Neg logit contributions | |
ores | -0.000 |
us | -0.000 |
om | -0.000 |
ubs | -0.000 |
ill | -0.000 |
Token | " |
Token ID | 366 |
Feature activation | +2.78e-03 |
Pos logit contributions | |
Deal | +0.012 |
nam | +0.012 |
guys | +0.010 |
smartest | +0.009 |
cient | +0.009 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
ubs | -0.008 |
ill | -0.008 |
om | -0.008 |
Token | Thank |
Token ID | 10449 |
Feature activation | +2.48e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.004 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.005 |
us | -0.004 |
om | -0.004 |
ill | -0.004 |
� | -0.004 |
Token | you |
Token ID | 345 |
Feature activation | -1.50e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
us | -0.004 |
ores | -0.004 |
� | -0.004 |
s | -0.003 |
ut | -0.003 |
Token | , |
Token ID | 11 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
ores | +0.002 |
us | +0.001 |
om | +0.001 |
ill | +0.001 |
ubs | +0.001 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.003 |
smartest | -0.003 |
strongest | -0.003 |
Token | very |
Token ID | 845 |
Feature activation | -6.80e-03 |
Pos logit contributions | |
Deal | +0.018 |
nam | +0.017 |
guys | +0.014 |
smartest | +0.013 |
Okay | +0.013 |
Neg logit contributions | |
ores | -0.014 |
us | -0.013 |
� | -0.013 |
om | -0.012 |
int | -0.012 |
Token | sorry |
Token ID | 7926 |
Feature activation | +7.66e-03 |
Pos logit contributions | |
ores | +0.010 |
us | +0.010 |
om | +0.010 |
ubs | +0.009 |
int | +0.009 |
Neg logit contributions | |
Deal | -0.012 |
nam | -0.011 |
guys | -0.009 |
smartest | -0.009 |
strongest | -0.008 |
Token | for |
Token ID | 329 |
Feature activation | +1.96e-03 |
Pos logit contributions | |
Deal | +0.015 |
nam | +0.014 |
guys | +0.012 |
smartest | +0.011 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.010 |
us | -0.010 |
Matt | -0.010 |
om | -0.010 |
ill | -0.009 |
Token | him |
Token ID | 683 |
Feature activation | -2.53e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.004 |
guys | +0.004 |
smartest | +0.004 |
strongest | +0.004 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
ubs | -0.002 |
ill | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | +2.89e-03 |
Pos logit contributions | |
ores | +0.003 |
Matt | +0.003 |
us | +0.003 |
irs | +0.003 |
Dan | +0.003 |
Neg logit contributions | |
nam | -0.005 |
Deal | -0.005 |
guys | -0.004 |
smartest | -0.004 |
strongest | -0.004 |
Token | so |
Token ID | 523 |
Feature activation | -1.15e-02 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
us | -0.005 |
ores | -0.005 |
om | -0.005 |
ubs | -0.005 |
ork | -0.005 |
Token | she |
Token ID | 673 |
Feature activation | -6.57e-03 |
Pos logit contributions | |
acks | +0.016 |
ork | +0.016 |
om | +0.016 |
aid | +0.016 |
udge | +0.016 |
Neg logit contributions | |
nam | -0.020 |
Deal | -0.019 |
smartest | -0.015 |
guys | -0.014 |
Sorry | -0.014 |
Token | decided |
Token ID | 3066 |
Feature activation | -2.90e-03 |
Pos logit contributions | |
ores | +0.008 |
us | +0.008 |
om | +0.008 |
� | +0.008 |
ine | +0.008 |
Neg logit contributions | |
Deal | -0.013 |
nam | -0.012 |
guys | -0.010 |
smartest | -0.010 |
strongest | -0.010 |
Token | to |
Token ID | 284 |
Feature activation | -3.41e-03 |
Pos logit contributions | |
om | +0.005 |
ores | +0.004 |
us | +0.004 |
acks | +0.004 |
udge | +0.004 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.004 |
Please | -0.004 |
Okay | -0.004 |
Token | stop |
Token ID | 2245 |
Feature activation | +1.31e-03 |
Pos logit contributions | |
ores | +0.006 |
us | +0.006 |
om | +0.006 |
ubs | +0.005 |
ill | +0.005 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.004 |
smartest | -0.004 |
strongest | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | -6.27e-03 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
guys | +0.002 |
forth | +0.001 |
Please | +0.001 |
Neg logit contributions | |
ork | -0.002 |
ushes | -0.002 |
om | -0.002 |
acks | -0.002 |
ata | -0.002 |
Token | knew |
Token ID | 2993 |
Feature activation | -6.52e-04 |
Pos logit contributions | |
ores | +0.002 |
us | +0.002 |
om | +0.002 |
Matt | +0.002 |
ubs | +0.002 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +8.01e-04 |
Pos logit contributions | |
om | +0.001 |
acks | +0.001 |
ores | +0.001 |
ubs | +0.001 |
oing | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
strongest | -0.001 |
Token | |
Token ID | 220 |
Feature activation | -2.42e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.001 |
guys | +0.001 |
Sorry | +0.001 |
cient | +0.001 |
Neg logit contributions | |
ores | -0.001 |
ubs | -0.001 |
us | -0.001 |
om | -0.001 |
ill | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +5.04e-04 |
Pos logit contributions | |
product | +0.003 |
ine | +0.003 |
ores | +0.003 |
oing | +0.003 |
anging | +0.003 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
cient | -0.003 |
smartest | -0.003 |
Sorry | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | -1.30e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
Fine | +0.001 |
Please | +0.001 |
Okay | +0.001 |
Neg logit contributions | |
ores | -0.001 |
ubs | -0.001 |
om | -0.000 |
ine | -0.000 |
anging | -0.000 |
Token | That |
Token ID | 2504 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
ores | +0.002 |
om | +0.002 |
ill | +0.002 |
ubs | +0.002 |
us | +0.002 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
Fine | -0.002 |
Okay | -0.002 |
guys | -0.002 |
Token | night |
Token ID | 1755 |
Feature activation | -2.64e-03 |
Pos logit contributions | |
ores | +0.031 |
us | +0.030 |
uts | +0.030 |
ank | +0.030 |
ubs | +0.030 |
Neg logit contributions | |
Deal | -0.022 |
guys | -0.020 |
simplest | -0.019 |
smartest | -0.018 |
strongest | -0.018 |
Token | , |
Token ID | 11 |
Feature activation | -6.05e-03 |
Pos logit contributions | |
ores | +0.004 |
ubs | +0.004 |
ill | +0.004 |
om | +0.003 |
us | +0.003 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.004 |
guys | -0.004 |
smartest | -0.004 |
strongest | -0.004 |
Token | George |
Token ID | 4502 |
Feature activation | +2.03e-03 |
Pos logit contributions | |
ores | +0.009 |
om | +0.009 |
us | +0.009 |
ubs | +0.009 |
ill | +0.009 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.010 |
guys | -0.009 |
smartest | -0.008 |
strongest | -0.008 |
Token | couldn |
Token ID | 3521 |
Feature activation | -9.44e-03 |
Pos logit contributions | |
Deal | +0.003 |
guys | +0.002 |
nam | +0.002 |
smartest | +0.002 |
strongest | +0.002 |
Neg logit contributions | |
ores | -0.004 |
ubs | -0.003 |
irs | -0.003 |
uts | -0.003 |
om | -0.003 |
Token | 't |
Token ID | 470 |
Feature activation | -4.04e-03 |
Pos logit contributions | |
ubs | +0.019 |
udge | +0.018 |
ores | +0.018 |
om | +0.018 |
ill | +0.017 |
Neg logit contributions | |
Deal | -0.010 |
guys | -0.009 |
Sorry | -0.008 |
brav | -0.007 |
ha | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -1.43e-03 |
Pos logit contributions | |
ores | +0.003 |
us | +0.003 |
om | +0.003 |
ubs | +0.003 |
ill | +0.003 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.004 |
smartest | -0.004 |
strongest | -0.004 |
Token | " |
Token ID | 366 |
Feature activation | +7.20e-04 |
Pos logit contributions | |
ores | +0.002 |
us | +0.002 |
ubs | +0.002 |
ill | +0.002 |
om | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.003 |
guys | -0.002 |
cient | -0.002 |
smartest | -0.002 |
Token | Okay |
Token ID | 16454 |
Feature activation | +8.86e-03 |
Pos logit contributions | |
Deal | +0.001 |
nam | +0.001 |
guys | +0.001 |
smartest | +0.001 |
simplest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ill | -0.001 |
� | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | -2.00e-03 |
Pos logit contributions | |
Deal | +0.021 |
nam | +0.020 |
guys | +0.017 |
smartest | +0.017 |
simplest | +0.016 |
Neg logit contributions | |
ores | -0.008 |
om | -0.007 |
us | -0.007 |
ill | -0.007 |
� | -0.007 |
Token | but |
Token ID | 475 |
Feature activation | -5.87e-03 |
Pos logit contributions | |
ores | +0.003 |
om | +0.003 |
us | +0.003 |
ill | +0.003 |
ubs | +0.003 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.003 |
guys | -0.003 |
smartest | -0.003 |
simplest | -0.003 |
Token | don |
Token ID | 836 |
Feature activation | -1.62e-02 |
Pos logit contributions | |
it | +0.008 |
ores | +0.007 |
� | +0.007 |
Joe | +0.007 |
int | +0.007 |
Neg logit contributions | |
Deal | -0.011 |
nam | -0.011 |
guys | -0.009 |
smartest | -0.008 |
cient | -0.008 |
Token | 't |
Token ID | 470 |
Feature activation | -7.03e-04 |
Pos logit contributions | |
ores | +0.020 |
us | +0.019 |
om | +0.019 |
ill | +0.018 |
ubs | +0.017 |
Neg logit contributions | |
Deal | -0.032 |
nam | -0.030 |
guys | -0.027 |
smartest | -0.025 |
strongest | -0.024 |
Token | forget |
Token ID | 6044 |
Feature activation | +4.91e-03 |
Pos logit contributions | |
ores | +0.001 |
� | +0.001 |
ubs | +0.001 |
om | +0.001 |
us | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.001 |
simplest | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | +1.42e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.010 |
guys | +0.009 |
smartest | +0.008 |
cient | +0.008 |
Neg logit contributions | |
us | -0.005 |
ores | -0.005 |
om | -0.005 |
ill | -0.005 |
udge | -0.005 |
Token | put |
Token ID | 1234 |
Feature activation | -6.21e-03 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.002 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.002 |
us | -0.002 |
om | -0.002 |
ill | -0.002 |
ubs | -0.002 |
Token | your |
Token ID | 534 |
Feature activation | -2.15e-03 |
Pos logit contributions | |
ores | +0.008 |
us | +0.008 |
om | +0.008 |
ill | +0.007 |
ubs | +0.007 |
Neg logit contributions | |
Deal | -0.012 |
nam | -0.012 |
guys | -0.010 |
smartest | -0.009 |
strongest | -0.009 |
Token | cat |
Token ID | 3797 |
Feature activation | -4.60e-03 |
Pos logit contributions | |
ores | +0.006 |
om | +0.006 |
us | +0.006 |
� | +0.006 |
s | +0.006 |
Neg logit contributions | |
Deal | -0.007 |
nam | -0.007 |
guys | -0.006 |
smartest | -0.005 |
strongest | -0.005 |
Token | to |
Token ID | 284 |
Feature activation | -1.22e-03 |
Pos logit contributions | |
Matt | +0.007 |
us | +0.006 |
ores | +0.006 |
Matt | +0.006 |
David | +0.006 |
Neg logit contributions | |
Deal | -0.008 |
nam | -0.008 |
guys | -0.007 |
fart | -0.006 |
games | -0.006 |
Token | their |
Token ID | 511 |
Feature activation | -8.27e-03 |
Pos logit contributions | |
us | +0.002 |
om | +0.001 |
uts | +0.001 |
ores | +0.001 |
anging | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
smartest | -0.002 |
strongest | -0.002 |
Token | home |
Token ID | 1363 |
Feature activation | +2.53e-03 |
Pos logit contributions | |
ores | +0.010 |
om | +0.010 |
us | +0.009 |
aid | +0.009 |
s | +0.009 |
Neg logit contributions | |
Deal | -0.016 |
nam | -0.015 |
guys | -0.013 |
smartest | -0.012 |
strongest | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | -5.44e-03 |
Pos logit contributions | |
Deal | +0.005 |
nam | +0.005 |
guys | +0.004 |
smartest | +0.004 |
chard | +0.004 |
Neg logit contributions | |
us | -0.003 |
Matt | -0.003 |
ores | -0.003 |
irs | -0.003 |
ubs | -0.002 |
Token | give |
Token ID | 1577 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
us | +0.009 |
ores | +0.009 |
om | +0.009 |
ubs | +0.009 |
ill | +0.009 |
Neg logit contributions | |
Deal | -0.009 |
nam | -0.008 |
guys | -0.006 |
smartest | -0.006 |
strongest | -0.006 |
Token | it |
Token ID | 340 |
Feature activation | +4.46e-03 |
Pos logit contributions | |
uts | +0.013 |
anging | +0.012 |
ill | +0.012 |
Matt | +0.012 |
ubs | +0.012 |
Neg logit contributions | |
Deal | -0.025 |
nam | -0.024 |
guys | -0.022 |
nic | -0.020 |
brav | -0.019 |
Token | some |
Token ID | 617 |
Feature activation | +5.07e-03 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.007 |
guys | +0.007 |
smartest | +0.006 |
nic | +0.006 |
Neg logit contributions | |
us | -0.006 |
om | -0.006 |
ores | -0.006 |
Matt | -0.006 |
ubs | -0.006 |
Token | milk |
Token ID | 7545 |
Feature activation | -1.39e-04 |
Pos logit contributions | |
Deal | +0.008 |
nam | +0.007 |
guys | +0.006 |
smartest | +0.006 |
simplest | +0.005 |
Neg logit contributions | |
ores | -0.008 |
us | -0.008 |
om | -0.008 |
ill | -0.008 |
ubs | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -2.94e-03 |
Pos logit contributions | |
Matt | +0.000 |
Josh | +0.000 |
Matt | +0.000 |
int | +0.000 |
anging | +0.000 |
Neg logit contributions | |
Deal | -0.000 |
nam | -0.000 |
guys | -0.000 |
fart | -0.000 |
nic | -0.000 |
Token | food |
Token ID | 2057 |
Feature activation | -3.91e-04 |
Pos logit contributions | |
ores | +0.005 |
us | +0.005 |
om | +0.005 |
ill | +0.005 |
ubs | +0.005 |
Neg logit contributions | |
Deal | -0.004 |
nam | -0.004 |
guys | -0.003 |
smartest | -0.003 |
simplest | -0.003 |
Token | The |
Token ID | 464 |
Feature activation | -3.80e-04 |
Pos logit contributions | |
ores | +0.004 |
om | +0.004 |
ays | +0.004 |
ill | +0.004 |
ubs | +0.004 |
Neg logit contributions | |
Deal | -0.003 |
Okay | -0.003 |
nam | -0.003 |
Fine | -0.003 |
Please | -0.003 |
Token | child |
Token ID | 1200 |
Feature activation | +5.93e-03 |
Pos logit contributions | |
ores | +0.001 |
us | +0.001 |
om | +0.001 |
ubs | +0.001 |
ill | +0.001 |
Neg logit contributions | |
Deal | -0.001 |
nam | -0.001 |
guys | -0.001 |
smartest | -0.000 |
strongest | -0.000 |
Token | bent |
Token ID | 17157 |
Feature activation | -2.91e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
nic | +0.006 |
Neg logit contributions | |
ores | -0.011 |
ubs | -0.010 |
us | -0.010 |
irs | -0.009 |
uts | -0.009 |
Token | down |
Token ID | 866 |
Feature activation | -1.76e-03 |
Pos logit contributions | |
ores | +0.006 |
uts | +0.006 |
ubs | +0.006 |
us | +0.006 |
ork | +0.006 |
Neg logit contributions | |
nam | -0.003 |
Deal | -0.003 |
forth | -0.002 |
guys | -0.002 |
heads | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | +2.34e-03 |
Pos logit contributions | |
ubs | +0.003 |
irs | +0.003 |
ores | +0.003 |
orse | +0.003 |
us | +0.002 |
Neg logit contributions | |
Deal | -0.003 |
nam | -0.002 |
OK | -0.002 |
Please | -0.002 |
ha | -0.002 |
Token | grabbed |
Token ID | 13176 |
Feature activation | -1.12e-02 |
Pos logit contributions | |
nam | +0.004 |
Deal | +0.003 |
nic | +0.003 |
chard | +0.002 |
cient | +0.002 |
Neg logit contributions | |
ubs | -0.004 |
ores | -0.004 |
om | -0.004 |
us | -0.004 |
uts | -0.004 |
Token | hold |
Token ID | 1745 |
Feature activation | +3.79e-04 |
Pos logit contributions | |
uts | +0.019 |
us | +0.018 |
ubs | +0.018 |
oing | +0.017 |
ill | +0.017 |
Neg logit contributions | |
nam | -0.019 |
Deal | -0.017 |
guys | -0.014 |
nic | -0.014 |
brav | -0.013 |
Token | of |
Token ID | 286 |
Feature activation | -3.19e-03 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
brav | +0.000 |
nic | +0.000 |
wind | +0.000 |
Neg logit contributions | |
ores | -0.001 |
uts | -0.001 |
oing | -0.001 |
Kat | -0.001 |
Matt | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +9.44e-04 |
Pos logit contributions | |
uts | +0.005 |
us | +0.005 |
oing | +0.005 |
ork | +0.005 |
om | +0.005 |
Neg logit contributions | |
nam | -0.005 |
Deal | -0.005 |
wind | -0.004 |
guys | -0.004 |
matter | -0.003 |
Token | toy |
Token ID | 13373 |
Feature activation | -9.59e-04 |
Pos logit contributions | |
Deal | +0.002 |
nam | +0.002 |
guys | +0.001 |
smartest | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
om | -0.001 |
ubs | -0.001 |
ill | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +4.79e-03 |
Pos logit contributions | |
ores | +0.001 |
ubs | +0.001 |
us | +0.001 |
Matt | +0.001 |
Jud | +0.001 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
guys | -0.002 |
strongest | -0.001 |
smartest | -0.001 |
Token | feels |
Token ID | 5300 |
Feature activation | +1.00e-02 |
Pos logit contributions | |
Deal | +0.004 |
guys | +0.004 |
nam | +0.004 |
nic | +0.003 |
simplest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
ubs | -0.003 |
us | -0.003 |
ork | -0.003 |
anging | -0.003 |
Token | even |
Token ID | 772 |
Feature activation | +4.70e-03 |
Pos logit contributions | |
nam | +0.016 |
Deal | +0.016 |
smartest | +0.013 |
guys | +0.013 |
strongest | +0.013 |
Neg logit contributions | |
om | -0.016 |
ill | -0.015 |
us | -0.015 |
Matt | -0.015 |
ork | -0.015 |
Token | happier |
Token ID | 23030 |
Feature activation | +3.74e-03 |
Pos logit contributions | |
Deal | +0.010 |
nam | +0.009 |
guys | +0.008 |
smartest | +0.007 |
simplest | +0.007 |
Neg logit contributions | |
ores | -0.006 |
us | -0.005 |
om | -0.005 |
ill | -0.005 |
ubs | -0.005 |
Token | and |
Token ID | 290 |
Feature activation | +1.95e-03 |
Pos logit contributions | |
Deal | +0.007 |
nam | +0.006 |
guys | +0.005 |
Please | +0.005 |
smartest | +0.005 |
Neg logit contributions | |
irs | -0.005 |
om | -0.005 |
ork | -0.005 |
ores | -0.005 |
Matt | -0.005 |
Token | p |
Token ID | 279 |
Feature activation | +5.07e-03 |
Pos logit contributions | |
Deal | +0.004 |
nam | +0.004 |
guys | +0.003 |
smartest | +0.003 |
strongest | +0.003 |
Neg logit contributions | |
ores | -0.003 |
om | -0.003 |
us | -0.003 |
ubs | -0.002 |
ill | -0.002 |
Token | rou |
Token ID | 472 |
Feature activation | -3.40e-02 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
cient | +0.007 |
nic | +0.007 |
Sorry | +0.006 |
Neg logit contributions | |
� | -0.008 |
aid | -0.007 |
Josh | -0.006 |
Kat | -0.006 |
Judy | -0.006 |
Token | der |
Token ID | 1082 |
Feature activation | -9.46e-03 |
Pos logit contributions | |
ores | +0.048 |
ill | +0.048 |
Matt | +0.047 |
aid | +0.046 |
ine | +0.046 |
Neg logit contributions | |
Deal | -0.061 |
nam | -0.051 |
guys | -0.049 |
Fine | -0.041 |
smartest | -0.041 |
Token | . |
Token ID | 13 |
Feature activation | -1.39e-03 |
Pos logit contributions | |
Matt | +0.011 |
aid | +0.011 |
ork | +0.011 |
ores | +0.011 |
om | +0.011 |
Neg logit contributions | |
Deal | -0.019 |
nam | -0.017 |
strongest | -0.014 |
smartest | -0.014 |
simplest | -0.013 |
Token | He |
Token ID | 679 |
Feature activation | +5.67e-03 |
Pos logit contributions | |
ge | +0.002 |
anging | +0.002 |
itched | +0.002 |
contact | +0.002 |
ores | +0.002 |
Neg logit contributions | |
Deal | -0.002 |
nam | -0.002 |
Sorry | -0.002 |
Really | -0.002 |
Okay | -0.002 |
Token | displays |
Token ID | 11298 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
Deal | +0.009 |
nam | +0.008 |
guys | +0.007 |
smartest | +0.006 |
simplest | +0.006 |
Neg logit contributions | |
ores | -0.010 |
us | -0.009 |
ubs | -0.009 |
ill | -0.009 |
om | -0.009 |
Token | his |
Token ID | 465 |
Feature activation | -3.12e-03 |
Pos logit contributions | |
nam | +0.002 |
Deal | +0.002 |
guys | +0.002 |
smartest | +0.002 |
brav | +0.002 |
Neg logit contributions | |
us | -0.001 |
ores | -0.001 |
anging | -0.001 |
uts | -0.001 |
ubs | -0.001 |
Token | sailed |
Token ID | 33835 |
Feature activation | +3.33e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.005 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.006 |
uts | -0.005 |
ubs | -0.005 |
ork | -0.005 |
us | -0.005 |
Token | for |
Token ID | 329 |
Feature activation | +8.92e-03 |
Pos logit contributions | |
Deal | +0.006 |
nam | +0.006 |
guys | +0.005 |
smartest | +0.005 |
strongest | +0.005 |
Neg logit contributions | |
ores | -0.005 |
uts | -0.004 |
us | -0.004 |
om | -0.004 |
ubs | -0.004 |
Token | days |
Token ID | 1528 |
Feature activation | -8.58e-04 |
Pos logit contributions | |
Deal | +0.016 |
nam | +0.015 |
guys | +0.013 |
smartest | +0.012 |
strongest | +0.011 |
Neg logit contributions | |
ores | -0.013 |
us | -0.013 |
om | -0.013 |
ill | -0.012 |
ubs | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | -5.18e-04 |
Pos logit contributions | |
ores | +0.001 |
Matt | +0.001 |
ork | +0.001 |
Jud | +0.001 |
ill | +0.001 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
guys | -0.001 |
strongest | -0.001 |
fastest | -0.001 |
Token | exploring |
Token ID | 13504 |
Feature activation | -2.81e-03 |
Pos logit contributions | |
ores | +0.001 |
ork | +0.001 |
uts | +0.001 |
us | +0.001 |
irs | +0.001 |
Neg logit contributions | |
nam | -0.001 |
Deal | -0.001 |
strongest | -0.001 |
guys | -0.001 |
smartest | -0.001 |
Token | unch |
Token ID | 16258 |
Feature activation | -3.39e-02 |
Pos logit contributions | |
ores | +0.004 |
uts | +0.004 |
om | +0.004 |
us | +0.003 |
ubs | +0.003 |
Neg logit contributions | |
Deal | -0.005 |
nam | -0.005 |
guys | -0.005 |
smartest | -0.004 |
strongest | -0.004 |
Token | arted |
Token ID | 19112 |
Feature activation | -1.16e-03 |
Pos logit contributions | |
us | +0.049 |
ores | +0.049 |
ork | +0.048 |
� | +0.048 |
aid | +0.048 |
Neg logit contributions | |
nam | -0.051 |
Deal | -0.051 |
guys | -0.040 |
Fine | -0.038 |
smartest | -0.037 |
Token | waters |
Token ID | 10150 |
Feature activation | +5.65e-04 |
Pos logit contributions | |
ores | +0.002 |
ill | +0.002 |
us | +0.002 |
uts | +0.002 |
Matt | +0.002 |
Neg logit contributions | |
Deal | -0.002 |
guys | -0.002 |
nam | -0.002 |
smartest | -0.002 |
strongest | -0.001 |
Token | until |
Token ID | 1566 |
Feature activation | -9.27e-03 |
Pos logit contributions | |
nam | +0.001 |
Deal | +0.001 |
guys | +0.001 |
songs | +0.001 |
strongest | +0.001 |
Neg logit contributions | |
ores | -0.001 |
us | -0.001 |
Matt | -0.001 |
Kat | -0.001 |
Jud | -0.001 |
Token | he |
Token ID | 339 |
Feature activation | -3.27e-03 |
Pos logit contributions | |
us | +0.012 |
om | +0.012 |
uts | +0.012 |
udge | +0.012 |
oing | +0.012 |
Neg logit contributions | |
nam | -0.017 |
Deal | -0.016 |
guys | -0.015 |
strongest | -0.014 |
wind | -0.014 |
Token | came |
Token ID | 1625 |
Feature activation | -5.61e-03 |
Pos logit contributions | |
ores | +0.005 |
ubs | +0.005 |
om | +0.005 |
uts | +0.005 |
us | +0.005 |
Neg logit contributions | |
Deal | -0.005 |
guys | -0.004 |
nam | -0.004 |
smartest | -0.004 |
strongest | -0.004 |