Token | was |
Token ID | 373 |
Feature activation | +8.34e-03 |
Pos logit contributions | |
mmm | +0.008 |
mm | +0.008 |
on | +0.007 |
etti | +0.007 |
inations | +0.007 |
Neg logit contributions | |
ranc | -0.005 |
attent | -0.004 |
err | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | amazed |
Token ID | 24562 |
Feature activation | +1.77e-02 |
Pos logit contributions | |
mmm | +0.015 |
mm | +0.015 |
inations | +0.014 |
opter | +0.014 |
etti | +0.013 |
Neg logit contributions | |
ranc | -0.010 |
out | -0.009 |
louder | -0.009 |
err | -0.009 |
attent | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | +7.40e-03 |
Pos logit contributions | |
mmm | +0.035 |
on | +0.035 |
orse | +0.034 |
inations | +0.034 |
mm | +0.033 |
Neg logit contributions | |
ranc | -0.016 |
err | -0.015 |
attent | -0.015 |
iet | -0.014 |
Please | -0.014 |
Token | see |
Token ID | 766 |
Feature activation | -4.49e-03 |
Pos logit contributions | |
etti | +0.012 |
mmm | +0.012 |
mm | +0.012 |
inations | +0.011 |
on | +0.011 |
Neg logit contributions | |
moral | -0.009 |
corner | -0.009 |
out | -0.009 |
ranc | -0.009 |
err | -0.009 |
Token | how |
Token ID | 703 |
Feature activation | -7.95e-03 |
Pos logit contributions | |
out | +0.004 |
ranc | +0.004 |
err | +0.004 |
attent | +0.004 |
girl | +0.004 |
Neg logit contributions | |
mmm | -0.009 |
orse | -0.009 |
inations | -0.008 |
mm | -0.008 |
etti | -0.008 |
Token | wide |
Token ID | 3094 |
Feature activation | +5.29e-02 |
Pos logit contributions | |
ranc | +0.008 |
attent | +0.008 |
err | +0.008 |
louder | +0.007 |
Please | +0.007 |
Neg logit contributions | |
mmm | -0.015 |
mm | -0.015 |
etti | -0.015 |
inations | -0.014 |
on | -0.014 |
Token | it |
Token ID | 340 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
inations | +0.083 |
mmm | +0.081 |
on | +0.078 |
orse | +0.078 |
etti | +0.076 |
Neg logit contributions | |
ranc | -0.071 |
out | -0.065 |
girl | -0.064 |
Please | -0.064 |
for | -0.063 |
Token | was |
Token ID | 373 |
Feature activation | +1.83e-03 |
Pos logit contributions | |
mmm | +0.030 |
on | +0.028 |
orse | +0.028 |
inations | +0.028 |
mm | +0.028 |
Neg logit contributions | |
ranc | -0.020 |
err | -0.019 |
attent | -0.017 |
Please | -0.017 |
iet | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | -3.85e-04 |
Pos logit contributions | |
mmm | +0.004 |
mm | +0.004 |
on | +0.004 |
orse | +0.003 |
etti | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.001 |
out | -0.001 |
Please | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | -2.57e-03 |
Pos logit contributions | |
err | +0.001 |
ranc | +0.001 |
attent | +0.000 |
Please | +0.000 |
veterinarian | +0.000 |
Neg logit contributions | |
inations | -0.001 |
mmm | -0.001 |
orse | -0.001 |
on | -0.001 |
etti | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +2.85e-05 |
Pos logit contributions | |
err | +0.002 |
ranc | +0.002 |
attent | +0.002 |
Please | +0.002 |
iet | +0.002 |
Neg logit contributions | |
etti | -0.005 |
mmm | -0.005 |
mm | -0.005 |
inations | -0.005 |
orse | -0.005 |
Token | excitement |
Token ID | 14067 |
Feature activation | +1.74e-03 |
Pos logit contributions | |
her | +0.001 |
attent | +0.001 |
out | +0.001 |
tears | +0.001 |
ranc | +0.001 |
Neg logit contributions | |
orse | -0.002 |
mmm | -0.002 |
inations | -0.002 |
opter | -0.002 |
etti | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +4.78e-03 |
Pos logit contributions | |
mmm | +0.003 |
orse | +0.003 |
on | +0.003 |
inations | +0.003 |
mm | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
attent | -0.002 |
err | -0.001 |
iet | -0.001 |
out | -0.001 |
Token | She |
Token ID | 1375 |
Feature activation | -2.75e-03 |
Pos logit contributions | |
on | +0.009 |
orse | +0.009 |
inations | +0.009 |
mmm | +0.009 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.004 |
Please | -0.004 |
veterinarian | -0.004 |
Token | pictured |
Token ID | 17915 |
Feature activation | +7.59e-03 |
Pos logit contributions | |
ranc | +0.003 |
attent | +0.003 |
Please | +0.003 |
err | +0.003 |
iet | +0.003 |
Neg logit contributions | |
mmm | -0.005 |
mm | -0.005 |
on | -0.004 |
etti | -0.004 |
inations | -0.004 |
Token | how |
Token ID | 703 |
Feature activation | -2.19e-04 |
Pos logit contributions | |
mmm | +0.013 |
on | +0.013 |
orse | +0.012 |
inations | +0.012 |
mm | +0.012 |
Neg logit contributions | |
ranc | -0.009 |
err | -0.008 |
attent | -0.008 |
iet | -0.008 |
Please | -0.008 |
Token | y |
Token ID | 331 |
Feature activation | +5.18e-02 |
Pos logit contributions | |
ranc | +0.000 |
attent | +0.000 |
err | +0.000 |
iet | +0.000 |
andel | +0.000 |
Neg logit contributions | |
mmm | -0.000 |
orse | -0.000 |
inations | -0.000 |
on | -0.000 |
etti | -0.000 |
Token | ummy |
Token ID | 13513 |
Feature activation | -2.58e-03 |
Pos logit contributions | |
inations | +0.087 |
orse | +0.087 |
achieve | +0.078 |
voy | +0.078 |
Matt | +0.077 |
Neg logit contributions | |
andel | -0.065 |
attent | -0.061 |
ocked | -0.057 |
ling | -0.054 |
err | -0.053 |
Token | the |
Token ID | 262 |
Feature activation | +7.23e-03 |
Pos logit contributions | |
ranc | +0.003 |
attent | +0.002 |
out | +0.002 |
girl | +0.002 |
err | +0.002 |
Neg logit contributions | |
orse | -0.005 |
inations | -0.005 |
mmm | -0.005 |
on | -0.004 |
achieve | -0.004 |
Token | cake |
Token ID | 12187 |
Feature activation | +6.39e-03 |
Pos logit contributions | |
on | +0.010 |
mmm | +0.010 |
orse | +0.010 |
inations | +0.010 |
mm | +0.009 |
Neg logit contributions | |
ranc | -0.011 |
err | -0.010 |
iet | -0.009 |
attent | -0.009 |
Please | -0.009 |
Token | would |
Token ID | 561 |
Feature activation | +6.50e-03 |
Pos logit contributions | |
orse | +0.012 |
mmm | +0.012 |
inations | +0.011 |
on | +0.011 |
mm | +0.011 |
Neg logit contributions | |
ranc | -0.006 |
attent | -0.006 |
out | -0.006 |
girl | -0.006 |
for | -0.005 |
Token | be |
Token ID | 307 |
Feature activation | +4.58e-04 |
Pos logit contributions | |
on | +0.009 |
orse | +0.009 |
mmm | +0.009 |
inations | +0.009 |
etti | +0.009 |
Neg logit contributions | |
ranc | -0.009 |
attent | -0.008 |
Please | -0.008 |
err | -0.008 |
moral | -0.008 |
Token | egg |
Token ID | 5935 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.004 |
Please | +0.004 |
veterinarian | +0.004 |
Neg logit contributions | |
mmm | -0.007 |
inations | -0.006 |
mm | -0.006 |
on | -0.006 |
etti | -0.006 |
Token | ! |
Token ID | 0 |
Feature activation | -5.84e-03 |
Pos logit contributions | |
ranc | +0.013 |
err | +0.012 |
attent | +0.011 |
iet | +0.011 |
Please | +0.011 |
Neg logit contributions | |
mmm | -0.020 |
inations | -0.020 |
on | -0.020 |
orse | -0.019 |
mm | -0.019 |
Token | He |
Token ID | 679 |
Feature activation | -4.39e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
Please | +0.007 |
attent | +0.007 |
veterinarian | +0.007 |
Neg logit contributions | |
inations | -0.009 |
mmm | -0.009 |
orse | -0.008 |
mm | -0.008 |
on | -0.008 |
Token | watched |
Token ID | 7342 |
Feature activation | +6.99e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.005 |
Please | +0.005 |
iet | +0.005 |
Neg logit contributions | |
mmm | -0.007 |
mm | -0.007 |
inations | -0.007 |
etti | -0.007 |
on | -0.007 |
Token | in |
Token ID | 287 |
Feature activation | -2.21e-03 |
Pos logit contributions | |
mmm | +0.012 |
inations | +0.012 |
on | +0.011 |
orse | +0.011 |
mm | +0.011 |
Neg logit contributions | |
ranc | -0.008 |
attent | -0.008 |
err | -0.008 |
andel | -0.007 |
iet | -0.007 |
Token | amaz |
Token ID | 40642 |
Feature activation | +5.16e-02 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
Please | +0.003 |
iet | +0.003 |
Neg logit contributions | |
mmm | -0.003 |
orse | -0.003 |
on | -0.003 |
inations | -0.003 |
mm | -0.003 |
Token | ement |
Token ID | 972 |
Feature activation | +7.48e-04 |
Pos logit contributions | |
orse | +0.090 |
inations | +0.083 |
achieve | +0.082 |
mmm | +0.079 |
on | +0.078 |
Neg logit contributions | |
attent | -0.058 |
err | -0.056 |
at | -0.053 |
iet | -0.051 |
louder | -0.051 |
Token | as |
Token ID | 355 |
Feature activation | -4.34e-04 |
Pos logit contributions | |
on | +0.001 |
mmm | +0.001 |
inations | +0.001 |
mm | +0.001 |
orse | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
attent | -0.001 |
err | -0.001 |
louder | -0.001 |
out | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -1.97e-03 |
Pos logit contributions | |
out | +0.000 |
attent | +0.000 |
louder | +0.000 |
girl | +0.000 |
err | +0.000 |
Neg logit contributions | |
mmm | -0.001 |
mm | -0.001 |
etti | -0.001 |
inations | -0.001 |
orse | -0.001 |
Token | egg |
Token ID | 5935 |
Feature activation | -2.52e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
inations | -0.003 |
etti | -0.003 |
Token | began |
Token ID | 2540 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
ranc | +0.003 |
attent | +0.003 |
err | +0.002 |
out | +0.002 |
ther | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
inations | -0.004 |
mm | -0.004 |
on | -0.004 |
orse | -0.004 |
Token | were |
Token ID | 547 |
Feature activation | +2.00e-02 |
Pos logit contributions | |
mmm | +0.004 |
mm | +0.003 |
on | +0.003 |
etti | +0.003 |
inations | +0.003 |
Neg logit contributions | |
ranc | -0.003 |
attent | -0.003 |
err | -0.003 |
iet | -0.003 |
Please | -0.003 |
Token | filled |
Token ID | 5901 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
mmm | +0.037 |
mm | +0.036 |
on | +0.034 |
inations | +0.033 |
etti | +0.033 |
Neg logit contributions | |
ranc | -0.025 |
out | -0.021 |
louder | -0.021 |
attent | -0.020 |
veterinarian | -0.020 |
Token | with |
Token ID | 351 |
Feature activation | +3.19e-03 |
Pos logit contributions | |
mmm | +0.033 |
inations | +0.032 |
orse | +0.032 |
mm | +0.031 |
on | +0.031 |
Neg logit contributions | |
ranc | -0.014 |
err | -0.014 |
attent | -0.013 |
iet | -0.012 |
out | -0.011 |
Token | wonder |
Token ID | 4240 |
Feature activation | -4.97e-03 |
Pos logit contributions | |
mmm | +0.005 |
mm | +0.005 |
orse | +0.005 |
on | +0.005 |
etti | +0.005 |
Neg logit contributions | |
ranc | -0.004 |
girl | -0.004 |
attent | -0.004 |
tears | -0.004 |
out | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | +2.97e-03 |
Pos logit contributions | |
ranc | +0.005 |
attent | +0.004 |
err | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.010 |
on | -0.009 |
orse | -0.009 |
mm | -0.009 |
etti | -0.009 |
Token | amaz |
Token ID | 40642 |
Feature activation | +5.13e-02 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.005 |
mm | +0.005 |
etti | +0.005 |
orse | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
attent | -0.004 |
louder | -0.003 |
out | -0.003 |
girl | -0.003 |
Token | ement |
Token ID | 972 |
Feature activation | +6.26e-03 |
Pos logit contributions | |
orse | +0.077 |
mmm | +0.074 |
on | +0.074 |
inations | +0.073 |
achieve | +0.068 |
Neg logit contributions | |
attent | -0.068 |
err | -0.067 |
ranc | -0.065 |
louder | -0.062 |
Please | -0.061 |
Token | . |
Token ID | 13 |
Feature activation | +3.42e-03 |
Pos logit contributions | |
mmm | +0.012 |
on | +0.012 |
inations | +0.012 |
mm | +0.012 |
orse | +0.011 |
Neg logit contributions | |
ranc | -0.006 |
attent | -0.006 |
err | -0.005 |
iet | -0.005 |
louder | -0.005 |
Token | They |
Token ID | 1119 |
Feature activation | +6.95e-03 |
Pos logit contributions | |
on | +0.006 |
inations | +0.006 |
mmm | +0.006 |
orse | +0.006 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.004 |
veterinarian | -0.003 |
Please | -0.003 |
Token | thanked |
Token ID | 26280 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
mmm | +0.012 |
mm | +0.012 |
on | +0.011 |
etti | +0.011 |
inations | +0.011 |
Neg logit contributions | |
ranc | -0.009 |
attent | -0.008 |
iet | -0.008 |
err | -0.007 |
Please | -0.007 |
Token | the |
Token ID | 262 |
Feature activation | +3.64e-03 |
Pos logit contributions | |
mmm | +0.026 |
on | +0.026 |
inations | +0.025 |
orse | +0.025 |
mm | +0.024 |
Neg logit contributions | |
ranc | -0.019 |
err | -0.017 |
attent | -0.017 |
iet | -0.016 |
Please | -0.016 |
Token | air |
Token ID | 1633 |
Feature activation | -2.03e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
attent | +0.006 |
veterinarian | +0.006 |
Please | +0.006 |
Neg logit contributions | |
orse | -0.013 |
mmm | -0.013 |
inations | -0.013 |
on | -0.012 |
mm | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | -1.53e-02 |
Pos logit contributions | |
ranc | +0.023 |
err | +0.021 |
iet | +0.019 |
attent | +0.019 |
Please | +0.018 |
Neg logit contributions | |
on | -0.036 |
mmm | -0.036 |
orse | -0.035 |
inations | -0.035 |
Joe | -0.034 |
Token | He |
Token ID | 679 |
Feature activation | -5.81e-03 |
Pos logit contributions | |
ranc | +0.018 |
err | +0.016 |
Please | +0.016 |
attent | +0.015 |
veterinarian | +0.015 |
Neg logit contributions | |
inations | -0.026 |
mmm | -0.025 |
on | -0.025 |
orse | -0.025 |
etti | -0.024 |
Token | watched |
Token ID | 7342 |
Feature activation | +3.47e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
attent | +0.007 |
iet | +0.007 |
Please | +0.007 |
Neg logit contributions | |
mmm | -0.009 |
on | -0.009 |
orse | -0.009 |
inations | -0.009 |
mm | -0.008 |
Token | with |
Token ID | 351 |
Feature activation | -7.24e-03 |
Pos logit contributions | |
mmm | +0.006 |
on | +0.006 |
orse | +0.005 |
inations | +0.005 |
mm | +0.005 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | amaz |
Token ID | 40642 |
Feature activation | +5.11e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
out | +0.007 |
attent | +0.007 |
louder | +0.007 |
Neg logit contributions | |
mmm | -0.014 |
mm | -0.013 |
orse | -0.013 |
inations | -0.013 |
etti | -0.013 |
Token | ement |
Token ID | 972 |
Feature activation | -5.85e-04 |
Pos logit contributions | |
orse | +0.084 |
inations | +0.079 |
mmm | +0.078 |
achieve | +0.077 |
on | +0.077 |
Neg logit contributions | |
attent | -0.059 |
err | -0.058 |
louder | -0.055 |
iet | -0.054 |
Please | -0.053 |
Token | as |
Token ID | 355 |
Feature activation | -1.45e-03 |
Pos logit contributions | |
ranc | +0.001 |
attent | +0.000 |
err | +0.000 |
for | +0.000 |
out | +0.000 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
inations | -0.001 |
orse | -0.001 |
mm | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -2.26e-03 |
Pos logit contributions | |
louder | +0.002 |
out | +0.002 |
attent | +0.002 |
ranc | +0.002 |
someone | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
mm | -0.002 |
orse | -0.002 |
etti | -0.002 |
inations | -0.002 |
Token | z |
Token ID | 1976 |
Feature activation | +5.39e-05 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
on | -0.004 |
orse | -0.004 |
inations | -0.004 |
mm | -0.003 |
Token | ig |
Token ID | 328 |
Feature activation | -7.71e-03 |
Pos logit contributions | |
mmm | +0.000 |
on | +0.000 |
orse | +0.000 |
inations | +0.000 |
Joe | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
iet | -0.000 |
andel | -0.000 |
Token | the |
Token ID | 262 |
Feature activation | +5.42e-03 |
Pos logit contributions | |
inations | +0.071 |
mmm | +0.070 |
etti | +0.067 |
mm | +0.064 |
orse | +0.064 |
Neg logit contributions | |
ranc | -0.047 |
out | -0.042 |
Please | -0.041 |
attent | -0.040 |
for | -0.039 |
Token | river |
Token ID | 7850 |
Feature activation | +1.12e-02 |
Pos logit contributions | |
mmm | +0.009 |
on | +0.009 |
orse | +0.009 |
etti | +0.009 |
mm | +0.009 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
attent | -0.006 |
Please | -0.006 |
moral | -0.006 |
Token | was |
Token ID | 373 |
Feature activation | +1.12e-03 |
Pos logit contributions | |
mmm | +0.022 |
orse | +0.020 |
inations | +0.020 |
mm | +0.020 |
etti | +0.020 |
Neg logit contributions | |
ranc | -0.011 |
attent | -0.010 |
err | -0.010 |
out | -0.010 |
Please | -0.010 |
Token | and |
Token ID | 290 |
Feature activation | +1.34e-03 |
Pos logit contributions | |
mmm | +0.002 |
mm | +0.002 |
orse | +0.002 |
etti | +0.002 |
on | +0.002 |
Neg logit contributions | |
ranc | -0.001 |
attent | -0.001 |
out | -0.001 |
err | -0.001 |
for | -0.001 |
Token | how |
Token ID | 703 |
Feature activation | +2.01e-03 |
Pos logit contributions | |
mm | +0.002 |
etti | +0.002 |
mmm | +0.002 |
inations | +0.002 |
opter | +0.002 |
Neg logit contributions | |
attent | -0.001 |
louder | -0.001 |
for | -0.001 |
one | -0.001 |
out | -0.001 |
Token | wide |
Token ID | 3094 |
Feature activation | +5.04e-02 |
Pos logit contributions | |
mmm | +0.004 |
mm | +0.004 |
etti | +0.003 |
orse | +0.003 |
on | +0.003 |
Neg logit contributions | |
attent | -0.002 |
ranc | -0.002 |
out | -0.002 |
louder | -0.002 |
err | -0.002 |
Token | the |
Token ID | 262 |
Feature activation | +6.76e-03 |
Pos logit contributions | |
inations | +0.083 |
mmm | +0.082 |
on | +0.077 |
orse | +0.077 |
etti | +0.076 |
Neg logit contributions | |
ranc | -0.064 |
out | -0.059 |
Please | -0.057 |
for | -0.056 |
girl | -0.056 |
Token | sky |
Token ID | 6766 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
mmm | +0.012 |
on | +0.012 |
orse | +0.011 |
etti | +0.011 |
mm | +0.011 |
Neg logit contributions | |
ranc | -0.008 |
err | -0.007 |
attent | -0.007 |
veterinarian | -0.007 |
moral | -0.007 |
Token | was |
Token ID | 373 |
Feature activation | +1.63e-03 |
Pos logit contributions | |
mmm | +0.021 |
orse | +0.019 |
inations | +0.019 |
mm | +0.019 |
etti | +0.018 |
Neg logit contributions | |
ranc | -0.011 |
attent | -0.010 |
err | -0.010 |
Please | -0.010 |
out | -0.010 |
Token | . |
Token ID | 13 |
Feature activation | +2.88e-03 |
Pos logit contributions | |
mmm | +0.003 |
mm | +0.003 |
orse | +0.003 |
on | +0.003 |
etti | +0.003 |
Neg logit contributions | |
ranc | -0.001 |
attent | -0.001 |
err | -0.001 |
out | -0.001 |
louder | -0.001 |
Token | And |
Token ID | 843 |
Feature activation | +2.20e-02 |
Pos logit contributions | |
inations | +0.005 |
mmm | +0.005 |
etti | +0.005 |
orse | +0.005 |
on | +0.005 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
veterinarian | -0.003 |
moral | -0.003 |
Token | at |
Token ID | 379 |
Feature activation | +1.30e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
Please | +0.007 |
urse | +0.007 |
veterinarian | +0.007 |
Neg logit contributions | |
Joe | -0.016 |
on | -0.015 |
John | -0.015 |
mmm | -0.015 |
inations | -0.015 |
Token | the |
Token ID | 262 |
Feature activation | -1.19e-03 |
Pos logit contributions | |
mmm | +0.025 |
inations | +0.024 |
orse | +0.024 |
on | +0.023 |
etti | +0.023 |
Neg logit contributions | |
ranc | -0.013 |
err | -0.013 |
iet | -0.012 |
attent | -0.012 |
girl | -0.011 |
Token | bright |
Token ID | 6016 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.001 |
iet | +0.001 |
attent | +0.001 |
Please | +0.001 |
Neg logit contributions | |
on | -0.002 |
mmm | -0.002 |
inations | -0.002 |
orse | -0.002 |
Joe | -0.002 |
Token | colours |
Token ID | 18915 |
Feature activation | -7.24e-04 |
Pos logit contributions | |
mmm | +0.016 |
on | +0.015 |
orse | +0.015 |
inations | +0.015 |
mm | +0.015 |
Neg logit contributions | |
ranc | -0.014 |
err | -0.013 |
attent | -0.012 |
iet | -0.012 |
andel | -0.012 |
Token | with |
Token ID | 351 |
Feature activation | +4.47e-03 |
Pos logit contributions | |
out | +0.001 |
attent | +0.001 |
for | +0.001 |
ranc | +0.001 |
at | +0.000 |
Neg logit contributions | |
mmm | -0.002 |
mm | -0.001 |
inations | -0.001 |
orse | -0.001 |
opter | -0.001 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.99e-02 |
Pos logit contributions | |
mmm | +0.008 |
mm | +0.008 |
orse | +0.008 |
inations | +0.008 |
on | +0.007 |
Neg logit contributions | |
ranc | -0.005 |
attent | -0.005 |
louder | -0.005 |
tears | -0.005 |
out | -0.005 |
Token | ement |
Token ID | 972 |
Feature activation | +6.79e-03 |
Pos logit contributions | |
orse | +0.072 |
mmm | +0.071 |
inations | +0.069 |
on | +0.067 |
achieve | +0.064 |
Neg logit contributions | |
err | -0.069 |
ranc | -0.068 |
attent | -0.066 |
iet | -0.064 |
andel | -0.063 |
Token | and |
Token ID | 290 |
Feature activation | +2.87e-03 |
Pos logit contributions | |
mmm | +0.013 |
inations | +0.013 |
on | +0.013 |
orse | +0.012 |
mm | +0.012 |
Neg logit contributions | |
ranc | -0.006 |
attent | -0.006 |
err | -0.006 |
iet | -0.005 |
out | -0.005 |
Token | awe |
Token ID | 25030 |
Feature activation | +1.54e-02 |
Pos logit contributions | |
mmm | +0.005 |
mm | +0.005 |
on | +0.005 |
etti | +0.004 |
inations | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
attent | -0.004 |
louder | -0.003 |
girl | -0.003 |
err | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | +4.04e-03 |
Pos logit contributions | |
mmm | +0.028 |
on | +0.028 |
orse | +0.027 |
inations | +0.027 |
Joe | +0.026 |
Neg logit contributions | |
ranc | -0.017 |
err | -0.015 |
attent | -0.014 |
iet | -0.014 |
Please | -0.014 |
Token | He |
Token ID | 679 |
Feature activation | +7.73e-03 |
Pos logit contributions | |
inations | +0.007 |
mmm | +0.007 |
on | +0.007 |
orse | +0.007 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.004 |
veterinarian | -0.004 |
Please | -0.004 |
Token | wanted |
Token ID | 2227 |
Feature activation | +5.93e-03 |
Pos logit contributions | |
mmm | +0.013 |
on | +0.013 |
mm | +0.013 |
inations | +0.013 |
etti | +0.013 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.008 |
attent | -0.008 |
Please | -0.008 |
veterinarian | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | +5.82e-03 |
Pos logit contributions | |
mmm | +0.013 |
inations | +0.013 |
etti | +0.013 |
orse | +0.013 |
on | +0.013 |
Neg logit contributions | |
ranc | -0.005 |
attent | -0.004 |
veterinarian | -0.003 |
err | -0.003 |
Please | -0.003 |
Token | show |
Token ID | 905 |
Feature activation | +7.60e-03 |
Pos logit contributions | |
mmm | +0.009 |
inations | +0.009 |
etti | +0.009 |
on | +0.009 |
opter | +0.009 |
Neg logit contributions | |
ranc | -0.007 |
veterinarian | -0.007 |
Please | -0.006 |
moral | -0.006 |
date | -0.006 |
Token | them |
Token ID | 606 |
Feature activation | +2.60e-03 |
Pos logit contributions | |
mmm | +0.012 |
on | +0.012 |
orse | +0.012 |
inations | +0.012 |
mm | +0.012 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
attent | -0.008 |
iet | -0.008 |
Please | -0.008 |
Token | how |
Token ID | 703 |
Feature activation | -1.66e-03 |
Pos logit contributions | |
mmm | +0.005 |
orse | +0.005 |
on | +0.005 |
mm | +0.005 |
inations | +0.004 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
iet | -0.002 |
out | -0.002 |
Token | y |
Token ID | 331 |
Feature activation | +4.96e-02 |
Pos logit contributions | |
ranc | +0.002 |
attent | +0.002 |
Please | +0.002 |
err | +0.002 |
err | +0.001 |
Neg logit contributions | |
mmm | -0.003 |
etti | -0.003 |
mm | -0.003 |
on | -0.003 |
inations | -0.003 |
Token | ummy |
Token ID | 13513 |
Feature activation | +4.55e-05 |
Pos logit contributions | |
inations | +0.078 |
orse | +0.072 |
on | +0.070 |
Matt | +0.070 |
Matt | +0.068 |
Neg logit contributions | |
err | -0.063 |
ranc | -0.063 |
ling | -0.063 |
attent | -0.062 |
andel | -0.062 |
Token | the |
Token ID | 262 |
Feature activation | +4.57e-03 |
Pos logit contributions | |
mmm | +0.000 |
inations | +0.000 |
orse | +0.000 |
etti | +0.000 |
on | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
out | -0.000 |
for | -0.000 |
girl | -0.000 |
err | -0.000 |
Token | carrots |
Token ID | 34397 |
Feature activation | +5.99e-03 |
Pos logit contributions | |
mmm | +0.008 |
on | +0.008 |
orse | +0.007 |
inations | +0.007 |
etti | +0.007 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.005 |
attent | -0.005 |
iet | -0.005 |
Please | -0.005 |
Token | were |
Token ID | 547 |
Feature activation | +1.45e-02 |
Pos logit contributions | |
mmm | +0.010 |
inations | +0.009 |
etti | +0.009 |
mm | +0.009 |
orse | +0.009 |
Neg logit contributions | |
ranc | -0.007 |
out | -0.007 |
for | -0.007 |
Please | -0.006 |
ther | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +6.72e-04 |
Pos logit contributions | |
mmm | +0.029 |
etti | +0.028 |
mm | +0.028 |
orse | +0.028 |
on | +0.028 |
Neg logit contributions | |
ranc | -0.013 |
err | -0.011 |
attent | -0.010 |
for | -0.010 |
out | -0.010 |
Token | She |
Token ID | 1375 |
Feature activation | -2.87e-03 |
Pos logit contributions | |
mmm | +0.001 |
on | +0.001 |
Joe | +0.001 |
orse | +0.001 |
John | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
iet | -0.001 |
andel | -0.001 |
ther | -0.001 |
Token | explored |
Token ID | 18782 |
Feature activation | +1.20e-02 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
andel | +0.004 |
attent | +0.004 |
tant | +0.003 |
Neg logit contributions | |
orse | -0.004 |
on | -0.004 |
inations | -0.004 |
mmm | -0.004 |
Joe | -0.004 |
Token | everything |
Token ID | 2279 |
Feature activation | +9.55e-03 |
Pos logit contributions | |
Joe | +0.016 |
on | +0.015 |
mmm | +0.014 |
inations | +0.014 |
John | +0.014 |
Neg logit contributions | |
ranc | -0.019 |
err | -0.018 |
Please | -0.017 |
urse | -0.017 |
pharm | -0.016 |
Token | outside |
Token ID | 2354 |
Feature activation | +2.19e-04 |
Pos logit contributions | |
mmm | +0.022 |
orse | +0.022 |
mm | +0.021 |
on | +0.021 |
inations | +0.021 |
Neg logit contributions | |
ranc | -0.005 |
attent | -0.005 |
out | -0.005 |
err | -0.005 |
for | -0.005 |
Token | with |
Token ID | 351 |
Feature activation | -2.94e-03 |
Pos logit contributions | |
mmm | +0.000 |
orse | +0.000 |
on | +0.000 |
inations | +0.000 |
mm | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
iet | -0.000 |
Please | -0.000 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.94e-02 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.001 |
attent | +0.001 |
iet | +0.001 |
out | +0.001 |
Neg logit contributions | |
mmm | -0.007 |
orse | -0.007 |
mm | -0.007 |
on | -0.007 |
inations | -0.007 |
Token | ement |
Token ID | 972 |
Feature activation | +8.56e-03 |
Pos logit contributions | |
mmm | +0.061 |
on | +0.061 |
orse | +0.060 |
inations | +0.058 |
etti | +0.055 |
Neg logit contributions | |
ranc | -0.081 |
err | -0.077 |
attent | -0.074 |
iet | -0.073 |
Please | -0.071 |
Token | . |
Token ID | 13 |
Feature activation | -1.92e-04 |
Pos logit contributions | |
mmm | +0.015 |
on | +0.015 |
orse | +0.015 |
inations | +0.014 |
Joe | +0.014 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
attent | -0.008 |
Please | -0.008 |
iet | -0.008 |
Token | She |
Token ID | 1375 |
Feature activation | -1.86e-03 |
Pos logit contributions | |
ranc | +0.000 |
err | +0.000 |
iet | +0.000 |
attent | +0.000 |
andel | +0.000 |
Neg logit contributions | |
mmm | -0.000 |
on | -0.000 |
Joe | -0.000 |
orse | -0.000 |
inations | -0.000 |
Token | saw |
Token ID | 2497 |
Feature activation | +5.47e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
mm | -0.003 |
inations | -0.003 |
Token | bright |
Token ID | 6016 |
Feature activation | +2.17e-02 |
Pos logit contributions | |
mmm | +0.010 |
on | +0.010 |
orse | +0.010 |
inations | +0.010 |
etti | +0.010 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.005 |
attent | -0.005 |
iet | -0.005 |
Please | -0.005 |
Token | animals |
Token ID | 4695 |
Feature activation | -1.03e-02 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
iet | +0.001 |
girl | +0.001 |
attent | +0.001 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
etti | -0.003 |
inations | -0.003 |
Token | were |
Token ID | 547 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
ranc | +0.011 |
out | +0.010 |
attent | +0.010 |
iet | +0.009 |
at | +0.009 |
Neg logit contributions | |
mmm | -0.020 |
mm | -0.019 |
etti | -0.019 |
on | -0.018 |
orse | -0.017 |
Token | watching |
Token ID | 4964 |
Feature activation | +3.92e-03 |
Pos logit contributions | |
mmm | +0.028 |
mm | +0.027 |
on | +0.026 |
etti | +0.026 |
orse | +0.025 |
Neg logit contributions | |
ranc | -0.018 |
out | -0.015 |
louder | -0.015 |
err | -0.015 |
veterinarian | -0.015 |
Token | him |
Token ID | 683 |
Feature activation | +3.66e-03 |
Pos logit contributions | |
mmm | +0.007 |
on | +0.007 |
orse | +0.007 |
inations | +0.007 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | with |
Token ID | 351 |
Feature activation | -2.01e-03 |
Pos logit contributions | |
mmm | +0.007 |
mm | +0.007 |
on | +0.007 |
etti | +0.007 |
inations | +0.006 |
Neg logit contributions | |
ranc | -0.004 |
out | -0.003 |
attent | -0.003 |
err | -0.003 |
for | -0.003 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.89e-02 |
Pos logit contributions | |
ranc | +0.002 |
out | +0.002 |
attent | +0.002 |
err | +0.002 |
louder | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
mm | -0.004 |
orse | -0.004 |
inations | -0.004 |
etti | -0.004 |
Token | ement |
Token ID | 972 |
Feature activation | +3.55e-04 |
Pos logit contributions | |
orse | +0.071 |
mmm | +0.069 |
inations | +0.067 |
on | +0.067 |
achieve | +0.064 |
Neg logit contributions | |
err | -0.066 |
attent | -0.064 |
ranc | -0.063 |
iet | -0.061 |
Please | -0.059 |
Token | . |
Token ID | 13 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
mmm | +0.001 |
on | +0.001 |
mm | +0.001 |
inations | +0.001 |
orse | +0.001 |
Neg logit contributions | |
ranc | -0.000 |
attent | -0.000 |
err | -0.000 |
out | -0.000 |
for | -0.000 |
Token | |
Token ID | 220 |
Feature activation | -4.52e-03 |
Pos logit contributions | |
inations | +0.004 |
mmm | +0.004 |
on | +0.004 |
orse | +0.004 |
mm | +0.004 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.002 |
attent | -0.002 |
veterinarian | -0.002 |
Please | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | -3.31e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.004 |
attent | +0.004 |
ther | +0.004 |
iet | +0.004 |
Neg logit contributions | |
mmm | -0.008 |
inations | -0.008 |
orse | -0.008 |
on | -0.008 |
mm | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | +2.06e-04 |
Pos logit contributions | |
err | +0.003 |
ranc | +0.003 |
Please | +0.002 |
attent | +0.002 |
moral | +0.002 |
Neg logit contributions | |
etti | -0.007 |
mmm | -0.006 |
mm | -0.006 |
inations | -0.006 |
on | -0.006 |
Token | go |
Token ID | 467 |
Feature activation | -6.00e-03 |
Pos logit contributions | |
ranc | +0.029 |
veterinarian | +0.026 |
err | +0.025 |
Please | +0.025 |
attent | +0.025 |
Neg logit contributions | |
mmm | -0.034 |
mm | -0.033 |
on | -0.033 |
inations | -0.032 |
etti | -0.032 |
Token | ! |
Token ID | 0 |
Feature activation | -4.76e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.005 |
attent | +0.005 |
iet | +0.005 |
Please | +0.004 |
Neg logit contributions | |
on | -0.012 |
mmm | -0.012 |
orse | -0.011 |
inations | -0.011 |
Joe | -0.011 |
Token | Everyone |
Token ID | 11075 |
Feature activation | -7.45e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.006 |
Please | +0.005 |
veterinarian | +0.005 |
attent | +0.005 |
Neg logit contributions | |
inations | -0.007 |
mmm | -0.007 |
on | -0.007 |
orse | -0.007 |
etti | -0.007 |
Token | watched |
Token ID | 7342 |
Feature activation | +2.46e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.008 |
attent | +0.008 |
Please | +0.007 |
iet | +0.007 |
Neg logit contributions | |
mmm | -0.014 |
mm | -0.013 |
etti | -0.013 |
orse | -0.012 |
on | -0.012 |
Token | in |
Token ID | 287 |
Feature activation | -1.44e-03 |
Pos logit contributions | |
mmm | +0.004 |
on | +0.004 |
orse | +0.004 |
inations | +0.004 |
mm | +0.004 |
Neg logit contributions | |
ranc | -0.003 |
attent | -0.002 |
err | -0.002 |
iet | -0.002 |
Please | -0.002 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.89e-02 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.002 |
orse | -0.002 |
on | -0.002 |
inations | -0.002 |
mm | -0.002 |
Token | ement |
Token ID | 972 |
Feature activation | -1.31e-03 |
Pos logit contributions | |
orse | +0.074 |
on | +0.070 |
mmm | +0.069 |
inations | +0.068 |
achieve | +0.065 |
Neg logit contributions | |
err | -0.064 |
attent | -0.064 |
iet | -0.060 |
ranc | -0.060 |
louder | -0.057 |
Token | as |
Token ID | 355 |
Feature activation | -2.59e-03 |
Pos logit contributions | |
ranc | +0.001 |
attent | +0.001 |
err | +0.001 |
louder | +0.001 |
for | +0.001 |
Neg logit contributions | |
on | -0.003 |
mmm | -0.003 |
orse | -0.002 |
mm | -0.002 |
inations | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | +5.87e-03 |
Pos logit contributions | |
attent | +0.003 |
louder | +0.003 |
ranc | +0.003 |
girl | +0.003 |
err | +0.003 |
Neg logit contributions | |
mmm | -0.005 |
mm | -0.004 |
orse | -0.004 |
on | -0.004 |
etti | -0.004 |
Token | took |
Token ID | 1718 |
Feature activation | -2.88e-03 |
Pos logit contributions | |
mmm | +0.010 |
on | +0.009 |
orse | +0.009 |
inations | +0.009 |
mm | +0.009 |
Neg logit contributions | |
ranc | -0.008 |
err | -0.007 |
attent | -0.007 |
iet | -0.006 |
Please | -0.006 |
Token | off |
Token ID | 572 |
Feature activation | -6.52e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
out | +0.002 |
attent | +0.002 |
iet | +0.002 |
Neg logit contributions | |
orse | -0.006 |
mmm | -0.006 |
on | -0.005 |
inations | -0.005 |
mm | -0.005 |
Token | hand |
Token ID | 1021 |
Feature activation | +1.03e-03 |
Pos logit contributions | |
ranc | +0.005 |
attent | +0.005 |
andel | +0.004 |
out | +0.004 |
corner | +0.004 |
Neg logit contributions | |
mmm | -0.009 |
mm | -0.009 |
on | -0.009 |
inations | -0.008 |
etti | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | +4.43e-03 |
Pos logit contributions | |
mmm | +0.002 |
inations | +0.002 |
orse | +0.002 |
on | +0.002 |
mm | +0.002 |
Neg logit contributions | |
ranc | -0.001 |
attent | -0.001 |
err | -0.001 |
Please | -0.001 |
veterinarian | -0.001 |
Token | but |
Token ID | 475 |
Feature activation | +4.66e-03 |
Pos logit contributions | |
mmm | +0.008 |
on | +0.007 |
orse | +0.007 |
inations | +0.007 |
mm | +0.007 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.005 |
Please | -0.005 |
iet | -0.004 |
Token | also |
Token ID | 635 |
Feature activation | -3.73e-04 |
Pos logit contributions | |
mmm | +0.008 |
on | +0.008 |
orse | +0.008 |
inations | +0.008 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.005 |
Please | -0.005 |
iet | -0.005 |
Token | how |
Token ID | 703 |
Feature activation | -7.55e-03 |
Pos logit contributions | |
ranc | +0.000 |
err | +0.000 |
attent | +0.000 |
iet | +0.000 |
Please | +0.000 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
orse | -0.001 |
inations | -0.001 |
etti | -0.001 |
Token | sturdy |
Token ID | 28055 |
Feature activation | +4.88e-02 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.010 |
attent | +0.009 |
iet | +0.009 |
Please | +0.009 |
Neg logit contributions | |
mmm | -0.012 |
on | -0.012 |
orse | -0.011 |
inations | -0.011 |
mm | -0.011 |
Token | and |
Token ID | 290 |
Feature activation | -6.42e-04 |
Pos logit contributions | |
mmm | +0.082 |
orse | +0.082 |
inations | +0.081 |
on | +0.081 |
etti | +0.078 |
Neg logit contributions | |
ranc | -0.057 |
err | -0.052 |
Please | -0.050 |
attent | -0.050 |
iet | -0.048 |
Token | strong |
Token ID | 1913 |
Feature activation | +3.09e-02 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
Please | +0.001 |
louder | +0.001 |
Neg logit contributions | |
orse | -0.001 |
mmm | -0.001 |
on | -0.001 |
etti | -0.001 |
inations | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -1.13e-03 |
Pos logit contributions | |
mmm | +0.053 |
on | +0.052 |
orse | +0.052 |
inations | +0.051 |
etti | +0.049 |
Neg logit contributions | |
ranc | -0.037 |
err | -0.033 |
attent | -0.032 |
Please | -0.031 |
iet | -0.031 |
Token | She |
Token ID | 1375 |
Feature activation | -6.49e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
iet | +0.001 |
attent | +0.001 |
andel | +0.001 |
Neg logit contributions | |
mmm | -0.002 |
on | -0.002 |
Joe | -0.002 |
orse | -0.002 |
mm | -0.002 |
Token | wanted |
Token ID | 2227 |
Feature activation | -1.06e-03 |
Pos logit contributions | |
attent | +0.006 |
ranc | +0.006 |
err | +0.005 |
moral | +0.005 |
iet | +0.005 |
Neg logit contributions | |
mmm | -0.013 |
etti | -0.013 |
mm | -0.013 |
on | -0.012 |
opter | -0.012 |
Token | magical |
Token ID | 10883 |
Feature activation | +6.66e-03 |
Pos logit contributions | |
mmm | +0.022 |
on | +0.021 |
inations | +0.021 |
mm | +0.021 |
orse | +0.021 |
Neg logit contributions | |
ranc | -0.013 |
err | -0.011 |
attent | -0.010 |
Please | -0.010 |
iet | -0.010 |
Token | noise |
Token ID | 7838 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
mmm | +0.010 |
on | +0.010 |
inations | +0.010 |
orse | +0.010 |
mm | +0.009 |
Neg logit contributions | |
ranc | -0.009 |
err | -0.009 |
attent | -0.008 |
iet | -0.008 |
Please | -0.008 |
Token | ! |
Token ID | 0 |
Feature activation | -6.45e-03 |
Pos logit contributions | |
ranc | +0.016 |
err | +0.015 |
attent | +0.014 |
iet | +0.014 |
Please | +0.013 |
Neg logit contributions | |
on | -0.019 |
mmm | -0.019 |
orse | -0.018 |
inations | -0.018 |
Joe | -0.018 |
Token | To |
Token ID | 1675 |
Feature activation | +1.38e-02 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.008 |
attent | +0.007 |
Please | +0.007 |
ther | +0.007 |
Neg logit contributions | |
inations | -0.011 |
mmm | -0.010 |
orse | -0.010 |
mm | -0.010 |
etti | -0.010 |
Token | his |
Token ID | 465 |
Feature activation | +7.46e-03 |
Pos logit contributions | |
inations | +0.026 |
mmm | +0.026 |
orse | +0.024 |
mm | +0.024 |
on | +0.024 |
Neg logit contributions | |
ranc | -0.013 |
attent | -0.012 |
out | -0.012 |
err | -0.012 |
iet | -0.012 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.86e-02 |
Pos logit contributions | |
mmm | +0.013 |
inations | +0.012 |
on | +0.012 |
mm | +0.012 |
orse | +0.012 |
Neg logit contributions | |
ranc | -0.009 |
err | -0.009 |
iet | -0.009 |
attent | -0.008 |
veterinarian | -0.008 |
Token | ement |
Token ID | 972 |
Feature activation | +4.57e-03 |
Pos logit contributions | |
orse | +0.070 |
inations | +0.070 |
mmm | +0.069 |
on | +0.067 |
achieve | +0.064 |
Neg logit contributions | |
ranc | -0.066 |
err | -0.066 |
iet | -0.063 |
attent | -0.062 |
Please | -0.059 |
Token | he |
Token ID | 339 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
mmm | +0.006 |
inations | +0.006 |
on | +0.006 |
mm | +0.006 |
achieve | +0.006 |
Neg logit contributions | |
ranc | -0.007 |
attent | -0.006 |
err | -0.006 |
iet | -0.006 |
out | -0.006 |
Token | had |
Token ID | 550 |
Feature activation | -4.88e-03 |
Pos logit contributions | |
mmm | +0.025 |
mm | +0.024 |
on | +0.024 |
inations | +0.024 |
etti | +0.024 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
iet | -0.009 |
Please | -0.009 |
attent | -0.008 |
Token | revealed |
Token ID | 4602 |
Feature activation | +1.99e-02 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.006 |
attent | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.008 |
on | -0.008 |
mm | -0.008 |
orse | -0.008 |
inations | -0.007 |
Token | a |
Token ID | 257 |
Feature activation | -5.20e-03 |
Pos logit contributions | |
inations | +0.039 |
mmm | +0.039 |
mm | +0.038 |
orse | +0.037 |
etti | +0.036 |
Neg logit contributions | |
ranc | -0.019 |
out | -0.019 |
err | -0.017 |
attent | -0.017 |
louder | -0.016 |
Token | she |
Token ID | 673 |
Feature activation | -3.43e-03 |
Pos logit contributions | |
on | +0.005 |
John | +0.005 |
Joe | +0.004 |
Jack | +0.004 |
mmm | +0.004 |
Neg logit contributions | |
err | -0.007 |
ranc | -0.007 |
andel | -0.007 |
iet | -0.007 |
arl | -0.006 |
Token | wanted |
Token ID | 2227 |
Feature activation | +4.52e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.004 |
andel | +0.004 |
iet | +0.004 |
Neg logit contributions | |
on | -0.005 |
orse | -0.005 |
mmm | -0.005 |
inations | -0.005 |
Joe | -0.005 |
Token | to |
Token ID | 284 |
Feature activation | +4.59e-03 |
Pos logit contributions | |
mmm | +0.009 |
orse | +0.009 |
inations | +0.009 |
on | +0.009 |
etti | +0.009 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.003 |
attent | -0.003 |
Please | -0.003 |
veterinarian | -0.003 |
Token | remember |
Token ID | 3505 |
Feature activation | +5.02e-03 |
Pos logit contributions | |
inations | +0.008 |
opter | +0.008 |
orse | +0.008 |
etti | +0.008 |
Mike | +0.008 |
Neg logit contributions | |
veterinarian | -0.004 |
Please | -0.004 |
date | -0.004 |
moral | -0.004 |
out | -0.004 |
Token | how |
Token ID | 703 |
Feature activation | -7.45e-03 |
Pos logit contributions | |
mmm | +0.008 |
on | +0.008 |
orse | +0.008 |
inations | +0.008 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.006 |
attent | -0.005 |
iet | -0.005 |
Please | -0.005 |
Token | y |
Token ID | 331 |
Feature activation | +4.81e-02 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.009 |
attent | +0.009 |
Please | +0.009 |
iet | +0.008 |
Neg logit contributions | |
mmm | -0.012 |
on | -0.011 |
orse | -0.011 |
inations | -0.011 |
etti | -0.011 |
Token | ummy |
Token ID | 13513 |
Feature activation | -3.70e-03 |
Pos logit contributions | |
inations | +0.072 |
orse | +0.069 |
achieve | +0.063 |
Matt | +0.062 |
Matt | +0.062 |
Neg logit contributions | |
err | -0.065 |
andel | -0.064 |
attent | -0.062 |
Please | -0.061 |
ocked | -0.060 |
Token | it |
Token ID | 340 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
ranc | +0.004 |
girl | +0.003 |
err | +0.003 |
Please | +0.003 |
attent | +0.003 |
Neg logit contributions | |
orse | -0.007 |
inations | -0.007 |
mmm | -0.006 |
etti | -0.006 |
on | -0.006 |
Token | was |
Token ID | 373 |
Feature activation | -3.21e-03 |
Pos logit contributions | |
mmm | +0.025 |
on | +0.025 |
orse | +0.024 |
inations | +0.024 |
mm | +0.023 |
Neg logit contributions | |
ranc | -0.024 |
err | -0.022 |
attent | -0.021 |
iet | -0.020 |
Please | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | -1.82e-04 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.006 |
on | -0.006 |
orse | -0.006 |
inations | -0.006 |
etti | -0.006 |
Token | So |
Token ID | 1406 |
Feature activation | -2.37e-03 |
Pos logit contributions | |
ranc | +0.000 |
iet | +0.000 |
err | +0.000 |
andel | +0.000 |
eh | +0.000 |
Neg logit contributions | |
mmm | -0.000 |
Joe | -0.000 |
on | -0.000 |
John | -0.000 |
mm | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | -6.11e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.006 |
attent | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.011 |
orse | -0.011 |
on | -0.011 |
inations | -0.011 |
mm | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | -3.40e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
Please | +0.006 |
attent | +0.006 |
veterinarian | +0.006 |
Neg logit contributions | |
inations | -0.010 |
mmm | -0.010 |
on | -0.010 |
orse | -0.010 |
etti | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +1.55e-04 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.004 |
iet | +0.003 |
Please | +0.003 |
Neg logit contributions | |
mmm | -0.006 |
on | -0.006 |
orse | -0.006 |
inations | -0.006 |
etti | -0.005 |
Token | To |
Token ID | 2514 |
Feature activation | +1.62e-02 |
Pos logit contributions | |
mmm | +0.000 |
on | +0.000 |
orse | +0.000 |
inations | +0.000 |
etti | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
iet | -0.000 |
Please | -0.000 |
Token | her |
Token ID | 607 |
Feature activation | -6.09e-03 |
Pos logit contributions | |
mmm | +0.026 |
orse | +0.026 |
on | +0.026 |
inations | +0.026 |
mm | +0.025 |
Neg logit contributions | |
ranc | -0.020 |
err | -0.019 |
attent | -0.018 |
iet | -0.018 |
Please | -0.017 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.78e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
attent | +0.007 |
veterinarian | +0.007 |
moral | +0.007 |
Neg logit contributions | |
mmm | -0.010 |
on | -0.010 |
mm | -0.010 |
orse | -0.010 |
inations | -0.010 |
Token | ement |
Token ID | 972 |
Feature activation | -5.86e-04 |
Pos logit contributions | |
mmm | +0.062 |
orse | +0.061 |
on | +0.060 |
inations | +0.059 |
Joe | +0.056 |
Neg logit contributions | |
ranc | -0.074 |
err | -0.072 |
attent | -0.069 |
iet | -0.068 |
Please | -0.066 |
Token | , |
Token ID | 11 |
Feature activation | -1.27e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
iet | +0.001 |
andel | +0.001 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
inations | -0.001 |
orse | -0.001 |
mm | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -2.05e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.002 |
on | -0.002 |
orse | -0.002 |
Joe | -0.002 |
inations | -0.002 |
Token | clothes |
Token ID | 8242 |
Feature activation | +1.30e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
on | -0.004 |
mmm | -0.004 |
orse | -0.003 |
inations | -0.003 |
Joe | -0.003 |
Token | came |
Token ID | 1625 |
Feature activation | -7.19e-03 |
Pos logit contributions | |
mmm | +0.002 |
on | +0.002 |
orse | +0.002 |
inations | +0.002 |
mm | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
Please | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -1.17e-03 |
Pos logit contributions | |
mmm | +0.014 |
on | +0.014 |
mm | +0.013 |
inations | +0.013 |
orse | +0.013 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.004 |
attent | -0.004 |
out | -0.004 |
for | -0.003 |
Token | He |
Token ID | 679 |
Feature activation | +3.41e-04 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.001 |
attent | +0.001 |
Please | +0.001 |
veterinarian | +0.001 |
Neg logit contributions | |
on | -0.002 |
mmm | -0.002 |
inations | -0.002 |
orse | -0.002 |
mm | -0.002 |
Token | watched |
Token ID | 7342 |
Feature activation | +7.91e-03 |
Pos logit contributions | |
mmm | +0.001 |
on | +0.001 |
inations | +0.001 |
orse | +0.001 |
mm | +0.001 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
iet | -0.000 |
Please | -0.000 |
Token | them |
Token ID | 606 |
Feature activation | +2.35e-04 |
Pos logit contributions | |
on | +0.013 |
mmm | +0.013 |
orse | +0.013 |
Joe | +0.012 |
inations | +0.012 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
iet | -0.009 |
attent | -0.008 |
Please | -0.008 |
Token | in |
Token ID | 287 |
Feature activation | -1.74e-03 |
Pos logit contributions | |
mmm | +0.000 |
mm | +0.000 |
on | +0.000 |
inations | +0.000 |
orse | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
attent | -0.000 |
err | -0.000 |
out | -0.000 |
louder | -0.000 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.78e-02 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
inations | -0.002 |
mm | -0.002 |
Token | ement |
Token ID | 972 |
Feature activation | +4.32e-03 |
Pos logit contributions | |
orse | +0.072 |
mmm | +0.069 |
on | +0.068 |
inations | +0.068 |
achieve | +0.065 |
Neg logit contributions | |
err | -0.063 |
attent | -0.062 |
iet | -0.061 |
ranc | -0.061 |
Please | -0.057 |
Token | and |
Token ID | 290 |
Feature activation | +2.63e-03 |
Pos logit contributions | |
on | +0.009 |
mmm | +0.009 |
inations | +0.008 |
mm | +0.008 |
orse | +0.008 |
Neg logit contributions | |
ranc | -0.004 |
attent | -0.003 |
err | -0.003 |
iet | -0.003 |
louder | -0.003 |
Token | even |
Token ID | 772 |
Feature activation | +9.06e-04 |
Pos logit contributions | |
mmm | +0.004 |
on | +0.004 |
mm | +0.004 |
inations | +0.004 |
etti | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
attent | -0.003 |
louder | -0.003 |
Please | -0.003 |
err | -0.003 |
Token | laughed |
Token ID | 13818 |
Feature activation | -3.35e-04 |
Pos logit contributions | |
on | +0.001 |
orse | +0.001 |
inations | +0.001 |
mmm | +0.001 |
Joe | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
andel | -0.001 |
veterinarian | -0.001 |
attent | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +4.98e-03 |
Pos logit contributions | |
ranc | +0.000 |
err | +0.000 |
iet | +0.000 |
andel | +0.000 |
Please | +0.000 |
Neg logit contributions | |
on | -0.001 |
mmm | -0.001 |
Joe | -0.001 |
orse | -0.001 |
etti | -0.001 |
Token | seen |
Token ID | 1775 |
Feature activation | +6.21e-03 |
Pos logit contributions | |
mmm | +0.004 |
on | +0.004 |
mm | +0.003 |
orse | +0.003 |
etti | +0.003 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.003 |
Please | -0.003 |
iet | -0.003 |
Token | ! |
Token ID | 0 |
Feature activation | +2.70e-04 |
Pos logit contributions | |
on | +0.011 |
mmm | +0.011 |
orse | +0.011 |
inations | +0.010 |
Joe | +0.010 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
attent | -0.006 |
iet | -0.006 |
Please | -0.006 |
Token | She |
Token ID | 1375 |
Feature activation | -3.10e-03 |
Pos logit contributions | |
inations | +0.000 |
mmm | +0.000 |
orse | +0.000 |
on | +0.000 |
etti | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
veterinarian | -0.000 |
Please | -0.000 |
Token | gasped |
Token ID | 45236 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
attent | +0.002 |
moral | +0.002 |
ranc | +0.002 |
girl | +0.002 |
err | +0.002 |
Neg logit contributions | |
mmm | -0.007 |
mm | -0.006 |
etti | -0.006 |
ourselves | -0.006 |
pleasure | -0.006 |
Token | in |
Token ID | 287 |
Feature activation | +1.10e-02 |
Pos logit contributions | |
mmm | +0.021 |
on | +0.021 |
orse | +0.020 |
inations | +0.020 |
etti | +0.019 |
Neg logit contributions | |
ranc | -0.012 |
err | -0.011 |
attent | -0.010 |
iet | -0.010 |
Please | -0.010 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.77e-02 |
Pos logit contributions | |
mmm | +0.013 |
orse | +0.013 |
inations | +0.013 |
on | +0.013 |
mm | +0.012 |
Neg logit contributions | |
ranc | -0.019 |
err | -0.018 |
attent | -0.017 |
Please | -0.017 |
iet | -0.017 |
Token | ement |
Token ID | 972 |
Feature activation | +3.26e-03 |
Pos logit contributions | |
orse | +0.061 |
mmm | +0.061 |
on | +0.060 |
inations | +0.059 |
etti | +0.055 |
Neg logit contributions | |
ranc | -0.074 |
err | -0.072 |
attent | -0.070 |
iet | -0.068 |
Please | -0.066 |
Token | , |
Token ID | 11 |
Feature activation | +2.96e-03 |
Pos logit contributions | |
mmm | +0.006 |
on | +0.006 |
orse | +0.006 |
inations | +0.006 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
iet | -0.003 |
Please | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | -8.05e-03 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.005 |
orse | +0.005 |
inations | +0.005 |
mm | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.003 |
attent | -0.003 |
iet | -0.003 |
Please | -0.003 |
Token | her |
Token ID | 607 |
Feature activation | -8.76e-03 |
Pos logit contributions | |
ranc | +0.010 |
attent | +0.010 |
err | +0.009 |
Please | +0.009 |
girl | +0.009 |
Neg logit contributions | |
mmm | -0.013 |
inations | -0.013 |
on | -0.013 |
orse | -0.012 |
mm | -0.012 |
Token | tears |
Token ID | 10953 |
Feature activation | -1.42e-02 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.010 |
attent | +0.010 |
moral | +0.009 |
girl | +0.009 |
Neg logit contributions | |
mmm | -0.016 |
on | -0.014 |
orse | -0.014 |
inations | -0.014 |
mm | -0.014 |
Token | awe |
Token ID | 25030 |
Feature activation | +1.21e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
iet | +0.007 |
attent | +0.007 |
Please | +0.006 |
Neg logit contributions | |
on | -0.006 |
mmm | -0.006 |
Joe | -0.006 |
orse | -0.006 |
inations | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +3.24e-03 |
Pos logit contributions | |
mmm | +0.021 |
on | +0.021 |
orse | +0.021 |
inations | +0.021 |
Joe | +0.020 |
Neg logit contributions | |
ranc | -0.014 |
err | -0.013 |
attent | -0.011 |
iet | -0.011 |
Please | -0.011 |
Token | She |
Token ID | 1375 |
Feature activation | -1.12e-03 |
Pos logit contributions | |
inations | +0.006 |
on | +0.006 |
orse | +0.006 |
mmm | +0.006 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
Please | -0.003 |
veterinarian | -0.003 |
Token | noticed |
Token ID | 6810 |
Feature activation | +8.86e-03 |
Pos logit contributions | |
ranc | +0.001 |
attent | +0.001 |
iet | +0.001 |
Please | +0.001 |
err | +0.001 |
Neg logit contributions | |
mm | -0.002 |
mmm | -0.002 |
etti | -0.002 |
on | -0.002 |
ourselves | -0.002 |
Token | how |
Token ID | 703 |
Feature activation | -7.66e-03 |
Pos logit contributions | |
mmm | +0.017 |
inations | +0.016 |
orse | +0.016 |
mm | +0.016 |
etti | +0.016 |
Neg logit contributions | |
ranc | -0.009 |
attent | -0.008 |
err | -0.008 |
out | -0.008 |
louder | -0.008 |
Token | colorful |
Token ID | 20239 |
Feature activation | +4.76e-02 |
Pos logit contributions | |
ranc | +0.009 |
attent | +0.008 |
err | +0.008 |
iet | +0.008 |
Please | +0.008 |
Neg logit contributions | |
mmm | -0.014 |
mm | -0.013 |
etti | -0.013 |
orse | -0.013 |
on | -0.013 |
Token | it |
Token ID | 340 |
Feature activation | +1.35e-02 |
Pos logit contributions | |
inations | +0.083 |
orse | +0.081 |
mmm | +0.080 |
etti | +0.075 |
on | +0.074 |
Neg logit contributions | |
out | -0.054 |
ranc | -0.051 |
attent | -0.049 |
for | -0.049 |
girl | -0.048 |
Token | was |
Token ID | 373 |
Feature activation | -3.43e-04 |
Pos logit contributions | |
mmm | +0.022 |
on | +0.021 |
orse | +0.021 |
inations | +0.021 |
mm | +0.021 |
Neg logit contributions | |
ranc | -0.017 |
err | -0.016 |
attent | -0.015 |
iet | -0.015 |
Please | -0.015 |
Token | and |
Token ID | 290 |
Feature activation | +1.58e-03 |
Pos logit contributions | |
ranc | +0.000 |
err | +0.000 |
attent | +0.000 |
iet | +0.000 |
Please | +0.000 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
orse | -0.001 |
mm | -0.001 |
inations | -0.001 |
Token | how |
Token ID | 703 |
Feature activation | -1.99e-04 |
Pos logit contributions | |
mmm | +0.003 |
mm | +0.003 |
on | +0.003 |
inations | +0.003 |
etti | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
attent | -0.002 |
louder | -0.002 |
err | -0.002 |
Please | -0.002 |
Token | tall |
Token ID | 7331 |
Feature activation | +4.70e-02 |
Pos logit contributions | |
ranc | +0.000 |
attent | +0.000 |
err | +0.000 |
iet | +0.000 |
girl | +0.000 |
Neg logit contributions | |
mmm | -0.000 |
mm | -0.000 |
on | -0.000 |
orse | -0.000 |
etti | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +9.05e-03 |
Pos logit contributions | |
mmm | +0.006 |
on | +0.006 |
inations | +0.006 |
mm | +0.006 |
etti | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
veterinarian | -0.003 |
iet | -0.003 |
Token | He |
Token ID | 679 |
Feature activation | +8.63e-03 |
Pos logit contributions | |
inations | +0.018 |
mmm | +0.016 |
orse | +0.016 |
on | +0.016 |
etti | +0.016 |
Neg logit contributions | |
err | -0.009 |
ranc | -0.009 |
attent | -0.008 |
Please | -0.008 |
veterinarian | -0.008 |
Token | was |
Token ID | 373 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
mmm | +0.015 |
on | +0.014 |
mm | +0.014 |
etti | +0.014 |
inations | +0.014 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
attent | -0.009 |
Please | -0.009 |
moral | -0.009 |
Token | filled |
Token ID | 5901 |
Feature activation | +1.34e-02 |
Pos logit contributions | |
mmm | +0.019 |
mm | +0.019 |
inations | +0.018 |
on | +0.018 |
etti | +0.018 |
Neg logit contributions | |
ranc | -0.015 |
err | -0.014 |
out | -0.014 |
louder | -0.014 |
attent | -0.013 |
Token | with |
Token ID | 351 |
Feature activation | +1.91e-03 |
Pos logit contributions | |
mmm | +0.028 |
inations | +0.027 |
mm | +0.027 |
orse | +0.027 |
on | +0.026 |
Neg logit contributions | |
err | -0.010 |
ranc | -0.010 |
attent | -0.010 |
Please | -0.009 |
out | -0.009 |
Token | amaz |
Token ID | 40642 |
Feature activation | +4.75e-02 |
Pos logit contributions | |
mmm | +0.003 |
etti | +0.003 |
mm | +0.003 |
orse | +0.003 |
inations | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
out | -0.002 |
girl | -0.002 |
louder | -0.002 |
tears | -0.002 |
Token | ement |
Token ID | 972 |
Feature activation | +3.19e-03 |
Pos logit contributions | |
orse | +0.071 |
mmm | +0.068 |
inations | +0.068 |
on | +0.066 |
etti | +0.063 |
Neg logit contributions | |
attent | -0.062 |
err | -0.061 |
ranc | -0.060 |
Please | -0.057 |
iet | -0.057 |
Token | and |
Token ID | 290 |
Feature activation | +4.56e-03 |
Pos logit contributions | |
mmm | +0.006 |
on | +0.006 |
inations | +0.006 |
mm | +0.006 |
orse | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
attent | -0.002 |
err | -0.002 |
louder | -0.002 |
iet | -0.002 |
Token | surprise |
Token ID | 5975 |
Feature activation | +7.61e-03 |
Pos logit contributions | |
mmm | +0.008 |
mm | +0.008 |
etti | +0.008 |
on | +0.007 |
inations | +0.007 |
Neg logit contributions | |
louder | -0.005 |
ranc | -0.005 |
girl | -0.005 |
attent | -0.005 |
out | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +5.54e-03 |
Pos logit contributions | |
mmm | +0.014 |
inations | +0.014 |
orse | +0.013 |
on | +0.013 |
mm | +0.013 |
Neg logit contributions | |
ranc | -0.008 |
attent | -0.007 |
err | -0.007 |
louder | -0.007 |
out | -0.007 |
Token | He |
Token ID | 679 |
Feature activation | +6.40e-03 |
Pos logit contributions | |
inations | +0.011 |
mmm | +0.010 |
etti | +0.010 |
orse | +0.010 |
on | +0.010 |
Neg logit contributions | |
err | -0.005 |
ranc | -0.005 |
attent | -0.005 |
Please | -0.004 |
Terr | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | +3.08e-03 |
Pos logit contributions | |
mmm | +0.006 |
inations | +0.006 |
orse | +0.006 |
achieve | +0.006 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.002 |
out | -0.002 |
attent | -0.002 |
for | -0.002 |
err | -0.001 |
Token | They |
Token ID | 1119 |
Feature activation | +4.57e-03 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.004 |
Joe | +0.004 |
orse | +0.004 |
etti | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
iet | -0.004 |
andel | -0.004 |
Please | -0.004 |
Token | talked |
Token ID | 6619 |
Feature activation | -7.86e-03 |
Pos logit contributions | |
mmm | +0.008 |
mm | +0.007 |
inations | +0.007 |
etti | +0.007 |
on | +0.007 |
Neg logit contributions | |
ranc | -0.006 |
attent | -0.005 |
Please | -0.005 |
iet | -0.005 |
girl | -0.005 |
Token | about |
Token ID | 546 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
attent | +0.007 |
iet | +0.006 |
Please | +0.006 |
Neg logit contributions | |
mmm | -0.015 |
on | -0.015 |
orse | -0.015 |
inations | -0.014 |
mm | -0.014 |
Token | how |
Token ID | 703 |
Feature activation | -2.18e-03 |
Pos logit contributions | |
inations | +0.022 |
mmm | +0.022 |
orse | +0.022 |
etti | +0.021 |
on | +0.021 |
Neg logit contributions | |
ranc | -0.013 |
attent | -0.010 |
err | -0.010 |
veterinarian | -0.010 |
for | -0.010 |
Token | y |
Token ID | 331 |
Feature activation | +4.74e-02 |
Pos logit contributions | |
ranc | +0.003 |
attent | +0.002 |
Please | +0.002 |
err | +0.002 |
girl | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
etti | -0.004 |
inations | -0.004 |
on | -0.004 |
orse | -0.003 |
Token | ummy |
Token ID | 13513 |
Feature activation | -4.00e-03 |
Pos logit contributions | |
inations | +0.087 |
orse | +0.080 |
achieve | +0.079 |
believe | +0.078 |
Matt | +0.076 |
Neg logit contributions | |
ocked | -0.050 |
ling | -0.049 |
andel | -0.049 |
at | -0.049 |
attent | -0.047 |
Token | the |
Token ID | 262 |
Feature activation | +6.49e-03 |
Pos logit contributions | |
ranc | +0.004 |
girl | +0.004 |
for | +0.003 |
Please | +0.003 |
at | +0.003 |
Neg logit contributions | |
inations | -0.008 |
orse | -0.007 |
etti | -0.007 |
achieve | -0.007 |
mmm | -0.007 |
Token | ice |
Token ID | 4771 |
Feature activation | -1.95e-02 |
Pos logit contributions | |
mmm | +0.010 |
on | +0.010 |
orse | +0.009 |
inations | +0.009 |
etti | +0.009 |
Neg logit contributions | |
ranc | -0.009 |
err | -0.009 |
attent | -0.008 |
Please | -0.008 |
iet | -0.008 |
Token | cream |
Token ID | 8566 |
Feature activation | -2.30e-03 |
Pos logit contributions | |
ranc | +0.023 |
err | +0.022 |
girl | +0.021 |
ther | +0.020 |
for | +0.020 |
Neg logit contributions | |
inations | -0.032 |
mmm | -0.032 |
etti | -0.031 |
orse | -0.031 |
on | -0.030 |
Token | was |
Token ID | 373 |
Feature activation | +1.01e-03 |
Pos logit contributions | |
ranc | +0.003 |
Please | +0.002 |
girl | +0.002 |
attent | +0.002 |
err | +0.002 |
Neg logit contributions | |
inations | -0.004 |
mmm | -0.004 |
orse | -0.004 |
etti | -0.004 |
achieve | -0.004 |
Token | accidentally |
Token ID | 14716 |
Feature activation | +1.30e-03 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.010 |
attent | +0.009 |
iet | +0.009 |
andel | +0.009 |
Neg logit contributions | |
on | -0.011 |
mmm | -0.011 |
orse | -0.010 |
inations | -0.010 |
Joe | -0.010 |
Token | used |
Token ID | 973 |
Feature activation | -1.51e-03 |
Pos logit contributions | |
on | +0.002 |
mmm | +0.002 |
orse | +0.002 |
inations | +0.002 |
Joe | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.001 |
iet | -0.001 |
andel | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | -4.73e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.001 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
inations | -0.003 |
mm | -0.002 |
Token | sour |
Token ID | 11348 |
Feature activation | -1.64e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
attent | +0.006 |
iet | +0.006 |
Please | +0.006 |
Neg logit contributions | |
on | -0.007 |
mmm | -0.007 |
orse | -0.007 |
inations | -0.007 |
mm | -0.006 |
Token | - |
Token ID | 12 |
Feature activation | -4.79e-02 |
Pos logit contributions | |
ranc | +0.026 |
err | +0.024 |
iet | +0.023 |
attent | +0.022 |
Please | +0.022 |
Neg logit contributions | |
on | -0.023 |
mmm | -0.023 |
orse | -0.021 |
mm | -0.021 |
Joe | -0.020 |
Token | fl |
Token ID | 2704 |
Feature activation | -7.09e-02 |
Pos logit contributions | |
ranc | +0.068 |
err | +0.061 |
iet | +0.057 |
attent | +0.057 |
Please | +0.055 |
Neg logit contributions | |
on | -0.075 |
mmm | -0.073 |
orse | -0.070 |
inations | -0.068 |
Joe | -0.067 |
Token | avored |
Token ID | 48275 |
Feature activation | -1.79e-02 |
Pos logit contributions | |
ranc | +0.130 |
err | +0.121 |
attent | +0.116 |
iet | +0.115 |
Please | +0.113 |
Neg logit contributions | |
mmm | -0.078 |
on | -0.078 |
orse | -0.074 |
inations | -0.072 |
mm | -0.070 |
Token | cr |
Token ID | 1067 |
Feature activation | -2.39e-02 |
Pos logit contributions | |
ranc | +0.028 |
err | +0.026 |
attent | +0.024 |
iet | +0.024 |
Please | +0.024 |
Neg logit contributions | |
mmm | -0.024 |
on | -0.024 |
orse | -0.023 |
inations | -0.023 |
mm | -0.022 |
Token | ay |
Token ID | 323 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
ranc | +0.036 |
err | +0.036 |
iet | +0.034 |
andel | +0.034 |
attent | +0.033 |
Neg logit contributions | |
orse | -0.031 |
mmm | -0.030 |
inations | -0.030 |
on | -0.029 |
Joe | -0.029 |
Token | on |
Token ID | 261 |
Feature activation | -1.04e-02 |
Pos logit contributions | |
mmm | +0.001 |
inations | +0.001 |
orse | +0.001 |
etti | +0.001 |
achieve | +0.001 |
Neg logit contributions | |
ranc | -0.027 |
err | -0.027 |
attent | -0.027 |
iet | -0.026 |
andel | -0.026 |
Token | . |
Token ID | 13 |
Feature activation | +8.67e-04 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.010 |
attent | +0.009 |
iet | +0.009 |
Please | +0.008 |
Neg logit contributions | |
mmm | -0.020 |
orse | -0.019 |
inations | -0.019 |
on | -0.019 |
mm | -0.018 |
Token | a |
Token ID | 257 |
Feature activation | -2.08e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.008 |
on | -0.008 |
inations | -0.008 |
orse | -0.008 |
etti | -0.008 |
Token | field |
Token ID | 2214 |
Feature activation | +3.16e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
veterinarian | +0.002 |
girl | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
on | -0.004 |
inations | -0.004 |
mm | -0.004 |
orse | -0.004 |
Token | full |
Token ID | 1336 |
Feature activation | +1.59e-02 |
Pos logit contributions | |
on | +0.005 |
orse | +0.005 |
mmm | +0.004 |
Joe | +0.004 |
etti | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
iet | -0.004 |
attent | -0.004 |
Please | -0.004 |
Token | of |
Token ID | 286 |
Feature activation | -7.83e-04 |
Pos logit contributions | |
on | +0.024 |
mmm | +0.024 |
orse | +0.023 |
Joe | +0.023 |
inations | +0.022 |
Neg logit contributions | |
ranc | -0.022 |
err | -0.021 |
attent | -0.019 |
iet | -0.019 |
Please | -0.019 |
Token | wild |
Token ID | 4295 |
Feature activation | -5.37e-04 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
girl | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
orse | -0.001 |
etti | -0.001 |
inations | -0.001 |
Token | fl |
Token ID | 2704 |
Feature activation | -6.79e-02 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.000 |
attent | +0.000 |
iet | +0.000 |
Please | +0.000 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
orse | -0.001 |
inations | -0.001 |
etti | -0.001 |
Token | owers |
Token ID | 3618 |
Feature activation | -1.81e-02 |
Pos logit contributions | |
ranc | +0.087 |
err | +0.080 |
attent | +0.075 |
iet | +0.074 |
andel | +0.072 |
Neg logit contributions | |
mmm | -0.109 |
on | -0.108 |
orse | -0.107 |
inations | -0.105 |
Joe | -0.101 |
Token | . |
Token ID | 13 |
Feature activation | -3.10e-03 |
Pos logit contributions | |
ranc | +0.013 |
attent | +0.010 |
err | +0.009 |
out | +0.009 |
for | +0.009 |
Neg logit contributions | |
mmm | -0.041 |
mm | -0.039 |
inations | -0.038 |
on | -0.038 |
orse | -0.038 |
Token | They |
Token ID | 1119 |
Feature activation | -5.14e-04 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
orse | -0.005 |
inations | -0.004 |
Joe | -0.004 |
Token | offered |
Token ID | 4438 |
Feature activation | -2.55e-03 |
Pos logit contributions | |
ranc | +0.001 |
attent | +0.001 |
iet | +0.001 |
err | +0.001 |
moral | +0.001 |
Neg logit contributions | |
mmm | -0.001 |
mm | -0.001 |
on | -0.001 |
etti | -0.001 |
inations | -0.001 |
Token | them |
Token ID | 606 |
Feature activation | -1.50e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
iet | +0.002 |
attent | +0.002 |
Please | +0.002 |
Neg logit contributions | |
on | -0.005 |
mmm | -0.005 |
orse | -0.004 |
inations | -0.004 |
Joe | -0.004 |
Token | , |
Token ID | 11 |
Feature activation | +2.36e-04 |
Pos logit contributions | |
on | +0.016 |
mmm | +0.014 |
Joe | +0.014 |
mm | +0.013 |
orse | +0.013 |
Neg logit contributions | |
ranc | -0.031 |
err | -0.030 |
attent | -0.029 |
iet | -0.028 |
andel | -0.028 |
Token | she |
Token ID | 673 |
Feature activation | -4.09e-03 |
Pos logit contributions | |
on | +0.000 |
Joe | +0.000 |
John | +0.000 |
orse | +0.000 |
Jack | +0.000 |
Neg logit contributions | |
err | -0.000 |
ranc | -0.000 |
iet | -0.000 |
attent | -0.000 |
andel | -0.000 |
Token | accidentally |
Token ID | 14716 |
Feature activation | +2.79e-04 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.004 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.007 |
on | -0.007 |
orse | -0.007 |
inations | -0.007 |
mm | -0.007 |
Token | threw |
Token ID | 9617 |
Feature activation | +1.68e-03 |
Pos logit contributions | |
on | +0.000 |
orse | +0.000 |
Joe | +0.000 |
etti | +0.000 |
Matt | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
andel | -0.000 |
iet | -0.000 |
Token | a |
Token ID | 257 |
Feature activation | -9.42e-03 |
Pos logit contributions | |
on | +0.002 |
Joe | +0.002 |
John | +0.002 |
Mike | +0.002 |
e | +0.002 |
Neg logit contributions | |
ranc | -0.003 |
attent | -0.002 |
err | -0.002 |
iet | -0.002 |
urse | -0.002 |
Token | pe |
Token ID | 613 |
Feature activation | -6.47e-02 |
Pos logit contributions | |
ranc | +0.016 |
err | +0.014 |
attent | +0.014 |
iet | +0.013 |
Please | +0.013 |
Neg logit contributions | |
on | -0.013 |
orse | -0.012 |
mmm | -0.011 |
cube | -0.011 |
inations | -0.011 |
Token | b |
Token ID | 65 |
Feature activation | -5.34e-02 |
Pos logit contributions | |
ranc | +0.148 |
err | +0.132 |
veterinarian | +0.130 |
attent | +0.129 |
Please | +0.127 |
Neg logit contributions | |
on | -0.056 |
orse | -0.048 |
mmm | -0.046 |
inations | -0.045 |
mm | -0.038 |
Token | ble |
Token ID | 903 |
Feature activation | -2.99e-02 |
Pos logit contributions | |
ranc | +0.118 |
attent | +0.106 |
err | +0.106 |
veterinarian | +0.103 |
Please | +0.103 |
Neg logit contributions | |
on | -0.050 |
mmm | -0.042 |
orse | -0.041 |
mm | -0.037 |
Joe | -0.036 |
Token | at |
Token ID | 379 |
Feature activation | +2.15e-03 |
Pos logit contributions | |
ranc | +0.045 |
err | +0.035 |
iet | +0.034 |
nurses | +0.033 |
attent | +0.033 |
Neg logit contributions | |
on | -0.055 |
cube | -0.047 |
Joe | -0.043 |
orse | -0.043 |
mmm | -0.043 |
Token | her |
Token ID | 607 |
Feature activation | -1.06e-02 |
Pos logit contributions | |
on | +0.004 |
mmm | +0.004 |
orse | +0.004 |
inations | +0.004 |
Joe | +0.004 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
Please | -0.002 |
Token | friend |
Token ID | 1545 |
Feature activation | +3.26e-03 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.009 |
veterinarian | +0.008 |
girl | +0.008 |
attent | +0.008 |
Neg logit contributions | |
mmm | -0.021 |
inations | -0.021 |
on | -0.020 |
orse | -0.020 |
etti | -0.020 |
Token | , |
Token ID | 11 |
Feature activation | +1.02e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
attent | +0.008 |
iet | +0.007 |
Please | +0.007 |
Neg logit contributions | |
mmm | -0.015 |
on | -0.015 |
inations | -0.015 |
orse | -0.015 |
mm | -0.015 |
Token | then |
Token ID | 788 |
Feature activation | -6.70e-03 |
Pos logit contributions | |
mmm | +0.017 |
on | +0.017 |
orse | +0.017 |
inations | +0.016 |
mm | +0.016 |
Neg logit contributions | |
ranc | -0.013 |
err | -0.012 |
attent | -0.011 |
iet | -0.011 |
Please | -0.011 |
Token | she |
Token ID | 673 |
Feature activation | -5.69e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
attent | +0.007 |
iet | +0.007 |
Please | +0.007 |
Neg logit contributions | |
mmm | -0.012 |
on | -0.011 |
orse | -0.011 |
inations | -0.011 |
mm | -0.011 |
Token | grabbed |
Token ID | 13176 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.006 |
attent | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.010 |
on | -0.010 |
mm | -0.010 |
inations | -0.010 |
orse | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | -5.96e-03 |
Pos logit contributions | |
ranc | +0.016 |
err | +0.014 |
iet | +0.013 |
attent | +0.012 |
Please | +0.012 |
Neg logit contributions | |
on | -0.023 |
mmm | -0.022 |
Joe | -0.021 |
orse | -0.021 |
inations | -0.020 |
Token | pe |
Token ID | 613 |
Feature activation | -6.41e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
attent | +0.007 |
iet | +0.007 |
ther | +0.007 |
Neg logit contributions | |
mmm | -0.009 |
on | -0.009 |
orse | -0.008 |
mm | -0.008 |
inations | -0.008 |
Token | b |
Token ID | 65 |
Feature activation | -5.33e-02 |
Pos logit contributions | |
ranc | +0.134 |
err | +0.124 |
veterinarian | +0.121 |
Please | +0.119 |
attent | +0.117 |
Neg logit contributions | |
on | -0.060 |
orse | -0.058 |
inations | -0.055 |
mmm | -0.054 |
Joe | -0.047 |
Token | ble |
Token ID | 903 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
ranc | +0.105 |
err | +0.098 |
attent | +0.095 |
Please | +0.093 |
veterinarian | +0.092 |
Neg logit contributions | |
on | -0.053 |
mmm | -0.051 |
orse | -0.050 |
inations | -0.046 |
Joe | -0.046 |
Token | . |
Token ID | 13 |
Feature activation | -4.73e-03 |
Pos logit contributions | |
ranc | +0.029 |
err | +0.026 |
attent | +0.024 |
iet | +0.023 |
Please | +0.023 |
Neg logit contributions | |
on | -0.040 |
mmm | -0.038 |
orse | -0.038 |
Joe | -0.037 |
inations | -0.036 |
Token | She |
Token ID | 1375 |
Feature activation | -4.83e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.005 |
iet | +0.005 |
attent | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.008 |
on | -0.008 |
orse | -0.008 |
inations | -0.008 |
Joe | -0.007 |
Token | looked |
Token ID | 3114 |
Feature activation | -1.70e-02 |
Pos logit contributions | |
ranc | +0.005 |
attent | +0.005 |
err | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.009 |
mm | -0.009 |
on | -0.008 |
etti | -0.008 |
inations | -0.008 |
Token | from |
Token ID | 422 |
Feature activation | -3.02e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.010 |
on | -0.010 |
orse | -0.009 |
inations | -0.009 |
mm | -0.009 |
Token | a |
Token ID | 257 |
Feature activation | +2.47e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.003 |
iet | +0.003 |
Please | +0.003 |
Neg logit contributions | |
on | -0.005 |
mmm | -0.005 |
orse | -0.005 |
Joe | -0.005 |
inations | -0.005 |
Token | field |
Token ID | 2214 |
Feature activation | -1.39e-03 |
Pos logit contributions | |
mmm | +0.005 |
mm | +0.005 |
inations | +0.004 |
orse | +0.004 |
on | +0.004 |
Neg logit contributions | |
ranc | -0.003 |
corner | -0.002 |
veterinarian | -0.002 |
girl | -0.002 |
attent | -0.002 |
Token | of |
Token ID | 286 |
Feature activation | -1.36e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.001 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.002 |
on | -0.002 |
orse | -0.002 |
inations | -0.002 |
mm | -0.002 |
Token | wild |
Token ID | 4295 |
Feature activation | +2.41e-04 |
Pos logit contributions | |
ranc | +0.002 |
girl | +0.001 |
Please | +0.001 |
attent | +0.001 |
err | +0.001 |
Neg logit contributions | |
mmm | -0.002 |
orse | -0.002 |
inations | -0.002 |
mm | -0.002 |
etti | -0.002 |
Token | fl |
Token ID | 2704 |
Feature activation | -6.39e-02 |
Pos logit contributions | |
mmm | +0.000 |
orse | +0.000 |
on | +0.000 |
inations | +0.000 |
mm | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
girl | -0.000 |
Please | -0.000 |
Token | owers |
Token ID | 3618 |
Feature activation | -1.68e-02 |
Pos logit contributions | |
ranc | +0.092 |
err | +0.086 |
andel | +0.082 |
attent | +0.081 |
iet | +0.080 |
Neg logit contributions | |
orse | -0.091 |
mmm | -0.088 |
inations | -0.087 |
on | -0.082 |
Joe | -0.082 |
Token | . |
Token ID | 13 |
Feature activation | -4.31e-03 |
Pos logit contributions | |
ranc | +0.011 |
out | +0.010 |
for | +0.009 |
at | +0.009 |
attent | +0.008 |
Neg logit contributions | |
mmm | -0.039 |
mm | -0.038 |
inations | -0.036 |
orse | -0.036 |
on | -0.035 |
Token |
|
Token ID | 198 |
Feature activation | -5.79e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.006 |
attent | +0.006 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.006 |
on | -0.006 |
orse | -0.006 |
inations | -0.006 |
Joe | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -2.83e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.003 |
ther | +0.003 |
L | +0.003 |
Neg logit contributions | |
mmm | -0.012 |
mm | -0.012 |
inations | -0.012 |
etti | -0.012 |
orse | -0.012 |
Token | Mom |
Token ID | 29252 |
Feature activation | +2.76e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.003 |
attent | +0.003 |
iet | +0.003 |
andel | +0.003 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
orse | -0.005 |
inations | -0.005 |
etti | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | -1.01e-02 |
Pos logit contributions | |
on | +0.010 |
mmm | +0.010 |
orse | +0.010 |
inations | +0.010 |
Joe | +0.010 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
attent | -0.006 |
iet | -0.006 |
Please | -0.005 |
Token | send |
Token ID | 3758 |
Feature activation | -5.02e-04 |
Pos logit contributions | |
ranc | +0.015 |
err | +0.013 |
attent | +0.013 |
Please | +0.013 |
iet | +0.013 |
Neg logit contributions | |
mmm | -0.015 |
on | -0.014 |
mm | -0.014 |
orse | -0.014 |
inations | -0.014 |
Token | soft |
Token ID | 2705 |
Feature activation | +5.11e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
iet | +0.001 |
attent | +0.000 |
andel | +0.000 |
Neg logit contributions | |
on | -0.001 |
mmm | -0.001 |
Joe | -0.001 |
inations | -0.001 |
John | -0.001 |
Token | white |
Token ID | 2330 |
Feature activation | -5.85e-03 |
Pos logit contributions | |
mmm | +0.009 |
on | +0.009 |
orse | +0.008 |
inations | +0.008 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.006 |
attent | -0.005 |
iet | -0.005 |
Please | -0.005 |
Token | snow |
Token ID | 6729 |
Feature activation | -2.46e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
attent | +0.006 |
iet | +0.006 |
Please | +0.006 |
Neg logit contributions | |
on | -0.010 |
mmm | -0.009 |
orse | -0.009 |
inations | -0.009 |
etti | -0.009 |
Token | fl |
Token ID | 2704 |
Feature activation | -6.37e-02 |
Pos logit contributions | |
ranc | +0.029 |
err | +0.027 |
attent | +0.025 |
iet | +0.024 |
Please | +0.024 |
Neg logit contributions | |
on | -0.043 |
mmm | -0.042 |
orse | -0.041 |
etti | -0.040 |
inations | -0.040 |
Token | akes |
Token ID | 1124 |
Feature activation | -1.25e-02 |
Pos logit contributions | |
ranc | +0.098 |
err | +0.092 |
attent | +0.087 |
andel | +0.086 |
ther | +0.086 |
Neg logit contributions | |
orse | -0.084 |
mmm | -0.084 |
inations | -0.081 |
on | -0.078 |
achieve | -0.077 |
Token | into |
Token ID | 656 |
Feature activation | -2.33e-02 |
Pos logit contributions | |
ranc | +0.012 |
err | +0.010 |
attent | +0.009 |
iet | +0.009 |
Please | +0.009 |
Neg logit contributions | |
mmm | -0.025 |
on | -0.025 |
orse | -0.024 |
inations | -0.024 |
mm | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
ranc | +0.026 |
err | +0.023 |
attent | +0.022 |
iet | +0.021 |
andel | +0.021 |
Neg logit contributions | |
mmm | -0.042 |
orse | -0.041 |
on | -0.041 |
inations | -0.041 |
mm | -0.040 |
Token | sky |
Token ID | 6766 |
Feature activation | -2.44e-03 |
Pos logit contributions | |
ranc | +0.014 |
err | +0.013 |
attent | +0.012 |
iet | +0.012 |
andel | +0.011 |
Neg logit contributions | |
on | -0.019 |
mmm | -0.018 |
orse | -0.018 |
inations | -0.018 |
Joe | -0.018 |
Token | . |
Token ID | 13 |
Feature activation | -6.90e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
inations | -0.005 |
orse | -0.005 |
mm | -0.005 |
Token | huge |
Token ID | 3236 |
Feature activation | +1.86e-02 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.005 |
mm | +0.004 |
orse | +0.004 |
inations | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.003 |
attent | -0.003 |
veterinarian | -0.003 |
girl | -0.003 |
Token | garden |
Token ID | 11376 |
Feature activation | -1.32e-02 |
Pos logit contributions | |
mmm | +0.029 |
inations | +0.028 |
mm | +0.027 |
on | +0.027 |
orse | +0.027 |
Neg logit contributions | |
ranc | -0.026 |
girl | -0.024 |
veterinarian | -0.023 |
err | -0.022 |
attent | -0.022 |
Token | filled |
Token ID | 5901 |
Feature activation | +6.15e-03 |
Pos logit contributions | |
ranc | +0.016 |
err | +0.014 |
attent | +0.014 |
iet | +0.014 |
Please | +0.013 |
Neg logit contributions | |
mmm | -0.022 |
on | -0.021 |
inations | -0.021 |
orse | -0.021 |
mm | -0.021 |
Token | with |
Token ID | 351 |
Feature activation | -8.62e-03 |
Pos logit contributions | |
mmm | +0.011 |
on | +0.011 |
orse | +0.010 |
inations | +0.010 |
mm | +0.010 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
attent | -0.006 |
iet | -0.006 |
Please | -0.006 |
Token | wild |
Token ID | 4295 |
Feature activation | +2.60e-03 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.009 |
attent | +0.009 |
girl | +0.009 |
iet | +0.009 |
Neg logit contributions | |
mmm | -0.015 |
orse | -0.015 |
on | -0.015 |
mm | -0.014 |
inations | -0.014 |
Token | fl |
Token ID | 2704 |
Feature activation | -6.34e-02 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.005 |
orse | +0.005 |
inations | +0.005 |
mm | +0.005 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
girl | -0.002 |
Token | owers |
Token ID | 3618 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
ranc | +0.068 |
err | +0.065 |
attent | +0.058 |
iet | +0.058 |
andel | +0.057 |
Neg logit contributions | |
orse | -0.113 |
mmm | -0.112 |
inations | -0.109 |
on | -0.107 |
achieve | -0.103 |
Token | and |
Token ID | 290 |
Feature activation | +4.37e-03 |
Pos logit contributions | |
ranc | +0.010 |
out | +0.008 |
attent | +0.008 |
for | +0.008 |
err | +0.008 |
Neg logit contributions | |
mmm | -0.027 |
mm | -0.027 |
inations | -0.026 |
orse | -0.025 |
opter | -0.025 |
Token | trees |
Token ID | 7150 |
Feature activation | +1.11e-02 |
Pos logit contributions | |
mmm | +0.007 |
on | +0.007 |
orse | +0.007 |
mm | +0.007 |
inations | +0.007 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.005 |
attent | -0.005 |
Please | -0.005 |
girl | -0.005 |
Token | ! |
Token ID | 0 |
Feature activation | -3.10e-03 |
Pos logit contributions | |
mmm | +0.024 |
mm | +0.023 |
inations | +0.022 |
orse | +0.022 |
on | +0.022 |
Neg logit contributions | |
ranc | -0.009 |
attent | -0.008 |
err | -0.007 |
out | -0.007 |
veterinarian | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -1.33e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.004 |
Please | +0.003 |
veterinarian | +0.003 |
Neg logit contributions | |
inations | -0.005 |
mmm | -0.005 |
on | -0.005 |
orse | -0.005 |
mm | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +3.10e-03 |
Pos logit contributions | |
mmm | +0.007 |
inations | +0.007 |
orse | +0.007 |
on | +0.006 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.008 |
err | -0.007 |
ther | -0.007 |
girl | -0.007 |
out | -0.007 |
Token | she |
Token ID | 673 |
Feature activation | -5.00e-03 |
Pos logit contributions | |
on | +0.005 |
mmm | +0.005 |
mm | +0.005 |
orse | +0.005 |
Joe | +0.005 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
andel | -0.004 |
Token | found |
Token ID | 1043 |
Feature activation | +1.41e-03 |
Pos logit contributions | |
err | +0.006 |
ranc | +0.006 |
andel | +0.006 |
attent | +0.006 |
iet | +0.005 |
Neg logit contributions | |
on | -0.008 |
orse | -0.008 |
mmm | -0.008 |
inations | -0.008 |
Joe | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | -3.77e-03 |
Pos logit contributions | |
on | +0.002 |
Joe | +0.002 |
John | +0.002 |
mmm | +0.002 |
Mike | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
andel | -0.002 |
Token | shiny |
Token ID | 22441 |
Feature activation | -8.86e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.004 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.006 |
on | -0.006 |
orse | -0.006 |
inations | -0.006 |
etti | -0.006 |
Token | pe |
Token ID | 613 |
Feature activation | -6.33e-02 |
Pos logit contributions | |
ranc | +0.014 |
err | +0.013 |
attent | +0.013 |
iet | +0.012 |
Please | +0.012 |
Neg logit contributions | |
on | -0.012 |
mmm | -0.012 |
orse | -0.011 |
etti | -0.011 |
mm | -0.011 |
Token | b |
Token ID | 65 |
Feature activation | -5.34e-02 |
Pos logit contributions | |
ranc | +0.122 |
err | +0.114 |
attent | +0.109 |
iet | +0.108 |
Please | +0.107 |
Neg logit contributions | |
on | -0.065 |
mmm | -0.064 |
orse | -0.061 |
inations | -0.059 |
mm | -0.056 |
Token | ble |
Token ID | 903 |
Feature activation | -2.78e-02 |
Pos logit contributions | |
ranc | +0.099 |
err | +0.093 |
attent | +0.089 |
iet | +0.088 |
Please | +0.087 |
Neg logit contributions | |
on | -0.057 |
mmm | -0.057 |
orse | -0.054 |
inations | -0.052 |
etti | -0.051 |
Token | and |
Token ID | 290 |
Feature activation | +1.88e-03 |
Pos logit contributions | |
ranc | +0.031 |
err | +0.028 |
attent | +0.026 |
iet | +0.026 |
Please | +0.024 |
Neg logit contributions | |
on | -0.052 |
mmm | -0.050 |
orse | -0.050 |
inations | -0.047 |
etti | -0.047 |
Token | picked |
Token ID | 6497 |
Feature activation | -1.57e-02 |
Pos logit contributions | |
mmm | +0.003 |
on | +0.003 |
orse | +0.003 |
inations | +0.003 |
mm | +0.002 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.002 |
iet | -0.002 |
Please | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | +6.96e-03 |
Pos logit contributions | |
ranc | +0.031 |
err | +0.028 |
iet | +0.027 |
attent | +0.027 |
Please | +0.027 |
Neg logit contributions | |
on | -0.016 |
mmm | -0.015 |
orse | -0.014 |
Joe | -0.014 |
inations | -0.014 |
Token | was |
Token ID | 373 |
Feature activation | -2.31e-02 |
Pos logit contributions | |
ranc | +0.022 |
err | +0.019 |
andel | +0.018 |
attent | +0.018 |
veterinarian | +0.018 |
Neg logit contributions | |
on | -0.018 |
orse | -0.017 |
Joe | -0.016 |
mmm | -0.016 |
etti | -0.015 |
Token | as |
Token ID | 355 |
Feature activation | -7.01e-03 |
Pos logit contributions | |
ranc | +0.035 |
err | +0.032 |
iet | +0.030 |
attent | +0.029 |
veterinarian | +0.029 |
Neg logit contributions | |
on | -0.033 |
mmm | -0.033 |
orse | -0.032 |
Joe | -0.032 |
inations | -0.031 |
Token | tiny |
Token ID | 7009 |
Feature activation | +4.51e-03 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
attent | +0.008 |
Please | +0.007 |
iet | +0.007 |
Neg logit contributions | |
mmm | -0.012 |
on | -0.011 |
orse | -0.011 |
inations | -0.011 |
etti | -0.011 |
Token | as |
Token ID | 355 |
Feature activation | -4.45e-03 |
Pos logit contributions | |
mmm | +0.008 |
on | +0.008 |
orse | +0.008 |
inations | +0.008 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | -6.52e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.005 |
Please | +0.005 |
louder | +0.005 |
Neg logit contributions | |
mmm | -0.007 |
orse | -0.007 |
inations | -0.007 |
on | -0.007 |
etti | -0.007 |
Token | pe |
Token ID | 613 |
Feature activation | -6.26e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
iet | +0.008 |
attent | +0.008 |
Please | +0.007 |
Neg logit contributions | |
on | -0.010 |
mmm | -0.010 |
orse | -0.010 |
inations | -0.010 |
Joe | -0.009 |
Token | a |
Token ID | 64 |
Feature activation | -1.70e-02 |
Pos logit contributions | |
ranc | +0.121 |
err | +0.103 |
nurses | +0.099 |
veterinarian | +0.098 |
attent | +0.098 |
Neg logit contributions | |
on | -0.079 |
orse | -0.073 |
mmm | -0.072 |
inations | -0.067 |
achieve | -0.062 |
Token | . |
Token ID | 13 |
Feature activation | -4.84e-03 |
Pos logit contributions | |
ranc | +0.022 |
err | +0.020 |
iet | +0.019 |
attent | +0.019 |
andel | +0.018 |
Neg logit contributions | |
on | -0.029 |
orse | -0.028 |
mmm | -0.027 |
Joe | -0.026 |
inations | -0.026 |
Token | The |
Token ID | 383 |
Feature activation | +1.69e-03 |
Pos logit contributions | |
ranc | +0.007 |
iet | +0.007 |
err | +0.007 |
andel | +0.006 |
ther | +0.006 |
Neg logit contributions | |
mmm | -0.007 |
Joe | -0.006 |
on | -0.006 |
John | -0.006 |
etti | -0.006 |
Token | little |
Token ID | 1310 |
Feature activation | -6.21e-03 |
Pos logit contributions | |
on | +0.003 |
mmm | +0.003 |
mm | +0.003 |
cube | +0.002 |
orse | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
attent | -0.002 |
iet | -0.002 |
err | -0.002 |
andel | -0.002 |
Token | girl |
Token ID | 2576 |
Feature activation | -6.60e-03 |
Pos logit contributions | |
ranc | +0.006 |
attent | +0.005 |
iet | +0.005 |
err | +0.005 |
andel | +0.004 |
Neg logit contributions | |
on | -0.012 |
Joe | -0.012 |
mmm | -0.012 |
cube | -0.012 |
mm | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | +6.78e-03 |
Pos logit contributions | |
on | +0.003 |
mmm | +0.003 |
orse | +0.003 |
inations | +0.003 |
Joe | +0.003 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | trying |
Token ID | 2111 |
Feature activation | -1.36e-04 |
Pos logit contributions | |
on | +0.009 |
orse | +0.009 |
mmm | +0.009 |
Joe | +0.008 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.011 |
err | -0.010 |
iet | -0.010 |
andel | -0.009 |
attent | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | -2.08e-03 |
Pos logit contributions | |
ranc | +0.000 |
andel | +0.000 |
iet | +0.000 |
err | +0.000 |
masse | +0.000 |
Neg logit contributions | |
on | -0.000 |
Joe | -0.000 |
orse | -0.000 |
mmm | -0.000 |
John | -0.000 |
Token | grab |
Token ID | 5552 |
Feature activation | -9.66e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.002 |
Please | +0.002 |
iet | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
inations | -0.003 |
etti | -0.003 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
ranc | +0.013 |
err | +0.012 |
attent | +0.011 |
iet | +0.011 |
Please | +0.011 |
Neg logit contributions | |
on | -0.016 |
Joe | -0.015 |
mmm | -0.015 |
orse | -0.014 |
etti | -0.014 |
Token | pr |
Token ID | 778 |
Feature activation | -6.26e-02 |
Pos logit contributions | |
ranc | +0.017 |
err | +0.015 |
iet | +0.015 |
Please | +0.014 |
attent | +0.014 |
Neg logit contributions | |
on | -0.014 |
orse | -0.012 |
mmm | -0.012 |
cube | -0.012 |
Joe | -0.011 |
Token | une |
Token ID | 1726 |
Feature activation | -3.00e-02 |
Pos logit contributions | |
ranc | +0.101 |
err | +0.093 |
attent | +0.090 |
Please | +0.089 |
iet | +0.088 |
Neg logit contributions | |
mmm | -0.085 |
on | -0.083 |
mm | -0.078 |
orse | -0.075 |
Joe | -0.074 |
Token | . |
Token ID | 13 |
Feature activation | -4.95e-03 |
Pos logit contributions | |
ranc | +0.041 |
err | +0.037 |
iet | +0.036 |
attent | +0.033 |
Please | +0.033 |
Neg logit contributions | |
on | -0.051 |
mmm | -0.047 |
orse | -0.045 |
Joe | -0.045 |
cube | -0.043 |
Token |
|
Token ID | 198 |
Feature activation | -4.29e-03 |
Pos logit contributions | |
ranc | +0.008 |
iet | +0.007 |
err | +0.007 |
andel | +0.007 |
attent | +0.007 |
Neg logit contributions | |
Joe | -0.006 |
on | -0.006 |
mmm | -0.006 |
orse | -0.006 |
Mike | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | -1.22e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.004 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.007 |
on | -0.007 |
inations | -0.007 |
orse | -0.007 |
etti | -0.007 |
Token | " |
Token ID | 1 |
Feature activation | -4.54e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.002 |
on | -0.002 |
orse | -0.002 |
inations | -0.002 |
etti | -0.002 |
Token | my |
Token ID | 1820 |
Feature activation | -2.82e-03 |
Pos logit contributions | |
mmm | +0.006 |
inations | +0.006 |
mm | +0.006 |
orse | +0.006 |
etti | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
girl | -0.003 |
Please | -0.003 |
veterinarian | -0.003 |
iet | -0.003 |
Token | took |
Token ID | 1718 |
Feature activation | -1.69e-02 |
Pos logit contributions | |
ranc | +0.003 |
veterinarian | +0.002 |
girl | +0.002 |
attent | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.005 |
mm | -0.005 |
inations | -0.005 |
orse | -0.005 |
etti | -0.005 |
Token | out |
Token ID | 503 |
Feature activation | -1.20e-02 |
Pos logit contributions | |
ranc | +0.026 |
err | +0.024 |
attent | +0.024 |
out | +0.024 |
Please | +0.023 |
Neg logit contributions | |
mmm | -0.023 |
orse | -0.023 |
inations | -0.022 |
mm | -0.022 |
etti | -0.021 |
Token | a |
Token ID | 257 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
ranc | +0.015 |
err | +0.013 |
attent | +0.012 |
iet | +0.012 |
Please | +0.012 |
Neg logit contributions | |
on | -0.020 |
mmm | -0.020 |
orse | -0.020 |
inations | -0.019 |
Joe | -0.019 |
Token | bright |
Token ID | 6016 |
Feature activation | -6.63e-03 |
Pos logit contributions | |
ranc | +0.013 |
err | +0.012 |
attent | +0.011 |
iet | +0.011 |
ther | +0.011 |
Neg logit contributions | |
mmm | -0.018 |
orse | -0.018 |
on | -0.018 |
mm | -0.017 |
inations | -0.017 |
Token | therm |
Token ID | 21969 |
Feature activation | -6.20e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.009 |
attent | +0.008 |
iet | +0.008 |
Please | +0.008 |
Neg logit contributions | |
on | -0.010 |
mmm | -0.010 |
orse | -0.009 |
inations | -0.009 |
etti | -0.009 |
Token | ometer |
Token ID | 15635 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
ranc | +0.065 |
err | +0.058 |
attent | +0.057 |
iet | +0.051 |
andel | +0.049 |
Neg logit contributions | |
inations | -0.117 |
mmm | -0.115 |
orse | -0.115 |
on | -0.113 |
achieve | -0.109 |
Token | and |
Token ID | 290 |
Feature activation | -5.84e-03 |
Pos logit contributions | |
ranc | +0.022 |
err | +0.019 |
attent | +0.018 |
iet | +0.017 |
Please | +0.017 |
Neg logit contributions | |
mmm | -0.040 |
on | -0.039 |
orse | -0.038 |
inations | -0.038 |
mm | -0.037 |
Token | checked |
Token ID | 10667 |
Feature activation | +1.02e-03 |
Pos logit contributions | |
ranc | +0.007 |
attent | +0.006 |
out | +0.006 |
nurses | +0.006 |
Please | +0.006 |
Neg logit contributions | |
mmm | -0.010 |
mm | -0.010 |
orse | -0.010 |
etti | -0.010 |
inations | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | -1.02e-02 |
Pos logit contributions | |
orse | +0.002 |
mmm | +0.002 |
inations | +0.002 |
mm | +0.002 |
etti | +0.002 |
Neg logit contributions | |
out | -0.001 |
ranc | -0.001 |
attent | -0.001 |
err | -0.001 |
for | -0.001 |
Token | Joey |
Token ID | 26154 |
Feature activation | -3.94e-03 |
Pos logit contributions | |
ranc | +0.016 |
attent | +0.015 |
err | +0.015 |
Please | +0.014 |
out | +0.014 |
Neg logit contributions | |
inations | -0.015 |
orse | -0.013 |
on | -0.013 |
mm | -0.013 |
mmm | -0.013 |
Token | safely |
Token ID | 11512 |
Feature activation | +6.47e-03 |
Pos logit contributions | |
on | +0.009 |
mmm | +0.009 |
orse | +0.009 |
inations | +0.009 |
Joe | +0.009 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.003 |
attent | -0.003 |
iet | -0.003 |
Please | -0.003 |
Token | away |
Token ID | 1497 |
Feature activation | +9.20e-03 |
Pos logit contributions | |
on | +0.013 |
mmm | +0.013 |
inations | +0.013 |
orse | +0.012 |
etti | +0.012 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.005 |
attent | -0.005 |
iet | -0.005 |
Please | -0.004 |
Token | in |
Token ID | 287 |
Feature activation | -6.48e-03 |
Pos logit contributions | |
mmm | +0.017 |
on | +0.017 |
orse | +0.017 |
inations | +0.016 |
Joe | +0.016 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
iet | -0.008 |
attent | -0.008 |
Please | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | -5.59e-04 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
attent | +0.006 |
corner | +0.005 |
moral | +0.005 |
Neg logit contributions | |
mmm | -0.012 |
orse | -0.012 |
mm | -0.012 |
inations | -0.012 |
etti | -0.012 |
Token | small |
Token ID | 1402 |
Feature activation | +8.16e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
veterinarian | +0.001 |
attent | +0.001 |
girl | +0.001 |
Neg logit contributions | |
mmm | -0.001 |
mm | -0.001 |
on | -0.001 |
etti | -0.001 |
inations | -0.001 |
Token | pe |
Token ID | 613 |
Feature activation | -6.14e-02 |
Pos logit contributions | |
mmm | +0.016 |
mm | +0.016 |
inations | +0.016 |
on | +0.015 |
orse | +0.015 |
Neg logit contributions | |
ranc | -0.009 |
girl | -0.008 |
corner | -0.008 |
veterinarian | -0.007 |
ther | -0.007 |
Token | b |
Token ID | 65 |
Feature activation | -4.88e-02 |
Pos logit contributions | |
ranc | +0.117 |
err | +0.110 |
attent | +0.104 |
Please | +0.104 |
iet | +0.102 |
Neg logit contributions | |
on | -0.065 |
orse | -0.063 |
mmm | -0.062 |
inations | -0.061 |
mm | -0.054 |
Token | ble |
Token ID | 903 |
Feature activation | -2.39e-02 |
Pos logit contributions | |
ranc | +0.084 |
err | +0.079 |
attent | +0.075 |
iet | +0.075 |
Please | +0.073 |
Neg logit contributions | |
mmm | -0.058 |
on | -0.056 |
orse | -0.055 |
inations | -0.054 |
mm | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | -7.41e-03 |
Pos logit contributions | |
ranc | +0.025 |
err | +0.022 |
attent | +0.020 |
iet | +0.020 |
Please | +0.019 |
Neg logit contributions | |
mmm | -0.045 |
on | -0.044 |
orse | -0.043 |
inations | -0.043 |
mm | -0.042 |
Token | |
Token ID | 220 |
Feature activation | -1.41e-02 |
Pos logit contributions | |
ranc | +0.007 |
Please | +0.005 |
err | +0.005 |
veterinarian | +0.005 |
attent | +0.005 |
Neg logit contributions | |
inations | -0.015 |
mmm | -0.015 |
orse | -0.015 |
on | -0.014 |
mm | -0.014 |
Token |
|
Token ID | 198 |
Feature activation | -1.46e-02 |
Pos logit contributions | |
ranc | +0.016 |
err | +0.015 |
attent | +0.014 |
iet | +0.014 |
Please | +0.014 |
Neg logit contributions | |
mmm | -0.024 |
on | -0.023 |
orse | -0.023 |
inations | -0.023 |
etti | -0.023 |
Token | with |
Token ID | 351 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
mmm | +0.006 |
inations | +0.006 |
mm | +0.006 |
orse | +0.006 |
on | +0.006 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.003 |
attent | -0.003 |
Please | -0.003 |
iet | -0.003 |
Token | lots |
Token ID | 6041 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.009 |
out | +0.008 |
girl | +0.008 |
louder | +0.008 |
Neg logit contributions | |
mmm | -0.025 |
orse | -0.024 |
inations | -0.023 |
mm | -0.023 |
on | -0.023 |
Token | of |
Token ID | 286 |
Feature activation | -7.76e-03 |
Pos logit contributions | |
mmm | +0.024 |
orse | +0.023 |
mm | +0.023 |
inations | +0.023 |
achieve | +0.023 |
Neg logit contributions | |
ranc | -0.006 |
andel | -0.006 |
attent | -0.005 |
at | -0.005 |
corner | -0.005 |
Token | lovely |
Token ID | 14081 |
Feature activation | +1.49e-02 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
girl | +0.007 |
ther | +0.006 |
attent | +0.006 |
Neg logit contributions | |
mmm | -0.015 |
orse | -0.015 |
on | -0.015 |
etti | -0.015 |
inations | -0.014 |
Token | wild |
Token ID | 4295 |
Feature activation | +3.32e-03 |
Pos logit contributions | |
mmm | +0.031 |
on | +0.031 |
orse | +0.031 |
mm | +0.030 |
inations | +0.030 |
Neg logit contributions | |
ranc | -0.013 |
err | -0.011 |
girl | -0.010 |
attent | -0.010 |
andel | -0.010 |
Token | fl |
Token ID | 2704 |
Feature activation | -6.13e-02 |
Pos logit contributions | |
mmm | +0.007 |
on | +0.007 |
orse | +0.006 |
inations | +0.006 |
mm | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
andel | -0.002 |
iet | -0.002 |
Token | owers |
Token ID | 3618 |
Feature activation | -1.21e-02 |
Pos logit contributions | |
ranc | +0.074 |
err | +0.070 |
andel | +0.064 |
iet | +0.063 |
attent | +0.063 |
Neg logit contributions | |
mmm | -0.101 |
orse | -0.101 |
inations | -0.098 |
on | -0.098 |
Joe | -0.092 |
Token | growing |
Token ID | 3957 |
Feature activation | -7.58e-03 |
Pos logit contributions | |
ranc | +0.008 |
out | +0.007 |
for | +0.007 |
attent | +0.007 |
at | +0.007 |
Neg logit contributions | |
mmm | -0.027 |
mm | -0.026 |
inations | -0.025 |
orse | -0.024 |
on | -0.024 |
Token | on |
Token ID | 319 |
Feature activation | -8.74e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
attent | +0.006 |
iet | +0.006 |
Please | +0.006 |
Neg logit contributions | |
on | -0.015 |
mmm | -0.014 |
orse | -0.014 |
inations | -0.014 |
Joe | -0.014 |
Token | it |
Token ID | 340 |
Feature activation | +1.14e-02 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.009 |
attent | +0.009 |
out | +0.009 |
Please | +0.009 |
Neg logit contributions | |
inations | -0.016 |
mmm | -0.015 |
orse | -0.015 |
on | -0.014 |
mm | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | -1.09e-03 |
Pos logit contributions | |
mmm | +0.025 |
orse | +0.024 |
inations | +0.024 |
mm | +0.024 |
on | +0.024 |
Neg logit contributions | |
ranc | -0.008 |
err | -0.007 |
attent | -0.007 |
out | -0.006 |
Please | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -3.07e-04 |
Pos logit contributions | |
ranc | +0.051 |
err | +0.049 |
attent | +0.047 |
iet | +0.046 |
Please | +0.045 |
Neg logit contributions | |
on | -0.021 |
mmm | -0.019 |
orse | -0.018 |
mm | -0.017 |
Joe | -0.017 |
Token | she |
Token ID | 673 |
Feature activation | -8.25e-03 |
Pos logit contributions | |
err | +0.001 |
ranc | +0.001 |
iet | +0.001 |
andel | +0.001 |
inct | +0.001 |
Neg logit contributions | |
on | -0.000 |
John | -0.000 |
Jack | -0.000 |
Joe | -0.000 |
mmm | -0.000 |
Token | saw |
Token ID | 2497 |
Feature activation | -4.38e-03 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.010 |
attent | +0.009 |
andel | +0.009 |
iet | +0.009 |
Neg logit contributions | |
on | -0.014 |
orse | -0.013 |
mmm | -0.013 |
inations | -0.013 |
Joe | -0.013 |
Token | a |
Token ID | 257 |
Feature activation | -2.41e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.006 |
attent | +0.005 |
iet | +0.005 |
andel | +0.005 |
Neg logit contributions | |
on | -0.007 |
Joe | -0.007 |
mmm | -0.006 |
orse | -0.006 |
mm | -0.006 |
Token | shiny |
Token ID | 22441 |
Feature activation | -6.63e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
on | -0.004 |
orse | -0.004 |
inations | -0.004 |
mm | -0.004 |
Token | pe |
Token ID | 613 |
Feature activation | -6.10e-02 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.010 |
attent | +0.010 |
iet | +0.009 |
Please | +0.009 |
Neg logit contributions | |
on | -0.009 |
mmm | -0.008 |
orse | -0.008 |
etti | -0.008 |
mm | -0.008 |
Token | b |
Token ID | 65 |
Feature activation | -4.97e-02 |
Pos logit contributions | |
ranc | +0.121 |
err | +0.114 |
attent | +0.109 |
iet | +0.107 |
Please | +0.107 |
Neg logit contributions | |
on | -0.061 |
mmm | -0.058 |
orse | -0.056 |
inations | -0.054 |
mm | -0.051 |
Token | ble |
Token ID | 903 |
Feature activation | -2.32e-02 |
Pos logit contributions | |
ranc | +0.099 |
err | +0.092 |
attent | +0.090 |
iet | +0.088 |
Please | +0.087 |
Neg logit contributions | |
on | -0.049 |
mmm | -0.047 |
orse | -0.045 |
mm | -0.042 |
inations | -0.042 |
Token | on |
Token ID | 319 |
Feature activation | -1.10e-02 |
Pos logit contributions | |
ranc | +0.029 |
err | +0.027 |
attent | +0.024 |
iet | +0.024 |
urse | +0.023 |
Neg logit contributions | |
on | -0.044 |
orse | -0.039 |
mmm | -0.037 |
cube | -0.037 |
Joe | -0.036 |
Token | the |
Token ID | 262 |
Feature activation | -9.62e-03 |
Pos logit contributions | |
ranc | +0.016 |
err | +0.015 |
attent | +0.014 |
iet | +0.014 |
Please | +0.013 |
Neg logit contributions | |
on | -0.016 |
mmm | -0.016 |
orse | -0.015 |
Joe | -0.015 |
etti | -0.015 |
Token | ground |
Token ID | 2323 |
Feature activation | -7.72e-03 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.008 |
attent | +0.008 |
Please | +0.007 |
iet | +0.007 |
Neg logit contributions | |
mmm | -0.019 |
on | -0.018 |
inations | -0.018 |
orse | -0.018 |
etti | -0.018 |
Token | , |
Token ID | 11 |
Feature activation | +8.36e-03 |
Pos logit contributions | |
inations | +0.008 |
mmm | +0.007 |
orse | +0.007 |
etti | +0.007 |
on | +0.007 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.007 |
ther | -0.007 |
upon | -0.007 |
out | -0.007 |
Token | there |
Token ID | 612 |
Feature activation | +1.07e-02 |
Pos logit contributions | |
mmm | +0.016 |
inations | +0.015 |
on | +0.015 |
orse | +0.015 |
etti | +0.015 |
Neg logit contributions | |
ranc | -0.009 |
err | -0.008 |
iet | -0.007 |
attent | -0.007 |
Please | -0.007 |
Token | was |
Token ID | 373 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
inations | +0.027 |
mmm | +0.026 |
orse | +0.024 |
etti | +0.024 |
achieve | +0.023 |
Neg logit contributions | |
ther | -0.005 |
err | -0.005 |
upon | -0.004 |
out | -0.004 |
girl | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | +4.11e-04 |
Pos logit contributions | |
ranc | +0.014 |
err | +0.013 |
attent | +0.012 |
iet | +0.011 |
Please | +0.011 |
Neg logit contributions | |
mmm | -0.029 |
inations | -0.028 |
orse | -0.028 |
on | -0.028 |
etti | -0.027 |
Token | small |
Token ID | 1402 |
Feature activation | +4.89e-03 |
Pos logit contributions | |
mmm | +0.001 |
on | +0.001 |
inations | +0.001 |
orse | +0.001 |
etti | +0.001 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
iet | -0.000 |
veterinarian | -0.000 |
Token | pe |
Token ID | 613 |
Feature activation | -6.05e-02 |
Pos logit contributions | |
mmm | +0.011 |
inations | +0.011 |
on | +0.011 |
orse | +0.010 |
mm | +0.010 |
Neg logit contributions | |
ranc | -0.004 |
girl | -0.003 |
veterinarian | -0.003 |
err | -0.003 |
iet | -0.003 |
Token | b |
Token ID | 65 |
Feature activation | -4.85e-02 |
Pos logit contributions | |
ranc | +0.109 |
err | +0.102 |
attent | +0.097 |
iet | +0.095 |
Please | +0.095 |
Neg logit contributions | |
on | -0.069 |
mmm | -0.068 |
orse | -0.066 |
inations | -0.064 |
mm | -0.061 |
Token | ble |
Token ID | 903 |
Feature activation | -2.42e-02 |
Pos logit contributions | |
ranc | +0.086 |
err | +0.081 |
attent | +0.077 |
iet | +0.076 |
Please | +0.075 |
Neg logit contributions | |
mmm | -0.055 |
on | -0.052 |
inations | -0.052 |
orse | -0.052 |
mm | -0.049 |
Token | that |
Token ID | 326 |
Feature activation | +9.76e-03 |
Pos logit contributions | |
ranc | +0.033 |
err | +0.032 |
attent | +0.030 |
iet | +0.029 |
andel | +0.028 |
Neg logit contributions | |
on | -0.040 |
orse | -0.038 |
cube | -0.035 |
mmm | -0.034 |
Joe | -0.033 |
Token | was |
Token ID | 373 |
Feature activation | -1.56e-02 |
Pos logit contributions | |
mmm | +0.016 |
inations | +0.015 |
etti | +0.015 |
on | +0.015 |
orse | +0.015 |
Neg logit contributions | |
ranc | -0.013 |
err | -0.012 |
Please | -0.011 |
attent | -0.011 |
ther | -0.011 |
Token | very |
Token ID | 845 |
Feature activation | -3.82e-03 |
Pos logit contributions | |
ranc | +0.021 |
err | +0.019 |
attent | +0.018 |
iet | +0.018 |
Please | +0.017 |
Neg logit contributions | |
on | -0.025 |
mmm | -0.025 |
orse | -0.024 |
inations | -0.024 |
Joe | -0.023 |
Token | day |
Token ID | 1110 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.003 |
iet | +0.003 |
attent | +0.003 |
Please | +0.003 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
inations | -0.005 |
etti | -0.005 |
orse | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | -2.56e-03 |
Pos logit contributions | |
ranc | +0.056 |
err | +0.055 |
attent | +0.052 |
iet | +0.051 |
Please | +0.050 |
Neg logit contributions | |
on | -0.019 |
mmm | -0.017 |
orse | -0.016 |
Joe | -0.015 |
mm | -0.014 |
Token | she |
Token ID | 673 |
Feature activation | -8.32e-03 |
Pos logit contributions | |
err | +0.005 |
ranc | +0.005 |
iet | +0.004 |
andel | +0.004 |
oral | +0.004 |
Neg logit contributions | |
on | -0.003 |
Joe | -0.003 |
John | -0.003 |
Jack | -0.003 |
Mike | -0.002 |
Token | found |
Token ID | 1043 |
Feature activation | +1.02e-03 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
attent | +0.008 |
iet | +0.008 |
Please | +0.007 |
Neg logit contributions | |
mmm | -0.015 |
on | -0.015 |
orse | -0.015 |
inations | -0.014 |
mm | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | -3.63e-03 |
Pos logit contributions | |
on | +0.002 |
Joe | +0.001 |
orse | +0.001 |
mmm | +0.001 |
Matt | +0.001 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.001 |
attent | -0.001 |
iet | -0.001 |
andel | -0.001 |
Token | pe |
Token ID | 613 |
Feature activation | -6.04e-02 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.004 |
attent | +0.004 |
iet | +0.004 |
ther | +0.004 |
Neg logit contributions | |
mmm | -0.006 |
on | -0.006 |
inations | -0.006 |
mm | -0.006 |
orse | -0.006 |
Token | b |
Token ID | 65 |
Feature activation | -4.93e-02 |
Pos logit contributions | |
ranc | +0.124 |
err | +0.115 |
attent | +0.110 |
Please | +0.109 |
veterinarian | +0.109 |
Neg logit contributions | |
on | -0.056 |
mmm | -0.053 |
orse | -0.053 |
inations | -0.051 |
mm | -0.046 |
Token | ble |
Token ID | 903 |
Feature activation | -2.27e-02 |
Pos logit contributions | |
ranc | +0.095 |
err | +0.089 |
attent | +0.086 |
iet | +0.084 |
Please | +0.084 |
Neg logit contributions | |
on | -0.050 |
mmm | -0.049 |
orse | -0.047 |
inations | -0.045 |
etti | -0.044 |
Token | that |
Token ID | 326 |
Feature activation | +8.19e-03 |
Pos logit contributions | |
ranc | +0.029 |
err | +0.027 |
attent | +0.025 |
iet | +0.024 |
andel | +0.023 |
Neg logit contributions | |
on | -0.040 |
orse | -0.037 |
mmm | -0.036 |
Joe | -0.035 |
etti | -0.034 |
Token | was |
Token ID | 373 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
mmm | +0.012 |
on | +0.012 |
orse | +0.012 |
inations | +0.012 |
mm | +0.011 |
Neg logit contributions | |
ranc | -0.012 |
err | -0.011 |
attent | -0.010 |
iet | -0.010 |
Please | -0.010 |
Token | very |
Token ID | 845 |
Feature activation | +7.00e-04 |
Pos logit contributions | |
ranc | +0.025 |
err | +0.024 |
attent | +0.022 |
iet | +0.022 |
Please | +0.021 |
Neg logit contributions | |
on | -0.028 |
mmm | -0.027 |
orse | -0.027 |
inations | -0.026 |
Joe | -0.026 |
Token | a |
Token ID | 257 |
Feature activation | -1.96e-03 |
Pos logit contributions | |
mmm | +0.004 |
orse | +0.004 |
inations | +0.004 |
on | +0.004 |
mm | +0.004 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
Please | -0.002 |
out | -0.002 |
Token | bou |
Token ID | 35833 |
Feature activation | -1.23e-02 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
veterinarian | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
mm | -0.003 |
inations | -0.003 |
Token | quet |
Token ID | 21108 |
Feature activation | -8.13e-03 |
Pos logit contributions | |
ranc | +0.021 |
err | +0.020 |
attent | +0.019 |
iet | +0.018 |
Please | +0.018 |
Neg logit contributions | |
mmm | -0.015 |
on | -0.015 |
orse | -0.014 |
inations | -0.014 |
etti | -0.014 |
Token | of |
Token ID | 286 |
Feature activation | +4.98e-03 |
Pos logit contributions | |
ranc | +0.007 |
out | +0.006 |
attent | +0.006 |
for | +0.006 |
err | +0.006 |
Neg logit contributions | |
mmm | -0.017 |
inations | -0.016 |
mm | -0.016 |
orse | -0.016 |
achieve | -0.015 |
Token | wild |
Token ID | 4295 |
Feature activation | +4.95e-03 |
Pos logit contributions | |
mmm | +0.009 |
orse | +0.009 |
on | +0.008 |
inations | +0.008 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.005 |
attent | -0.005 |
iet | -0.005 |
Please | -0.005 |
Token | fl |
Token ID | 2704 |
Feature activation | -5.98e-02 |
Pos logit contributions | |
mmm | +0.009 |
on | +0.009 |
orse | +0.009 |
inations | +0.009 |
mm | +0.009 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | owers |
Token ID | 3618 |
Feature activation | -1.14e-02 |
Pos logit contributions | |
ranc | +0.071 |
err | +0.070 |
ther | +0.065 |
andel | +0.063 |
iet | +0.063 |
Neg logit contributions | |
orse | -0.101 |
mmm | -0.095 |
inations | -0.094 |
achieve | -0.093 |
on | -0.089 |
Token | he |
Token ID | 339 |
Feature activation | +1.01e-03 |
Pos logit contributions | |
for | +0.008 |
out | +0.008 |
ranc | +0.008 |
at | +0.008 |
attent | +0.006 |
Neg logit contributions | |
mmm | -0.025 |
mm | -0.025 |
orse | -0.023 |
inations | -0.023 |
opter | -0.023 |
Token | had |
Token ID | 550 |
Feature activation | -1.27e-02 |
Pos logit contributions | |
mmm | +0.002 |
on | +0.001 |
orse | +0.001 |
etti | +0.001 |
mm | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
Please | -0.001 |
attent | -0.001 |
iet | -0.001 |
Token | picked |
Token ID | 6497 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
ranc | +0.022 |
err | +0.021 |
attent | +0.020 |
iet | +0.020 |
Please | +0.020 |
Neg logit contributions | |
mmm | -0.015 |
on | -0.014 |
orse | -0.014 |
inations | -0.013 |
mm | -0.013 |
Token | for |
Token ID | 329 |
Feature activation | -1.91e-02 |
Pos logit contributions | |
ranc | +0.014 |
err | +0.012 |
attent | +0.011 |
iet | +0.011 |
Please | +0.011 |
Neg logit contributions | |
mmm | -0.024 |
on | -0.024 |
orse | -0.023 |
inations | -0.023 |
Joe | -0.023 |
Token | nodded |
Token ID | 14464 |
Feature activation | +1.45e-03 |
Pos logit contributions | |
mmm | +0.021 |
inations | +0.020 |
on | +0.019 |
mm | +0.019 |
orse | +0.019 |
Neg logit contributions | |
ranc | -0.018 |
err | -0.018 |
attent | -0.017 |
iet | -0.016 |
Please | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | -7.31e-03 |
Pos logit contributions | |
Joe | +0.002 |
on | +0.002 |
orse | +0.002 |
John | +0.002 |
mmm | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
andel | -0.002 |
masse | -0.002 |
veterinarian | -0.002 |
Token | picked |
Token ID | 6497 |
Feature activation | -3.08e-03 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.009 |
attent | +0.008 |
girl | +0.008 |
louder | +0.008 |
Neg logit contributions | |
mmm | -0.012 |
inations | -0.011 |
on | -0.011 |
mm | -0.011 |
etti | -0.011 |
Token | up |
Token ID | 510 |
Feature activation | -1.43e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
on | -0.006 |
mmm | -0.006 |
orse | -0.006 |
Joe | -0.006 |
inations | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | -7.85e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
on | -0.002 |
mmm | -0.002 |
orse | -0.002 |
Joe | -0.002 |
inations | -0.002 |
Token | pe |
Token ID | 613 |
Feature activation | -5.98e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
girl | +0.008 |
ther | +0.008 |
attent | +0.008 |
Neg logit contributions | |
mmm | -0.014 |
mm | -0.013 |
inations | -0.013 |
etti | -0.013 |
on | -0.013 |
Token | b |
Token ID | 65 |
Feature activation | -5.05e-02 |
Pos logit contributions | |
ranc | +0.116 |
err | +0.109 |
attent | +0.104 |
iet | +0.103 |
Please | +0.103 |
Neg logit contributions | |
on | -0.059 |
mmm | -0.059 |
orse | -0.057 |
inations | -0.055 |
mm | -0.052 |
Token | ble |
Token ID | 903 |
Feature activation | -1.90e-02 |
Pos logit contributions | |
ranc | +0.095 |
err | +0.089 |
attent | +0.085 |
iet | +0.084 |
Please | +0.083 |
Neg logit contributions | |
mmm | -0.053 |
on | -0.053 |
orse | -0.050 |
inations | -0.049 |
mm | -0.047 |
Token | too |
Token ID | 1165 |
Feature activation | -4.55e-03 |
Pos logit contributions | |
ranc | +0.022 |
err | +0.020 |
iet | +0.018 |
attent | +0.018 |
Please | +0.017 |
Neg logit contributions | |
on | -0.034 |
mmm | -0.033 |
orse | -0.033 |
Joe | -0.032 |
inations | -0.031 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e-04 |
Pos logit contributions | |
attent | +0.001 |
for | +0.001 |
louder | +0.001 |
at | +0.001 |
out | +0.001 |
Neg logit contributions | |
inations | -0.012 |
mm | -0.011 |
on | -0.011 |
etti | -0.011 |
mmm | -0.011 |
Token | He |
Token ID | 679 |
Feature activation | +7.31e-04 |
Pos logit contributions | |
on | +0.000 |
mmm | +0.000 |
orse | +0.000 |
Joe | +0.000 |
mm | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
iet | -0.000 |
attent | -0.000 |
andel | -0.000 |
Token | Mom |
Token ID | 11254 |
Feature activation | +2.76e-03 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.009 |
attent | +0.008 |
iet | +0.008 |
Please | +0.008 |
Neg logit contributions | |
mmm | -0.016 |
on | -0.016 |
orse | -0.016 |
inations | -0.016 |
mm | -0.015 |
Token | my |
Token ID | 1820 |
Feature activation | -7.53e-03 |
Pos logit contributions | |
mmm | +0.005 |
orse | +0.004 |
inations | +0.004 |
on | +0.004 |
mm | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.003 |
attent | -0.003 |
Please | -0.003 |
iet | -0.003 |
Token | gave |
Token ID | 2921 |
Feature activation | -7.35e-03 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
attent | +0.008 |
Please | +0.008 |
veterinarian | +0.008 |
Neg logit contributions | |
mmm | -0.013 |
on | -0.012 |
inations | -0.012 |
mm | -0.012 |
etti | -0.012 |
Token | her |
Token ID | 607 |
Feature activation | -1.82e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
iet | +0.007 |
andel | +0.007 |
attent | +0.007 |
Neg logit contributions | |
on | -0.013 |
John | -0.012 |
Joe | -0.012 |
mmm | -0.012 |
Mike | -0.012 |
Token | a |
Token ID | 257 |
Feature activation | -7.75e-03 |
Pos logit contributions | |
ranc | +0.028 |
err | +0.027 |
attent | +0.025 |
iet | +0.025 |
andel | +0.025 |
Neg logit contributions | |
on | -0.025 |
Joe | -0.023 |
mmm | -0.022 |
John | -0.021 |
orse | -0.021 |
Token | therm |
Token ID | 21969 |
Feature activation | -5.97e-02 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.011 |
iet | +0.010 |
Please | +0.010 |
attent | +0.010 |
Neg logit contributions | |
on | -0.011 |
mmm | -0.011 |
orse | -0.011 |
inations | -0.010 |
cube | -0.010 |
Token | ometer |
Token ID | 15635 |
Feature activation | -1.48e-02 |
Pos logit contributions | |
ranc | +0.074 |
err | +0.067 |
attent | +0.062 |
iet | +0.060 |
Please | +0.059 |
Neg logit contributions | |
mmm | -0.101 |
on | -0.100 |
inations | -0.099 |
orse | -0.097 |
achieve | -0.094 |
Token | to |
Token ID | 284 |
Feature activation | -6.02e-03 |
Pos logit contributions | |
ranc | +0.017 |
err | +0.016 |
iet | +0.015 |
attent | +0.014 |
Please | +0.014 |
Neg logit contributions | |
on | -0.026 |
mmm | -0.025 |
orse | -0.025 |
etti | -0.024 |
Joe | -0.024 |
Token | see |
Token ID | 766 |
Feature activation | -1.17e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.008 |
attent | +0.008 |
iet | +0.008 |
Please | +0.008 |
Neg logit contributions | |
mmm | -0.009 |
on | -0.009 |
orse | -0.008 |
inations | -0.008 |
etti | -0.008 |
Token | how |
Token ID | 703 |
Feature activation | -5.76e-03 |
Pos logit contributions | |
ranc | +0.012 |
err | +0.011 |
attent | +0.010 |
iet | +0.010 |
andel | +0.010 |
Neg logit contributions | |
on | -0.022 |
mmm | -0.022 |
orse | -0.021 |
inations | -0.021 |
Joe | -0.021 |
Token | sick |
Token ID | 6639 |
Feature activation | +2.17e-02 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
attent | +0.007 |
iet | +0.007 |
Please | +0.007 |
Neg logit contributions | |
mmm | -0.009 |
on | -0.009 |
orse | -0.009 |
inations | -0.008 |
mm | -0.008 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -1.76e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
orse | -0.005 |
inations | -0.005 |
mm | -0.005 |
Token | Once |
Token ID | 7454 |
Feature activation | -4.54e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
inations | -0.003 |
mm | -0.003 |
Token | there |
Token ID | 612 |
Feature activation | +8.85e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.001 |
attent | +0.001 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.011 |
on | -0.011 |
orse | -0.011 |
inations | -0.011 |
etti | -0.011 |
Token | was |
Token ID | 373 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
inations | +0.022 |
mmm | +0.021 |
orse | +0.020 |
etti | +0.020 |
achieve | +0.019 |
Neg logit contributions | |
upon | -0.005 |
girl | -0.005 |
ther | -0.004 |
out | -0.004 |
err | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | +1.29e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.008 |
out | +0.007 |
girl | +0.007 |
ther | +0.007 |
Neg logit contributions | |
inations | -0.027 |
mmm | -0.027 |
orse | -0.026 |
achieve | -0.026 |
etti | -0.026 |
Token | pe |
Token ID | 613 |
Feature activation | -5.96e-02 |
Pos logit contributions | |
mmm | +0.003 |
on | +0.003 |
inations | +0.003 |
orse | +0.003 |
etti | +0.003 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
iet | -0.001 |
veterinarian | -0.001 |
Token | b |
Token ID | 65 |
Feature activation | -4.69e-02 |
Pos logit contributions | |
ranc | +0.105 |
err | +0.099 |
attent | +0.094 |
iet | +0.093 |
Please | +0.092 |
Neg logit contributions | |
on | -0.068 |
mmm | -0.068 |
orse | -0.066 |
inations | -0.064 |
mm | -0.061 |
Token | ble |
Token ID | 903 |
Feature activation | -2.25e-02 |
Pos logit contributions | |
ranc | +0.079 |
err | +0.075 |
iet | +0.071 |
attent | +0.070 |
Please | +0.068 |
Neg logit contributions | |
mmm | -0.056 |
inations | -0.055 |
orse | -0.053 |
on | -0.052 |
mm | -0.051 |
Token | . |
Token ID | 13 |
Feature activation | -2.89e-03 |
Pos logit contributions | |
ranc | +0.032 |
err | +0.031 |
attent | +0.028 |
iet | +0.027 |
911 | +0.027 |
Neg logit contributions | |
on | -0.036 |
orse | -0.035 |
cube | -0.031 |
mmm | -0.031 |
Joe | -0.030 |
Token | The |
Token ID | 383 |
Feature activation | +4.30e-03 |
Pos logit contributions | |
Please | +0.002 |
ranc | +0.002 |
err | +0.002 |
Across | +0.001 |
On | +0.001 |
Neg logit contributions | |
inations | -0.007 |
ll | -0.007 |
orse | -0.006 |
achieve | -0.006 |
opter | -0.006 |
Token | pe |
Token ID | 613 |
Feature activation | -3.22e-02 |
Pos logit contributions | |
mmm | +0.007 |
inations | +0.007 |
etti | +0.007 |
orse | +0.007 |
on | +0.007 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.005 |
attent | -0.005 |
girl | -0.005 |
Please | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +5.97e-03 |
Pos logit contributions | |
orse | +0.009 |
mmm | +0.009 |
inations | +0.009 |
mm | +0.008 |
icated | +0.008 |
Neg logit contributions | |
out | -0.007 |
ranc | -0.007 |
corner | -0.007 |
for | -0.007 |
attent | -0.007 |
Token | he |
Token ID | 339 |
Feature activation | +4.31e-03 |
Pos logit contributions | |
mmm | +0.007 |
inations | +0.007 |
orse | +0.007 |
etti | +0.007 |
mm | +0.007 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
attent | -0.009 |
Please | -0.009 |
out | -0.009 |
Token | found |
Token ID | 1043 |
Feature activation | +9.95e-03 |
Pos logit contributions | |
mmm | +0.009 |
mm | +0.008 |
inations | +0.008 |
orse | +0.008 |
on | +0.008 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.004 |
Please | -0.004 |
iet | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | +4.40e-03 |
Pos logit contributions | |
mmm | +0.021 |
inations | +0.020 |
orse | +0.020 |
mm | +0.020 |
achieve | +0.019 |
Neg logit contributions | |
ranc | -0.008 |
out | -0.008 |
err | -0.008 |
attent | -0.007 |
louder | -0.007 |
Token | room |
Token ID | 2119 |
Feature activation | -7.47e-03 |
Pos logit contributions | |
mmm | +0.008 |
mm | +0.008 |
orse | +0.008 |
on | +0.008 |
inations | +0.007 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
veterinarian | -0.004 |
attent | -0.004 |
girl | -0.004 |
Token | full |
Token ID | 1336 |
Feature activation | +2.60e-02 |
Pos logit contributions | |
ranc | +0.009 |
err | +0.009 |
attent | +0.008 |
iet | +0.008 |
Please | +0.008 |
Neg logit contributions | |
on | -0.012 |
mmm | -0.012 |
orse | -0.012 |
inations | -0.012 |
etti | -0.012 |
Token | of |
Token ID | 286 |
Feature activation | +4.21e-03 |
Pos logit contributions | |
mmm | +0.047 |
orse | +0.046 |
inations | +0.045 |
on | +0.044 |
mm | +0.044 |
Neg logit contributions | |
ranc | -0.029 |
err | -0.026 |
attent | -0.024 |
veterinarian | -0.023 |
Please | -0.023 |
Token | games |
Token ID | 1830 |
Feature activation | -1.67e-03 |
Pos logit contributions | |
mmm | +0.007 |
orse | +0.007 |
etti | +0.007 |
mm | +0.007 |
on | +0.007 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.004 |
girl | -0.004 |
nurses | -0.004 |
Token | and |
Token ID | 290 |
Feature activation | -2.46e-04 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
out | +0.001 |
for | +0.001 |
Neg logit contributions | |
mmm | -0.004 |
mm | -0.003 |
orse | -0.003 |
inations | -0.003 |
on | -0.003 |
Token | toys |
Token ID | 14958 |
Feature activation | +1.93e-03 |
Pos logit contributions | |
ranc | +0.000 |
err | +0.000 |
girl | +0.000 |
attent | +0.000 |
nurses | +0.000 |
Neg logit contributions | |
mmm | -0.000 |
mm | -0.000 |
orse | -0.000 |
on | -0.000 |
etti | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +9.41e-04 |
Pos logit contributions | |
mmm | +0.004 |
orse | +0.004 |
mm | +0.004 |
on | +0.004 |
inations | +0.004 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.001 |
attent | -0.001 |
out | -0.001 |
Please | -0.001 |
Token | became |
Token ID | 2627 |
Feature activation | +6.82e-04 |
Pos logit contributions | |
mmm | +0.019 |
etti | +0.019 |
on | +0.018 |
mm | +0.018 |
inations | +0.018 |
Neg logit contributions | |
ranc | -0.013 |
moral | -0.013 |
for | -0.013 |
attent | -0.013 |
Please | -0.013 |
Token | a |
Token ID | 257 |
Feature activation | +3.12e-03 |
Pos logit contributions | |
mmm | +0.001 |
on | +0.001 |
orse | +0.001 |
inations | +0.001 |
etti | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
veterinarian | -0.001 |
girl | -0.001 |
moral | -0.001 |
Token | good |
Token ID | 922 |
Feature activation | +1.91e-03 |
Pos logit contributions | |
mmm | +0.006 |
mm | +0.006 |
on | +0.006 |
inations | +0.006 |
orse | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
girl | -0.003 |
veterinarian | -0.003 |
err | -0.003 |
moral | -0.003 |
Token | friend |
Token ID | 1545 |
Feature activation | +1.61e-03 |
Pos logit contributions | |
mmm | +0.004 |
on | +0.003 |
inations | +0.003 |
mm | +0.003 |
orse | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
veterinarian | -0.002 |
girl | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | +7.42e-03 |
Pos logit contributions | |
mmm | +0.003 |
inations | +0.003 |
on | +0.003 |
orse | +0.003 |
mm | +0.003 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
Please | -0.001 |
attent | -0.001 |
veterinarian | -0.001 |
Token | From |
Token ID | 3574 |
Feature activation | +2.95e-02 |
Pos logit contributions | |
inations | +0.015 |
mmm | +0.014 |
etti | +0.014 |
opter | +0.013 |
achieve | +0.013 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.007 |
veterinarian | -0.006 |
attent | -0.006 |
moral | -0.005 |
Token | that |
Token ID | 326 |
Feature activation | -4.40e-03 |
Pos logit contributions | |
inations | +0.044 |
on | +0.043 |
mmm | +0.043 |
orse | +0.042 |
etti | +0.042 |
Neg logit contributions | |
ranc | -0.043 |
Please | -0.038 |
iet | -0.037 |
err | -0.037 |
attent | -0.037 |
Token | day |
Token ID | 1110 |
Feature activation | -1.94e-02 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.004 |
attent | +0.004 |
moral | +0.004 |
iet | +0.004 |
Neg logit contributions | |
mmm | -0.008 |
etti | -0.008 |
inations | -0.008 |
orse | -0.008 |
on | -0.008 |
Token | on |
Token ID | 319 |
Feature activation | +1.72e-02 |
Pos logit contributions | |
ranc | +0.015 |
err | +0.014 |
attent | +0.012 |
iet | +0.011 |
andel | +0.011 |
Neg logit contributions | |
on | -0.042 |
mmm | -0.041 |
orse | -0.040 |
inations | -0.039 |
mm | -0.039 |
Token | , |
Token ID | 11 |
Feature activation | +4.24e-03 |
Pos logit contributions | |
inations | +0.033 |
etti | +0.032 |
mmm | +0.031 |
orse | +0.030 |
icated | +0.028 |
Neg logit contributions | |
for | -0.017 |
ranc | -0.016 |
at | -0.016 |
ther | -0.016 |
out | -0.016 |
Token | Lucy |
Token ID | 22162 |
Feature activation | -6.99e-04 |
Pos logit contributions | |
inations | +0.008 |
mmm | +0.008 |
etti | +0.008 |
opter | +0.008 |
orse | +0.008 |
Neg logit contributions | |
ranc | -0.004 |
for | -0.004 |
girl | -0.003 |
attent | -0.003 |
at | -0.003 |
Token | sang |
Token ID | 25889 |
Feature activation | -4.92e-03 |
Pos logit contributions | |
mmm | +0.010 |
mm | +0.009 |
inations | +0.009 |
achieve | +0.008 |
orse | +0.008 |
Neg logit contributions | |
ranc | -0.006 |
out | -0.005 |
attent | -0.005 |
girl | -0.005 |
for | -0.005 |
Token | songs |
Token ID | 7259 |
Feature activation | -5.59e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.005 |
attent | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.009 |
on | -0.008 |
orse | -0.008 |
inations | -0.008 |
mm | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +8.43e-04 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.005 |
attent | +0.005 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.011 |
on | -0.010 |
orse | -0.010 |
inations | -0.010 |
mm | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +3.52e-03 |
Pos logit contributions | |
inations | +0.001 |
mmm | +0.001 |
orse | +0.001 |
on | +0.001 |
mm | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
Please | -0.001 |
veterinarian | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +5.96e-03 |
Pos logit contributions | |
etti | +0.007 |
mmm | +0.007 |
inations | +0.007 |
mm | +0.007 |
orse | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
moral | -0.002 |
iet | -0.002 |
Token | At |
Token ID | 2953 |
Feature activation | +2.38e-02 |
Pos logit contributions | |
mmm | +0.010 |
on | +0.010 |
orse | +0.009 |
inations | +0.009 |
mm | +0.009 |
Neg logit contributions | |
ranc | -0.008 |
err | -0.007 |
attent | -0.007 |
iet | -0.007 |
Please | -0.006 |
Token | the |
Token ID | 262 |
Feature activation | +2.40e-03 |
Pos logit contributions | |
mmm | +0.045 |
inations | +0.044 |
orse | +0.044 |
on | +0.044 |
etti | +0.043 |
Neg logit contributions | |
ranc | -0.023 |
moral | -0.020 |
attent | -0.020 |
for | -0.020 |
out | -0.020 |
Token | end |
Token ID | 886 |
Feature activation | -2.30e-03 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.005 |
mm | +0.004 |
orse | +0.004 |
Joe | +0.004 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
andel | -0.002 |
Token | of |
Token ID | 286 |
Feature activation | +5.09e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
girl | +0.002 |
veterinarian | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
inations | -0.004 |
orse | -0.004 |
on | -0.004 |
mm | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | -3.80e-03 |
Pos logit contributions | |
on | +0.007 |
mmm | +0.007 |
Joe | +0.007 |
orse | +0.007 |
John | +0.006 |
Neg logit contributions | |
ranc | -0.008 |
err | -0.008 |
attent | -0.007 |
iet | -0.007 |
Please | -0.007 |
Token | day |
Token ID | 1110 |
Feature activation | -1.13e-02 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.006 |
on | -0.006 |
orse | -0.006 |
inations | -0.006 |
etti | -0.006 |
Token | , |
Token ID | 11 |
Feature activation | -5.52e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
orse | -0.001 |
inations | -0.001 |
etti | -0.001 |
Token | " |
Token ID | 366 |
Feature activation | -4.90e-03 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.006 |
iet | +0.005 |
andel | +0.005 |
attent | +0.005 |
Neg logit contributions | |
on | -0.010 |
mmm | -0.010 |
Joe | -0.010 |
orse | -0.010 |
John | -0.010 |
Token | Why |
Token ID | 5195 |
Feature activation | -2.52e-03 |
Pos logit contributions | |
ranc | +0.006 |
andel | +0.005 |
attent | +0.005 |
err | +0.005 |
err | +0.004 |
Neg logit contributions | |
on | -0.009 |
mmm | -0.009 |
Joe | -0.008 |
orse | -0.008 |
Mike | -0.008 |
Token | is |
Token ID | 318 |
Feature activation | +1.76e-02 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
iet | +0.004 |
urse | +0.003 |
moral | +0.003 |
Neg logit contributions | |
mmm | -0.003 |
orse | -0.003 |
inations | -0.003 |
etti | -0.003 |
on | -0.003 |
Token | my |
Token ID | 616 |
Feature activation | -3.13e-03 |
Pos logit contributions | |
mmm | +0.026 |
inations | +0.026 |
orse | +0.025 |
on | +0.025 |
etti | +0.025 |
Neg logit contributions | |
ranc | -0.026 |
Please | -0.022 |
err | -0.022 |
attent | -0.021 |
veterinarian | -0.021 |
Token | towel |
Token ID | 24808 |
Feature activation | +3.07e-02 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.003 |
attent | +0.003 |
Please | +0.003 |
iet | +0.003 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
orse | -0.005 |
inations | -0.005 |
Joe | -0.005 |
Token | so |
Token ID | 523 |
Feature activation | +1.28e-02 |
Pos logit contributions | |
mmm | +0.046 |
on | +0.045 |
orse | +0.045 |
inations | +0.044 |
mm | +0.043 |
Neg logit contributions | |
ranc | -0.043 |
err | -0.039 |
iet | -0.037 |
attent | -0.037 |
Please | -0.036 |
Token | bad |
Token ID | 2089 |
Feature activation | -3.99e-03 |
Pos logit contributions | |
mmm | +0.021 |
on | +0.021 |
orse | +0.021 |
inations | +0.020 |
etti | +0.020 |
Neg logit contributions | |
ranc | -0.016 |
err | -0.014 |
attent | -0.014 |
iet | -0.013 |
Please | -0.013 |
Token | ?" |
Token ID | 1701 |
Feature activation | +2.25e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
attent | +0.006 |
iet | +0.006 |
andel | +0.006 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
Joe | -0.004 |
orse | -0.004 |
mm | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | -4.11e-03 |
Pos logit contributions | |
on | +0.003 |
mmm | +0.003 |
orse | +0.003 |
Joe | +0.003 |
inations | +0.003 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
iet | -0.003 |
attent | -0.003 |
andel | -0.003 |
Token |
|
Token ID | 198 |
Feature activation | +1.48e-04 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.005 |
attent | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
on | -0.006 |
mmm | -0.006 |
orse | -0.006 |
inations | -0.006 |
Joe | -0.006 |
Token | a |
Token ID | 257 |
Feature activation | +2.68e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.007 |
on | -0.007 |
orse | -0.007 |
inations | -0.007 |
mm | -0.007 |
Token | play |
Token ID | 711 |
Feature activation | -1.47e-02 |
Pos logit contributions | |
on | +0.004 |
mmm | +0.004 |
orse | +0.004 |
inations | +0.004 |
etti | +0.004 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
iet | -0.003 |
Please | -0.003 |
Token | about |
Token ID | 546 |
Feature activation | +3.90e-03 |
Pos logit contributions | |
ranc | +0.027 |
err | +0.025 |
attent | +0.025 |
andel | +0.024 |
iet | +0.024 |
Neg logit contributions | |
on | -0.018 |
orse | -0.014 |
e | -0.014 |
cube | -0.014 |
etti | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | +6.42e-03 |
Pos logit contributions | |
mmm | +0.007 |
on | +0.007 |
orse | +0.007 |
inations | +0.007 |
mm | +0.007 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | princess |
Token ID | 21752 |
Feature activation | -7.59e-04 |
Pos logit contributions | |
mmm | +0.011 |
on | +0.010 |
orse | +0.010 |
inations | +0.010 |
mm | +0.010 |
Neg logit contributions | |
ranc | -0.008 |
err | -0.007 |
attent | -0.007 |
iet | -0.007 |
veterinarian | -0.007 |
Token | who |
Token ID | 508 |
Feature activation | +2.78e-02 |
Pos logit contributions | |
err | +0.001 |
ranc | +0.001 |
attent | +0.001 |
andel | +0.001 |
iet | +0.001 |
Neg logit contributions | |
on | -0.001 |
orse | -0.001 |
inations | -0.001 |
etti | -0.001 |
mmm | -0.001 |
Token | lost |
Token ID | 2626 |
Feature activation | +6.70e-03 |
Pos logit contributions | |
mmm | +0.050 |
inations | +0.047 |
mm | +0.046 |
orse | +0.045 |
etti | +0.044 |
Neg logit contributions | |
ranc | -0.034 |
attent | -0.029 |
Please | -0.029 |
err | -0.029 |
iet | -0.028 |
Token | her |
Token ID | 607 |
Feature activation | -2.93e-03 |
Pos logit contributions | |
on | +0.011 |
Joe | +0.010 |
e | +0.010 |
Mike | +0.010 |
John | +0.010 |
Neg logit contributions | |
err | -0.008 |
attent | -0.008 |
ranc | -0.008 |
Please | -0.007 |
oral | -0.007 |
Token | crown |
Token ID | 12389 |
Feature activation | +1.72e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.003 |
attent | +0.003 |
iet | +0.003 |
Please | +0.003 |
Neg logit contributions | |
on | -0.005 |
mmm | -0.005 |
orse | -0.005 |
inations | -0.005 |
mm | -0.004 |
Token | . |
Token ID | 13 |
Feature activation | -6.18e-04 |
Pos logit contributions | |
on | +0.003 |
mmm | +0.003 |
orse | +0.003 |
inations | +0.003 |
etti | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
Please | -0.002 |
Token | During |
Token ID | 5856 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
err | +0.001 |
iet | +0.001 |
ranc | +0.001 |
eh | +0.001 |
andel | +0.001 |
Neg logit contributions | |
John | -0.001 |
Joe | -0.001 |
Jack | -0.001 |
Mike | -0.001 |
etti | -0.001 |
Token | little |
Token ID | 1310 |
Feature activation | -6.61e-03 |
Pos logit contributions | |
on | +0.008 |
cube | +0.008 |
orse | +0.007 |
mm | +0.007 |
inations | +0.007 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.005 |
andel | -0.005 |
iet | -0.005 |
Token | girl |
Token ID | 2576 |
Feature activation | -5.10e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.003 |
attent | +0.003 |
iet | +0.003 |
andel | +0.002 |
Neg logit contributions | |
on | -0.015 |
Joe | -0.015 |
mmm | -0.015 |
etti | -0.014 |
mm | -0.014 |
Token | couldn |
Token ID | 3521 |
Feature activation | +8.11e-03 |
Pos logit contributions | |
ranc | +0.006 |
attent | +0.005 |
err | +0.005 |
girl | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.010 |
inations | -0.009 |
on | -0.009 |
mm | -0.009 |
etti | -0.009 |
Token | 't |
Token ID | 470 |
Feature activation | -1.18e-02 |
Pos logit contributions | |
mmm | +0.011 |
inations | +0.011 |
orse | +0.011 |
on | +0.011 |
mm | +0.010 |
Neg logit contributions | |
ranc | -0.012 |
err | -0.011 |
attent | -0.011 |
Please | -0.011 |
veterinarian | -0.011 |
Token | believe |
Token ID | 1975 |
Feature activation | -1.33e-02 |
Pos logit contributions | |
ranc | +0.021 |
err | +0.019 |
attent | +0.019 |
Please | +0.018 |
veterinarian | +0.018 |
Neg logit contributions | |
mmm | -0.014 |
on | -0.014 |
mm | -0.013 |
inations | -0.013 |
orse | -0.013 |
Token | it |
Token ID | 340 |
Feature activation | +8.23e-04 |
Pos logit contributions | |
ranc | +0.018 |
err | +0.016 |
attent | +0.016 |
iet | +0.015 |
Please | +0.015 |
Neg logit contributions | |
mmm | -0.021 |
on | -0.021 |
orse | -0.020 |
inations | -0.020 |
mm | -0.019 |
Token | ! |
Token ID | 0 |
Feature activation | +1.62e-03 |
Pos logit contributions | |
mmm | +0.001 |
on | +0.001 |
orse | +0.001 |
inations | +0.001 |
etti | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
iet | -0.001 |
Please | -0.001 |
Token | She |
Token ID | 1375 |
Feature activation | -1.26e-02 |
Pos logit contributions | |
orse | +0.003 |
inations | +0.003 |
on | +0.003 |
mmm | +0.003 |
mm | +0.003 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
Please | -0.001 |
veterinarian | -0.001 |
Token | waved |
Token ID | 26834 |
Feature activation | -5.45e-03 |
Pos logit contributions | |
ranc | +0.016 |
attent | +0.014 |
err | +0.013 |
Please | +0.013 |
iet | +0.013 |
Neg logit contributions | |
mmm | -0.022 |
on | -0.022 |
mm | -0.021 |
inations | -0.021 |
etti | -0.020 |
Token | goodbye |
Token ID | 24829 |
Feature activation | +2.26e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
eh | +0.006 |
iet | +0.006 |
urse | +0.005 |
Neg logit contributions | |
Joe | -0.009 |
John | -0.009 |
Mike | -0.009 |
on | -0.009 |
Matt | -0.009 |
Token | and |
Token ID | 290 |
Feature activation | -5.84e-03 |
Pos logit contributions | |
orse | +0.004 |
mmm | +0.004 |
on | +0.004 |
Joe | +0.004 |
etti | +0.003 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
iet | -0.002 |
andel | -0.002 |
ther | -0.002 |
Token | playing |
Token ID | 2712 |
Feature activation | -9.12e-03 |
Pos logit contributions | |
on | +0.020 |
orse | +0.019 |
mmm | +0.019 |
inations | +0.018 |
Joe | +0.018 |
Neg logit contributions | |
ranc | -0.026 |
err | -0.025 |
attent | -0.024 |
andel | -0.023 |
Please | -0.023 |
Token | in |
Token ID | 287 |
Feature activation | +2.97e-03 |
Pos logit contributions | |
ranc | +0.013 |
err | +0.011 |
andel | +0.011 |
iet | +0.010 |
attent | +0.010 |
Neg logit contributions | |
on | -0.015 |
e | -0.014 |
orse | -0.013 |
achieve | -0.013 |
Joe | -0.013 |
Token | the |
Token ID | 262 |
Feature activation | -3.56e-04 |
Pos logit contributions | |
mmm | +0.007 |
inations | +0.007 |
mm | +0.007 |
orse | +0.007 |
opter | +0.006 |
Neg logit contributions | |
her | -0.002 |
corner | -0.002 |
ranc | -0.002 |
girl | -0.002 |
ther | -0.002 |
Token | park |
Token ID | 3952 |
Feature activation | -5.31e-03 |
Pos logit contributions | |
ranc | +0.000 |
err | +0.000 |
iet | +0.000 |
girl | +0.000 |
ther | +0.000 |
Neg logit contributions | |
mmm | -0.001 |
inations | -0.001 |
orse | -0.001 |
mm | -0.001 |
on | -0.001 |
Token | with |
Token ID | 351 |
Feature activation | -7.67e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
iet | +0.006 |
andel | +0.006 |
attent | +0.006 |
Neg logit contributions | |
on | -0.009 |
orse | -0.008 |
mmm | -0.008 |
Joe | -0.008 |
etti | -0.008 |
Token | their |
Token ID | 511 |
Feature activation | +7.52e-03 |
Pos logit contributions | |
ranc | +0.007 |
iet | +0.006 |
err | +0.006 |
girl | +0.005 |
ther | +0.005 |
Neg logit contributions | |
mmm | -0.016 |
inations | -0.016 |
orse | -0.016 |
mm | -0.015 |
on | -0.015 |
Token | toys |
Token ID | 14958 |
Feature activation | -6.76e-03 |
Pos logit contributions | |
mmm | +0.017 |
inations | +0.016 |
orse | +0.015 |
on | +0.015 |
etti | +0.015 |
Neg logit contributions | |
ranc | -0.007 |
girl | -0.007 |
err | -0.006 |
moral | -0.005 |
ther | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.50e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.008 |
iet | +0.007 |
attent | +0.007 |
andel | +0.007 |
Neg logit contributions | |
on | -0.011 |
orse | -0.011 |
mmm | -0.011 |
inations | -0.010 |
Joe | -0.010 |
Token | They |
Token ID | 1119 |
Feature activation | +6.03e-03 |
Pos logit contributions | |
Joe | +0.002 |
orse | +0.002 |
mmm | +0.002 |
on | +0.002 |
etti | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
iet | -0.002 |
attent | -0.002 |
andel | -0.002 |
Token | liked |
Token ID | 8288 |
Feature activation | +4.69e-03 |
Pos logit contributions | |
mmm | +0.014 |
mm | +0.013 |
inations | +0.012 |
etti | +0.012 |
on | +0.012 |
Neg logit contributions | |
ranc | -0.006 |
Please | -0.005 |
girl | -0.005 |
out | -0.004 |
iet | -0.004 |
Token | to |
Token ID | 284 |
Feature activation | +5.18e-03 |
Pos logit contributions | |
mmm | +0.012 |
mm | +0.011 |
on | +0.011 |
orse | +0.011 |
inations | +0.011 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.002 |
attent | -0.002 |
Please | -0.002 |
veterinarian | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | -7.35e-03 |
Pos logit contributions | |
mmm | +0.017 |
on | +0.016 |
inations | +0.016 |
orse | +0.016 |
mm | +0.016 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
attent | -0.008 |
Please | -0.008 |
iet | -0.008 |
Token | let |
Token ID | 1309 |
Feature activation | -5.12e-03 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.009 |
attent | +0.009 |
Please | +0.008 |
iet | +0.008 |
Neg logit contributions | |
mmm | -0.012 |
on | -0.011 |
inations | -0.011 |
orse | -0.011 |
mm | -0.011 |
Token | go |
Token ID | 467 |
Feature activation | +7.87e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
attent | +0.006 |
iet | +0.006 |
Please | +0.006 |
Neg logit contributions | |
on | -0.008 |
mmm | -0.008 |
orse | -0.007 |
Joe | -0.007 |
inations | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | -6.11e-03 |
Pos logit contributions | |
mmm | +0.017 |
mm | +0.016 |
inations | +0.016 |
orse | +0.016 |
etti | +0.016 |
Neg logit contributions | |
ranc | -0.006 |
out | -0.006 |
err | -0.005 |
for | -0.005 |
corner | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | -5.30e-03 |
Pos logit contributions | |
out | +0.005 |
her | +0.005 |
louder | +0.005 |
ranc | +0.005 |
911 | +0.004 |
Neg logit contributions | |
mmm | -0.013 |
inations | -0.013 |
mm | -0.012 |
orse | -0.012 |
opter | -0.012 |
Token | string |
Token ID | 4731 |
Feature activation | -3.99e-03 |
Pos logit contributions | |
ranc | +0.007 |
girl | +0.006 |
err | +0.006 |
veterinarian | +0.006 |
Please | +0.006 |
Neg logit contributions | |
mmm | -0.009 |
inations | -0.008 |
orse | -0.008 |
Joe | -0.008 |
on | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | +1.18e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
out | +0.002 |
louder | +0.002 |
Neg logit contributions | |
mmm | -0.009 |
mm | -0.008 |
inations | -0.008 |
on | -0.008 |
orse | -0.008 |
Token | The |
Token ID | 383 |
Feature activation | +1.17e-02 |
Pos logit contributions | |
mmm | +0.002 |
on | +0.002 |
orse | +0.002 |
inations | +0.002 |
mm | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.001 |
iet | -0.001 |
Please | -0.001 |
Token | arrow |
Token ID | 15452 |
Feature activation | +1.71e-02 |
Pos logit contributions | |
mmm | +0.015 |
on | +0.015 |
orse | +0.015 |
inations | +0.014 |
Joe | +0.014 |
Neg logit contributions | |
ranc | -0.019 |
err | -0.018 |
attent | -0.017 |
Please | -0.017 |
iet | -0.017 |
Token | flew |
Token ID | 13112 |
Feature activation | +9.39e-04 |
Pos logit contributions | |
mmm | +0.029 |
on | +0.027 |
inations | +0.027 |
orse | +0.027 |
mm | +0.026 |
Neg logit contributions | |
ranc | -0.021 |
err | -0.019 |
attent | -0.019 |
Please | -0.018 |
moral | -0.017 |
Token | in |
Token ID | 287 |
Feature activation | -6.59e-03 |
Pos logit contributions | |
on | +0.002 |
Joe | +0.002 |
mmm | +0.002 |
John | +0.002 |
etti | +0.002 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
iet | -0.001 |
attent | -0.001 |
andel | -0.001 |
Token | see |
Token ID | 766 |
Feature activation | -4.20e-03 |
Pos logit contributions | |
mmm | +0.040 |
inations | +0.038 |
mm | +0.037 |
etti | +0.036 |
orse | +0.036 |
Neg logit contributions | |
out | -0.028 |
ranc | -0.027 |
veterinarian | -0.027 |
Please | -0.025 |
girl | -0.025 |
Token | your |
Token ID | 534 |
Feature activation | -4.67e-04 |
Pos logit contributions | |
ranc | +0.005 |
out | +0.005 |
Please | +0.005 |
louder | +0.005 |
veterinarian | +0.005 |
Neg logit contributions | |
inations | -0.006 |
mmm | -0.006 |
orse | -0.006 |
etti | -0.006 |
achieve | -0.006 |
Token | car |
Token ID | 1097 |
Feature activation | +1.67e-02 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.000 |
iet | +0.000 |
Please | +0.000 |
Neg logit contributions | |
on | -0.001 |
mmm | -0.001 |
orse | -0.001 |
inations | -0.001 |
etti | -0.001 |
Token | ?" |
Token ID | 1701 |
Feature activation | -3.46e-03 |
Pos logit contributions | |
mmm | +0.026 |
orse | +0.026 |
inations | +0.025 |
on | +0.025 |
mm | +0.024 |
Neg logit contributions | |
ranc | -0.022 |
err | -0.020 |
iet | -0.019 |
Please | -0.019 |
attent | -0.019 |
Token | Ben |
Token ID | 3932 |
Feature activation | +2.15e-02 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.005 |
iet | +0.005 |
attent | +0.005 |
andel | +0.005 |
Neg logit contributions | |
on | -0.004 |
mmm | -0.004 |
orse | -0.004 |
Joe | -0.004 |
inations | -0.004 |
Token | asks |
Token ID | 7893 |
Feature activation | +5.47e-03 |
Pos logit contributions | |
on | +0.030 |
mmm | +0.030 |
orse | +0.029 |
Joe | +0.028 |
inations | +0.028 |
Neg logit contributions | |
ranc | -0.032 |
err | -0.030 |
attent | -0.028 |
andel | -0.028 |
iet | -0.028 |
Token | the |
Token ID | 262 |
Feature activation | -7.61e-04 |
Pos logit contributions | |
on | +0.008 |
Joe | +0.007 |
Mike | +0.007 |
John | +0.007 |
orse | +0.007 |
Neg logit contributions | |
ranc | -0.009 |
err | -0.008 |
iet | -0.008 |
attent | -0.008 |
andel | -0.008 |
Token | man |
Token ID | 582 |
Feature activation | +1.23e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
iet | +0.001 |
andel | +0.001 |
Neg logit contributions | |
on | -0.001 |
cube | -0.001 |
orse | -0.001 |
etti | -0.001 |
John | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +3.79e-03 |
Pos logit contributions | |
on | +0.002 |
mmm | +0.002 |
orse | +0.002 |
inations | +0.002 |
etti | +0.002 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
iet | -0.001 |
Please | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +1.80e-03 |
Pos logit contributions | |
on | +0.005 |
Joe | +0.004 |
orse | +0.004 |
mmm | +0.004 |
John | +0.004 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
iet | -0.006 |
andel | -0.006 |
err | -0.006 |
Token |
|
Token ID | 198 |
Feature activation | +4.63e-03 |
Pos logit contributions | |
mmm | +0.003 |
inations | +0.003 |
on | +0.003 |
etti | +0.003 |
orse | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
Please | -0.002 |
iet | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | -4.98e-04 |
Pos logit contributions | |
mmm | +0.023 |
on | +0.023 |
Joe | +0.022 |
orse | +0.022 |
inations | +0.022 |
Neg logit contributions | |
ranc | -0.018 |
err | -0.016 |
attent | -0.015 |
iet | -0.015 |
Please | -0.015 |
Token | Daisy |
Token ID | 40355 |
Feature activation | -5.13e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
iet | +0.001 |
attent | +0.001 |
andel | +0.001 |
Neg logit contributions | |
mmm | -0.001 |
on | -0.001 |
orse | -0.001 |
Joe | -0.001 |
inations | -0.001 |
Token | almost |
Token ID | 2048 |
Feature activation | +9.14e-04 |
Pos logit contributions | |
ranc | +0.006 |
attent | +0.005 |
err | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.010 |
mm | -0.009 |
on | -0.009 |
inations | -0.009 |
etti | -0.009 |
Token | forgot |
Token ID | 16453 |
Feature activation | +1.07e-04 |
Pos logit contributions | |
mmm | +0.002 |
on | +0.001 |
mm | +0.001 |
inations | +0.001 |
orse | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
attent | -0.001 |
err | -0.001 |
iet | -0.001 |
Please | -0.001 |
Token | about |
Token ID | 546 |
Feature activation | +6.24e-03 |
Pos logit contributions | |
mmm | +0.000 |
on | +0.000 |
orse | +0.000 |
inations | +0.000 |
mm | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
iet | -0.000 |
Please | -0.000 |
Token | her |
Token ID | 607 |
Feature activation | -2.23e-03 |
Pos logit contributions | |
mmm | +0.011 |
on | +0.011 |
orse | +0.011 |
inations | +0.010 |
mm | +0.010 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.007 |
attent | -0.006 |
iet | -0.006 |
Please | -0.006 |
Token | letter |
Token ID | 3850 |
Feature activation | +1.19e-02 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
iet | +0.002 |
moral | +0.002 |
Neg logit contributions | |
mmm | -0.004 |
on | -0.004 |
etti | -0.003 |
orse | -0.003 |
mm | -0.003 |
Token | but |
Token ID | 475 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
mmm | +0.022 |
orse | +0.021 |
on | +0.021 |
inations | +0.021 |
mm | +0.021 |
Neg logit contributions | |
ranc | -0.012 |
err | -0.011 |
attent | -0.011 |
iet | -0.010 |
Please | -0.010 |
Token | then |
Token ID | 788 |
Feature activation | -9.87e-03 |
Pos logit contributions | |
mmm | +0.022 |
inations | +0.021 |
orse | +0.021 |
on | +0.021 |
etti | +0.021 |
Neg logit contributions | |
ranc | -0.014 |
err | -0.013 |
attent | -0.013 |
Please | -0.012 |
girl | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | -7.68e-04 |
Pos logit contributions | |
ranc | +0.013 |
err | +0.012 |
attent | +0.011 |
iet | +0.011 |
andel | +0.010 |
Neg logit contributions | |
on | -0.016 |
mmm | -0.016 |
orse | -0.016 |
inations | -0.015 |
Joe | -0.015 |
Token | one |
Token ID | 530 |
Feature activation | -3.84e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
iet | +0.001 |
andel | +0.001 |
attent | +0.001 |
Neg logit contributions | |
Joe | -0.001 |
on | -0.001 |
John | -0.001 |
mmm | -0.001 |
Andy | -0.001 |
Token | sleep |
Token ID | 3993 |
Feature activation | -8.78e-03 |
Pos logit contributions | |
ranc | +0.008 |
attent | +0.007 |
err | +0.007 |
out | +0.007 |
veterinarian | +0.007 |
Neg logit contributions | |
mmm | -0.013 |
mm | -0.013 |
inations | -0.013 |
on | -0.012 |
orse | -0.012 |
Token | . |
Token ID | 13 |
Feature activation | +4.99e-03 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.011 |
iet | +0.010 |
andel | +0.009 |
attent | +0.009 |
Neg logit contributions | |
on | -0.015 |
orse | -0.014 |
mmm | -0.014 |
inations | -0.013 |
Joe | -0.013 |
Token | But |
Token ID | 887 |
Feature activation | +7.75e-03 |
Pos logit contributions | |
inations | +0.009 |
orse | +0.009 |
on | +0.009 |
mmm | +0.009 |
etti | +0.008 |
Neg logit contributions | |
err | -0.006 |
ranc | -0.005 |
attent | -0.005 |
Please | -0.005 |
veterinarian | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | +1.62e-03 |
Pos logit contributions | |
inations | +0.013 |
mmm | +0.013 |
etti | +0.012 |
orse | +0.012 |
on | +0.012 |
Neg logit contributions | |
ranc | -0.009 |
attent | -0.009 |
err | -0.009 |
out | -0.008 |
Please | -0.008 |
Token | next |
Token ID | 1306 |
Feature activation | +4.88e-03 |
Pos logit contributions | |
on | +0.003 |
mmm | +0.003 |
orse | +0.003 |
inations | +0.003 |
mm | +0.003 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
Please | -0.002 |
Token | day |
Token ID | 1110 |
Feature activation | -1.24e-02 |
Pos logit contributions | |
on | +0.008 |
mmm | +0.008 |
orse | +0.008 |
inations | +0.007 |
Joe | +0.007 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
attent | -0.006 |
iet | -0.005 |
Please | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +6.46e-03 |
Pos logit contributions | |
ranc | +0.017 |
out | +0.016 |
Please | +0.016 |
girl | +0.016 |
err | +0.016 |
Neg logit contributions | |
inations | -0.019 |
mmm | -0.018 |
orse | -0.017 |
etti | -0.017 |
mm | -0.017 |
Token | when |
Token ID | 618 |
Feature activation | -1.89e-03 |
Pos logit contributions | |
orse | +0.009 |
mmm | +0.009 |
inations | +0.009 |
on | +0.009 |
etti | +0.009 |
Neg logit contributions | |
ranc | -0.009 |
err | -0.009 |
attent | -0.009 |
Please | -0.009 |
out | -0.008 |
Token | he |
Token ID | 339 |
Feature activation | +5.26e-03 |
Pos logit contributions | |
someone | +0.002 |
out | +0.002 |
Please | +0.002 |
ranc | +0.002 |
louder | +0.002 |
Neg logit contributions | |
orse | -0.003 |
inations | -0.003 |
on | -0.003 |
etti | -0.003 |
mmm | -0.003 |
Token | woke |
Token ID | 19092 |
Feature activation | +3.85e-03 |
Pos logit contributions | |
on | +0.010 |
mmm | +0.009 |
orse | +0.009 |
inations | +0.009 |
Joe | +0.009 |
Neg logit contributions | |
ranc | -0.006 |
err | -0.005 |
attent | -0.005 |
iet | -0.005 |
andel | -0.005 |
Token | up |
Token ID | 510 |
Feature activation | -3.97e-04 |
Pos logit contributions | |
mmm | +0.008 |
on | +0.008 |
orse | +0.008 |
Joe | +0.008 |
etti | +0.008 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
iet | -0.003 |
attent | -0.003 |
Please | -0.002 |
Token | it |
Token ID | 340 |
Feature activation | +9.40e-04 |
Pos logit contributions | |
moral | +0.009 |
for | +0.009 |
louder | +0.009 |
ranc | +0.009 |
out | +0.008 |
Neg logit contributions | |
etti | -0.014 |
mmm | -0.014 |
on | -0.014 |
mm | -0.014 |
inations | -0.013 |
Token | â |
Token ID | 22940 |
Feature activation | -9.44e-03 |
Pos logit contributions | |
mmm | +0.002 |
on | +0.002 |
orse | +0.002 |
etti | +0.002 |
mm | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
moral | -0.001 |
iet | -0.001 |
Token | € |
Token ID | 26391 |
Feature activation | -9.38e-03 |
Pos logit contributions | |
ranc | +0.013 |
err | +0.012 |
attent | +0.011 |
Please | +0.011 |
iet | +0.011 |
Neg logit contributions | |
on | -0.014 |
mmm | -0.014 |
orse | -0.014 |
inations | -0.014 |
etti | -0.013 |
Token | â„¢ |
Token ID | 8151 |
Feature activation | +1.04e-02 |
Pos logit contributions | |
ranc | +0.012 |
err | +0.010 |
urse | +0.010 |
iet | +0.010 |
veterinarian | +0.009 |
Neg logit contributions | |
mmm | -0.014 |
on | -0.014 |
cube | -0.014 |
inations | -0.013 |
mm | -0.013 |
Token | s |
Token ID | 82 |
Feature activation | +1.01e-02 |
Pos logit contributions | |
inations | +0.017 |
mmm | +0.017 |
orse | +0.017 |
etti | +0.016 |
achieve | +0.016 |
Neg logit contributions | |
ranc | -0.012 |
err | -0.012 |
ther | -0.011 |
upon | -0.011 |
urse | -0.011 |
Token | important |
Token ID | 1593 |
Feature activation | -1.08e-02 |
Pos logit contributions | |
mmm | +0.016 |
on | +0.015 |
orse | +0.015 |
inations | +0.015 |
Joe | +0.014 |
Neg logit contributions | |
ranc | -0.014 |
err | -0.013 |
attent | -0.012 |
iet | -0.012 |
Please | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | +7.57e-03 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
attent | +0.006 |
Please | +0.006 |
veterinarian | +0.005 |
Neg logit contributions | |
mmm | -0.024 |
on | -0.024 |
orse | -0.023 |
etti | -0.023 |
inations | -0.023 |
Token | listen |
Token ID | 6004 |
Feature activation | -1.65e-02 |
Pos logit contributions | |
on | +0.013 |
etti | +0.013 |
orse | +0.012 |
inations | +0.012 |
mmm | +0.012 |
Neg logit contributions | |
ranc | -0.010 |
moral | -0.009 |
veterinarian | -0.008 |
iet | -0.008 |
strangers | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | +2.40e-04 |
Pos logit contributions | |
ranc | +0.015 |
err | +0.013 |
attent | +0.013 |
iet | +0.012 |
Please | +0.012 |
Neg logit contributions | |
mmm | -0.033 |
on | -0.033 |
orse | -0.032 |
inations | -0.032 |
mm | -0.031 |
Token | your |
Token ID | 534 |
Feature activation | -4.66e-03 |
Pos logit contributions | |
on | +0.000 |
etti | +0.000 |
mmm | +0.000 |
mm | +0.000 |
orse | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
attent | -0.000 |
err | -0.000 |
iet | -0.000 |
moral | -0.000 |
Token | elders |
Token ID | 27495 |
Feature activation | -8.32e-04 |
Pos logit contributions | |
ranc | +0.006 |
err | +0.005 |
attent | +0.005 |
iet | +0.005 |
veterinarian | +0.004 |
Neg logit contributions | |
mmm | -0.008 |
on | -0.008 |
orse | -0.008 |
inations | -0.008 |
etti | -0.008 |
Token | machine |
Token ID | 4572 |
Feature activation | -6.66e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
Please | +0.003 |
iet | +0.003 |
attent | +0.003 |
Neg logit contributions | |
on | -0.002 |
inations | -0.002 |
orse | -0.002 |
mmm | -0.002 |
achieve | -0.002 |
Token | for |
Token ID | 329 |
Feature activation | -1.93e-02 |
Pos logit contributions | |
ranc | +0.006 |
attent | +0.005 |
out | +0.005 |
err | +0.005 |
louder | +0.005 |
Neg logit contributions | |
mmm | -0.014 |
mm | -0.013 |
orse | -0.013 |
inations | -0.013 |
on | -0.013 |
Token | a |
Token ID | 257 |
Feature activation | +2.21e-03 |
Pos logit contributions | |
ranc | +0.015 |
doctors | +0.012 |
louder | +0.012 |
attent | +0.012 |
nurses | +0.011 |
Neg logit contributions | |
mmm | -0.041 |
etti | -0.041 |
mm | -0.040 |
orse | -0.040 |
inations | -0.040 |
Token | few |
Token ID | 1178 |
Feature activation | +8.87e-03 |
Pos logit contributions | |
mmm | +0.004 |
on | +0.004 |
orse | +0.004 |
inations | +0.004 |
mm | +0.004 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.002 |
iet | -0.002 |
Please | -0.002 |
Token | seconds |
Token ID | 4201 |
Feature activation | +3.76e-03 |
Pos logit contributions | |
on | +0.015 |
inations | +0.015 |
orse | +0.015 |
mmm | +0.015 |
Joe | +0.014 |
Neg logit contributions | |
ranc | -0.011 |
err | -0.010 |
attent | -0.009 |
iet | -0.009 |
Please | -0.008 |
Token | and |
Token ID | 290 |
Feature activation | -1.63e-02 |
Pos logit contributions | |
inations | +0.008 |
opter | +0.008 |
disl | +0.008 |
pleasure | +0.008 |
mmm | +0.008 |
Neg logit contributions | |
for | -0.003 |
at | -0.002 |
out | -0.002 |
ranc | -0.002 |
attent | -0.002 |
Token | said |
Token ID | 531 |
Feature activation | +3.12e-04 |
Pos logit contributions | |
ranc | +0.024 |
attent | +0.022 |
err | +0.022 |
Please | +0.021 |
iet | +0.020 |
Neg logit contributions | |
mmm | -0.024 |
on | -0.023 |
inations | -0.023 |
orse | -0.023 |
mm | -0.022 |
Token | , |
Token ID | 11 |
Feature activation | -3.48e-03 |
Pos logit contributions | |
inations | +0.000 |
mmm | +0.000 |
orse | +0.000 |
on | +0.000 |
etti | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
attent | -0.000 |
err | -0.000 |
louder | -0.000 |
out | -0.000 |
Token | " |
Token ID | 366 |
Feature activation | -7.35e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
iet | +0.003 |
andel | +0.002 |
attent | +0.002 |
Neg logit contributions | |
mmm | -0.007 |
on | -0.007 |
orse | -0.007 |
Joe | -0.007 |
etti | -0.007 |
Token | That |
Token ID | 2504 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
ranc | +0.008 |
err | +0.007 |
attent | +0.006 |
Please | +0.006 |
iet | +0.006 |
Neg logit contributions | |
mmm | -0.014 |
on | -0.014 |
orse | -0.014 |
inations | -0.013 |
etti | -0.013 |
Token | looks |
Token ID | 3073 |
Feature activation | -7.36e-03 |
Pos logit contributions | |
ranc | +0.012 |
err | +0.010 |
attent | +0.010 |
out | +0.010 |
girl | +0.010 |
Neg logit contributions | |
mmm | -0.018 |
orse | -0.017 |
inations | -0.017 |
mm | -0.017 |
on | -0.017 |
Token |
|
Token ID | 198 |
Feature activation | -5.97e-03 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.010 |
attent | +0.009 |
iet | +0.009 |
Please | +0.009 |
Neg logit contributions | |
mmm | -0.013 |
on | -0.013 |
orse | -0.013 |
inations | -0.013 |
mm | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -1.54e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
attent | +0.006 |
Please | +0.006 |
iet | +0.006 |
Neg logit contributions | |
mmm | -0.010 |
on | -0.010 |
inations | -0.010 |
orse | -0.010 |
etti | -0.010 |
Token | As |
Token ID | 1722 |
Feature activation | +8.50e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
inations | -0.003 |
etti | -0.002 |
Token | she |
Token ID | 673 |
Feature activation | -5.65e-03 |
Pos logit contributions | |
inations | +0.014 |
mmm | +0.013 |
on | +0.013 |
etti | +0.013 |
orse | +0.013 |
Neg logit contributions | |
ranc | -0.011 |
attent | -0.010 |
err | -0.009 |
girl | -0.009 |
ther | -0.009 |
Token | w |
Token ID | 266 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
attent | +0.005 |
iet | +0.005 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.010 |
on | -0.010 |
inations | -0.010 |
orse | -0.010 |
etti | -0.010 |
Token | add |
Token ID | 2860 |
Feature activation | -1.30e-02 |
Pos logit contributions | |
mmm | +0.019 |
on | +0.019 |
orse | +0.018 |
inations | +0.018 |
mm | +0.018 |
Neg logit contributions | |
ranc | -0.013 |
err | -0.012 |
attent | -0.011 |
iet | -0.011 |
Please | -0.010 |
Token | led |
Token ID | 992 |
Feature activation | +2.43e-03 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.009 |
attent | +0.008 |
iet | +0.008 |
Please | +0.007 |
Neg logit contributions | |
mmm | -0.027 |
on | -0.027 |
orse | -0.027 |
inations | -0.026 |
mm | -0.026 |
Token | along |
Token ID | 1863 |
Feature activation | +1.13e-02 |
Pos logit contributions | |
Joe | +0.004 |
on | +0.004 |
John | +0.004 |
orse | +0.004 |
Andy | +0.004 |
Neg logit contributions | |
err | -0.003 |
ranc | -0.003 |
iet | -0.002 |
urse | -0.002 |
Please | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | -5.06e-04 |
Pos logit contributions | |
mmm | +0.013 |
on | +0.013 |
orse | +0.012 |
inations | +0.012 |
mm | +0.012 |
Neg logit contributions | |
ranc | -0.020 |
err | -0.019 |
attent | -0.018 |
iet | -0.018 |
Please | -0.017 |
Token | she |
Token ID | 673 |
Feature activation | -1.47e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
iet | +0.001 |
attent | +0.001 |
Please | +0.001 |
Neg logit contributions | |
Joe | -0.001 |
on | -0.001 |
mmm | -0.001 |
John | -0.001 |
Mike | -0.001 |
Token | saw |
Token ID | 2497 |
Feature activation | +2.64e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.001 |
attent | +0.001 |
iet | +0.001 |
Please | +0.001 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
mm | -0.003 |
inations | -0.003 |
orse | -0.003 |
Token | Ben |
Token ID | 11696 |
Feature activation | +7.26e-03 |
Pos logit contributions | |
ranc | +0.002 |
err | +0.002 |
attent | +0.002 |
iet | +0.002 |
andel | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.002 |
orse | -0.002 |
inations | -0.002 |
mm | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | -1.99e-02 |
Pos logit contributions | |
mmm | +0.014 |
inations | +0.014 |
on | +0.013 |
orse | +0.013 |
mm | +0.013 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.007 |
attent | -0.006 |
Please | -0.006 |
iet | -0.006 |
Token | Lily |
Token ID | 20037 |
Feature activation | -6.90e-03 |
Pos logit contributions | |
ranc | +0.035 |
iet | +0.034 |
andel | +0.034 |
attent | +0.034 |
err | +0.033 |
Neg logit contributions | |
Joe | -0.024 |
John | -0.024 |
Mike | -0.022 |
Bobby | -0.022 |
Jack | -0.021 |
Token | decided |
Token ID | 3066 |
Feature activation | -1.61e-04 |
Pos logit contributions | |
ranc | +0.009 |
Please | +0.008 |
attent | +0.007 |
err | +0.007 |
iet | +0.007 |
Neg logit contributions | |
mmm | -0.012 |
inations | -0.011 |
orse | -0.011 |
on | -0.011 |
mm | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | +9.27e-04 |
Pos logit contributions | |
ranc | +0.000 |
err | +0.000 |
attent | +0.000 |
iet | +0.000 |
Please | +0.000 |
Neg logit contributions | |
mmm | -0.000 |
on | -0.000 |
orse | -0.000 |
inations | -0.000 |
mm | -0.000 |
Token | listen |
Token ID | 6004 |
Feature activation | -1.66e-02 |
Pos logit contributions | |
inations | +0.002 |
orse | +0.002 |
mmm | +0.002 |
on | +0.001 |
odic | +0.001 |
Neg logit contributions | |
veterinarian | -0.001 |
Please | -0.001 |
moral | -0.001 |
ranc | -0.001 |
date | -0.001 |
Token | to |
Token ID | 284 |
Feature activation | +7.69e-04 |
Pos logit contributions | |
ranc | +0.022 |
err | +0.020 |
andel | +0.019 |
iet | +0.019 |
ther | +0.018 |
Neg logit contributions | |
on | -0.027 |
mmm | -0.026 |
orse | -0.025 |
inations | -0.025 |
Joe | -0.025 |
Token | Mom |
Token ID | 11254 |
Feature activation | -4.62e-03 |
Pos logit contributions | |
mmm | +0.001 |
inations | +0.001 |
on | +0.001 |
orse | +0.001 |
etti | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
Please | -0.001 |
iet | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +4.98e-03 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.004 |
iet | +0.003 |
Please | +0.003 |
Neg logit contributions | |
mmm | -0.009 |
orse | -0.009 |
on | -0.009 |
inations | -0.009 |
mm | -0.009 |
Token | They |
Token ID | 1119 |
Feature activation | +1.28e-03 |
Pos logit contributions | |
mmm | +0.007 |
on | +0.007 |
orse | +0.007 |
inations | +0.007 |
Joe | +0.007 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.007 |
attent | -0.006 |
iet | -0.006 |
Please | -0.006 |
Token | said |
Token ID | 531 |
Feature activation | +8.01e-04 |
Pos logit contributions | |
mmm | +0.002 |
inations | +0.002 |
mm | +0.002 |
orse | +0.002 |
on | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
Please | -0.001 |
attent | -0.001 |
iet | -0.001 |
veterinarian | -0.001 |
Token | a |
Token ID | 257 |
Feature activation | +6.22e-03 |
Pos logit contributions | |
ranc | +0.007 |
out | +0.006 |
attent | +0.006 |
err | +0.006 |
doctors | +0.006 |
Neg logit contributions | |
mmm | -0.016 |
orse | -0.015 |
mm | -0.015 |
achieve | -0.014 |
inations | -0.014 |
Token | garden |
Token ID | 11376 |
Feature activation | -4.50e-03 |
Pos logit contributions | |
mmm | +0.011 |
mm | +0.011 |
on | +0.011 |
orse | +0.011 |
inations | +0.010 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
veterinarian | -0.006 |
attent | -0.006 |
ther | -0.006 |
Token | full |
Token ID | 1336 |
Feature activation | +1.70e-02 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
on | -0.008 |
mmm | -0.008 |
orse | -0.008 |
inations | -0.007 |
etti | -0.007 |
Token | of |
Token ID | 286 |
Feature activation | +3.75e-03 |
Pos logit contributions | |
mmm | +0.027 |
on | +0.027 |
orse | +0.026 |
inations | +0.026 |
mm | +0.025 |
Neg logit contributions | |
ranc | -0.022 |
err | -0.020 |
attent | -0.019 |
iet | -0.019 |
Please | -0.018 |
Token | wild |
Token ID | 4295 |
Feature activation | +5.43e-03 |
Pos logit contributions | |
mmm | +0.007 |
orse | +0.007 |
on | +0.007 |
etti | +0.007 |
mm | +0.007 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.003 |
veterinarian | -0.003 |
girl | -0.003 |
Token | fl |
Token ID | 2704 |
Feature activation | -5.62e-02 |
Pos logit contributions | |
mmm | +0.010 |
on | +0.010 |
orse | +0.010 |
inations | +0.010 |
mm | +0.010 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.005 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | owers |
Token ID | 3618 |
Feature activation | -6.66e-03 |
Pos logit contributions | |
ranc | +0.070 |
err | +0.064 |
iet | +0.059 |
attent | +0.059 |
andel | +0.057 |
Neg logit contributions | |
mmm | -0.093 |
orse | -0.091 |
on | -0.089 |
inations | -0.088 |
Joe | -0.085 |
Token | . |
Token ID | 13 |
Feature activation | +3.06e-03 |
Pos logit contributions | |
ranc | +0.005 |
out | +0.003 |
attent | +0.003 |
err | +0.003 |
for | +0.003 |
Neg logit contributions | |
mmm | -0.015 |
mm | -0.015 |
etti | -0.014 |
inations | -0.014 |
orse | -0.014 |
Token | He |
Token ID | 679 |
Feature activation | +5.14e-03 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.005 |
inations | +0.005 |
orse | +0.004 |
etti | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.004 |
Please | -0.004 |
veterinarian | -0.004 |
Token | decided |
Token ID | 3066 |
Feature activation | +4.86e-03 |
Pos logit contributions | |
mmm | +0.009 |
on | +0.009 |
mm | +0.008 |
etti | +0.008 |
inations | +0.008 |
Neg logit contributions | |
ranc | -0.007 |
err | -0.006 |
attent | -0.006 |
iet | -0.005 |
Please | -0.005 |
Token | to |
Token ID | 284 |
Feature activation | +1.37e-03 |
Pos logit contributions | |
mmm | +0.010 |
on | +0.010 |
orse | +0.009 |
inations | +0.009 |
mm | +0.009 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
Please | -0.004 |
Token | tears |
Token ID | 10953 |
Feature activation | -1.61e-02 |
Pos logit contributions | |
ranc | +0.013 |
attent | +0.012 |
andel | +0.011 |
err | +0.011 |
iet | +0.010 |
Neg logit contributions | |
on | -0.016 |
orse | -0.015 |
cube | -0.015 |
mm | -0.014 |
e | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | -1.55e-03 |
Pos logit contributions | |
ranc | +0.019 |
err | +0.016 |
attent | +0.015 |
iet | +0.015 |
Please | +0.014 |
Neg logit contributions | |
on | -0.029 |
mmm | -0.028 |
orse | -0.028 |
inations | -0.027 |
etti | -0.027 |
Token | He |
Token ID | 679 |
Feature activation | +3.42e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.002 |
iet | +0.002 |
attent | +0.002 |
andel | +0.002 |
Neg logit contributions | |
on | -0.002 |
mmm | -0.002 |
orse | -0.002 |
Joe | -0.002 |
mm | -0.002 |
Token | takes |
Token ID | 2753 |
Feature activation | -1.88e-02 |
Pos logit contributions | |
on | +0.004 |
mmm | +0.004 |
orse | +0.004 |
mm | +0.004 |
inations | +0.004 |
Neg logit contributions | |
ranc | -0.006 |
andel | -0.005 |
err | -0.005 |
attent | -0.005 |
iet | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | -6.83e-03 |
Pos logit contributions | |
ranc | +0.030 |
err | +0.024 |
iet | +0.024 |
attent | +0.023 |
Please | +0.021 |
Neg logit contributions | |
on | -0.032 |
Joe | -0.028 |
e | -0.027 |
John | -0.027 |
Mike | -0.026 |
Token | band |
Token ID | 4097 |
Feature activation | -4.08e-02 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.010 |
attent | +0.010 |
Please | +0.010 |
iet | +0.009 |
Neg logit contributions | |
on | -0.010 |
orse | -0.009 |
cube | -0.008 |
inations | -0.008 |
mmm | -0.008 |
Token | - |
Token ID | 12 |
Feature activation | -4.54e-02 |
Pos logit contributions | |
ranc | +0.055 |
err | +0.049 |
attent | +0.046 |
Please | +0.045 |
iet | +0.045 |
Neg logit contributions | |
on | -0.073 |
orse | -0.067 |
e | -0.064 |
mmm | -0.060 |
inations | -0.058 |
Token | aid |
Token ID | 1698 |
Feature activation | -4.63e-02 |
Pos logit contributions | |
ranc | +0.089 |
err | +0.080 |
attent | +0.078 |
iet | +0.076 |
andel | +0.075 |
Neg logit contributions | |
on | -0.050 |
mmm | -0.044 |
orse | -0.043 |
inations | -0.040 |
mm | -0.040 |
Token | from |
Token ID | 422 |
Feature activation | -5.11e-03 |
Pos logit contributions | |
ranc | +0.068 |
err | +0.063 |
Ps | +0.060 |
iet | +0.059 |
Please | +0.056 |
Neg logit contributions | |
on | -0.077 |
orse | -0.062 |
mmm | -0.061 |
cube | -0.059 |
Joe | -0.058 |
Token | his |
Token ID | 465 |
Feature activation | -2.61e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
iet | +0.006 |
attent | +0.006 |
andel | +0.005 |
Neg logit contributions | |
on | -0.009 |
Joe | -0.008 |
orse | -0.008 |
John | -0.008 |
mmm | -0.008 |
Token | pocket |
Token ID | 10000 |
Feature activation | +5.12e-04 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
iet | +0.003 |
Please | +0.003 |
Neg logit contributions | |
on | -0.004 |
mmm | -0.004 |
orse | -0.004 |
inations | -0.004 |
mm | -0.004 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.49e-03 |
Pos logit contributions | |
mmm | +0.000 |
on | +0.000 |
inations | +0.000 |
orse | +0.000 |
mm | +0.000 |
Neg logit contributions | |
ranc | -0.000 |
err | -0.000 |
attent | -0.000 |
iet | -0.000 |
Please | -0.000 |
Token | a |
Token ID | 257 |
Feature activation | +6.43e-04 |
Pos logit contributions | |
mmm | +0.003 |
inations | +0.003 |
orse | +0.003 |
etti | +0.003 |
mm | +0.003 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
out | -0.001 |
nurses | -0.001 |
iet | -0.001 |
Token | big |
Token ID | 1263 |
Feature activation | +2.03e-02 |
Pos logit contributions | |
mmm | +0.001 |
inations | +0.001 |
on | +0.001 |
orse | +0.001 |
mm | +0.001 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
girl | -0.001 |
veterinarian | -0.001 |
iet | -0.001 |
Token | , |
Token ID | 11 |
Feature activation | +1.40e-02 |
Pos logit contributions | |
inations | +0.038 |
mmm | +0.035 |
orse | +0.035 |
mm | +0.034 |
etti | +0.032 |
Neg logit contributions | |
ranc | -0.026 |
girl | -0.024 |
ambulance | -0.022 |
veterinarian | -0.022 |
woman | -0.022 |
Token | strange |
Token ID | 6283 |
Feature activation | -3.07e-03 |
Pos logit contributions | |
mmm | +0.023 |
on | +0.023 |
orse | +0.022 |
inations | +0.022 |
mm | +0.021 |
Neg logit contributions | |
ranc | -0.018 |
err | -0.017 |
attent | -0.016 |
iet | -0.015 |
Please | -0.015 |
Token | - |
Token ID | 12 |
Feature activation | -4.20e-02 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
attent | +0.004 |
iet | +0.004 |
Please | +0.004 |
Neg logit contributions | |
mmm | -0.005 |
on | -0.005 |
orse | -0.005 |
inations | -0.004 |
Joe | -0.004 |
Token | looking |
Token ID | 11534 |
Feature activation | +3.52e-03 |
Pos logit contributions | |
ranc | +0.052 |
err | +0.048 |
attent | +0.045 |
iet | +0.044 |
Please | +0.043 |
Neg logit contributions | |
mmm | -0.071 |
inations | -0.068 |
orse | -0.067 |
mm | -0.067 |
on | -0.066 |
Token | box |
Token ID | 3091 |
Feature activation | +1.52e-02 |
Pos logit contributions | |
mmm | +0.006 |
inations | +0.006 |
on | +0.006 |
orse | +0.006 |
mm | +0.005 |
Neg logit contributions | |
ranc | -0.005 |
err | -0.004 |
attent | -0.004 |
iet | -0.004 |
veterinarian | -0.004 |
Token | nearby |
Token ID | 6716 |
Feature activation | +1.22e-02 |
Pos logit contributions | |
on | +0.028 |
mmm | +0.027 |
orse | +0.026 |
etti | +0.026 |
inations | +0.025 |
Neg logit contributions | |
ranc | -0.017 |
err | -0.016 |
attent | -0.014 |
iet | -0.014 |
andel | -0.014 |
Token | a |
Token ID | 257 |
Feature activation | +1.29e-03 |
Pos logit contributions | |
mmm | +0.024 |
on | +0.023 |
orse | +0.023 |
inations | +0.023 |
mm | +0.022 |
Neg logit contributions | |
ranc | -0.012 |
err | -0.011 |
attent | -0.010 |
Please | -0.010 |
iet | -0.009 |
Token | mailbox |
Token ID | 37282 |
Feature activation | +2.98e-03 |
Pos logit contributions | |
mmm | +0.002 |
on | +0.002 |
inations | +0.002 |
orse | +0.002 |
mm | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
err | -0.002 |
attent | -0.001 |
veterinarian | -0.001 |
Please | -0.001 |
Token | picked |
Token ID | 6497 |
Feature activation | -1.40e-02 |
Pos logit contributions | |
ranc | +0.004 |
err | +0.004 |
iet | +0.003 |
attent | +0.003 |
andel | +0.003 |
Neg logit contributions | |
on | -0.003 |
mmm | -0.003 |
orse | -0.003 |
inations | -0.003 |
Joe | -0.003 |
Token | and |
Token ID | 290 |
Feature activation | +1.21e-03 |
Pos logit contributions | |
ranc | +0.021 |
err | +0.019 |
attent | +0.018 |
iet | +0.018 |
Please | +0.018 |
Neg logit contributions | |
mmm | -0.020 |
on | -0.020 |
orse | -0.019 |
inations | -0.019 |
etti | -0.018 |
Token | put |
Token ID | 1234 |
Feature activation | -3.39e-03 |
Pos logit contributions | |
mmm | +0.002 |
on | +0.002 |
orse | +0.002 |
inations | +0.002 |
mm | +0.002 |
Neg logit contributions | |
ranc | -0.002 |
Please | -0.002 |
attent | -0.001 |
veterinarian | -0.001 |
out | -0.001 |
Token | in |
Token ID | 287 |
Feature activation | -6.17e-03 |
Pos logit contributions | |
ranc | +0.005 |
err | +0.005 |
attent | +0.005 |
Please | +0.005 |
iet | +0.005 |
Neg logit contributions | |
mmm | -0.004 |
orse | -0.004 |
on | -0.004 |
inations | -0.004 |
etti | -0.004 |
Token | a |
Token ID | 257 |
Feature activation | -1.00e-02 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.007 |
out | +0.007 |
Please | +0.007 |
ther | +0.007 |
Neg logit contributions | |
orse | -0.010 |
mmm | -0.010 |
inations | -0.009 |
opter | -0.009 |
etti | -0.009 |
Token | v |
Token ID | 410 |
Feature activation | -4.41e-02 |
Pos logit contributions | |
ranc | +0.013 |
err | +0.013 |
attent | +0.012 |
iet | +0.011 |
Please | +0.011 |
Neg logit contributions | |
on | -0.016 |
mmm | -0.016 |
orse | -0.015 |
inations | -0.015 |
etti | -0.014 |
Token | ase |
Token ID | 589 |
Feature activation | -8.18e-03 |
Pos logit contributions | |
ranc | +0.067 |
attent | +0.060 |
err | +0.058 |
louder | +0.058 |
ther | +0.056 |
Neg logit contributions | |
on | -0.066 |
mmm | -0.062 |
mm | -0.060 |
orse | -0.060 |
etti | -0.059 |
Token | like |
Token ID | 588 |
Feature activation | +3.61e-04 |
Pos logit contributions | |
ranc | +0.010 |
err | +0.009 |
attent | +0.009 |
iet | +0.009 |
Please | +0.008 |
Neg logit contributions | |
mmm | -0.013 |
on | -0.013 |
orse | -0.013 |
inations | -0.013 |
mm | -0.013 |
Token | you |
Token ID | 345 |
Feature activation | +7.57e-03 |
Pos logit contributions | |
on | +0.000 |
mmm | +0.000 |
orse | +0.000 |
inations | +0.000 |
mm | +0.000 |
Neg logit contributions | |
ranc | -0.001 |
err | -0.001 |
attent | -0.001 |
iet | -0.001 |
Please | -0.000 |
Token | ." |
Token ID | 526 |
Feature activation | +2.94e-03 |
Pos logit contributions | |
mmm | +0.012 |
on | +0.012 |
etti | +0.012 |
mm | +0.012 |
orse | +0.011 |
Neg logit contributions | |
ranc | -0.010 |
err | -0.009 |
Please | -0.008 |
attent | -0.008 |
out | -0.008 |
Token |
|
Token ID | 198 |
Feature activation | -4.39e-03 |
Pos logit contributions | |
mmm | +0.005 |
on | +0.005 |
orse | +0.004 |
inations | +0.004 |
mm | +0.004 |
Neg logit contributions | |
ranc | -0.004 |
err | -0.004 |
attent | -0.003 |
iet | -0.003 |
Please | -0.003 |
Token | she |
Token ID | 673 |
Feature activation | -1.99e-03 |
Pos logit contributions | |
ranc | +0.001 |
err | +0.001 |
attent | +0.001 |
Please | +0.001 |
girl | +0.001 |
Neg logit contributions | |
orse | -0.002 |
mmm | -0.002 |
inations | -0.002 |
on | -0.002 |
etti | -0.002 |
Token | forgot |
Token ID | 16453 |
Feature activation | -9.00e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.002 |
iet | +0.002 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.003 |
on | -0.003 |
orse | -0.003 |
inations | -0.003 |
mm | -0.003 |
Token | all |
Token ID | 477 |
Feature activation | -2.98e-03 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.010 |
andel | +0.009 |
iet | +0.009 |
attent | +0.009 |
Neg logit contributions | |
on | -0.015 |
mmm | -0.015 |
Joe | -0.015 |
inations | -0.014 |
John | -0.014 |
Token | about |
Token ID | 546 |
Feature activation | +3.48e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
iet | +0.003 |
Please | +0.002 |
Neg logit contributions | |
mmm | -0.006 |
on | -0.006 |
orse | -0.005 |
inations | -0.005 |
mm | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | -7.13e-03 |
Pos logit contributions | |
orse | +0.007 |
inations | +0.006 |
mmm | +0.006 |
on | +0.006 |
etti | +0.006 |
Neg logit contributions | |
ranc | -0.003 |
attent | -0.003 |
err | -0.003 |
Please | -0.003 |
moral | -0.003 |
Token | muff |
Token ID | 27563 |
Feature activation | -4.11e-02 |
Pos logit contributions | |
ranc | +0.011 |
err | +0.010 |
attent | +0.010 |
Please | +0.009 |
andel | +0.009 |
Neg logit contributions | |
mmm | -0.010 |
on | -0.010 |
orse | -0.010 |
inations | -0.009 |
etti | -0.009 |
Token | in |
Token ID | 259 |
Feature activation | -3.87e-03 |
Pos logit contributions | |
ranc | +0.044 |
err | +0.044 |
attent | +0.043 |
iet | +0.042 |
ther | +0.041 |
Neg logit contributions | |
mmm | -0.067 |
Joe | -0.066 |
orse | -0.065 |
etti | -0.065 |
John | -0.064 |
Token | . |
Token ID | 13 |
Feature activation | -4.94e-03 |
Pos logit contributions | |
ranc | +0.003 |
err | +0.003 |
attent | +0.003 |
girl | +0.003 |
Please | +0.003 |
Neg logit contributions | |
mmm | -0.008 |
orse | -0.007 |
inations | -0.007 |
mm | -0.007 |
etti | -0.007 |
Token | Later |
Token ID | 11450 |
Feature activation | +1.73e-03 |
Pos logit contributions | |
ranc | +0.007 |
err | +0.006 |
iet | +0.006 |
attent | +0.006 |
Please | +0.005 |
Neg logit contributions | |
mmm | -0.008 |
on | -0.008 |
orse | -0.008 |
Joe | -0.007 |
inations | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -2.27e-03 |
Pos logit contributions | |
on | +0.002 |
mmm | +0.002 |
orse | +0.002 |
Joe | +0.002 |
mm | +0.002 |
Neg logit contributions | |
ranc | -0.003 |
err | -0.003 |
attent | -0.003 |
iet | -0.003 |
andel | -0.003 |
Token | when |
Token ID | 618 |
Feature activation | -1.16e-02 |
Pos logit contributions | |
ranc | +0.004 |
andel | +0.004 |
err | +0.004 |
iet | +0.004 |
veterinarian | +0.004 |
Neg logit contributions | |
Joe | -0.003 |
John | -0.003 |
mmm | -0.003 |
on | -0.003 |
Mike | -0.003 |