Token | crab |
Token ID | 32202 |
Feature activation | -2.98e-01 |
Pos logit contributions | |
endant | +0.018 |
av | +0.018 |
arrest | +0.018 |
jewels | +0.018 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.007 |
Good | -0.006 |
Time | -0.006 |
Why | -0.006 |
ash | -0.006 |
Token | named |
Token ID | 3706 |
Feature activation | +6.53e-01 |
Pos logit contributions | |
Which | +0.009 |
Good | +0.009 |
Time | +0.009 |
Where | +0.009 |
idget | +0.009 |
Neg logit contributions | |
endant | -0.008 |
av | -0.007 |
arrest | -0.007 |
jewels | -0.007 |
brace | -0.007 |
Token | Cr |
Token ID | 3864 |
Feature activation | -9.38e-01 |
Pos logit contributions | |
endant | +0.021 |
jewels | +0.020 |
arrest | +0.020 |
brace | +0.019 |
av | +0.019 |
Neg logit contributions | |
Good | -0.016 |
Which | -0.016 |
Time | -0.015 |
Why | -0.015 |
Where | -0.015 |
Token | ust |
Token ID | 436 |
Feature activation | -5.47e-01 |
Pos logit contributions | |
Which | +0.024 |
Good | +0.023 |
Time | +0.022 |
Why | +0.022 |
Where | +0.022 |
Neg logit contributions | |
endant | -0.030 |
av | -0.029 |
arrest | -0.028 |
jewels | -0.028 |
brace | -0.028 |
Token | y |
Token ID | 88 |
Feature activation | +5.97e-02 |
Pos logit contributions | |
Which | +0.009 |
Good | +0.008 |
Time | +0.008 |
idget | +0.008 |
Why | +0.008 |
Neg logit contributions | |
endant | -0.023 |
jewels | -0.022 |
av | -0.022 |
arrest | -0.021 |
coins | -0.021 |
Token | . |
Token ID | 13 |
Feature activation | +4.07e+00 |
Pos logit contributions | |
endant | +0.002 |
av | +0.002 |
jewels | +0.002 |
arrest | +0.002 |
brace | +0.002 |
Neg logit contributions | |
Which | -0.001 |
Good | -0.001 |
Time | -0.001 |
Why | -0.001 |
Where | -0.001 |
Token | Cr |
Token ID | 3864 |
Feature activation | +2.06e-01 |
Pos logit contributions | |
endant | +0.111 |
arrest | +0.110 |
aches | +0.105 |
vern | +0.102 |
kins | +0.098 |
Neg logit contributions | |
Which | -0.122 |
Which | -0.117 |
Where | -0.115 |
Why | -0.114 |
Why | -0.112 |
Token | ust |
Token ID | 436 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
endant | +0.007 |
jewels | +0.007 |
arrest | +0.007 |
av | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.004 |
ash | -0.004 |
Time | -0.004 |
idget | -0.004 |
Good | -0.004 |
Token | y |
Token ID | 88 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
endant | +0.007 |
jewels | +0.007 |
av | +0.007 |
arrest | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Time | -0.002 |
Why | -0.002 |
Where | -0.002 |
Token | lived |
Token ID | 5615 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
av | +0.068 |
arrest | +0.067 |
endant | +0.066 |
jewels | +0.064 |
brace | +0.063 |
Neg logit contributions | |
Clean | -0.028 |
when | -0.027 |
Which | -0.027 |
Why | -0.027 |
Time | -0.026 |
Token | in |
Token ID | 287 |
Feature activation | +1.79e+00 |
Pos logit contributions | |
endant | +0.061 |
arrest | +0.061 |
hy | +0.058 |
brace | +0.054 |
� | +0.054 |
Neg logit contributions | |
over | -0.025 |
when | -0.023 |
Why | -0.022 |
Where | -0.021 |
What | -0.021 |
Token | finding |
Token ID | 4917 |
Feature activation | +6.10e-01 |
Pos logit contributions | |
agged | +0.034 |
aches | +0.033 |
hy | +0.032 |
endant | +0.032 |
arrest | +0.032 |
Neg logit contributions | |
Clean | -0.021 |
Time | -0.021 |
when | -0.021 |
activity | -0.020 |
Which | -0.020 |
Token | ! |
Token ID | 0 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
endant | +0.021 |
hy | +0.020 |
arrest | +0.020 |
pe | +0.020 |
aches | +0.019 |
Neg logit contributions | |
Which | -0.014 |
over | -0.014 |
Where | -0.013 |
What | -0.012 |
Good | -0.012 |
Token | He |
Token ID | 679 |
Feature activation | +6.13e-01 |
Pos logit contributions | |
endant | +0.008 |
av | +0.008 |
jewels | +0.008 |
arrest | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.010 |
Time | -0.010 |
Good | -0.010 |
ash | -0.010 |
Where | -0.010 |
Token | showed |
Token ID | 3751 |
Feature activation | +4.39e-01 |
Pos logit contributions | |
endant | +0.021 |
av | +0.021 |
agged | +0.021 |
arrest | +0.021 |
hy | +0.020 |
Neg logit contributions | |
over | -0.012 |
Which | -0.012 |
Where | -0.012 |
Time | -0.012 |
Clean | -0.011 |
Token | the |
Token ID | 262 |
Feature activation | +1.89e+00 |
Pos logit contributions | |
endant | +0.014 |
av | +0.013 |
arrest | +0.013 |
jewels | +0.012 |
hy | +0.012 |
Neg logit contributions | |
Which | -0.011 |
Good | -0.010 |
over | -0.010 |
Where | -0.010 |
idget | -0.010 |
Token | three |
Token ID | 1115 |
Feature activation | +3.87e+00 |
Pos logit contributions | |
agged | +0.050 |
itched | +0.046 |
aches | +0.046 |
endant | +0.046 |
itching | +0.045 |
Neg logit contributions | |
Where | -0.058 |
Which | -0.056 |
What | -0.055 |
Ready | -0.054 |
end | -0.053 |
Token | gems |
Token ID | 23685 |
Feature activation | +7.55e-01 |
Pos logit contributions | |
endant | +0.114 |
� | +0.113 |
arrest | +0.112 |
agged | +0.110 |
hy | +0.105 |
Neg logit contributions | |
Which | -0.092 |
over | -0.088 |
Where | -0.088 |
ing | -0.087 |
What | -0.085 |
Token | to |
Token ID | 284 |
Feature activation | -1.82e-01 |
Pos logit contributions | |
arrest | +0.027 |
agged | +0.027 |
endant | +0.026 |
� | +0.025 |
hy | +0.025 |
Neg logit contributions | |
over | -0.016 |
when | -0.015 |
ing | -0.015 |
Which | -0.014 |
Where | -0.013 |
Token | his |
Token ID | 465 |
Feature activation | +1.12e-01 |
Pos logit contributions | |
over | +0.005 |
What | +0.004 |
Why | +0.004 |
Which | +0.004 |
Where | +0.004 |
Neg logit contributions | |
endant | -0.006 |
hy | -0.005 |
arrest | -0.005 |
av | -0.005 |
jewels | -0.005 |
Token | friends |
Token ID | 2460 |
Feature activation | -4.69e-01 |
Pos logit contributions | |
endant | +0.004 |
agged | +0.004 |
aches | +0.004 |
arrest | +0.003 |
pe | +0.003 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Where | -0.002 |
Clean | -0.002 |
Time | -0.002 |
Token | , |
Token ID | 11 |
Feature activation | +2.12e-01 |
Pos logit contributions | |
Which | +0.013 |
Good | +0.013 |
Time | +0.013 |
Where | +0.012 |
ash | +0.012 |
Neg logit contributions | |
endant | -0.013 |
av | -0.013 |
jewels | -0.013 |
arrest | -0.013 |
brace | -0.012 |
Token | happy |
Token ID | 3772 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
endant | +0.031 |
arrest | +0.030 |
jewels | +0.030 |
av | +0.029 |
brace | +0.028 |
Neg logit contributions | |
Time | -0.019 |
Good | -0.018 |
over | -0.018 |
Time | -0.018 |
Why | -0.018 |
Token | and |
Token ID | 290 |
Feature activation | -4.54e-02 |
Pos logit contributions | |
endant | +0.038 |
av | +0.035 |
jewels | +0.035 |
arrest | +0.035 |
brace | +0.034 |
Neg logit contributions | |
Which | -0.029 |
Why | -0.028 |
Good | -0.028 |
Time | -0.028 |
Where | -0.027 |
Token | brought |
Token ID | 3181 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
when | +0.001 |
over | +0.001 |
Clean | +0.001 |
Good | +0.001 |
Where | +0.001 |
Neg logit contributions | |
endant | -0.002 |
agged | -0.001 |
ir | -0.001 |
pe | -0.001 |
arrest | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +2.46e+00 |
Pos logit contributions | |
endant | +0.030 |
hy | +0.029 |
arrest | +0.028 |
pe | +0.027 |
vern | +0.025 |
Neg logit contributions | |
over | -0.017 |
Which | -0.016 |
Where | -0.015 |
What | -0.014 |
when | -0.014 |
Token | av |
Token ID | 1196 |
Feature activation | +9.82e-01 |
Pos logit contributions | |
endant | +0.066 |
itched | +0.061 |
ink | +0.059 |
hy | +0.058 |
agged | +0.057 |
Neg logit contributions | |
Which | -0.080 |
Why | -0.076 |
Where | -0.076 |
Which | -0.075 |
What | -0.075 |
Token | oc |
Token ID | 420 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
endant | +0.036 |
arrest | +0.034 |
jewels | +0.034 |
hy | +0.034 |
agged | +0.033 |
Neg logit contributions | |
Which | -0.019 |
ash | -0.017 |
Good | -0.017 |
Where | -0.017 |
Time | -0.016 |
Token | ados |
Token ID | 22484 |
Feature activation | +3.76e-02 |
Pos logit contributions | |
endant | +0.090 |
hy | +0.082 |
jewels | +0.074 |
curly | +0.073 |
vern | +0.073 |
Neg logit contributions | |
ting | -0.122 |
ing | -0.120 |
Which | -0.110 |
fl | -0.109 |
Which | -0.109 |
Token | home |
Token ID | 1363 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
arrest | +0.002 |
endant | +0.002 |
hy | +0.001 |
agged | +0.001 |
brace | +0.001 |
Neg logit contributions | |
over | -0.001 |
when | -0.001 |
Which | -0.001 |
ash | -0.001 |
Where | -0.000 |
Token | to |
Token ID | 284 |
Feature activation | +3.32e-01 |
Pos logit contributions | |
arrest | +0.052 |
endant | +0.051 |
agged | +0.049 |
brace | +0.047 |
jewels | +0.046 |
Neg logit contributions | |
over | -0.013 |
when | -0.012 |
ing | -0.007 |
Where | -0.007 |
across | -0.006 |
Token | share |
Token ID | 2648 |
Feature activation | +1.07e+00 |
Pos logit contributions | |
endant | +0.015 |
agged | +0.012 |
aces | +0.012 |
hy | +0.012 |
ls | +0.012 |
Neg logit contributions | |
Why | -0.006 |
over | -0.006 |
Good | -0.006 |
What | -0.006 |
end | -0.006 |
Token | with |
Token ID | 351 |
Feature activation | +2.10e-01 |
Pos logit contributions | |
endant | +0.047 |
arrest | +0.044 |
hy | +0.044 |
agged | +0.043 |
jewels | +0.041 |
Neg logit contributions | |
Why | -0.016 |
Which | -0.015 |
over | -0.015 |
What | -0.015 |
Where | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +1.56e+00 |
Pos logit contributions | |
Which | +0.002 |
Where | +0.002 |
Why | +0.002 |
Good | +0.002 |
ash | +0.001 |
Neg logit contributions | |
endant | -0.004 |
arrest | -0.004 |
av | -0.004 |
jewels | -0.004 |
brace | -0.004 |
Token | It |
Token ID | 632 |
Feature activation | +9.39e-01 |
Pos logit contributions | |
endant | +0.050 |
arrest | +0.049 |
jewels | +0.048 |
av | +0.047 |
aches | +0.046 |
Neg logit contributions | |
Which | -0.039 |
Good | -0.037 |
Why | -0.036 |
Time | -0.036 |
Time | -0.036 |
Token | was |
Token ID | 373 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
arrest | +0.043 |
agged | +0.041 |
av | +0.041 |
endant | +0.040 |
ir | +0.039 |
Neg logit contributions | |
Which | -0.012 |
Why | -0.011 |
Where | -0.011 |
over | -0.011 |
Good | -0.010 |
Token | a |
Token ID | 257 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
arrest | +0.043 |
� | +0.040 |
pe | +0.038 |
endant | +0.038 |
agged | +0.037 |
Neg logit contributions | |
Which | -0.022 |
over | -0.021 |
when | -0.021 |
Where | -0.020 |
Why | -0.019 |
Token | big |
Token ID | 1263 |
Feature activation | +2.09e+00 |
Pos logit contributions | |
agged | +0.059 |
arrest | +0.059 |
endant | +0.057 |
aches | +0.055 |
av | +0.055 |
Neg logit contributions | |
Which | -0.045 |
Where | -0.043 |
Good | -0.043 |
Time | -0.042 |
Why | -0.041 |
Token | , |
Token ID | 11 |
Feature activation | +3.77e+00 |
Pos logit contributions | |
agged | +0.075 |
aches | +0.071 |
endant | +0.068 |
arrest | +0.068 |
vern | +0.066 |
Neg logit contributions | |
Good | -0.046 |
end | -0.045 |
morning | -0.044 |
when | -0.044 |
Which | -0.044 |
Token | purple |
Token ID | 14032 |
Feature activation | +1.97e+00 |
Pos logit contributions | |
arrest | +0.142 |
agged | +0.135 |
� | +0.129 |
ir | +0.123 |
alks | +0.122 |
Neg logit contributions | |
Which | -0.089 |
Where | -0.082 |
Why | -0.082 |
over | -0.082 |
What | -0.081 |
Token | jewel |
Token ID | 16927 |
Feature activation | -2.10e-02 |
Pos logit contributions | |
endant | +0.040 |
agged | +0.038 |
arrest | +0.038 |
aches | +0.036 |
vern | +0.035 |
Neg logit contributions | |
Which | -0.070 |
Good | -0.067 |
Where | -0.066 |
Why | -0.065 |
Time | -0.064 |
Token | and |
Token ID | 290 |
Feature activation | +8.89e-01 |
Pos logit contributions | |
Which | +0.000 |
Good | +0.000 |
Why | +0.000 |
Where | +0.000 |
Time | +0.000 |
Neg logit contributions | |
endant | -0.001 |
arrest | -0.001 |
av | -0.001 |
jewels | -0.001 |
brace | -0.001 |
Token | it |
Token ID | 340 |
Feature activation | +6.22e-01 |
Pos logit contributions | |
arrest | +0.035 |
agged | +0.033 |
endant | +0.032 |
ir | +0.031 |
vern | +0.031 |
Neg logit contributions | |
Which | -0.021 |
Where | -0.018 |
Why | -0.018 |
when | -0.018 |
Good | -0.018 |
Token | was |
Token ID | 373 |
Feature activation | +2.43e-01 |
Pos logit contributions | |
arrest | +0.027 |
agged | +0.026 |
endant | +0.025 |
av | +0.025 |
ir | +0.025 |
Neg logit contributions | |
Why | -0.009 |
over | -0.009 |
when | -0.009 |
Which | -0.009 |
Where | -0.008 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.00e+00 |
Pos logit contributions | |
endant | +0.038 |
av | +0.036 |
jewels | +0.036 |
brace | +0.035 |
hy | +0.034 |
Neg logit contributions | |
Which | -0.050 |
ash | -0.048 |
Time | -0.048 |
Good | -0.047 |
Where | -0.047 |
Token | loved |
Token ID | 6151 |
Feature activation | +8.20e-01 |
Pos logit contributions | |
endant | +0.031 |
jewels | +0.030 |
av | +0.029 |
arrest | +0.029 |
brace | +0.029 |
Neg logit contributions | |
Which | -0.026 |
Good | -0.025 |
Time | -0.025 |
ash | -0.025 |
idget | -0.024 |
Token | to |
Token ID | 284 |
Feature activation | +5.66e-01 |
Pos logit contributions | |
endant | +0.027 |
arrest | +0.025 |
jewels | +0.025 |
av | +0.025 |
pe | +0.024 |
Neg logit contributions | |
Which | -0.020 |
Good | -0.019 |
Why | -0.019 |
Time | -0.019 |
Where | -0.018 |
Token | eat |
Token ID | 4483 |
Feature activation | +7.24e-01 |
Pos logit contributions | |
endant | +0.023 |
jewels | +0.021 |
agged | +0.021 |
av | +0.021 |
arrest | +0.021 |
Neg logit contributions | |
Which | -0.009 |
Clean | -0.009 |
Why | -0.008 |
Time | -0.008 |
Time | -0.008 |
Token | av |
Token ID | 1196 |
Feature activation | +4.40e-01 |
Pos logit contributions | |
endant | +0.019 |
arrest | +0.018 |
jewels | +0.017 |
av | +0.016 |
hy | +0.016 |
Neg logit contributions | |
Which | -0.023 |
Good | -0.022 |
Time | -0.022 |
Why | -0.022 |
Where | -0.021 |
Token | oc |
Token ID | 420 |
Feature activation | +3.75e+00 |
Pos logit contributions | |
endant | +0.015 |
arrest | +0.014 |
jewels | +0.014 |
hy | +0.013 |
av | +0.013 |
Neg logit contributions | |
Which | -0.010 |
Good | -0.009 |
Why | -0.009 |
ash | -0.009 |
Where | -0.009 |
Token | ados |
Token ID | 22484 |
Feature activation | -6.90e-01 |
Pos logit contributions | |
endant | +0.085 |
acle | +0.080 |
hy | +0.079 |
kins | +0.076 |
pe | +0.071 |
Neg logit contributions | |
ting | -0.123 |
ing | -0.118 |
Good | -0.112 |
Which | -0.111 |
Why | -0.110 |
Token | , |
Token ID | 11 |
Feature activation | +3.04e-01 |
Pos logit contributions | |
when | +0.011 |
Which | +0.011 |
Why | +0.011 |
over | +0.010 |
ash | +0.010 |
Neg logit contributions | |
endant | -0.028 |
arrest | -0.028 |
hy | -0.026 |
agged | -0.026 |
jewels | -0.026 |
Token | they |
Token ID | 484 |
Feature activation | +5.96e-01 |
Pos logit contributions | |
endant | +0.015 |
agged | +0.015 |
ink | +0.014 |
arrest | +0.014 |
vern | +0.014 |
Neg logit contributions | |
Why | -0.004 |
Which | -0.004 |
when | -0.004 |
What | -0.003 |
Where | -0.003 |
Token | were |
Token ID | 547 |
Feature activation | +4.27e-01 |
Pos logit contributions | |
endant | +0.022 |
arrest | +0.021 |
agged | +0.020 |
vern | +0.020 |
jewels | +0.020 |
Neg logit contributions | |
Which | -0.013 |
Why | -0.013 |
Where | -0.012 |
What | -0.011 |
over | -0.011 |
Token | her |
Token ID | 607 |
Feature activation | +8.34e-01 |
Pos logit contributions | |
endant | +0.014 |
arrest | +0.014 |
hy | +0.013 |
pe | +0.012 |
agged | +0.012 |
Neg logit contributions | |
Which | -0.011 |
Why | -0.010 |
Where | -0.010 |
over | -0.010 |
Time | -0.009 |
Token | could |
Token ID | 714 |
Feature activation | +2.41e+00 |
Pos logit contributions | |
arrest | +0.014 |
endant | +0.013 |
agged | +0.013 |
vern | +0.013 |
jewels | +0.012 |
Neg logit contributions | |
over | -0.007 |
when | -0.006 |
Where | -0.006 |
ing | -0.006 |
Why | -0.006 |
Token | see |
Token ID | 766 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
agged | +0.094 |
endant | +0.093 |
jewels | +0.088 |
hy | +0.086 |
arrest | +0.084 |
Neg logit contributions | |
over | -0.044 |
Why | -0.041 |
end | -0.041 |
when | -0.039 |
why | -0.036 |
Token | lots |
Token ID | 6041 |
Feature activation | +5.90e-01 |
Pos logit contributions | |
Which | +0.024 |
Where | +0.022 |
Why | +0.022 |
Good | +0.022 |
What | +0.021 |
Neg logit contributions | |
endant | -0.035 |
arrest | -0.033 |
jewels | -0.032 |
hy | -0.032 |
av | -0.031 |
Token | of |
Token ID | 286 |
Feature activation | +1.41e+00 |
Pos logit contributions | |
endant | +0.020 |
arrest | +0.020 |
jewels | +0.019 |
av | +0.019 |
brace | +0.018 |
Neg logit contributions | |
Which | -0.013 |
Time | -0.012 |
Good | -0.012 |
Why | -0.012 |
Where | -0.012 |
Token | av |
Token ID | 1196 |
Feature activation | +7.10e-01 |
Pos logit contributions | |
endant | +0.038 |
arrest | +0.037 |
hy | +0.036 |
agged | +0.035 |
acle | +0.034 |
Neg logit contributions | |
Which | -0.042 |
Where | -0.041 |
Why | -0.041 |
What | -0.040 |
Time | -0.039 |
Token | oc |
Token ID | 420 |
Feature activation | +3.70e+00 |
Pos logit contributions | |
endant | +0.025 |
hy | +0.024 |
agged | +0.024 |
jewels | +0.024 |
acle | +0.023 |
Neg logit contributions | |
Which | -0.013 |
Good | -0.012 |
ash | -0.012 |
Where | -0.012 |
Time | -0.012 |
Token | ados |
Token ID | 22484 |
Feature activation | -8.38e-01 |
Pos logit contributions | |
endant | +0.082 |
acle | +0.076 |
hy | +0.075 |
kin | +0.072 |
kins | +0.070 |
Neg logit contributions | |
ing | -0.121 |
ting | -0.121 |
ash | -0.112 |
Good | -0.108 |
Which | -0.103 |
Token | that |
Token ID | 326 |
Feature activation | -7.96e-02 |
Pos logit contributions | |
Why | +0.013 |
Which | +0.013 |
Where | +0.013 |
over | +0.013 |
when | +0.012 |
Neg logit contributions | |
endant | -0.033 |
agged | -0.032 |
arrest | -0.032 |
hy | -0.031 |
jewels | -0.030 |
Token | the |
Token ID | 262 |
Feature activation | +2.16e-01 |
Pos logit contributions | |
Why | +0.002 |
Which | +0.002 |
over | +0.002 |
Where | +0.002 |
Good | +0.002 |
Neg logit contributions | |
endant | -0.003 |
arrest | -0.003 |
agged | -0.003 |
brace | -0.003 |
vern | -0.003 |
Token | supplier |
Token ID | 22693 |
Feature activation | +3.00e-01 |
Pos logit contributions | |
endant | +0.007 |
agged | +0.007 |
vern | +0.006 |
brace | +0.006 |
arrest | +0.006 |
Neg logit contributions | |
Where | -0.005 |
Why | -0.005 |
Which | -0.005 |
What | -0.005 |
Ready | -0.005 |
Token | had |
Token ID | 550 |
Feature activation | -1.37e-01 |
Pos logit contributions | |
arrest | +0.011 |
endant | +0.010 |
brace | +0.010 |
agged | +0.010 |
jewels | +0.010 |
Neg logit contributions | |
over | -0.006 |
Why | -0.005 |
ash | -0.005 |
Which | -0.005 |
Where | -0.005 |
Token | , |
Token ID | 11 |
Feature activation | +3.82e-01 |
Pos logit contributions | |
endant | +0.032 |
arrest | +0.030 |
jewels | +0.028 |
agged | +0.028 |
brace | +0.027 |
Neg logit contributions | |
when | -0.020 |
Why | -0.020 |
Which | -0.020 |
Why | -0.020 |
louder | -0.020 |
Token | " |
Token ID | 366 |
Feature activation | +1.51e-01 |
Pos logit contributions | |
endant | +0.016 |
arrest | +0.015 |
jewels | +0.015 |
av | +0.015 |
brace | +0.014 |
Neg logit contributions | |
Which | -0.007 |
Good | -0.006 |
Why | -0.006 |
Time | -0.006 |
Where | -0.006 |
Token | I |
Token ID | 40 |
Feature activation | +6.67e-01 |
Pos logit contributions | |
endant | +0.006 |
av | +0.005 |
arrest | +0.005 |
jewels | +0.005 |
brace | +0.005 |
Neg logit contributions | |
Which | -0.003 |
Good | -0.003 |
ash | -0.003 |
idget | -0.003 |
Time | -0.003 |
Token | love |
Token ID | 1842 |
Feature activation | +1.91e+00 |
Pos logit contributions | |
endant | +0.022 |
jewels | +0.022 |
av | +0.022 |
arrest | +0.021 |
brace | +0.021 |
Neg logit contributions | |
Which | -0.016 |
Good | -0.015 |
Time | -0.015 |
Why | -0.014 |
ash | -0.014 |
Token | av |
Token ID | 1196 |
Feature activation | +4.56e-01 |
Pos logit contributions | |
agged | +0.063 |
endant | +0.062 |
acle | +0.060 |
hy | +0.060 |
pe | +0.055 |
Neg logit contributions | |
Why | -0.050 |
Which | -0.048 |
Good | -0.046 |
when | -0.045 |
What | -0.045 |
Token | oc |
Token ID | 420 |
Feature activation | +3.65e+00 |
Pos logit contributions | |
endant | +0.017 |
jewels | +0.016 |
arrest | +0.016 |
hy | +0.015 |
acle | +0.015 |
Neg logit contributions | |
Which | -0.009 |
ash | -0.008 |
Good | -0.008 |
Why | -0.008 |
Time | -0.008 |
Token | ados |
Token ID | 22484 |
Feature activation | -7.13e-01 |
Pos logit contributions | |
endant | +0.085 |
acle | +0.075 |
hy | +0.073 |
jewels | +0.070 |
spe | +0.067 |
Neg logit contributions | |
ing | -0.122 |
ting | -0.121 |
ash | -0.113 |
Good | -0.113 |
Which | -0.111 |
Token | ! |
Token ID | 0 |
Feature activation | +2.73e-01 |
Pos logit contributions | |
Which | +0.014 |
ash | +0.014 |
when | +0.014 |
Why | +0.013 |
Good | +0.013 |
Neg logit contributions | |
endant | -0.026 |
arrest | -0.025 |
agged | -0.024 |
jewels | -0.024 |
brace | -0.024 |
Token | They |
Token ID | 1119 |
Feature activation | +1.55e+00 |
Pos logit contributions | |
endant | +0.009 |
av | +0.008 |
jewels | +0.008 |
arrest | +0.008 |
brace | +0.008 |
Neg logit contributions | |
Which | -0.007 |
Time | -0.007 |
ash | -0.006 |
idget | -0.006 |
Good | -0.006 |
Token | are |
Token ID | 389 |
Feature activation | +1.09e+00 |
Pos logit contributions | |
agged | +0.057 |
endant | +0.056 |
arrest | +0.055 |
alo | +0.054 |
hy | +0.052 |
Neg logit contributions | |
over | -0.029 |
Which | -0.029 |
when | -0.029 |
Why | -0.029 |
Good | -0.028 |
Token | so |
Token ID | 523 |
Feature activation | +2.65e+00 |
Pos logit contributions | |
arrest | +0.041 |
agged | +0.040 |
endant | +0.040 |
� | +0.038 |
hy | +0.038 |
Neg logit contributions | |
over | -0.022 |
when | -0.021 |
Which | -0.021 |
why | -0.020 |
Why | -0.020 |
Token | made |
Token ID | 925 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
endant | +0.013 |
agged | +0.012 |
arrest | +0.012 |
av | +0.012 |
pe | +0.012 |
Neg logit contributions | |
Good | -0.011 |
Clean | -0.010 |
over | -0.010 |
Time | -0.010 |
when | -0.010 |
Token | up |
Token ID | 510 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
Which | +0.030 |
Time | +0.027 |
Why | +0.027 |
Where | +0.027 |
ash | +0.027 |
Neg logit contributions | |
av | -0.032 |
endant | -0.031 |
jewels | -0.031 |
arrest | -0.030 |
brace | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | -7.36e-01 |
Pos logit contributions | |
endant | +0.072 |
arrest | +0.065 |
agged | +0.065 |
pe | +0.065 |
aches | +0.064 |
Neg logit contributions | |
over | -0.029 |
Good | -0.029 |
when | -0.027 |
Clean | -0.025 |
Time | -0.025 |
Token | They |
Token ID | 1119 |
Feature activation | +7.49e-01 |
Pos logit contributions | |
Which | +0.020 |
Time | +0.018 |
ash | +0.018 |
Where | +0.018 |
idget | +0.018 |
Neg logit contributions | |
endant | -0.022 |
av | -0.021 |
arrest | -0.021 |
jewels | -0.021 |
brace | -0.020 |
Token | shared |
Token ID | 4888 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
endant | +0.026 |
arrest | +0.026 |
av | +0.025 |
agged | +0.024 |
jewels | +0.024 |
Neg logit contributions | |
over | -0.016 |
idget | -0.015 |
Clean | -0.014 |
Which | -0.014 |
Good | -0.014 |
Token | the |
Token ID | 262 |
Feature activation | +3.65e+00 |
Pos logit contributions | |
endant | +0.069 |
agged | +0.066 |
hy | +0.065 |
pe | +0.065 |
arrest | +0.064 |
Neg logit contributions | |
over | -0.034 |
Which | -0.033 |
when | -0.031 |
What | -0.031 |
Good | -0.030 |
Token | jewel |
Token ID | 16927 |
Feature activation | +1.69e+00 |
Pos logit contributions | |
arrest | +0.098 |
alks | +0.096 |
� | +0.095 |
ir | +0.093 |
agged | +0.090 |
Neg logit contributions | |
Which | -0.107 |
end | -0.104 |
What | -0.104 |
Good | -0.101 |
Where | -0.101 |
Token | and |
Token ID | 290 |
Feature activation | +3.77e-01 |
Pos logit contributions | |
agged | +0.073 |
endant | +0.070 |
hy | +0.067 |
arrest | +0.067 |
alo | +0.065 |
Neg logit contributions | |
when | -0.028 |
over | -0.028 |
's | -0.024 |
ing | -0.022 |
out | -0.021 |
Token | had |
Token ID | 550 |
Feature activation | -1.64e-01 |
Pos logit contributions | |
endant | +0.013 |
agged | +0.012 |
vern | +0.012 |
pe | +0.012 |
av | +0.012 |
Neg logit contributions | |
Good | -0.009 |
over | -0.008 |
Which | -0.008 |
Clean | -0.008 |
when | -0.008 |
Token | lots |
Token ID | 6041 |
Feature activation | +1.61e+00 |
Pos logit contributions | |
Which | +0.004 |
Good | +0.004 |
Time | +0.004 |
Where | +0.004 |
Time | +0.004 |
Neg logit contributions | |
endant | -0.005 |
arrest | -0.005 |
jewels | -0.005 |
av | -0.005 |
pe | -0.005 |
Token | of |
Token ID | 286 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
endant | +0.068 |
pe | +0.066 |
arrest | +0.065 |
jewels | +0.064 |
aches | +0.063 |
Neg logit contributions | |
Time | -0.021 |
Good | -0.020 |
ash | -0.019 |
when | -0.019 |
over | -0.018 |
Token | little |
Token ID | 1310 |
Feature activation | +5.04e-01 |
Pos logit contributions | |
Which | +0.001 |
ash | +0.001 |
idget | +0.001 |
Good | +0.001 |
Time | +0.001 |
Neg logit contributions | |
av | -0.001 |
endant | -0.001 |
jewels | -0.001 |
arrest | -0.001 |
brace | -0.001 |
Token | girl |
Token ID | 2576 |
Feature activation | +6.07e-01 |
Pos logit contributions | |
endant | +0.020 |
av | +0.020 |
jewels | +0.020 |
arrest | +0.020 |
brace | +0.019 |
Neg logit contributions | |
Which | -0.008 |
Good | -0.007 |
Time | -0.007 |
ash | -0.007 |
Where | -0.007 |
Token | called |
Token ID | 1444 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
endant | +0.011 |
arrest | +0.011 |
av | +0.010 |
jewels | +0.010 |
hy | +0.010 |
Neg logit contributions | |
Which | -0.023 |
Ready | -0.023 |
Good | -0.023 |
Time | -0.023 |
ash | -0.022 |
Token | Lib |
Token ID | 7980 |
Feature activation | -5.40e-01 |
Pos logit contributions | |
endant | +0.038 |
jewels | +0.036 |
av | +0.036 |
arrest | +0.035 |
brace | +0.034 |
Neg logit contributions | |
Which | -0.028 |
Good | -0.027 |
Time | -0.027 |
Time | -0.026 |
Why | -0.026 |
Token | by |
Token ID | 1525 |
Feature activation | -8.70e-01 |
Pos logit contributions | |
Which | +0.012 |
Good | +0.011 |
Time | +0.011 |
ash | +0.011 |
Where | +0.011 |
Neg logit contributions | |
endant | -0.019 |
av | -0.018 |
arrest | -0.018 |
jewels | -0.018 |
brace | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | +3.63e+00 |
Pos logit contributions | |
Which | +0.022 |
Time | +0.022 |
Ready | +0.021 |
Good | +0.021 |
idget | +0.020 |
Neg logit contributions | |
endant | -0.028 |
jewels | -0.027 |
av | -0.027 |
arrest | -0.026 |
brace | -0.025 |
Token | Lib |
Token ID | 7980 |
Feature activation | +5.60e-01 |
Pos logit contributions | |
arrest | +0.097 |
endant | +0.096 |
kins | +0.091 |
av | +0.088 |
swords | +0.087 |
Neg logit contributions | |
Which | -0.111 |
Where | -0.105 |
Why | -0.104 |
Which | -0.104 |
Good | -0.104 |
Token | by |
Token ID | 1525 |
Feature activation | +5.31e-01 |
Pos logit contributions | |
arrest | +0.022 |
endant | +0.021 |
av | +0.021 |
� | +0.021 |
jewels | +0.021 |
Neg logit contributions | |
Which | -0.010 |
ash | -0.008 |
Good | -0.008 |
Where | -0.008 |
idget | -0.008 |
Token | was |
Token ID | 373 |
Feature activation | -3.01e-01 |
Pos logit contributions | |
endant | +0.018 |
arrest | +0.018 |
av | +0.018 |
jewels | +0.018 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.012 |
Good | -0.011 |
Time | -0.011 |
Why | -0.011 |
Clean | -0.011 |
Token | a |
Token ID | 257 |
Feature activation | +6.09e-02 |
Pos logit contributions | |
Which | +0.008 |
Good | +0.007 |
Time | +0.007 |
Why | +0.007 |
Where | +0.007 |
Neg logit contributions | |
endant | -0.010 |
arrest | -0.009 |
jewels | -0.009 |
av | -0.009 |
brace | -0.009 |
Token | j |
Token ID | 474 |
Feature activation | +1.78e+00 |
Pos logit contributions | |
endant | +0.002 |
av | +0.002 |
jewels | +0.002 |
arrest | +0.002 |
brace | +0.002 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Time | -0.002 |
ash | -0.002 |
Where | -0.002 |
Token | black |
Token ID | 2042 |
Feature activation | +8.42e-03 |
Pos logit contributions | |
Which | +0.012 |
ash | +0.012 |
idget | +0.012 |
Good | +0.011 |
Time | +0.011 |
Neg logit contributions | |
av | -0.012 |
endant | -0.012 |
jewels | -0.012 |
arrest | -0.011 |
brace | -0.011 |
Token | je |
Token ID | 11223 |
Feature activation | +2.57e+00 |
Pos logit contributions | |
endant | +0.000 |
av | +0.000 |
jewels | +0.000 |
arrest | +0.000 |
brace | +0.000 |
Neg logit contributions | |
Which | -0.000 |
Good | -0.000 |
Time | -0.000 |
Where | -0.000 |
ash | -0.000 |
Token | ep |
Token ID | 538 |
Feature activation | -5.89e-01 |
Pos logit contributions | |
endant | +0.082 |
jewels | +0.081 |
arrest | +0.077 |
av | +0.076 |
brace | +0.074 |
Neg logit contributions | |
Which | -0.059 |
Why | -0.059 |
Time | -0.058 |
Where | -0.058 |
ing | -0.057 |
Token | . |
Token ID | 13 |
Feature activation | +1.58e+00 |
Pos logit contributions | |
Which | +0.015 |
Good | +0.014 |
Time | +0.014 |
ash | +0.013 |
Which | +0.013 |
Neg logit contributions | |
arrest | -0.019 |
endant | -0.018 |
hy | -0.018 |
av | -0.018 |
jewels | -0.018 |
Token | The |
Token ID | 383 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
endant | +0.053 |
aches | +0.049 |
av | +0.049 |
jewels | +0.049 |
brace | +0.049 |
Neg logit contributions | |
Which | -0.038 |
Good | -0.038 |
Time | -0.037 |
Why | -0.037 |
Time | -0.036 |
Token | je |
Token ID | 11223 |
Feature activation | +3.61e+00 |
Pos logit contributions | |
endant | +0.029 |
av | +0.028 |
arrest | +0.027 |
brace | +0.026 |
jewels | +0.026 |
Neg logit contributions | |
Which | -0.035 |
Good | -0.033 |
Where | -0.033 |
Time | -0.033 |
Why | -0.032 |
Token | ep |
Token ID | 538 |
Feature activation | +1.04e+00 |
Pos logit contributions | |
arrest | +0.126 |
endant | +0.125 |
onna | +0.124 |
jewels | +0.123 |
av | +0.122 |
Neg logit contributions | |
Which | -0.068 |
ing | -0.067 |
What | -0.066 |
Where | -0.066 |
ch | -0.064 |
Token | loved |
Token ID | 6151 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
av | +0.041 |
endant | +0.040 |
arrest | +0.040 |
brace | +0.039 |
jewels | +0.039 |
Neg logit contributions | |
Which | -0.017 |
Why | -0.016 |
Where | -0.016 |
Good | -0.016 |
Time | -0.016 |
Token | going |
Token ID | 1016 |
Feature activation | +7.11e-01 |
Pos logit contributions | |
endant | +0.045 |
agged | +0.043 |
arrest | +0.041 |
kins | +0.041 |
aches | +0.040 |
Neg logit contributions | |
Which | -0.022 |
Why | -0.020 |
Where | -0.020 |
Clean | -0.020 |
Time | -0.020 |
Token | on |
Token ID | 319 |
Feature activation | +1.15e+00 |
Pos logit contributions | |
endant | +0.027 |
arrest | +0.025 |
av | +0.025 |
brace | +0.025 |
jewels | +0.024 |
Neg logit contributions | |
Which | -0.015 |
over | -0.014 |
Good | -0.014 |
Time | -0.013 |
Why | -0.013 |
Token | new |
Token ID | 649 |
Feature activation | +1.26e+00 |
Pos logit contributions | |
endant | +0.042 |
agged | +0.040 |
kins | +0.037 |
ocket | +0.036 |
acle | +0.035 |
Neg logit contributions | |
Which | -0.027 |
Time | -0.025 |
Why | -0.025 |
Where | -0.024 |
Good | -0.024 |
Token | Lucy |
Token ID | 22162 |
Feature activation | +2.48e-01 |
Pos logit contributions | |
Which | +0.035 |
ash | +0.035 |
idget | +0.034 |
Time | +0.033 |
Where | +0.033 |
Neg logit contributions | |
endant | -0.034 |
arrest | -0.034 |
av | -0.033 |
jewels | -0.033 |
hy | -0.033 |
Token | was |
Token ID | 373 |
Feature activation | -6.52e-01 |
Pos logit contributions | |
endant | +0.009 |
av | +0.009 |
jewels | +0.009 |
agged | +0.009 |
arrest | +0.009 |
Neg logit contributions | |
Good | -0.004 |
over | -0.004 |
Clean | -0.004 |
Which | -0.004 |
Why | -0.004 |
Token | happy |
Token ID | 3772 |
Feature activation | +9.69e-01 |
Pos logit contributions | |
over | +0.017 |
Good | +0.017 |
Which | +0.016 |
Time | +0.016 |
Why | +0.016 |
Neg logit contributions | |
endant | -0.021 |
av | -0.020 |
jewels | -0.020 |
arrest | -0.019 |
brace | -0.019 |
Token | to |
Token ID | 284 |
Feature activation | -2.22e-01 |
Pos logit contributions | |
endant | +0.028 |
jewels | +0.027 |
av | +0.027 |
arrest | +0.027 |
brace | +0.026 |
Neg logit contributions | |
Which | -0.027 |
Good | -0.026 |
Time | -0.026 |
ash | -0.025 |
idget | -0.025 |
Token | share |
Token ID | 2648 |
Feature activation | +1.12e+00 |
Pos logit contributions | |
Which | +0.005 |
Why | +0.005 |
Where | +0.005 |
Good | +0.005 |
Time | +0.005 |
Neg logit contributions | |
endant | -0.008 |
av | -0.008 |
jewels | -0.007 |
coins | -0.007 |
brace | -0.007 |
Token | her |
Token ID | 607 |
Feature activation | +3.59e+00 |
Pos logit contributions | |
endant | +0.041 |
arrest | +0.037 |
pe | +0.036 |
agged | +0.036 |
hy | +0.036 |
Neg logit contributions | |
Why | -0.025 |
Which | -0.025 |
What | -0.024 |
Where | -0.024 |
over | -0.024 |
Token | jewel |
Token ID | 16927 |
Feature activation | +1.73e+00 |
Pos logit contributions | |
hy | +0.110 |
arrest | +0.108 |
ir | +0.106 |
� | +0.105 |
ink | +0.104 |
Neg logit contributions | |
Which | -0.093 |
Where | -0.088 |
What | -0.087 |
end | -0.087 |
when | -0.086 |
Token | with |
Token ID | 351 |
Feature activation | -1.13e-01 |
Pos logit contributions | |
agged | +0.074 |
endant | +0.072 |
arrest | +0.070 |
hy | +0.068 |
ir | +0.066 |
Neg logit contributions | |
when | -0.030 |
over | -0.026 |
's | -0.020 |
after | -0.019 |
end | -0.018 |
Token | her |
Token ID | 607 |
Feature activation | +2.05e-01 |
Pos logit contributions | |
Which | +0.003 |
Why | +0.003 |
Good | +0.003 |
Where | +0.003 |
Time | +0.003 |
Neg logit contributions | |
endant | -0.004 |
jewels | -0.004 |
arrest | -0.004 |
av | -0.003 |
brace | -0.003 |
Token | friend |
Token ID | 1545 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
endant | +0.008 |
arrest | +0.007 |
agged | +0.007 |
aches | +0.007 |
pe | +0.007 |
Neg logit contributions | |
when | -0.004 |
Which | -0.004 |
Where | -0.004 |
Why | -0.003 |
over | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -1.03e+00 |
Pos logit contributions | |
Which | +0.028 |
Time | +0.027 |
Good | +0.027 |
Where | +0.026 |
ash | +0.026 |
Neg logit contributions | |
endant | -0.031 |
av | -0.030 |
jewels | -0.030 |
arrest | -0.029 |
brace | -0.029 |
Token | said |
Token ID | 531 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
endant | +0.044 |
arrest | +0.042 |
agged | +0.042 |
vern | +0.042 |
av | +0.041 |
Neg logit contributions | |
when | -0.020 |
over | -0.020 |
Why | -0.019 |
Clean | -0.019 |
Good | -0.018 |
Token | , |
Token ID | 11 |
Feature activation | +5.74e-01 |
Pos logit contributions | |
endant | +0.050 |
arrest | +0.047 |
jewels | +0.043 |
agged | +0.042 |
brace | +0.042 |
Neg logit contributions | |
Which | -0.034 |
Good | -0.033 |
over | -0.032 |
Why | -0.032 |
Where | -0.031 |
Token | " |
Token ID | 366 |
Feature activation | +3.85e-01 |
Pos logit contributions | |
endant | +0.022 |
jewels | +0.021 |
av | +0.021 |
arrest | +0.021 |
brace | +0.021 |
Neg logit contributions | |
Which | -0.011 |
Good | -0.010 |
Time | -0.010 |
Why | -0.010 |
Where | -0.010 |
Token | Hello |
Token ID | 15496 |
Feature activation | +1.97e-01 |
Pos logit contributions | |
endant | +0.015 |
av | +0.015 |
arrest | +0.015 |
jewels | +0.015 |
brace | +0.014 |
Neg logit contributions | |
Which | -0.006 |
ash | -0.006 |
idget | -0.006 |
Good | -0.006 |
Time | -0.006 |
Token | ! |
Token ID | 0 |
Feature activation | +7.70e-01 |
Pos logit contributions | |
av | +0.004 |
endant | +0.004 |
jewels | +0.004 |
arrest | +0.004 |
brace | +0.004 |
Neg logit contributions | |
Which | -0.007 |
Time | -0.006 |
ash | -0.006 |
idget | -0.006 |
Good | -0.006 |
Token | Can |
Token ID | 1680 |
Feature activation | +3.58e+00 |
Pos logit contributions | |
endant | +0.027 |
av | +0.026 |
arrest | +0.026 |
jewels | +0.026 |
hy | +0.025 |
Neg logit contributions | |
Which | -0.016 |
ash | -0.015 |
Time | -0.015 |
idget | -0.015 |
Where | -0.014 |
Token | I |
Token ID | 314 |
Feature activation | +1.36e+00 |
Pos logit contributions | |
endant | +0.145 |
jewels | +0.133 |
brace | +0.133 |
agged | +0.132 |
kins | +0.132 |
Neg logit contributions | |
Why | -0.076 |
Which | -0.073 |
Good | -0.072 |
Why | -0.071 |
What | -0.067 |
Token | come |
Token ID | 1282 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
endant | +0.053 |
jewels | +0.051 |
av | +0.051 |
agged | +0.050 |
brace | +0.050 |
Neg logit contributions | |
Which | -0.024 |
over | -0.024 |
Good | -0.024 |
Why | -0.024 |
Time | -0.023 |
Token | in |
Token ID | 287 |
Feature activation | +1.08e+00 |
Pos logit contributions | |
endant | +0.061 |
av | +0.058 |
arrest | +0.058 |
jewels | +0.057 |
brace | +0.056 |
Neg logit contributions | |
Which | -0.038 |
Why | -0.036 |
Good | -0.036 |
over | -0.035 |
Where | -0.034 |
Token | and |
Token ID | 290 |
Feature activation | +3.86e-01 |
Pos logit contributions | |
endant | +0.040 |
brace | +0.037 |
aches | +0.037 |
jewels | +0.037 |
av | +0.036 |
Neg logit contributions | |
Which | -0.025 |
Good | -0.024 |
Why | -0.024 |
over | -0.023 |
Time | -0.022 |
Token | play |
Token ID | 711 |
Feature activation | -5.59e-02 |
Pos logit contributions | |
endant | +0.015 |
agged | +0.014 |
av | +0.014 |
jewels | +0.014 |
brace | +0.014 |
Neg logit contributions | |
Which | -0.008 |
Good | -0.007 |
Why | -0.007 |
Where | -0.007 |
Time | -0.007 |
Token | She |
Token ID | 1375 |
Feature activation | +3.10e-01 |
Pos logit contributions | |
av | +0.035 |
endant | +0.035 |
jewels | +0.033 |
brace | +0.033 |
hy | +0.033 |
Neg logit contributions | |
Which | -0.056 |
ash | -0.054 |
Time | -0.053 |
Good | -0.052 |
Where | -0.052 |
Token | loved |
Token ID | 6151 |
Feature activation | +5.51e-01 |
Pos logit contributions | |
endant | +0.009 |
jewels | +0.009 |
av | +0.009 |
arrest | +0.009 |
brace | +0.009 |
Neg logit contributions | |
Which | -0.008 |
ash | -0.008 |
Good | -0.008 |
Time | -0.008 |
idget | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | +3.11e-01 |
Pos logit contributions | |
endant | +0.018 |
jewels | +0.017 |
arrest | +0.017 |
av | +0.016 |
brace | +0.016 |
Neg logit contributions | |
Which | -0.014 |
Good | -0.013 |
Time | -0.013 |
Why | -0.013 |
Where | -0.013 |
Token | eat |
Token ID | 4483 |
Feature activation | +5.88e-01 |
Pos logit contributions | |
endant | +0.012 |
jewels | +0.011 |
arrest | +0.011 |
av | +0.011 |
agged | +0.011 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.005 |
Time | -0.005 |
Why | -0.005 |
Clean | -0.005 |
Token | av |
Token ID | 1196 |
Feature activation | +1.91e-01 |
Pos logit contributions | |
endant | +0.016 |
arrest | +0.015 |
hy | +0.014 |
jewels | +0.014 |
agged | +0.014 |
Neg logit contributions | |
Which | -0.018 |
Good | -0.017 |
Why | -0.017 |
Time | -0.017 |
ash | -0.016 |
Token | oc |
Token ID | 420 |
Feature activation | +3.58e+00 |
Pos logit contributions | |
endant | +0.006 |
jewels | +0.006 |
arrest | +0.006 |
hy | +0.006 |
av | +0.006 |
Neg logit contributions | |
Which | -0.004 |
Good | -0.004 |
ash | -0.004 |
Time | -0.004 |
Why | -0.004 |
Token | ados |
Token ID | 22484 |
Feature activation | -1.01e+00 |
Pos logit contributions | |
endant | +0.084 |
acle | +0.076 |
kins | +0.073 |
hy | +0.073 |
kin | +0.068 |
Neg logit contributions | |
ting | -0.116 |
ing | -0.111 |
Good | -0.109 |
Which | -0.105 |
ning | -0.102 |
Token | because |
Token ID | 780 |
Feature activation | +1.18e+00 |
Pos logit contributions | |
when | +0.018 |
over | +0.017 |
Why | +0.017 |
Which | +0.016 |
ash | +0.016 |
Neg logit contributions | |
endant | -0.041 |
arrest | -0.040 |
agged | -0.038 |
hy | -0.037 |
jewels | -0.037 |
Token | they |
Token ID | 484 |
Feature activation | +6.61e-01 |
Pos logit contributions | |
endant | +0.040 |
arrest | +0.038 |
hy | +0.036 |
agged | +0.035 |
brace | +0.034 |
Neg logit contributions | |
Which | -0.033 |
Why | -0.030 |
Where | -0.029 |
Which | -0.028 |
What | -0.028 |
Token | were |
Token ID | 547 |
Feature activation | +1.78e-01 |
Pos logit contributions | |
endant | +0.023 |
arrest | +0.022 |
agged | +0.021 |
hy | +0.021 |
brace | +0.020 |
Neg logit contributions | |
Why | -0.016 |
Which | -0.015 |
Where | -0.014 |
What | -0.014 |
over | -0.013 |
Token | green |
Token ID | 4077 |
Feature activation | +4.87e-01 |
Pos logit contributions | |
endant | +0.007 |
arrest | +0.006 |
hy | +0.006 |
agged | +0.006 |
acle | +0.006 |
Neg logit contributions | |
Which | -0.004 |
Why | -0.004 |
Where | -0.004 |
over | -0.004 |
when | -0.004 |
Token | thin |
Token ID | 7888 |
Feature activation | +1.06e-01 |
Pos logit contributions | |
Which | +0.006 |
ash | +0.006 |
Good | +0.005 |
idget | +0.005 |
Time | +0.005 |
Neg logit contributions | |
endant | -0.006 |
av | -0.006 |
jewels | -0.006 |
arrest | -0.006 |
brace | -0.006 |
Token | par |
Token ID | 1582 |
Feature activation | +2.17e+00 |
Pos logit contributions | |
endant | +0.004 |
arrest | +0.003 |
jewels | +0.003 |
av | +0.003 |
brace | +0.003 |
Neg logit contributions | |
Which | -0.003 |
Good | -0.002 |
Time | -0.002 |
Why | -0.002 |
ash | -0.002 |
Token | rot |
Token ID | 10599 |
Feature activation | -5.45e-01 |
Pos logit contributions | |
jewels | +0.062 |
av | +0.058 |
endant | +0.058 |
arrest | +0.057 |
coins | +0.057 |
Neg logit contributions | |
ing | -0.056 |
ch | -0.054 |
idget | -0.054 |
Time | -0.053 |
ash | -0.053 |
Token | . |
Token ID | 13 |
Feature activation | +2.72e+00 |
Pos logit contributions | |
Which | +0.018 |
Time | +0.017 |
Good | +0.017 |
Ready | +0.017 |
idget | +0.017 |
Neg logit contributions | |
endant | -0.013 |
arrest | -0.013 |
av | -0.013 |
jewels | -0.013 |
brace | -0.012 |
Token | The |
Token ID | 383 |
Feature activation | +1.70e+00 |
Pos logit contributions | |
endant | +0.107 |
aches | +0.105 |
vern | +0.103 |
coins | +0.100 |
arrest | +0.100 |
Neg logit contributions | |
Where | -0.052 |
Time | -0.051 |
Good | -0.051 |
Why | -0.050 |
Why | -0.049 |
Token | par |
Token ID | 1582 |
Feature activation | +3.56e+00 |
Pos logit contributions | |
av | +0.050 |
agged | +0.049 |
endant | +0.049 |
arrest | +0.047 |
aches | +0.047 |
Neg logit contributions | |
Which | -0.044 |
Where | -0.043 |
Time | -0.041 |
What | -0.041 |
Why | -0.041 |
Token | rot |
Token ID | 10599 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
breath | +0.123 |
hips | +0.119 |
jewels | +0.115 |
av | +0.114 |
arrest | +0.113 |
Neg logit contributions | |
ing | -0.067 |
ch | -0.065 |
Where | -0.064 |
Which | -0.062 |
V | -0.062 |
Token | liked |
Token ID | 8288 |
Feature activation | +1.60e+00 |
Pos logit contributions | |
arrest | +0.043 |
endant | +0.042 |
av | +0.041 |
jewels | +0.040 |
agged | +0.039 |
Neg logit contributions | |
Which | -0.022 |
Why | -0.021 |
Good | -0.020 |
Clean | -0.020 |
Where | -0.019 |
Token | to |
Token ID | 284 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
endant | +0.071 |
kins | +0.067 |
� | +0.067 |
agged | +0.066 |
ink | +0.066 |
Neg logit contributions | |
Which | -0.023 |
Why | -0.023 |
when | -0.022 |
over | -0.021 |
Where | -0.020 |
Token | fly |
Token ID | 6129 |
Feature activation | +1.01e+00 |
Pos logit contributions | |
endant | +0.059 |
agged | +0.053 |
ls | +0.052 |
� | +0.052 |
av | +0.051 |
Neg logit contributions | |
Why | -0.020 |
jazz | -0.019 |
rhythm | -0.019 |
end | -0.019 |
over | -0.019 |
Token | around |
Token ID | 1088 |
Feature activation | +6.25e-01 |
Pos logit contributions | |
arrest | +0.040 |
endant | +0.040 |
� | +0.038 |
av | +0.036 |
mm | +0.035 |
Neg logit contributions | |
over | -0.024 |
when | -0.022 |
across | -0.020 |
Why | -0.019 |
Which | -0.018 |
Token | to |
Token ID | 284 |
Feature activation | +8.90e-01 |
Pos logit contributions | |
endant | +0.010 |
jewels | +0.010 |
av | +0.009 |
arrest | +0.009 |
brace | +0.009 |
Neg logit contributions | |
Which | -0.007 |
Good | -0.007 |
Time | -0.006 |
Why | -0.006 |
Clean | -0.006 |
Token | enjoy |
Token ID | 2883 |
Feature activation | +6.68e-01 |
Pos logit contributions | |
endant | +0.035 |
jewels | +0.032 |
av | +0.032 |
agged | +0.031 |
arrest | +0.030 |
Neg logit contributions | |
Which | -0.017 |
Why | -0.017 |
Good | -0.017 |
Time | -0.016 |
Time | -0.016 |
Token | eating |
Token ID | 6600 |
Feature activation | +1.27e+00 |
Pos logit contributions | |
endant | +0.024 |
hy | +0.021 |
agged | +0.021 |
arrest | +0.021 |
jewels | +0.020 |
Neg logit contributions | |
Which | -0.016 |
Why | -0.016 |
Good | -0.015 |
What | -0.015 |
Time | -0.015 |
Token | her |
Token ID | 607 |
Feature activation | +8.08e-01 |
Pos logit contributions | |
endant | +0.043 |
arrest | +0.040 |
hy | +0.038 |
agged | +0.038 |
jewels | +0.035 |
Neg logit contributions | |
Which | -0.030 |
Why | -0.029 |
Good | -0.029 |
when | -0.028 |
Time | -0.028 |
Token | av |
Token ID | 1196 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
endant | +0.025 |
arrest | +0.024 |
hy | +0.023 |
av | +0.023 |
agged | +0.023 |
Neg logit contributions | |
Which | -0.019 |
Good | -0.018 |
ash | -0.018 |
when | -0.017 |
Time | -0.017 |
Token | oc |
Token ID | 420 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
endant | +0.019 |
jewels | +0.018 |
arrest | +0.018 |
alo | +0.018 |
hy | +0.018 |
Neg logit contributions | |
ash | -0.008 |
Which | -0.008 |
Good | -0.007 |
ch | -0.007 |
ing | -0.007 |
Token | ados |
Token ID | 22484 |
Feature activation | -4.81e-01 |
Pos logit contributions | |
endant | +0.079 |
jewels | +0.069 |
acle | +0.067 |
hy | +0.065 |
onna | +0.065 |
Neg logit contributions | |
ting | -0.110 |
ing | -0.110 |
ning | -0.105 |
ash | -0.105 |
fl | -0.102 |
Token | with |
Token ID | 351 |
Feature activation | +1.23e-01 |
Pos logit contributions | |
when | +0.009 |
over | +0.008 |
Why | +0.007 |
ing | +0.007 |
ash | +0.006 |
Neg logit contributions | |
endant | -0.020 |
arrest | -0.019 |
agged | -0.019 |
hy | -0.018 |
jewels | -0.017 |
Token | a |
Token ID | 257 |
Feature activation | +3.17e-01 |
Pos logit contributions | |
endant | +0.005 |
arrest | +0.004 |
agged | +0.004 |
jewels | +0.004 |
hy | +0.004 |
Neg logit contributions | |
Why | -0.003 |
Which | -0.003 |
Where | -0.003 |
Time | -0.003 |
Good | -0.003 |
Token | smile |
Token ID | 8212 |
Feature activation | -6.86e-01 |
Pos logit contributions | |
endant | +0.008 |
agged | +0.007 |
arrest | +0.007 |
av | +0.007 |
jewels | +0.007 |
Neg logit contributions | |
Which | -0.010 |
Time | -0.010 |
Where | -0.010 |
Good | -0.010 |
Why | -0.009 |
Token | on |
Token ID | 319 |
Feature activation | +7.90e-02 |
Pos logit contributions | |
Which | +0.019 |
Good | +0.018 |
Time | +0.018 |
Where | +0.017 |
ash | +0.017 |
Neg logit contributions | |
endant | -0.020 |
av | -0.020 |
jewels | -0.020 |
arrest | -0.019 |
brace | -0.019 |
Token | and |
Token ID | 290 |
Feature activation | -2.53e-01 |
Pos logit contributions | |
Which | +0.024 |
Time | +0.024 |
Good | +0.023 |
Where | +0.023 |
idget | +0.023 |
Neg logit contributions | |
av | -0.014 |
jewels | -0.014 |
brace | -0.013 |
endant | -0.013 |
coins | -0.013 |
Token | decided |
Token ID | 3066 |
Feature activation | +3.35e-02 |
Pos logit contributions | |
Which | +0.007 |
Good | +0.006 |
ash | +0.006 |
Time | +0.006 |
idget | +0.006 |
Neg logit contributions | |
endant | -0.008 |
jewels | -0.008 |
av | -0.008 |
arrest | -0.007 |
brace | -0.007 |
Token | to |
Token ID | 284 |
Feature activation | +9.16e-02 |
Pos logit contributions | |
endant | +0.001 |
av | +0.001 |
arrest | +0.001 |
jewels | +0.001 |
brace | +0.001 |
Neg logit contributions | |
Which | -0.001 |
Good | -0.001 |
Why | -0.001 |
Where | -0.001 |
Time | -0.001 |
Token | share |
Token ID | 2648 |
Feature activation | +9.45e-01 |
Pos logit contributions | |
endant | +0.004 |
av | +0.003 |
jewels | +0.003 |
agged | +0.003 |
brace | +0.003 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Time | -0.002 |
Time | -0.002 |
Why | -0.002 |
Token | her |
Token ID | 607 |
Feature activation | +2.14e+00 |
Pos logit contributions | |
endant | +0.031 |
arrest | +0.030 |
hy | +0.029 |
agged | +0.028 |
av | +0.028 |
Neg logit contributions | |
Which | -0.024 |
What | -0.023 |
Why | -0.023 |
Where | -0.023 |
Good | -0.022 |
Token | je |
Token ID | 11223 |
Feature activation | +3.52e+00 |
Pos logit contributions | |
arrest | +0.061 |
av | +0.060 |
agged | +0.060 |
endant | +0.058 |
acle | +0.058 |
Neg logit contributions | |
Which | -0.055 |
Where | -0.050 |
Good | -0.050 |
Which | -0.049 |
What | -0.049 |
Token | ep |
Token ID | 538 |
Feature activation | +1.28e+00 |
Pos logit contributions | |
endant | +0.120 |
av | +0.120 |
� | +0.118 |
jewels | +0.118 |
arrest | +0.118 |
Neg logit contributions | |
Which | -0.070 |
V | -0.066 |
ch | -0.064 |
Where | -0.064 |
ash | -0.064 |
Token | with |
Token ID | 351 |
Feature activation | -5.14e-02 |
Pos logit contributions | |
endant | +0.043 |
av | +0.041 |
arrest | +0.040 |
jewels | +0.040 |
brace | +0.037 |
Neg logit contributions | |
Which | -0.030 |
ash | -0.029 |
Why | -0.029 |
Where | -0.028 |
over | -0.028 |
Token | Max |
Token ID | 5436 |
Feature activation | -5.51e-01 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.001 |
Why | +0.001 |
Where | +0.001 |
Neg logit contributions | |
endant | -0.002 |
av | -0.002 |
jewels | -0.002 |
arrest | -0.002 |
brace | -0.002 |
Token | . |
Token ID | 13 |
Feature activation | -6.15e-01 |
Pos logit contributions | |
Which | +0.015 |
Time | +0.014 |
Good | +0.014 |
Ready | +0.013 |
Where | +0.013 |
Neg logit contributions | |
av | -0.017 |
jewels | -0.017 |
endant | -0.017 |
brace | -0.016 |
coins | -0.016 |
Token | They |
Token ID | 1119 |
Feature activation | +9.66e-01 |
Pos logit contributions | |
Which | +0.019 |
ash | +0.018 |
Time | +0.018 |
Where | +0.017 |
Good | +0.017 |
Neg logit contributions | |
arrest | -0.016 |
endant | -0.015 |
brace | -0.015 |
av | -0.015 |
jewels | -0.015 |
Token | she |
Token ID | 673 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
endant | +0.005 |
arrest | +0.005 |
av | +0.005 |
agged | +0.005 |
jewels | +0.005 |
Neg logit contributions | |
when | -0.003 |
Why | -0.003 |
over | -0.002 |
Where | -0.002 |
Which | -0.002 |
Token | wanted |
Token ID | 2227 |
Feature activation | -5.29e-02 |
Pos logit contributions | |
Which | +0.004 |
Why | +0.004 |
over | +0.004 |
Where | +0.004 |
Good | +0.003 |
Neg logit contributions | |
endant | -0.007 |
av | -0.007 |
arrest | -0.007 |
jewels | -0.006 |
agged | -0.006 |
Token | to |
Token ID | 284 |
Feature activation | -3.98e-02 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.001 |
Where | +0.001 |
Why | +0.001 |
Neg logit contributions | |
endant | -0.002 |
arrest | -0.002 |
jewels | -0.002 |
av | -0.002 |
brace | -0.002 |
Token | keep |
Token ID | 1394 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
Which | +0.001 |
Why | +0.001 |
Good | +0.001 |
Time | +0.001 |
Time | +0.001 |
Neg logit contributions | |
endant | -0.001 |
jewels | -0.001 |
av | -0.001 |
agged | -0.001 |
coins | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
endant | +0.038 |
arrest | +0.035 |
jewels | +0.035 |
av | +0.035 |
hy | +0.034 |
Neg logit contributions | |
Which | -0.031 |
Good | -0.030 |
Why | -0.029 |
Where | -0.029 |
Time | -0.029 |
Token | par |
Token ID | 1582 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
av | +0.032 |
agged | +0.031 |
endant | +0.030 |
kins | +0.029 |
arrest | +0.029 |
Neg logit contributions | |
Which | -0.029 |
Where | -0.028 |
Good | -0.028 |
Time | -0.028 |
Why | -0.028 |
Token | rot |
Token ID | 10599 |
Feature activation | +5.56e-01 |
Pos logit contributions | |
jewels | +0.111 |
av | +0.105 |
coins | +0.103 |
arrest | +0.099 |
endant | +0.095 |
Neg logit contributions | |
ing | -0.082 |
ch | -0.080 |
tap | -0.075 |
Where | -0.074 |
Which | -0.072 |
Token | all |
Token ID | 477 |
Feature activation | -5.85e-01 |
Pos logit contributions | |
endant | +0.021 |
arrest | +0.020 |
av | +0.020 |
jewels | +0.019 |
agged | +0.019 |
Neg logit contributions | |
Which | -0.011 |
ash | -0.010 |
Good | -0.010 |
over | -0.010 |
Where | -0.010 |
Token | for |
Token ID | 329 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
Which | +0.014 |
Good | +0.014 |
Time | +0.013 |
Where | +0.013 |
Why | +0.013 |
Neg logit contributions | |
endant | -0.019 |
av | -0.019 |
jewels | -0.019 |
arrest | -0.018 |
brace | -0.018 |
Token | herself |
Token ID | 5223 |
Feature activation | -4.01e-01 |
Pos logit contributions | |
endant | +0.037 |
hy | +0.032 |
agged | +0.032 |
av | +0.031 |
jewels | +0.031 |
Neg logit contributions | |
Where | -0.024 |
Why | -0.023 |
Time | -0.023 |
What | -0.023 |
Which | -0.023 |
Token | , |
Token ID | 11 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
Which | +0.007 |
Good | +0.007 |
ash | +0.006 |
Why | +0.006 |
Time | +0.006 |
Neg logit contributions | |
endant | -0.016 |
arrest | -0.015 |
av | -0.015 |
jewels | -0.015 |
brace | -0.014 |
Token | Yes |
Token ID | 5297 |
Feature activation | +5.01e-01 |
Pos logit contributions | |
Which | +0.023 |
idget | +0.023 |
ash | +0.023 |
Good | +0.022 |
Clean | +0.021 |
Neg logit contributions | |
endant | -0.033 |
arrest | -0.033 |
hy | -0.033 |
pe | -0.032 |
jewels | -0.032 |
Token | ! |
Token ID | 0 |
Feature activation | +8.91e-01 |
Pos logit contributions | |
endant | +0.014 |
av | +0.013 |
jewels | +0.013 |
arrest | +0.013 |
brace | +0.013 |
Neg logit contributions | |
Which | -0.015 |
Good | -0.014 |
Time | -0.014 |
ash | -0.014 |
Why | -0.014 |
Token | I |
Token ID | 314 |
Feature activation | +4.03e-01 |
Pos logit contributions | |
endant | +0.030 |
av | +0.029 |
jewels | +0.029 |
arrest | +0.029 |
brace | +0.028 |
Neg logit contributions | |
Which | -0.020 |
Time | -0.019 |
ash | -0.018 |
idget | -0.018 |
Where | -0.018 |
Token | am |
Token ID | 716 |
Feature activation | -1.21e-01 |
Pos logit contributions | |
endant | +0.014 |
av | +0.014 |
jewels | +0.014 |
arrest | +0.014 |
brace | +0.013 |
Neg logit contributions | |
Which | -0.009 |
Good | -0.008 |
Time | -0.008 |
ash | -0.008 |
Why | -0.008 |
Token | the |
Token ID | 262 |
Feature activation | +1.05e+00 |
Pos logit contributions | |
Good | +0.003 |
Which | +0.003 |
Time | +0.003 |
Time | +0.003 |
Why | +0.003 |
Neg logit contributions | |
endant | -0.004 |
arrest | -0.004 |
av | -0.004 |
jewels | -0.004 |
brace | -0.004 |
Token | cle |
Token ID | 1190 |
Feature activation | +3.51e+00 |
Pos logit contributions | |
endant | +0.031 |
arrest | +0.031 |
agged | +0.029 |
av | +0.028 |
hy | +0.028 |
Neg logit contributions | |
Which | -0.029 |
Good | -0.028 |
Why | -0.027 |
Where | -0.027 |
Time | -0.027 |
Token | ve |
Token ID | 303 |
Feature activation | +6.77e-01 |
Pos logit contributions | |
arrest | +0.089 |
jewels | +0.083 |
brace | +0.082 |
endant | +0.081 |
av | +0.080 |
Neg logit contributions | |
ash | -0.100 |
ing | -0.098 |
ray | -0.097 |
Not | -0.095 |
Time | -0.095 |
Token | rest |
Token ID | 2118 |
Feature activation | +3.76e-01 |
Pos logit contributions | |
endant | +0.024 |
av | +0.022 |
arrest | +0.022 |
brace | +0.022 |
� | +0.022 |
Neg logit contributions | |
ash | -0.015 |
over | -0.015 |
Good | -0.014 |
Which | -0.014 |
Time | -0.014 |
Token | crystal |
Token ID | 15121 |
Feature activation | +5.29e-02 |
Pos logit contributions | |
endant | +0.011 |
av | +0.010 |
arrest | +0.010 |
jewels | +0.010 |
brace | +0.010 |
Neg logit contributions | |
Which | -0.011 |
Good | -0.010 |
Time | -0.010 |
ash | -0.010 |
Where | -0.010 |
Token | ever |
Token ID | 1683 |
Feature activation | -5.93e-01 |
Pos logit contributions | |
endant | +0.002 |
arrest | +0.002 |
av | +0.002 |
agged | +0.002 |
jewels | +0.002 |
Neg logit contributions | |
Which | -0.001 |
Good | -0.001 |
ash | -0.001 |
Why | -0.001 |
Time | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | +6.88e-02 |
Pos logit contributions | |
Which | +0.019 |
idget | +0.017 |
Good | +0.017 |
Time | +0.017 |
Where | +0.017 |
Neg logit contributions | |
endant | -0.015 |
jewels | -0.015 |
av | -0.015 |
arrest | -0.014 |
brace | -0.014 |
Token | . |
Token ID | 13 |
Feature activation | -2.48e-02 |
Pos logit contributions | |
endant | +0.029 |
av | +0.028 |
jewels | +0.028 |
arrest | +0.027 |
brace | +0.026 |
Neg logit contributions | |
Which | -0.019 |
ash | -0.019 |
Good | -0.018 |
Why | -0.018 |
Time | -0.018 |
Token | They |
Token ID | 1119 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
Which | +0.001 |
Time | +0.001 |
Good | +0.001 |
ash | +0.001 |
idget | +0.001 |
Neg logit contributions | |
endant | -0.001 |
av | -0.001 |
jewels | -0.001 |
arrest | -0.001 |
brace | -0.001 |
Token | look |
Token ID | 804 |
Feature activation | -4.09e-01 |
Pos logit contributions | |
endant | +0.010 |
agged | +0.010 |
av | +0.010 |
vern | +0.009 |
jewels | +0.009 |
Neg logit contributions | |
Why | -0.005 |
over | -0.005 |
What | -0.004 |
Ready | -0.004 |
Which | -0.004 |
Token | inside |
Token ID | 2641 |
Feature activation | -5.03e-01 |
Pos logit contributions | |
Which | +0.011 |
Time | +0.011 |
Good | +0.010 |
Where | +0.010 |
Why | +0.010 |
Neg logit contributions | |
endant | -0.013 |
jewels | -0.013 |
av | -0.012 |
brace | -0.012 |
coins | -0.012 |
Token | the |
Token ID | 262 |
Feature activation | +1.82e+00 |
Pos logit contributions | |
Which | +0.012 |
Good | +0.011 |
Time | +0.011 |
Why | +0.011 |
Where | +0.011 |
Neg logit contributions | |
endant | -0.017 |
arrest | -0.016 |
av | -0.016 |
jewels | -0.016 |
brace | -0.016 |
Token | je |
Token ID | 11223 |
Feature activation | +3.50e+00 |
Pos logit contributions | |
agged | +0.051 |
endant | +0.050 |
arrest | +0.050 |
aches | +0.049 |
av | +0.048 |
Neg logit contributions | |
Which | -0.050 |
Where | -0.048 |
Good | -0.047 |
Time | -0.046 |
Why | -0.046 |
Token | ep |
Token ID | 538 |
Feature activation | +7.32e-01 |
Pos logit contributions | |
onna | +0.125 |
arrest | +0.123 |
� | +0.123 |
av | +0.123 |
jewels | +0.122 |
Neg logit contributions | |
ing | -0.058 |
Which | -0.057 |
ash | -0.054 |
ch | -0.053 |
stations | -0.052 |
Token | . |
Token ID | 13 |
Feature activation | +1.74e-01 |
Pos logit contributions | |
endant | +0.027 |
av | +0.026 |
jewels | +0.026 |
arrest | +0.026 |
brace | +0.025 |
Neg logit contributions | |
Which | -0.014 |
Good | -0.014 |
Time | -0.014 |
ash | -0.013 |
Where | -0.013 |
Token | They |
Token ID | 1119 |
Feature activation | +4.15e-01 |
Pos logit contributions | |
endant | +0.006 |
jewels | +0.006 |
av | +0.006 |
arrest | +0.005 |
brace | +0.005 |
Neg logit contributions | |
Which | -0.004 |
ash | -0.004 |
Time | -0.004 |
Good | -0.004 |
idget | -0.004 |
Token | see |
Token ID | 766 |
Feature activation | -5.51e-01 |
Pos logit contributions | |
agged | +0.018 |
endant | +0.017 |
av | +0.017 |
vern | +0.016 |
mm | +0.015 |
Neg logit contributions | |
over | -0.006 |
Why | -0.006 |
Ready | -0.006 |
What | -0.005 |
why | -0.005 |
Token | a |
Token ID | 257 |
Feature activation | +1.17e+00 |
Pos logit contributions | |
Which | +0.014 |
Where | +0.013 |
Good | +0.013 |
Why | +0.013 |
Time | +0.012 |
Neg logit contributions | |
endant | -0.017 |
arrest | -0.017 |
av | -0.017 |
agged | -0.016 |
jewels | -0.016 |
Token | he |
Token ID | 339 |
Feature activation | +7.73e-01 |
Pos logit contributions | |
endant | +0.017 |
arrest | +0.016 |
agged | +0.016 |
av | +0.015 |
brace | +0.014 |
Neg logit contributions | |
Good | -0.015 |
Which | -0.015 |
over | -0.014 |
Where | -0.014 |
Time | -0.014 |
Token | had |
Token ID | 550 |
Feature activation | +2.30e-01 |
Pos logit contributions | |
endant | +0.029 |
av | +0.028 |
arrest | +0.027 |
brace | +0.026 |
agged | +0.026 |
Neg logit contributions | |
Where | -0.016 |
Why | -0.015 |
Which | -0.015 |
Good | -0.015 |
over | -0.015 |
Token | made |
Token ID | 925 |
Feature activation | +2.83e-01 |
Pos logit contributions | |
endant | +0.008 |
av | +0.008 |
arrest | +0.007 |
jewels | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Where | -0.005 |
Time | -0.005 |
Which | -0.005 |
over | -0.005 |
when | -0.005 |
Token | the |
Token ID | 262 |
Feature activation | +1.24e+00 |
Pos logit contributions | |
endant | +0.010 |
arrest | +0.009 |
av | +0.009 |
jewels | +0.009 |
agged | +0.009 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.006 |
Time | -0.006 |
Where | -0.006 |
over | -0.006 |
Token | reliable |
Token ID | 9314 |
Feature activation | +1.83e+00 |
Pos logit contributions | |
endant | +0.038 |
agged | +0.037 |
arrest | +0.036 |
av | +0.036 |
aches | +0.034 |
Neg logit contributions | |
Which | -0.030 |
Where | -0.030 |
Why | -0.029 |
Good | -0.029 |
Ready | -0.028 |
Token | par |
Token ID | 1582 |
Feature activation | +3.49e+00 |
Pos logit contributions | |
agged | +0.057 |
endant | +0.054 |
� | +0.053 |
av | +0.052 |
arrest | +0.052 |
Neg logit contributions | |
Which | -0.042 |
Time | -0.041 |
Good | -0.041 |
end | -0.041 |
Where | -0.040 |
Token | rot |
Token ID | 10599 |
Feature activation | +8.47e-01 |
Pos logit contributions | |
jewels | +0.110 |
av | +0.108 |
arrest | +0.105 |
endant | +0.101 |
coins | +0.101 |
Neg logit contributions | |
ing | -0.076 |
ch | -0.074 |
Where | -0.070 |
Which | -0.068 |
who | -0.066 |
Token | so |
Token ID | 523 |
Feature activation | +1.44e+00 |
Pos logit contributions | |
endant | +0.032 |
arrest | +0.031 |
agged | +0.031 |
av | +0.031 |
jewels | +0.030 |
Neg logit contributions | |
Which | -0.015 |
over | -0.014 |
Good | -0.014 |
when | -0.014 |
ash | -0.013 |
Token | happy |
Token ID | 3772 |
Feature activation | +5.02e-01 |
Pos logit contributions | |
arrest | +0.048 |
endant | +0.048 |
agged | +0.046 |
av | +0.045 |
pe | +0.045 |
Neg logit contributions | |
when | -0.031 |
Good | -0.030 |
Which | -0.029 |
ing | -0.029 |
Where | -0.028 |
Token | . |
Token ID | 13 |
Feature activation | +3.11e-01 |
Pos logit contributions | |
endant | +0.019 |
arrest | +0.018 |
av | +0.018 |
jewels | +0.018 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.010 |
Good | -0.009 |
Why | -0.009 |
Time | -0.009 |
Where | -0.009 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -8.44e-02 |
Pos logit contributions | |
endant | +0.011 |
jewels | +0.011 |
av | +0.011 |
brace | +0.011 |
arrest | +0.011 |
Neg logit contributions | |
Good | -0.007 |
Which | -0.007 |
Time | -0.006 |
Time | -0.006 |
Where | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | -2.18e+00 |
Pos logit contributions | |
Which | +0.033 |
Good | +0.031 |
Time | +0.030 |
Where | +0.029 |
ash | +0.029 |
Neg logit contributions | |
endant | -0.047 |
av | -0.046 |
jewels | -0.046 |
arrest | -0.045 |
brace | -0.044 |
Token |
|
Token ID | 198 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
rated | +0.079 |
ksh | +0.074 |
louder | +0.072 |
Where | +0.072 |
ash | +0.072 |
Neg logit contributions | |
� | -0.037 |
endant | -0.036 |
hy | -0.033 |
brace | -0.031 |
ir | -0.031 |
Token |
|
Token ID | 198 |
Feature activation | -1.83e+00 |
Pos logit contributions | |
ksh | +0.048 |
Which | +0.048 |
rated | +0.047 |
ash | +0.047 |
Good | +0.047 |
Neg logit contributions | |
endant | -0.035 |
pe | -0.034 |
arrest | -0.034 |
av | -0.033 |
ir | -0.032 |
Token | One |
Token ID | 3198 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
ksh | +0.061 |
rated | +0.060 |
Good | +0.056 |
idget | +0.056 |
ash | +0.055 |
Neg logit contributions | |
pe | -0.035 |
ink | -0.035 |
ir | -0.035 |
high | -0.032 |
brace | -0.031 |
Token | day |
Token ID | 1110 |
Feature activation | -2.23e+00 |
Pos logit contributions | |
Which | +0.043 |
Ready | +0.042 |
idget | +0.042 |
stations | +0.041 |
Where | +0.040 |
Neg logit contributions | |
hy | -0.041 |
high | -0.040 |
av | -0.040 |
jewels | -0.040 |
endant | -0.039 |
Token | , |
Token ID | 11 |
Feature activation | -3.67e+00 |
Pos logit contributions | |
ksh | +0.106 |
rated | +0.101 |
ash | +0.101 |
Which | +0.100 |
Ready | +0.100 |
Neg logit contributions | |
itched | -0.015 |
jewels | -0.015 |
ink | -0.014 |
brace | -0.013 |
arrest | -0.013 |
Token | Angela |
Token ID | 17799 |
Feature activation | -1.66e+00 |
Pos logit contributions | |
ash | +0.099 |
Good | +0.097 |
ksh | +0.096 |
Which | +0.092 |
Ready | +0.092 |
Neg logit contributions | |
jewels | -0.093 |
brace | -0.091 |
breath | -0.091 |
arrest | -0.091 |
kins | -0.088 |
Token | stayed |
Token ID | 9658 |
Feature activation | +4.94e-01 |
Pos logit contributions | |
Which | +0.036 |
Good | +0.034 |
Time | +0.033 |
Where | +0.032 |
Why | +0.032 |
Neg logit contributions | |
endant | -0.059 |
av | -0.057 |
jewels | -0.057 |
arrest | -0.057 |
brace | -0.055 |
Token | up |
Token ID | 510 |
Feature activation | +8.38e-01 |
Pos logit contributions | |
endant | +0.019 |
arrest | +0.018 |
av | +0.017 |
jewels | +0.017 |
hy | +0.017 |
Neg logit contributions | |
Which | -0.010 |
Why | -0.009 |
Time | -0.009 |
Where | -0.009 |
over | -0.009 |
Token | past |
Token ID | 1613 |
Feature activation | -3.48e-01 |
Pos logit contributions | |
endant | +0.034 |
jewels | +0.031 |
brace | +0.031 |
arrest | +0.030 |
hy | +0.030 |
Neg logit contributions | |
when | -0.017 |
over | -0.016 |
Why | -0.016 |
Which | -0.015 |
Time | -0.015 |
Token | her |
Token ID | 607 |
Feature activation | -1.26e+00 |
Pos logit contributions | |
Which | +0.009 |
Why | +0.009 |
idget | +0.009 |
ash | +0.009 |
Good | +0.009 |
Neg logit contributions | |
endant | -0.011 |
arrest | -0.010 |
jewels | -0.010 |
av | -0.010 |
hy | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | -3.52e-01 |
Pos logit contributions | |
Which | +0.013 |
ash | +0.012 |
Good | +0.012 |
idget | +0.012 |
Why | +0.012 |
Neg logit contributions | |
endant | -0.013 |
arrest | -0.013 |
jewels | -0.012 |
av | -0.012 |
pe | -0.012 |
Token | " |
Token ID | 1 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
idget | +0.012 |
ash | +0.011 |
Good | +0.011 |
Which | +0.011 |
ksh | +0.011 |
Neg logit contributions | |
hy | -0.007 |
arrest | -0.007 |
pe | -0.007 |
aches | -0.007 |
coins | -0.007 |
Token | Let |
Token ID | 5756 |
Feature activation | -3.50e-01 |
Pos logit contributions | |
exception | +0.044 |
ash | +0.044 |
idget | +0.043 |
rated | +0.041 |
rhythms | +0.038 |
Neg logit contributions | |
Jerry | -0.045 |
pe | -0.043 |
Chuck | -0.043 |
brace | -0.040 |
cores | -0.040 |
Token | 's |
Token ID | 338 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
Which | +0.008 |
idget | +0.008 |
ash | +0.008 |
Where | +0.008 |
stations | +0.007 |
Neg logit contributions | |
arrest | -0.011 |
av | -0.011 |
brace | -0.011 |
aches | -0.010 |
coins | -0.010 |
Token | pretend |
Token ID | 16614 |
Feature activation | +2.38e-01 |
Pos logit contributions | |
Which | +0.036 |
Time | +0.034 |
Good | +0.034 |
ash | +0.033 |
Where | +0.033 |
Neg logit contributions | |
arrest | -0.041 |
endant | -0.040 |
av | -0.040 |
jewels | -0.039 |
aches | -0.038 |
Token | the |
Token ID | 262 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
endant | +0.007 |
av | +0.006 |
jewels | +0.006 |
arrest | +0.006 |
brace | +0.006 |
Neg logit contributions | |
Which | -0.007 |
Good | -0.007 |
Time | -0.007 |
Where | -0.006 |
ash | -0.006 |
Token | m |
Token ID | 285 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
idget | +0.123 |
rated | +0.118 |
Kids | +0.115 |
ashing | +0.115 |
ash | +0.115 |
Neg logit contributions | |
pe | -0.072 |
coins | -0.070 |
ladder | -0.064 |
spe | -0.062 |
cones | -0.061 |
Token | op |
Token ID | 404 |
Feature activation | -7.79e-01 |
Pos logit contributions | |
Which | +0.057 |
Ready | +0.054 |
Where | +0.053 |
Time | +0.053 |
Good | +0.051 |
Neg logit contributions | |
endant | -0.037 |
pe | -0.036 |
ink | -0.035 |
� | -0.035 |
arrest | -0.034 |
Token | is |
Token ID | 318 |
Feature activation | -1.78e+00 |
Pos logit contributions | |
Which | +0.016 |
Good | +0.016 |
ash | +0.016 |
Why | +0.015 |
Time | +0.015 |
Neg logit contributions | |
endant | -0.028 |
arrest | -0.027 |
av | -0.026 |
jewels | -0.026 |
brace | -0.026 |
Token | a |
Token ID | 257 |
Feature activation | -2.50e+00 |
Pos logit contributions | |
Which | +0.054 |
Good | +0.051 |
Time | +0.051 |
idget | +0.050 |
ash | +0.050 |
Neg logit contributions | |
jewels | -0.047 |
endant | -0.047 |
av | -0.047 |
arrest | -0.045 |
brace | -0.043 |
Token | horse |
Token ID | 8223 |
Feature activation | +6.66e-01 |
Pos logit contributions | |
idget | +0.086 |
ash | +0.082 |
Which | +0.079 |
ting | +0.078 |
rated | +0.078 |
Neg logit contributions | |
jewels | -0.056 |
coins | -0.054 |
crown | -0.054 |
av | -0.054 |
nut | -0.053 |
Token |
|
Token ID | 198 |
Feature activation | +4.19e-01 |
Pos logit contributions | |
ash | +0.018 |
Which | +0.018 |
stations | +0.017 |
idget | +0.017 |
rated | +0.017 |
Neg logit contributions | |
endant | -0.014 |
av | -0.014 |
jewels | -0.013 |
� | -0.012 |
brace | -0.011 |
Token |
|
Token ID | 198 |
Feature activation | +5.29e-01 |
Pos logit contributions | |
endant | +0.011 |
av | +0.011 |
jewels | +0.010 |
arrest | +0.010 |
pe | +0.010 |
Neg logit contributions | |
ash | -0.012 |
Which | -0.012 |
stations | -0.011 |
ksh | -0.011 |
idget | -0.011 |
Token | â |
Token ID | 22940 |
Feature activation | -1.13e+00 |
Pos logit contributions | |
endant | +0.013 |
av | +0.012 |
jewels | +0.012 |
arrest | +0.011 |
pe | +0.011 |
Neg logit contributions | |
ash | -0.016 |
idget | -0.016 |
stations | -0.016 |
Which | -0.015 |
ksh | -0.015 |
Token | € |
Token ID | 26391 |
Feature activation | -1.89e-01 |
Pos logit contributions | |
Which | +0.031 |
Where | +0.028 |
Time | +0.026 |
Good | +0.026 |
Which | +0.026 |
Neg logit contributions | |
endant | -0.035 |
pe | -0.034 |
hy | -0.034 |
agged | -0.032 |
arrest | -0.032 |
Token | � |
Token ID | 129 |
Feature activation | -2.00e+00 |
Pos logit contributions | |
Which | +0.005 |
Good | +0.005 |
Time | +0.005 |
Why | +0.005 |
Where | +0.005 |
Neg logit contributions | |
endant | -0.006 |
av | -0.005 |
jewels | -0.005 |
arrest | -0.005 |
brace | -0.005 |
Token | � |
Token ID | 241 |
Feature activation | -3.64e+00 |
Pos logit contributions | |
Which | +0.060 |
Time | +0.054 |
Good | +0.052 |
Where | +0.052 |
Which | +0.052 |
Neg logit contributions | |
arrest | -0.057 |
endant | -0.056 |
pe | -0.055 |
brace | -0.053 |
aches | -0.053 |
Token | M |
Token ID | 44 |
Feature activation | -4.62e-01 |
Pos logit contributions | |
ash | +0.089 |
idget | +0.087 |
stations | +0.079 |
ting | +0.078 |
DJ | +0.078 |
Neg logit contributions | |
pe | -0.096 |
hy | -0.094 |
endant | -0.091 |
arrest | -0.091 |
ve | -0.089 |
Token | ama |
Token ID | 1689 |
Feature activation | -1.20e+00 |
Pos logit contributions | |
Which | +0.015 |
Good | +0.014 |
Where | +0.014 |
Time | +0.014 |
Why | +0.014 |
Neg logit contributions | |
endant | -0.012 |
av | -0.011 |
jewels | -0.011 |
arrest | -0.011 |
brace | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
Which | +0.032 |
Good | +0.031 |
Time | +0.031 |
Why | +0.030 |
ash | +0.030 |
Neg logit contributions | |
endant | -0.036 |
arrest | -0.034 |
jewels | -0.034 |
av | -0.034 |
brace | -0.033 |
Token | what |
Token ID | 644 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
Which | +0.057 |
ash | +0.055 |
idget | +0.053 |
Time | +0.052 |
Where | +0.052 |
Neg logit contributions | |
endant | -0.061 |
av | -0.061 |
jewels | -0.061 |
arrest | -0.057 |
coins | -0.056 |
Token | are |
Token ID | 389 |
Feature activation | -6.21e-01 |
Pos logit contributions | |
Which | +0.062 |
Where | +0.060 |
idget | +0.060 |
ash | +0.059 |
Time | +0.059 |
Neg logit contributions | |
av | -0.051 |
endant | -0.049 |
jewels | -0.048 |
arrest | -0.045 |
brace | -0.045 |
Token | Tom |
Token ID | 4186 |
Feature activation | +5.79e-01 |
Pos logit contributions | |
endant | +0.029 |
jewels | +0.028 |
arrest | +0.028 |
av | +0.027 |
brace | +0.027 |
Neg logit contributions | |
Which | -0.028 |
Good | -0.026 |
Time | -0.026 |
Why | -0.025 |
ash | -0.025 |
Token | says |
Token ID | 1139 |
Feature activation | +1.25e+00 |
Pos logit contributions | |
endant | +0.020 |
arrest | +0.020 |
av | +0.019 |
jewels | +0.019 |
agged | +0.018 |
Neg logit contributions | |
Which | -0.013 |
Good | -0.012 |
Why | -0.012 |
Clean | -0.012 |
ash | -0.012 |
Token | it |
Token ID | 340 |
Feature activation | -6.74e-01 |
Pos logit contributions | |
arrest | +0.044 |
endant | +0.043 |
agged | +0.043 |
� | +0.039 |
av | +0.039 |
Neg logit contributions | |
Which | -0.029 |
Why | -0.027 |
Which | -0.027 |
Where | -0.026 |
Good | -0.026 |
Token | is |
Token ID | 318 |
Feature activation | -9.47e-01 |
Pos logit contributions | |
Which | +0.016 |
Good | +0.015 |
Time | +0.015 |
Why | +0.014 |
ash | +0.014 |
Neg logit contributions | |
endant | -0.023 |
arrest | -0.022 |
av | -0.022 |
jewels | -0.022 |
brace | -0.021 |
Token | a |
Token ID | 257 |
Feature activation | -1.87e+00 |
Pos logit contributions | |
Which | +0.029 |
Good | +0.028 |
Time | +0.028 |
ash | +0.027 |
Where | +0.027 |
Neg logit contributions | |
endant | -0.025 |
jewels | -0.024 |
av | -0.024 |
arrest | -0.024 |
brace | -0.023 |
Token | magic |
Token ID | 5536 |
Feature activation | -3.62e+00 |
Pos logit contributions | |
idget | +0.062 |
ash | +0.061 |
ting | +0.060 |
Which | +0.059 |
Kids | +0.058 |
Neg logit contributions | |
jewels | -0.043 |
endant | -0.043 |
coins | -0.041 |
av | -0.040 |
brace | -0.040 |
Token | m |
Token ID | 285 |
Feature activation | -8.46e-01 |
Pos logit contributions | |
Which | +0.115 |
idget | +0.113 |
Where | +0.112 |
Kids | +0.111 |
Good | +0.110 |
Neg logit contributions | |
pe | -0.089 |
coins | -0.087 |
endant | -0.081 |
jewels | -0.079 |
crown | -0.079 |
Token | op |
Token ID | 404 |
Feature activation | -6.75e-01 |
Pos logit contributions | |
Which | +0.028 |
Where | +0.026 |
Time | +0.025 |
Good | +0.025 |
Ready | +0.025 |
Neg logit contributions | |
endant | -0.022 |
pe | -0.020 |
aches | -0.020 |
hy | -0.020 |
arrest | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | +6.76e-01 |
Pos logit contributions | |
Which | +0.014 |
Good | +0.013 |
Time | +0.013 |
Where | +0.013 |
Why | +0.013 |
Neg logit contributions | |
endant | -0.024 |
av | -0.024 |
jewels | -0.024 |
arrest | -0.023 |
brace | -0.023 |
Token | He |
Token ID | 679 |
Feature activation | +1.84e-01 |
Pos logit contributions | |
endant | +0.019 |
av | +0.018 |
jewels | +0.018 |
arrest | +0.018 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.020 |
Good | -0.019 |
Time | -0.019 |
Where | -0.019 |
ash | -0.019 |
Token | can |
Token ID | 460 |
Feature activation | +7.97e-01 |
Pos logit contributions | |
endant | +0.006 |
arrest | +0.006 |
av | +0.006 |
jewels | +0.006 |
hy | +0.006 |
Neg logit contributions | |
Which | -0.004 |
Good | -0.004 |
Why | -0.004 |
Time | -0.004 |
ash | -0.004 |
Token | with |
Token ID | 351 |
Feature activation | +5.50e-01 |
Pos logit contributions | |
Which | +0.038 |
Time | +0.037 |
idget | +0.035 |
Where | +0.035 |
Kids | +0.035 |
Neg logit contributions | |
jewels | -0.026 |
av | -0.025 |
brace | -0.025 |
endant | -0.024 |
coins | -0.023 |
Token | joy |
Token ID | 8716 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
endant | +0.017 |
av | +0.015 |
arrest | +0.015 |
jewels | +0.015 |
pe | +0.015 |
Neg logit contributions | |
Which | -0.015 |
Good | -0.015 |
Time | -0.015 |
Where | -0.014 |
Why | -0.014 |
Token | ! |
Token ID | 0 |
Feature activation | -3.26e-01 |
Pos logit contributions | |
Which | +0.034 |
Time | +0.032 |
Good | +0.031 |
Ready | +0.031 |
Where | +0.030 |
Neg logit contributions | |
jewels | -0.036 |
endant | -0.035 |
av | -0.035 |
brace | -0.033 |
coins | -0.032 |
Token |
|
Token ID | 198 |
Feature activation | -7.18e-01 |
Pos logit contributions | |
Which | +0.009 |
Time | +0.009 |
ash | +0.009 |
idget | +0.009 |
Where | +0.008 |
Neg logit contributions | |
endant | -0.009 |
av | -0.009 |
arrest | -0.009 |
jewels | -0.009 |
brace | -0.009 |
Token |
|
Token ID | 198 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
Which | +0.019 |
Good | +0.019 |
ash | +0.018 |
idget | +0.018 |
Time | +0.018 |
Neg logit contributions | |
endant | -0.020 |
arrest | -0.019 |
av | -0.019 |
pe | -0.019 |
jewels | -0.019 |
Token | The |
Token ID | 464 |
Feature activation | -3.61e+00 |
Pos logit contributions | |
pe | +0.011 |
arrest | +0.011 |
hy | +0.010 |
av | +0.010 |
endant | +0.010 |
Neg logit contributions | |
idget | -0.011 |
ash | -0.011 |
Good | -0.011 |
Which | -0.010 |
ksh | -0.010 |
Token | m |
Token ID | 285 |
Feature activation | -1.94e+00 |
Pos logit contributions | |
idget | +0.129 |
ash | +0.126 |
Good | +0.123 |
rated | +0.122 |
Would | +0.121 |
Neg logit contributions | |
coins | -0.056 |
breath | -0.054 |
bul | -0.054 |
swollen | -0.052 |
pe | -0.051 |
Token | op |
Token ID | 404 |
Feature activation | -1.67e+00 |
Pos logit contributions | |
Which | +0.067 |
Ready | +0.064 |
Good | +0.063 |
Where | +0.062 |
Time | +0.062 |
Neg logit contributions | |
endant | -0.042 |
ink | -0.040 |
arrest | -0.040 |
pe | -0.039 |
itt | -0.039 |
Token | danced |
Token ID | 39480 |
Feature activation | -1.88e-01 |
Pos logit contributions | |
Which | +0.040 |
Good | +0.038 |
Time | +0.037 |
ash | +0.036 |
Why | +0.036 |
Neg logit contributions | |
endant | -0.056 |
av | -0.054 |
jewels | -0.054 |
arrest | -0.053 |
brace | -0.052 |
Token | all |
Token ID | 477 |
Feature activation | -1.39e+00 |
Pos logit contributions | |
Which | +0.005 |
Good | +0.005 |
Time | +0.005 |
ash | +0.005 |
Why | +0.005 |
Neg logit contributions | |
endant | -0.006 |
av | -0.005 |
jewels | -0.005 |
arrest | -0.005 |
brace | -0.005 |
Token | over |
Token ID | 625 |
Feature activation | +4.85e-02 |
Pos logit contributions | |
Which | +0.032 |
Where | +0.028 |
Good | +0.027 |
Which | +0.027 |
Ready | +0.026 |
Neg logit contributions | |
jewels | -0.046 |
endant | -0.046 |
arrest | -0.045 |
hy | -0.045 |
brace | -0.045 |
Token | the |
Token ID | 262 |
Feature activation | -1.11e-01 |
Pos logit contributions | |
endant | +0.002 |
arrest | +0.002 |
av | +0.002 |
jewels | +0.002 |
brace | +0.002 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Time | -0.002 |
Why | -0.002 |
Where | -0.002 |
Token | world |
Token ID | 995 |
Feature activation | -4.45e-02 |
Pos logit contributions | |
Which | +0.003 |
Good | +0.003 |
Time | +0.003 |
ash | +0.002 |
idget | +0.002 |
Neg logit contributions | |
endant | -0.004 |
av | -0.004 |
jewels | -0.004 |
arrest | -0.003 |
brace | -0.003 |
Token | . |
Token ID | 13 |
Feature activation | -2.55e+00 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.001 |
Where | +0.001 |
ash | +0.001 |
Neg logit contributions | |
endant | -0.002 |
jewels | -0.002 |
av | -0.002 |
arrest | -0.002 |
brace | -0.001 |
Token | One |
Token ID | 1881 |
Feature activation | -6.85e-01 |
Pos logit contributions | |
Which | +0.085 |
Time | +0.085 |
ting | +0.084 |
Where | +0.084 |
stations | +0.084 |
Neg logit contributions | |
pe | -0.046 |
endant | -0.045 |
hy | -0.043 |
jewels | -0.041 |
coins | -0.040 |
Token | day |
Token ID | 1110 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Which | +0.017 |
idget | +0.016 |
Ready | +0.016 |
stations | +0.016 |
Where | +0.016 |
Neg logit contributions | |
hy | -0.020 |
endant | -0.020 |
jewels | -0.020 |
av | -0.020 |
nut | -0.019 |
Token | , |
Token ID | 11 |
Feature activation | -3.59e+00 |
Pos logit contributions | |
Which | +0.072 |
idget | +0.070 |
Time | +0.070 |
Where | +0.069 |
ash | +0.069 |
Neg logit contributions | |
jewels | -0.023 |
arrest | -0.021 |
coins | -0.021 |
endant | -0.021 |
av | -0.020 |
Token | Owen |
Token ID | 22605 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
ash | +0.144 |
idget | +0.140 |
Which | +0.139 |
Good | +0.138 |
ksh | +0.138 |
Neg logit contributions | |
jewels | -0.049 |
coins | -0.046 |
arrest | -0.043 |
pe | -0.042 |
breath | -0.042 |
Token | asked |
Token ID | 1965 |
Feature activation | -1.48e+00 |
Pos logit contributions | |
Which | +0.019 |
Good | +0.018 |
Time | +0.018 |
Why | +0.018 |
Time | +0.018 |
Neg logit contributions | |
endant | -0.039 |
av | -0.037 |
jewels | -0.037 |
brace | -0.037 |
arrest | -0.036 |
Token | his |
Token ID | 465 |
Feature activation | -9.94e-01 |
Pos logit contributions | |
Which | +0.063 |
Where | +0.061 |
Time | +0.061 |
ash | +0.061 |
Ready | +0.061 |
Neg logit contributions | |
jewels | -0.019 |
av | -0.018 |
coins | -0.016 |
arrest | -0.016 |
aches | -0.015 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
Which | +0.033 |
ash | +0.033 |
Time | +0.033 |
Good | +0.032 |
Why | +0.032 |
Neg logit contributions | |
jewels | -0.024 |
av | -0.023 |
endant | -0.023 |
coins | -0.022 |
brace | -0.022 |
Token | why |
Token ID | 1521 |
Feature activation | -1.57e-01 |
Pos logit contributions | |
Time | +0.025 |
Which | +0.025 |
Ready | +0.024 |
Good | +0.024 |
Where | +0.024 |
Neg logit contributions | |
av | -0.035 |
jewels | -0.033 |
endant | -0.032 |
coins | -0.031 |
aches | -0.031 |
Token | was |
Token ID | 373 |
Feature activation | -2.45e-01 |
Pos logit contributions | |
Which | +0.038 |
ash | +0.035 |
Time | +0.035 |
Good | +0.035 |
idget | +0.034 |
Neg logit contributions | |
endant | -0.050 |
av | -0.049 |
jewels | -0.049 |
arrest | -0.049 |
brace | -0.047 |
Token | a |
Token ID | 257 |
Feature activation | -1.52e-01 |
Pos logit contributions | |
Which | +0.007 |
Good | +0.007 |
ash | +0.007 |
Time | +0.007 |
idget | +0.007 |
Neg logit contributions | |
endant | -0.007 |
av | -0.007 |
jewels | -0.006 |
arrest | -0.006 |
brace | -0.006 |
Token | m |
Token ID | 285 |
Feature activation | +2.35e-01 |
Pos logit contributions | |
Which | +0.004 |
ash | +0.004 |
Good | +0.004 |
idget | +0.004 |
Time | +0.004 |
Neg logit contributions | |
endant | -0.004 |
av | -0.004 |
jewels | -0.004 |
arrest | -0.004 |
brace | -0.004 |
Token | op |
Token ID | 404 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
endant | +0.007 |
jewels | +0.007 |
av | +0.007 |
arrest | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.006 |
Time | -0.006 |
ash | -0.006 |
Why | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +1.11e+00 |
Pos logit contributions | |
Which | +0.042 |
Time | +0.040 |
Good | +0.040 |
Ready | +0.038 |
Where | +0.038 |
Neg logit contributions | |
endant | -0.039 |
arrest | -0.038 |
av | -0.038 |
jewels | -0.037 |
pe | -0.037 |
Token | The |
Token ID | 383 |
Feature activation | -3.49e+00 |
Pos logit contributions | |
endant | +0.036 |
jewels | +0.034 |
av | +0.034 |
arrest | +0.033 |
brace | +0.033 |
Neg logit contributions | |
Which | -0.028 |
Good | -0.027 |
Time | -0.026 |
Time | -0.026 |
Why | -0.026 |
Token | m |
Token ID | 285 |
Feature activation | -1.59e+00 |
Pos logit contributions | |
idget | +0.117 |
Which | +0.115 |
ash | +0.114 |
Would | +0.113 |
Ready | +0.112 |
Neg logit contributions | |
breath | -0.062 |
pe | -0.061 |
coins | -0.060 |
high | -0.058 |
bul | -0.058 |
Token | op |
Token ID | 404 |
Feature activation | -7.54e-01 |
Pos logit contributions | |
Which | +0.053 |
Ready | +0.051 |
Good | +0.050 |
Where | +0.049 |
Time | +0.049 |
Neg logit contributions | |
endant | -0.038 |
ink | -0.035 |
pe | -0.035 |
arrest | -0.034 |
aches | -0.034 |
Token | was |
Token ID | 373 |
Feature activation | -2.08e-01 |
Pos logit contributions | |
Which | +0.016 |
Why | +0.015 |
Good | +0.015 |
ash | +0.015 |
Time | +0.014 |
Neg logit contributions | |
endant | -0.027 |
arrest | -0.026 |
av | -0.026 |
jewels | -0.026 |
brace | -0.026 |
Token | very |
Token ID | 845 |
Feature activation | +5.38e-01 |
Pos logit contributions | |
Which | +0.005 |
Why | +0.005 |
when | +0.004 |
over | +0.004 |
Time | +0.004 |
Neg logit contributions | |
arrest | -0.007 |
endant | -0.007 |
av | -0.007 |
brace | -0.007 |
jewels | -0.007 |
Token | happy |
Token ID | 3772 |
Feature activation | +6.65e-01 |
Pos logit contributions | |
arrest | +0.018 |
endant | +0.017 |
brace | +0.017 |
av | +0.016 |
jewels | +0.016 |
Neg logit contributions | |
Good | -0.012 |
Clean | -0.012 |
Time | -0.012 |
Which | -0.012 |
Time | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | +4.31e-01 |
Pos logit contributions | |
endant | +0.002 |
av | +0.002 |
jewels | +0.001 |
arrest | +0.001 |
hy | +0.001 |
Neg logit contributions | |
Which | -0.003 |
Time | -0.002 |
Good | -0.002 |
ash | -0.002 |
idget | -0.002 |
Token |
|
Token ID | 198 |
Feature activation | +1.02e+00 |
Pos logit contributions | |
endant | +0.013 |
av | +0.013 |
arrest | +0.013 |
jewels | +0.013 |
brace | +0.012 |
Neg logit contributions | |
Which | -0.011 |
Good | -0.010 |
ash | -0.010 |
Time | -0.010 |
idget | -0.010 |
Token | â |
Token ID | 22940 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
arrest | +0.027 |
pe | +0.027 |
endant | +0.026 |
hy | +0.026 |
av | +0.026 |
Neg logit contributions | |
idget | -0.028 |
Which | -0.027 |
ash | -0.027 |
Good | -0.027 |
ting | -0.026 |
Token | € |
Token ID | 26391 |
Feature activation | +1.47e-01 |
Pos logit contributions | |
Which | +0.013 |
Where | +0.012 |
Good | +0.011 |
Time | +0.011 |
Why | +0.011 |
Neg logit contributions | |
endant | -0.019 |
pe | -0.019 |
arrest | -0.019 |
hy | -0.019 |
av | -0.018 |
Token | � |
Token ID | 129 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
endant | +0.005 |
av | +0.005 |
jewels | +0.005 |
brace | +0.004 |
arrest | +0.004 |
Neg logit contributions | |
Which | -0.004 |
Good | -0.004 |
Time | -0.004 |
Why | -0.004 |
Time | -0.004 |
Token | � |
Token ID | 241 |
Feature activation | -3.44e+00 |
Pos logit contributions | |
Which | +0.035 |
Time | +0.031 |
Good | +0.031 |
Where | +0.030 |
Which | +0.029 |
Neg logit contributions | |
arrest | -0.048 |
endant | -0.047 |
pe | -0.047 |
hy | -0.045 |
aches | -0.045 |
Token | H |
Token ID | 39 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
ash | +0.083 |
idget | +0.082 |
ting | +0.072 |
ning | +0.071 |
DJ | +0.070 |
Neg logit contributions | |
pe | -0.103 |
hy | -0.096 |
arrest | -0.094 |
� | -0.086 |
curly | -0.085 |
Token | urry |
Token ID | 16682 |
Feature activation | -2.37e+00 |
Pos logit contributions | |
jewels | +0.018 |
av | +0.018 |
endant | +0.017 |
brace | +0.017 |
arrest | +0.017 |
Neg logit contributions | |
ash | -0.018 |
Good | -0.018 |
Time | -0.018 |
Which | -0.017 |
idget | -0.017 |
Token | up |
Token ID | 510 |
Feature activation | +2.78e-01 |
Pos logit contributions | |
Which | +0.072 |
Time | +0.067 |
Where | +0.066 |
Good | +0.066 |
Why | +0.066 |
Neg logit contributions | |
arrest | -0.062 |
jewels | -0.062 |
endant | -0.062 |
av | -0.060 |
coins | -0.058 |
Token | , |
Token ID | 11 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
endant | +0.010 |
av | +0.009 |
brace | +0.009 |
jewels | +0.009 |
arrest | +0.008 |
Neg logit contributions | |
when | -0.007 |
Good | -0.006 |
Which | -0.006 |
over | -0.006 |
Time | -0.006 |
Token | Tim |
Token ID | 5045 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Which | +0.047 |
ash | +0.044 |
Where | +0.043 |
Good | +0.042 |
idget | +0.042 |
Neg logit contributions | |
jewels | -0.043 |
endant | -0.042 |
arrest | -0.042 |
av | -0.042 |
coins | -0.040 |
Token |
|
Token ID | 198 |
Feature activation | -1.24e+00 |
Pos logit contributions | |
rated | +0.038 |
Which | +0.038 |
stations | +0.036 |
ash | +0.036 |
Time | +0.035 |
Neg logit contributions | |
� | -0.033 |
endant | -0.032 |
av | -0.032 |
hy | -0.031 |
brace | -0.030 |
Token |
|
Token ID | 198 |
Feature activation | -7.45e-01 |
Pos logit contributions | |
rated | +0.043 |
Which | +0.041 |
ksh | +0.040 |
stations | +0.040 |
ash | +0.039 |
Neg logit contributions | |
� | -0.023 |
pe | -0.022 |
arrest | -0.022 |
ir | -0.022 |
endant | -0.022 |
Token | â |
Token ID | 22940 |
Feature activation | -7.32e-01 |
Pos logit contributions | |
rated | +0.023 |
idget | +0.021 |
ash | +0.020 |
Which | +0.020 |
Good | +0.020 |
Neg logit contributions | |
arrest | -0.016 |
pe | -0.016 |
aches | -0.015 |
ink | -0.015 |
� | -0.015 |
Token | € |
Token ID | 26391 |
Feature activation | -5.57e-01 |
Pos logit contributions | |
Which | +0.018 |
Where | +0.016 |
Time | +0.015 |
Good | +0.015 |
Why | +0.014 |
Neg logit contributions | |
endant | -0.025 |
hy | -0.024 |
pe | -0.024 |
agged | -0.023 |
arrest | -0.023 |
Token | � |
Token ID | 129 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
Which | +0.017 |
Good | +0.016 |
Time | +0.016 |
Where | +0.016 |
ash | +0.016 |
Neg logit contributions | |
endant | -0.015 |
arrest | -0.014 |
av | -0.014 |
jewels | -0.014 |
brace | -0.014 |
Token | � |
Token ID | 241 |
Feature activation | -3.42e+00 |
Pos logit contributions | |
Which | +0.044 |
Where | +0.039 |
Time | +0.039 |
Good | +0.039 |
Which | +0.037 |
Neg logit contributions | |
arrest | -0.059 |
endant | -0.059 |
pe | -0.058 |
hy | -0.057 |
aches | -0.056 |
Token | That |
Token ID | 2504 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
idget | +0.091 |
ash | +0.081 |
ting | +0.078 |
nurses | +0.076 |
Which | +0.074 |
Neg logit contributions | |
pe | -0.097 |
hy | -0.094 |
arrest | -0.087 |
� | -0.086 |
endant | -0.083 |
Token | â |
Token ID | 22940 |
Feature activation | +2.42e-01 |
Pos logit contributions | |
Which | +0.033 |
Where | +0.032 |
idget | +0.032 |
Time | +0.030 |
Why | +0.030 |
Neg logit contributions | |
endant | -0.048 |
av | -0.048 |
jewels | -0.047 |
brace | -0.047 |
coins | -0.046 |
Token | € |
Token ID | 26391 |
Feature activation | +5.42e-01 |
Pos logit contributions | |
endant | +0.008 |
hy | +0.008 |
av | +0.008 |
arrest | +0.008 |
pe | +0.008 |
Neg logit contributions | |
Which | -0.006 |
Where | -0.005 |
Good | -0.005 |
idget | -0.005 |
Time | -0.005 |
Token | ™ |
Token ID | 8151 |
Feature activation | -3.77e-02 |
Pos logit contributions | |
endant | +0.017 |
arrest | +0.016 |
av | +0.016 |
jewels | +0.016 |
brace | +0.015 |
Neg logit contributions | |
Which | -0.014 |
Good | -0.014 |
Time | -0.013 |
Where | -0.013 |
Why | -0.013 |
Token | s |
Token ID | 82 |
Feature activation | -9.88e-01 |
Pos logit contributions | |
ash | +0.001 |
Good | +0.001 |
Which | +0.001 |
Time | +0.001 |
Time | +0.001 |
Neg logit contributions | |
endant | -0.001 |
jewels | -0.001 |
arrest | -0.001 |
av | -0.001 |
brace | -0.001 |
Token | Mom |
Token ID | 29252 |
Feature activation | -1.52e+00 |
Pos logit contributions | |
ting | +0.034 |
idget | +0.034 |
ash | +0.033 |
Good | +0.033 |
rated | +0.032 |
Neg logit contributions | |
kins | -0.026 |
pe | -0.021 |
aches | -0.021 |
coins | -0.021 |
brace | -0.021 |
Token | says |
Token ID | 1139 |
Feature activation | +2.63e-01 |
Pos logit contributions | |
Which | +0.045 |
Good | +0.042 |
Where | +0.042 |
Time | +0.042 |
ash | +0.040 |
Neg logit contributions | |
endant | -0.042 |
av | -0.040 |
arrest | -0.040 |
jewels | -0.040 |
brace | -0.039 |
Token | , |
Token ID | 11 |
Feature activation | -8.79e-01 |
Pos logit contributions | |
endant | +0.008 |
arrest | +0.007 |
jewels | +0.007 |
av | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.008 |
Good | -0.007 |
Time | -0.007 |
Why | -0.007 |
Time | -0.007 |
Token | " |
Token ID | 366 |
Feature activation | -4.03e-01 |
Pos logit contributions | |
ash | +0.020 |
Which | +0.020 |
idget | +0.020 |
Time | +0.019 |
Good | +0.019 |
Neg logit contributions | |
av | -0.028 |
endant | -0.028 |
jewels | -0.028 |
arrest | -0.027 |
brace | -0.026 |
Token | Bro |
Token ID | 15783 |
Feature activation | -6.81e-01 |
Pos logit contributions | |
idget | +0.009 |
ash | +0.009 |
Good | +0.009 |
Which | +0.008 |
over | +0.008 |
Neg logit contributions | |
arrest | -0.013 |
pe | -0.013 |
brace | -0.012 |
av | -0.012 |
endant | -0.012 |
Token | ccoli |
Token ID | 34544 |
Feature activation | -3.41e+00 |
Pos logit contributions | |
Which | +0.017 |
Time | +0.016 |
Where | +0.016 |
Good | +0.016 |
Why | +0.015 |
Neg logit contributions | |
endant | -0.022 |
av | -0.022 |
jewels | -0.021 |
arrest | -0.020 |
brace | -0.020 |
Token | is |
Token ID | 318 |
Feature activation | -5.66e-01 |
Pos logit contributions | |
Which | +0.106 |
idget | +0.101 |
Where | +0.098 |
Time | +0.098 |
Good | +0.096 |
Neg logit contributions | |
av | -0.084 |
jewels | -0.083 |
endant | -0.081 |
arrest | -0.081 |
brace | -0.079 |
Token | good |
Token ID | 922 |
Feature activation | -3.20e-01 |
Pos logit contributions | |
Which | +0.018 |
Good | +0.018 |
Time | +0.017 |
Why | +0.017 |
Where | +0.017 |
Neg logit contributions | |
endant | -0.014 |
arrest | -0.014 |
jewels | -0.013 |
av | -0.013 |
brace | -0.013 |
Token | for |
Token ID | 329 |
Feature activation | +4.05e-01 |
Pos logit contributions | |
Which | +0.009 |
Where | +0.008 |
Time | +0.008 |
Good | +0.008 |
idget | +0.008 |
Neg logit contributions | |
av | -0.009 |
endant | -0.009 |
jewels | -0.009 |
arrest | -0.009 |
brace | -0.009 |
Token | you |
Token ID | 345 |
Feature activation | +1.34e-01 |
Pos logit contributions | |
endant | +0.012 |
jewels | +0.011 |
arrest | +0.011 |
av | +0.011 |
brace | +0.011 |
Neg logit contributions | |
Which | -0.011 |
Good | -0.011 |
Time | -0.011 |
Why | -0.011 |
Where | -0.011 |
Token | . |
Token ID | 13 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
endant | +0.004 |
arrest | +0.004 |
jewels | +0.004 |
av | +0.004 |
brace | +0.004 |
Neg logit contributions | |
Which | -0.003 |
Good | -0.003 |
Time | -0.003 |
Where | -0.003 |
Why | -0.003 |
Token | |
Token ID | 220 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
Which | +0.059 |
Where | +0.058 |
idget | +0.057 |
Time | +0.057 |
rated | +0.056 |
Neg logit contributions | |
endant | -0.048 |
arrest | -0.047 |
pe | -0.045 |
brace | -0.045 |
� | -0.045 |
Token |
|
Token ID | 198 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Which | +0.053 |
Good | +0.050 |
Time | +0.050 |
ash | +0.048 |
Why | +0.048 |
Neg logit contributions | |
endant | -0.064 |
av | -0.061 |
jewels | -0.060 |
arrest | -0.060 |
brace | -0.059 |
Token |
|
Token ID | 198 |
Feature activation | -1.30e+00 |
Pos logit contributions | |
Which | +0.034 |
idget | +0.032 |
Good | +0.032 |
ash | +0.032 |
Where | +0.031 |
Neg logit contributions | |
endant | -0.031 |
pe | -0.030 |
arrest | -0.030 |
av | -0.029 |
brace | -0.029 |
Token | One |
Token ID | 3198 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
idget | +0.039 |
ting | +0.036 |
rated | +0.036 |
Where | +0.035 |
Clean | +0.034 |
Neg logit contributions | |
pe | -0.033 |
arrest | -0.029 |
brace | -0.029 |
aches | -0.029 |
hy | -0.029 |
Token | day |
Token ID | 1110 |
Feature activation | -2.09e+00 |
Pos logit contributions | |
Which | +0.041 |
idget | +0.040 |
Where | +0.039 |
Ready | +0.038 |
Which | +0.038 |
Neg logit contributions | |
hy | -0.042 |
av | -0.041 |
high | -0.041 |
jewels | -0.040 |
endant | -0.040 |
Token | , |
Token ID | 11 |
Feature activation | -3.39e+00 |
Pos logit contributions | |
idget | +0.101 |
ksh | +0.098 |
Which | +0.097 |
rated | +0.096 |
ash | +0.096 |
Neg logit contributions | |
ls | -0.016 |
coins | -0.016 |
kins | -0.015 |
arrest | -0.014 |
jewels | -0.013 |
Token | on |
Token ID | 319 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
ash | +0.122 |
idget | +0.121 |
Which | +0.119 |
Good | +0.117 |
rated | +0.117 |
Neg logit contributions | |
coins | -0.059 |
kins | -0.057 |
arrest | -0.056 |
jewels | -0.056 |
ls | -0.054 |
Token | their |
Token ID | 511 |
Feature activation | +1.06e+00 |
Pos logit contributions | |
Which | +0.031 |
Good | +0.030 |
Time | +0.030 |
Why | +0.029 |
Where | +0.029 |
Neg logit contributions | |
endant | -0.034 |
av | -0.032 |
jewels | -0.032 |
arrest | -0.031 |
brace | -0.030 |
Token | latest |
Token ID | 3452 |
Feature activation | +6.46e-01 |
Pos logit contributions | |
endant | +0.036 |
av | +0.035 |
jewels | +0.034 |
arrest | +0.034 |
brace | +0.033 |
Neg logit contributions | |
Which | -0.025 |
Good | -0.023 |
Time | -0.023 |
Where | -0.023 |
Why | -0.023 |
Token | adventure |
Token ID | 8855 |
Feature activation | -8.02e-02 |
Pos logit contributions | |
endant | +0.020 |
av | +0.019 |
jewels | +0.019 |
arrest | +0.019 |
brace | +0.018 |
Neg logit contributions | |
Which | -0.017 |
ash | -0.016 |
Time | -0.016 |
Good | -0.016 |
Time | -0.015 |
Token | , |
Token ID | 11 |
Feature activation | -2.69e+00 |
Pos logit contributions | |
Which | +0.002 |
Time | +0.002 |
Good | +0.002 |
ash | +0.002 |
Why | +0.002 |
Neg logit contributions | |
endant | -0.002 |
arrest | -0.002 |
av | -0.002 |
jewels | -0.002 |
brace | -0.002 |
Token | " |
Token ID | 366 |
Feature activation | -1.53e+00 |
Pos logit contributions | |
ash | +0.042 |
idget | +0.040 |
stations | +0.040 |
Which | +0.039 |
rated | +0.038 |
Neg logit contributions | |
av | -0.041 |
jewels | -0.038 |
pe | -0.036 |
endant | -0.036 |
� | -0.036 |
Token | What |
Token ID | 2061 |
Feature activation | -1.05e+00 |
Pos logit contributions | |
idget | +0.021 |
ash | +0.020 |
rated | +0.018 |
Clean | +0.018 |
inter | +0.017 |
Neg logit contributions | |
av | -0.065 |
jewels | -0.063 |
endant | -0.062 |
arrest | -0.060 |
brace | -0.060 |
Token | do |
Token ID | 466 |
Feature activation | +1.51e+00 |
Pos logit contributions | |
Which | +0.029 |
idget | +0.027 |
Time | +0.027 |
Where | +0.027 |
Good | +0.027 |
Neg logit contributions | |
endant | -0.031 |
av | -0.030 |
jewels | -0.030 |
arrest | -0.029 |
brace | -0.029 |
Token | you |
Token ID | 345 |
Feature activation | +3.41e-01 |
Pos logit contributions | |
endant | +0.048 |
jewels | +0.043 |
arrest | +0.042 |
brace | +0.042 |
agged | +0.041 |
Neg logit contributions | |
Which | -0.043 |
Good | -0.041 |
Time | -0.040 |
Why | -0.039 |
Time | -0.038 |
Token | think |
Token ID | 892 |
Feature activation | -1.73e-01 |
Pos logit contributions | |
endant | +0.011 |
jewels | +0.011 |
av | +0.011 |
arrest | +0.011 |
brace | +0.010 |
Neg logit contributions | |
Which | -0.008 |
Good | -0.008 |
Time | -0.008 |
Why | -0.008 |
ash | -0.008 |
Token | , |
Token ID | 11 |
Feature activation | -3.39e+00 |
Pos logit contributions | |
Which | +0.005 |
Good | +0.005 |
Time | +0.005 |
Why | +0.004 |
ash | +0.004 |
Neg logit contributions | |
endant | -0.005 |
arrest | -0.005 |
jewels | -0.005 |
av | -0.005 |
brace | -0.005 |
Token | Baby |
Token ID | 14801 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
Ready | +0.090 |
Which | +0.088 |
stations | +0.088 |
ash | +0.087 |
idget | +0.086 |
Neg logit contributions | |
av | -0.096 |
jewels | -0.093 |
endant | -0.088 |
coins | -0.087 |
aches | -0.086 |
Token | ?", |
Token ID | 35379 |
Feature activation | -1.04e+00 |
Pos logit contributions | |
Which | +0.054 |
Where | +0.051 |
Ready | +0.050 |
Time | +0.050 |
idget | +0.048 |
Neg logit contributions | |
av | -0.047 |
endant | -0.045 |
jewels | -0.045 |
aches | -0.042 |
kins | -0.041 |
Token | and |
Token ID | 290 |
Feature activation | -1.65e+00 |
Pos logit contributions | |
Which | +0.026 |
ash | +0.025 |
idget | +0.024 |
Time | +0.024 |
Ready | +0.024 |
Neg logit contributions | |
av | -0.033 |
endant | -0.032 |
jewels | -0.032 |
arrest | -0.031 |
brace | -0.030 |
Token | Baby |
Token ID | 14801 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
Which | +0.038 |
Good | +0.036 |
Time | +0.035 |
ash | +0.035 |
Where | +0.034 |
Neg logit contributions | |
endant | -0.056 |
av | -0.054 |
jewels | -0.054 |
arrest | -0.053 |
brace | -0.052 |
Token | said |
Token ID | 531 |
Feature activation | -1.92e-01 |
Pos logit contributions | |
Which | +0.050 |
Good | +0.049 |
Time | +0.048 |
Why | +0.047 |
ash | +0.047 |
Neg logit contributions | |
endant | -0.053 |
arrest | -0.051 |
jewels | -0.050 |
av | -0.050 |
brace | -0.048 |
Token | the |
Token ID | 262 |
Feature activation | -7.27e-01 |
Pos logit contributions | |
Which | +0.013 |
Good | +0.012 |
Time | +0.012 |
Where | +0.012 |
Why | +0.012 |
Neg logit contributions | |
endant | -0.016 |
av | -0.015 |
arrest | -0.015 |
jewels | -0.015 |
brace | -0.014 |
Token | m |
Token ID | 285 |
Feature activation | +2.67e-01 |
Pos logit contributions | |
Which | +0.018 |
Good | +0.017 |
Time | +0.017 |
Where | +0.017 |
Why | +0.017 |
Neg logit contributions | |
endant | -0.024 |
arrest | -0.022 |
av | -0.022 |
jewels | -0.022 |
brace | -0.022 |
Token | op |
Token ID | 404 |
Feature activation | -9.08e-01 |
Pos logit contributions | |
jewels | +0.009 |
av | +0.009 |
brace | +0.009 |
arrest | +0.008 |
endant | +0.008 |
Neg logit contributions | |
ash | -0.006 |
Good | -0.006 |
Which | -0.006 |
idget | -0.006 |
Time | -0.006 |
Token | helped |
Token ID | 4193 |
Feature activation | -2.01e+00 |
Pos logit contributions | |
Why | +0.016 |
ash | +0.015 |
Time | +0.015 |
Which | +0.015 |
Time | +0.015 |
Neg logit contributions | |
endant | -0.035 |
jewels | -0.033 |
av | -0.033 |
brace | -0.033 |
arrest | -0.033 |
Token | the |
Token ID | 262 |
Feature activation | -2.64e+00 |
Pos logit contributions | |
Which | +0.055 |
Good | +0.053 |
Time | +0.053 |
Why | +0.052 |
Where | +0.052 |
Neg logit contributions | |
endant | -0.061 |
jewels | -0.057 |
av | -0.056 |
arrest | -0.056 |
brace | -0.053 |
Token | little |
Token ID | 1310 |
Feature activation | -3.39e+00 |
Pos logit contributions | |
Which | +0.070 |
ash | +0.068 |
idget | +0.068 |
Good | +0.067 |
Time | +0.063 |
Neg logit contributions | |
av | -0.077 |
coins | -0.076 |
jewels | -0.076 |
arrest | -0.073 |
brace | -0.070 |
Token | girl |
Token ID | 2576 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
Which | +0.090 |
Good | +0.087 |
idget | +0.085 |
ash | +0.083 |
Time | +0.083 |
Neg logit contributions | |
coins | -0.101 |
av | -0.098 |
jewels | -0.097 |
brace | -0.090 |
breath | -0.090 |
Token | dry |
Token ID | 5894 |
Feature activation | -8.87e-01 |
Pos logit contributions | |
Which | +0.024 |
Good | +0.023 |
Time | +0.022 |
ash | +0.022 |
Why | +0.022 |
Neg logit contributions | |
endant | -0.034 |
jewels | -0.033 |
av | -0.033 |
arrest | -0.033 |
brace | -0.032 |
Token | off |
Token ID | 572 |
Feature activation | +2.89e-02 |
Pos logit contributions | |
Which | +0.024 |
Good | +0.022 |
Time | +0.022 |
Why | +0.022 |
Where | +0.022 |
Neg logit contributions | |
endant | -0.027 |
av | -0.026 |
arrest | -0.026 |
jewels | -0.026 |
brace | -0.025 |
Token | with |
Token ID | 351 |
Feature activation | +2.08e-01 |
Pos logit contributions | |
endant | +0.001 |
agged | +0.001 |
jewels | +0.001 |
arrest | +0.001 |
av | +0.001 |
Neg logit contributions | |
over | -0.001 |
when | -0.000 |
Why | -0.000 |
Where | -0.000 |
Clean | -0.000 |
Token | a |
Token ID | 257 |
Feature activation | -3.20e-01 |
Pos logit contributions | |
endant | +0.007 |
arrest | +0.007 |
pe | +0.007 |
agged | +0.006 |
av | +0.006 |
Neg logit contributions | |
Which | -0.005 |
Where | -0.005 |
Time | -0.005 |
Good | -0.005 |
Why | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +5.68e-01 |
Pos logit contributions | |
Which | +0.021 |
Good | +0.020 |
Time | +0.020 |
ash | +0.019 |
idget | +0.019 |
Neg logit contributions | |
endant | -0.012 |
av | -0.011 |
jewels | -0.011 |
arrest | -0.011 |
pe | -0.010 |
Token |
|
Token ID | 198 |
Feature activation | +4.48e-01 |
Pos logit contributions | |
endant | +0.018 |
av | +0.017 |
arrest | +0.017 |
jewels | +0.017 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.014 |
Good | -0.013 |
ash | -0.013 |
idget | -0.013 |
Time | -0.013 |
Token | â |
Token ID | 22940 |
Feature activation | -5.53e-01 |
Pos logit contributions | |
pe | +0.010 |
arrest | +0.009 |
hy | +0.009 |
aches | +0.009 |
av | +0.009 |
Neg logit contributions | |
idget | -0.015 |
Which | -0.014 |
ash | -0.014 |
Good | -0.014 |
stations | -0.013 |
Token | € |
Token ID | 26391 |
Feature activation | +4.21e-01 |
Pos logit contributions | |
Which | +0.014 |
Where | +0.012 |
Good | +0.012 |
Time | +0.012 |
idget | +0.011 |
Neg logit contributions | |
endant | -0.018 |
pe | -0.018 |
hy | -0.018 |
arrest | -0.017 |
jewels | -0.017 |
Token | � |
Token ID | 129 |
Feature activation | -1.17e+00 |
Pos logit contributions | |
av | +0.015 |
endant | +0.015 |
jewels | +0.015 |
brace | +0.015 |
arrest | +0.014 |
Neg logit contributions | |
Which | -0.008 |
Good | -0.008 |
Time | -0.008 |
Time | -0.008 |
Why | -0.008 |
Token | � |
Token ID | 241 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
Which | +0.030 |
Good | +0.027 |
Time | +0.027 |
Where | +0.026 |
Why | +0.025 |
Neg logit contributions | |
endant | -0.037 |
arrest | -0.037 |
pe | -0.036 |
hy | -0.035 |
jewels | -0.035 |
Token | Dad |
Token ID | 46270 |
Feature activation | +2.24e-01 |
Pos logit contributions | |
idget | +0.084 |
ash | +0.080 |
ting | +0.076 |
DJ | +0.072 |
nurses | +0.072 |
Neg logit contributions | |
pe | -0.098 |
hy | -0.091 |
arrest | -0.085 |
high | -0.082 |
curly | -0.080 |
Token | , |
Token ID | 11 |
Feature activation | -2.61e+00 |
Pos logit contributions | |
endant | +0.007 |
arrest | +0.007 |
av | +0.006 |
jewels | +0.006 |
brace | +0.006 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.006 |
Time | -0.006 |
Why | -0.005 |
Where | -0.005 |
Token | let |
Token ID | 1309 |
Feature activation | -1.85e+00 |
Pos logit contributions | |
ash | +0.061 |
idget | +0.061 |
Which | +0.058 |
ksh | +0.058 |
tap | +0.058 |
Neg logit contributions | |
jewels | -0.083 |
coins | -0.081 |
av | -0.078 |
aches | -0.077 |
endant | -0.076 |
Token | 's |
Token ID | 338 |
Feature activation | -7.08e-01 |
Pos logit contributions | |
Which | +0.056 |
stations | +0.054 |
Where | +0.053 |
idget | +0.053 |
rhythms | +0.053 |
Neg logit contributions | |
arrest | -0.042 |
av | -0.041 |
aches | -0.041 |
pe | -0.040 |
coins | -0.039 |
Token | fly |
Token ID | 6129 |
Feature activation | -2.94e-01 |
Pos logit contributions | |
Which | +0.015 |
Good | +0.013 |
Time | +0.013 |
Why | +0.013 |
Where | +0.013 |
Neg logit contributions | |
endant | -0.026 |
av | -0.025 |
jewels | -0.025 |
arrest | -0.024 |
brace | -0.024 |
Token | I |
Token ID | 314 |
Feature activation | +5.86e-01 |
Pos logit contributions | |
endant | +0.027 |
av | +0.026 |
jewels | +0.026 |
arrest | +0.025 |
hy | +0.024 |
Neg logit contributions | |
Which | -0.021 |
Time | -0.020 |
ash | -0.020 |
idget | -0.019 |
Where | -0.019 |
Token | have |
Token ID | 423 |
Feature activation | +6.70e-02 |
Pos logit contributions | |
av | +0.021 |
endant | +0.021 |
brace | +0.021 |
jewels | +0.021 |
agged | +0.020 |
Neg logit contributions | |
Good | -0.012 |
Time | -0.012 |
Which | -0.012 |
Why | -0.011 |
Clean | -0.011 |
Token | to |
Token ID | 284 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
endant | +0.002 |
hy | +0.002 |
brace | +0.002 |
agged | +0.002 |
pe | +0.002 |
Neg logit contributions | |
Which | -0.001 |
Where | -0.001 |
Time | -0.001 |
Good | -0.001 |
Why | -0.001 |
Token | buy |
Token ID | 2822 |
Feature activation | -1.11e+00 |
Pos logit contributions | |
Which | +0.004 |
Time | +0.004 |
Why | +0.004 |
Good | +0.004 |
Time | +0.004 |
Neg logit contributions | |
endant | -0.009 |
jewels | -0.008 |
av | -0.008 |
brace | -0.008 |
arrest | -0.008 |
Token | a |
Token ID | 257 |
Feature activation | -2.85e+00 |
Pos logit contributions | |
Which | +0.034 |
Time | +0.033 |
idget | +0.032 |
Good | +0.032 |
ash | +0.032 |
Neg logit contributions | |
jewels | -0.028 |
av | -0.028 |
endant | -0.028 |
arrest | -0.027 |
coins | -0.027 |
Token | new |
Token ID | 649 |
Feature activation | -3.36e+00 |
Pos logit contributions | |
idget | +0.103 |
Why | +0.102 |
ting | +0.099 |
Kids | +0.099 |
Why | +0.099 |
Neg logit contributions | |
coins | -0.058 |
endant | -0.056 |
jewels | -0.056 |
av | -0.054 |
coin | -0.051 |
Token | one |
Token ID | 530 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
Kids | +0.107 |
idget | +0.107 |
Where | +0.105 |
Time | +0.104 |
Why | +0.103 |
Neg logit contributions | |
coins | -0.083 |
jewels | -0.080 |
av | -0.075 |
endant | -0.075 |
pe | -0.074 |
Token | ." |
Token ID | 526 |
Feature activation | +5.13e-02 |
Pos logit contributions | |
Time | +0.042 |
Which | +0.041 |
idget | +0.041 |
Good | +0.040 |
Kids | +0.039 |
Neg logit contributions | |
jewels | -0.038 |
endant | -0.038 |
av | -0.037 |
coins | -0.036 |
aches | -0.034 |
Token |
|
Token ID | 198 |
Feature activation | -4.25e-01 |
Pos logit contributions | |
endant | +0.001 |
av | +0.001 |
brace | +0.001 |
jewels | +0.001 |
� | +0.001 |
Neg logit contributions | |
Which | -0.002 |
ash | -0.002 |
Time | -0.001 |
stations | -0.001 |
idget | -0.001 |
Token |
|
Token ID | 198 |
Feature activation | +1.96e-01 |
Pos logit contributions | |
Which | +0.012 |
ash | +0.011 |
Good | +0.011 |
Time | +0.011 |
idget | +0.011 |
Neg logit contributions | |
endant | -0.011 |
av | -0.011 |
arrest | -0.011 |
jewels | -0.010 |
brace | -0.010 |
Token | L |
Token ID | 43 |
Feature activation | +5.78e-01 |
Pos logit contributions | |
brace | +0.005 |
endant | +0.005 |
av | +0.005 |
arrest | +0.005 |
aches | +0.005 |
Neg logit contributions | |
ash | -0.006 |
Good | -0.006 |
idget | -0.005 |
ting | -0.005 |
Which | -0.005 |
Token | ". |
Token ID | 1911 |
Feature activation | -9.82e-01 |
Pos logit contributions | |
Which | +0.026 |
Time | +0.024 |
Where | +0.023 |
Good | +0.023 |
idget | +0.022 |
Neg logit contributions | |
endant | -0.032 |
jewels | -0.031 |
av | -0.031 |
arrest | -0.030 |
brace | -0.030 |
Token | He |
Token ID | 679 |
Feature activation | -1.29e-03 |
Pos logit contributions | |
Which | +0.029 |
ash | +0.026 |
Where | +0.025 |
Why | +0.025 |
Time | +0.025 |
Neg logit contributions | |
endant | -0.025 |
hy | -0.025 |
jewels | -0.025 |
arrest | -0.025 |
av | -0.024 |
Token | handed |
Token ID | 10158 |
Feature activation | -1.41e+00 |
Pos logit contributions | |
Which | +0.000 |
Good | +0.000 |
Time | +0.000 |
Where | +0.000 |
Why | +0.000 |
Neg logit contributions | |
endant | -0.000 |
arrest | -0.000 |
jewels | -0.000 |
av | -0.000 |
hy | -0.000 |
Token | the |
Token ID | 262 |
Feature activation | +2.91e-01 |
Pos logit contributions | |
Which | +0.041 |
Good | +0.039 |
Time | +0.039 |
ash | +0.038 |
Why | +0.038 |
Neg logit contributions | |
endant | -0.039 |
av | -0.038 |
jewels | -0.038 |
arrest | -0.037 |
brace | -0.036 |
Token | squash |
Token ID | 34613 |
Feature activation | -1.02e+00 |
Pos logit contributions | |
endant | +0.009 |
arrest | +0.008 |
jewels | +0.008 |
av | +0.008 |
brace | +0.008 |
Neg logit contributions | |
Which | -0.008 |
Good | -0.008 |
Time | -0.008 |
Where | -0.008 |
Why | -0.008 |
Token | to |
Token ID | 284 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
Which | +0.028 |
Good | +0.026 |
Time | +0.026 |
ash | +0.025 |
Where | +0.025 |
Neg logit contributions | |
endant | -0.031 |
av | -0.030 |
jewels | -0.030 |
arrest | -0.029 |
brace | -0.028 |
Token | Olivia |
Token ID | 33911 |
Feature activation | -1.54e+00 |
Pos logit contributions | |
Which | +0.091 |
ash | +0.088 |
Good | +0.085 |
Time | +0.084 |
Ready | +0.081 |
Neg logit contributions | |
arrest | -0.092 |
jewels | -0.091 |
av | -0.090 |
endant | -0.089 |
brace | -0.088 |
Token | and |
Token ID | 290 |
Feature activation | -9.46e-01 |
Pos logit contributions | |
Which | +0.050 |
Time | +0.048 |
Good | +0.046 |
Where | +0.046 |
Why | +0.045 |
Neg logit contributions | |
av | -0.038 |
endant | -0.038 |
jewels | -0.037 |
arrest | -0.037 |
brace | -0.035 |
Token | gave |
Token ID | 2921 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
Which | +0.027 |
Good | +0.026 |
Time | +0.026 |
Where | +0.025 |
Why | +0.025 |
Neg logit contributions | |
endant | -0.027 |
av | -0.026 |
jewels | -0.026 |
arrest | -0.026 |
brace | -0.025 |
Token | her |
Token ID | 607 |
Feature activation | +6.95e-02 |
Pos logit contributions | |
Which | +0.066 |
Time | +0.063 |
Good | +0.062 |
Why | +0.062 |
ash | +0.062 |
Neg logit contributions | |
jewels | -0.037 |
av | -0.036 |
brace | -0.035 |
coins | -0.035 |
endant | -0.034 |
Token | a |
Token ID | 257 |
Feature activation | -5.43e-01 |
Pos logit contributions | |
endant | +0.002 |
av | +0.002 |
jewels | +0.002 |
arrest | +0.002 |
brace | +0.002 |
Neg logit contributions | |
Which | -0.002 |
Time | -0.002 |
Good | -0.002 |
ash | -0.002 |
Where | -0.002 |
Token | carry |
Token ID | 3283 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
Time | +0.028 |
Which | +0.028 |
Good | +0.028 |
Ready | +0.026 |
Kids | +0.026 |
Neg logit contributions | |
av | -0.026 |
endant | -0.025 |
jewels | -0.025 |
arrest | -0.024 |
aches | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | -3.07e-01 |
Pos logit contributions | |
Which | +0.005 |
ash | +0.005 |
Why | +0.005 |
Where | +0.005 |
over | +0.005 |
Neg logit contributions | |
endant | -0.007 |
arrest | -0.006 |
hy | -0.006 |
jewels | -0.006 |
av | -0.006 |
Token | laundry |
Token ID | 25724 |
Feature activation | -1.80e+00 |
Pos logit contributions | |
Which | +0.008 |
Good | +0.008 |
Time | +0.008 |
ash | +0.007 |
Where | +0.007 |
Neg logit contributions | |
endant | -0.009 |
av | -0.009 |
jewels | -0.009 |
arrest | -0.009 |
brace | -0.009 |
Token | to |
Token ID | 284 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
Which | +0.034 |
ash | +0.032 |
Why | +0.031 |
idget | +0.031 |
Where | +0.031 |
Neg logit contributions | |
endant | -0.068 |
arrest | -0.065 |
jewels | -0.064 |
av | -0.064 |
brace | -0.063 |
Token | the |
Token ID | 262 |
Feature activation | -2.28e+00 |
Pos logit contributions | |
Which | +0.042 |
Why | +0.040 |
Time | +0.040 |
Where | +0.040 |
Good | +0.039 |
Neg logit contributions | |
endant | -0.052 |
jewels | -0.046 |
agged | -0.045 |
av | -0.045 |
hy | -0.045 |
Token | washing |
Token ID | 20518 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
rated | +0.083 |
ash | +0.083 |
idget | +0.082 |
tap | +0.077 |
Good | +0.076 |
Neg logit contributions | |
av | -0.047 |
coins | -0.047 |
arrest | -0.045 |
jewels | -0.042 |
brace | -0.039 |
Token | machine |
Token ID | 4572 |
Feature activation | -1.99e+00 |
Pos logit contributions | |
Good | +0.108 |
Which | +0.105 |
Time | +0.100 |
ksh | +0.098 |
idget | +0.097 |
Neg logit contributions | |
kins | -0.080 |
coins | -0.076 |
av | -0.074 |
arrest | -0.071 |
pe | -0.070 |
Token | . |
Token ID | 13 |
Feature activation | +1.09e-02 |
Pos logit contributions | |
Which | +0.045 |
Good | +0.042 |
Time | +0.042 |
Where | +0.040 |
Why | +0.039 |
Neg logit contributions | |
endant | -0.069 |
av | -0.067 |
jewels | -0.067 |
arrest | -0.066 |
brace | -0.064 |
Token | Tim |
Token ID | 5045 |
Feature activation | -7.56e-01 |
Pos logit contributions | |
endant | +0.000 |
av | +0.000 |
arrest | +0.000 |
jewels | +0.000 |
brace | +0.000 |
Neg logit contributions | |
Which | -0.000 |
Time | -0.000 |
Good | -0.000 |
ash | -0.000 |
Where | -0.000 |
Token | my |
Token ID | 1820 |
Feature activation | -4.67e-01 |
Pos logit contributions | |
Which | +0.014 |
Good | +0.013 |
Time | +0.013 |
Where | +0.013 |
Why | +0.012 |
Neg logit contributions | |
endant | -0.029 |
av | -0.028 |
jewels | -0.028 |
arrest | -0.028 |
brace | -0.027 |
Token | was |
Token ID | 373 |
Feature activation | -1.23e+00 |
Pos logit contributions | |
Which | +0.009 |
Good | +0.009 |
Time | +0.009 |
Why | +0.008 |
ash | +0.008 |
Neg logit contributions | |
endant | -0.018 |
jewels | -0.017 |
arrest | -0.017 |
av | -0.017 |
hy | -0.016 |
Token |
|
Token ID | 198 |
Feature activation | -2.14e-01 |
Pos logit contributions | |
ash | +0.027 |
stations | +0.027 |
Which | +0.027 |
tap | +0.026 |
idget | +0.026 |
Neg logit contributions | |
av | -0.014 |
endant | -0.014 |
jewels | -0.014 |
hy | -0.012 |
coins | -0.012 |
Token |
|
Token ID | 198 |
Feature activation | -6.07e-02 |
Pos logit contributions | |
ash | +0.006 |
idget | +0.006 |
Which | +0.006 |
stations | +0.006 |
rated | +0.006 |
Neg logit contributions | |
endant | -0.005 |
jewels | -0.005 |
hy | -0.005 |
av | -0.005 |
arrest | -0.005 |
Token | â |
Token ID | 22940 |
Feature activation | -5.64e-01 |
Pos logit contributions | |
idget | +0.002 |
ash | +0.002 |
stations | +0.002 |
ting | +0.002 |
inter | +0.002 |
Neg logit contributions | |
endant | -0.001 |
hy | -0.001 |
jewels | -0.001 |
av | -0.001 |
arrest | -0.001 |
Token | € |
Token ID | 26391 |
Feature activation | +5.36e-01 |
Pos logit contributions | |
Which | +0.014 |
Where | +0.012 |
Time | +0.012 |
Good | +0.012 |
Why | +0.011 |
Neg logit contributions | |
endant | -0.019 |
hy | -0.018 |
pe | -0.018 |
arrest | -0.018 |
av | -0.018 |
Token | � |
Token ID | 129 |
Feature activation | -1.40e+00 |
Pos logit contributions | |
av | +0.018 |
endant | +0.018 |
jewels | +0.018 |
brace | +0.018 |
aches | +0.017 |
Neg logit contributions | |
Which | -0.012 |
Good | -0.012 |
Time | -0.011 |
Time | -0.011 |
Where | -0.011 |
Token | � |
Token ID | 241 |
Feature activation | -3.35e+00 |
Pos logit contributions | |
Which | +0.036 |
Time | +0.032 |
Good | +0.032 |
Where | +0.031 |
Which | +0.030 |
Neg logit contributions | |
endant | -0.046 |
arrest | -0.045 |
pe | -0.043 |
hy | -0.043 |
jewels | -0.042 |
Token | M |
Token ID | 44 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
ash | +0.080 |
idget | +0.077 |
nurses | +0.069 |
ting | +0.067 |
stations | +0.066 |
Neg logit contributions | |
hy | -0.100 |
pe | -0.095 |
arrest | -0.093 |
endant | -0.087 |
curly | -0.085 |
Token | um |
Token ID | 388 |
Feature activation | -6.91e-03 |
Pos logit contributions | |
endant | +0.013 |
jewels | +0.013 |
arrest | +0.013 |
av | +0.013 |
brace | +0.013 |
Neg logit contributions | |
Which | -0.012 |
Good | -0.011 |
Time | -0.011 |
ash | -0.011 |
Why | -0.011 |
Token | , |
Token ID | 11 |
Feature activation | -1.47e+00 |
Pos logit contributions | |
Good | +0.000 |
Which | +0.000 |
Time | +0.000 |
Time | +0.000 |
Why | +0.000 |
Neg logit contributions | |
endant | -0.000 |
arrest | -0.000 |
agged | -0.000 |
av | -0.000 |
jewels | -0.000 |
Token | look |
Token ID | 804 |
Feature activation | -1.97e+00 |
Pos logit contributions | |
Which | +0.039 |
ash | +0.038 |
idget | +0.037 |
Time | +0.037 |
Good | +0.037 |
Neg logit contributions | |
endant | -0.043 |
jewels | -0.042 |
av | -0.042 |
arrest | -0.040 |
coins | -0.039 |
Token | ! |
Token ID | 0 |
Feature activation | -4.83e-01 |
Pos logit contributions | |
Time | +0.055 |
Which | +0.055 |
Good | +0.052 |
Ready | +0.052 |
Kids | +0.051 |
Neg logit contributions | |
jewels | -0.057 |
endant | -0.056 |
av | -0.056 |
coins | -0.054 |
brace | -0.051 |
Token | " |
Token ID | 366 |
Feature activation | -3.06e+00 |
Pos logit contributions | |
ash | +0.103 |
Which | +0.100 |
idget | +0.097 |
stations | +0.097 |
rated | +0.093 |
Neg logit contributions | |
hy | -0.061 |
arrest | -0.059 |
� | -0.058 |
curly | -0.057 |
hips | -0.056 |
Token | What |
Token ID | 2061 |
Feature activation | -1.68e+00 |
Pos logit contributions | |
inter | +0.065 |
idget | +0.065 |
ash | +0.064 |
habit | +0.059 |
rated | +0.058 |
Neg logit contributions | |
pe | -0.089 |
arrest | -0.087 |
hy | -0.086 |
Chuck | -0.081 |
curly | -0.079 |
Token | are |
Token ID | 389 |
Feature activation | -6.77e-01 |
Pos logit contributions | |
idget | +0.046 |
Which | +0.045 |
Where | +0.044 |
Time | +0.043 |
ash | +0.043 |
Neg logit contributions | |
av | -0.049 |
endant | -0.047 |
jewels | -0.047 |
brace | -0.045 |
arrest | -0.045 |
Token | you |
Token ID | 345 |
Feature activation | -7.76e-01 |
Pos logit contributions | |
Which | +0.024 |
Good | +0.023 |
Time | +0.023 |
idget | +0.023 |
ash | +0.022 |
Neg logit contributions | |
endant | -0.015 |
av | -0.014 |
jewels | -0.014 |
arrest | -0.014 |
brace | -0.013 |
Token | making |
Token ID | 1642 |
Feature activation | -8.62e-01 |
Pos logit contributions | |
Which | +0.025 |
Good | +0.023 |
Where | +0.023 |
idget | +0.023 |
Time | +0.023 |
Neg logit contributions | |
av | -0.019 |
arrest | -0.019 |
endant | -0.019 |
jewels | -0.018 |
aches | -0.018 |
Token | , |
Token ID | 11 |
Feature activation | -3.34e+00 |
Pos logit contributions | |
Which | +0.024 |
Good | +0.022 |
Time | +0.022 |
Where | +0.022 |
ash | +0.022 |
Neg logit contributions | |
endant | -0.025 |
av | -0.025 |
jewels | -0.025 |
arrest | -0.024 |
brace | -0.023 |
Token | Mama |
Token ID | 40084 |
Feature activation | -1.60e+00 |
Pos logit contributions | |
Which | +0.094 |
ash | +0.089 |
Where | +0.088 |
idget | +0.086 |
Ready | +0.085 |
Neg logit contributions | |
jewels | -0.085 |
coins | -0.082 |
arrest | -0.080 |
aches | -0.079 |
av | -0.078 |
Token | ?" |
Token ID | 1701 |
Feature activation | -2.73e+00 |
Pos logit contributions | |
Which | +0.052 |
Time | +0.049 |
Where | +0.049 |
Ready | +0.048 |
ash | +0.047 |
Neg logit contributions | |
av | -0.040 |
endant | -0.038 |
jewels | -0.038 |
aches | -0.036 |
arrest | -0.035 |
Token | asked |
Token ID | 1965 |
Feature activation | -3.26e+00 |
Pos logit contributions | |
ash | +0.078 |
Which | +0.077 |
stations | +0.072 |
Ready | +0.072 |
idget | +0.072 |
Neg logit contributions | |
arrest | -0.068 |
pe | -0.067 |
jewels | -0.067 |
av | -0.067 |
brace | -0.066 |
Token | Michael |
Token ID | 3899 |
Feature activation | -1.08e+00 |
Pos logit contributions | |
Which | +0.097 |
Ready | +0.089 |
ash | +0.088 |
Good | +0.085 |
Where | +0.085 |
Neg logit contributions | |
pe | -0.080 |
jewels | -0.079 |
coins | -0.079 |
av | -0.079 |
aches | -0.077 |
Token | . |
Token ID | 13 |
Feature activation | -3.10e+00 |
Pos logit contributions | |
Which | +0.030 |
Time | +0.028 |
Good | +0.027 |
Ready | +0.026 |
ash | +0.026 |
Neg logit contributions | |
endant | -0.032 |
av | -0.032 |
jewels | -0.031 |
brace | -0.031 |
hy | -0.030 |
Token | m |
Token ID | 285 |
Feature activation | +6.83e-01 |
Pos logit contributions | |
endant | +0.019 |
arrest | +0.018 |
agged | +0.017 |
av | +0.017 |
jewels | +0.017 |
Neg logit contributions | |
Which | -0.015 |
Good | -0.014 |
Time | -0.014 |
Time | -0.014 |
Clean | -0.014 |
Token | op |
Token ID | 404 |
Feature activation | -8.87e-01 |
Pos logit contributions | |
jewels | +0.022 |
av | +0.022 |
brace | +0.021 |
endant | +0.021 |
arrest | +0.021 |
Neg logit contributions | |
ash | -0.017 |
Which | -0.016 |
Good | -0.016 |
idget | -0.016 |
Time | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
Which | +0.019 |
ash | +0.018 |
Why | +0.018 |
Good | +0.017 |
Time | +0.017 |
Neg logit contributions | |
endant | -0.031 |
av | -0.030 |
jewels | -0.030 |
arrest | -0.030 |
brace | -0.029 |
Token | They |
Token ID | 1119 |
Feature activation | -3.02e-01 |
Pos logit contributions | |
idget | +0.041 |
rated | +0.041 |
ting | +0.041 |
ash | +0.040 |
ing | +0.040 |
Neg logit contributions | |
endant | -0.027 |
� | -0.026 |
av | -0.026 |
jewels | -0.025 |
arrest | -0.024 |
Token | use |
Token ID | 779 |
Feature activation | -8.65e-01 |
Pos logit contributions | |
Which | +0.006 |
Why | +0.006 |
Good | +0.006 |
Time | +0.006 |
ash | +0.005 |
Neg logit contributions | |
endant | -0.011 |
av | -0.011 |
jewels | -0.011 |
arrest | -0.011 |
brace | -0.010 |
Token | the |
Token ID | 262 |
Feature activation | -3.34e+00 |
Pos logit contributions | |
Which | +0.024 |
Good | +0.023 |
Time | +0.023 |
Where | +0.022 |
ash | +0.022 |
Neg logit contributions | |
endant | -0.025 |
av | -0.024 |
arrest | -0.024 |
jewels | -0.024 |
brace | -0.023 |
Token | m |
Token ID | 285 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
Good | +0.098 |
Which | +0.096 |
Kids | +0.096 |
idget | +0.095 |
Time | +0.095 |
Neg logit contributions | |
coins | -0.088 |
pe | -0.081 |
jewels | -0.081 |
endant | -0.077 |
aches | -0.076 |
Token | op |
Token ID | 404 |
Feature activation | -8.26e-01 |
Pos logit contributions | |
Which | +0.049 |
Good | +0.046 |
Where | +0.046 |
Time | +0.045 |
Ready | +0.045 |
Neg logit contributions | |
endant | -0.042 |
arrest | -0.038 |
aches | -0.038 |
pe | -0.038 |
av | -0.036 |
Token | to |
Token ID | 284 |
Feature activation | -1.33e+00 |
Pos logit contributions | |
Which | +0.018 |
ash | +0.018 |
Why | +0.017 |
over | +0.017 |
Good | +0.017 |
Neg logit contributions | |
endant | -0.028 |
av | -0.027 |
arrest | -0.027 |
jewels | -0.027 |
brace | -0.026 |
Token | make |
Token ID | 787 |
Feature activation | -2.12e+00 |
Pos logit contributions | |
Which | +0.025 |
Why | +0.025 |
Time | +0.024 |
Where | +0.023 |
ash | +0.023 |
Neg logit contributions | |
endant | -0.051 |
av | -0.048 |
jewels | -0.048 |
arrest | -0.046 |
agged | -0.046 |
Token | bubbles |
Token ID | 25037 |
Feature activation | -7.56e-01 |
Pos logit contributions | |
Which | +0.068 |
idget | +0.063 |
Kids | +0.063 |
Time | +0.063 |
Good | +0.063 |
Neg logit contributions | |
coins | -0.054 |
brace | -0.054 |
av | -0.054 |
jewels | -0.053 |
aches | -0.053 |
Token | was |
Token ID | 373 |
Feature activation | +8.62e-02 |
Pos logit contributions | |
Which | +0.027 |
Good | +0.025 |
ash | +0.025 |
Time | +0.024 |
idget | +0.024 |
Neg logit contributions | |
endant | -0.039 |
jewels | -0.038 |
arrest | -0.038 |
av | -0.038 |
brace | -0.037 |
Token | a |
Token ID | 257 |
Feature activation | +3.68e-02 |
Pos logit contributions | |
endant | +0.003 |
jewels | +0.003 |
arrest | +0.003 |
av | +0.003 |
brace | +0.002 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Time | -0.002 |
Where | -0.002 |
Why | -0.002 |
Token | girl |
Token ID | 2576 |
Feature activation | +7.29e-01 |
Pos logit contributions | |
endant | +0.001 |
av | +0.001 |
jewels | +0.001 |
arrest | +0.001 |
brace | +0.001 |
Neg logit contributions | |
Which | -0.001 |
ash | -0.001 |
Good | -0.001 |
Time | -0.001 |
idget | -0.001 |
Token | named |
Token ID | 3706 |
Feature activation | +2.57e-01 |
Pos logit contributions | |
endant | +0.014 |
arrest | +0.014 |
av | +0.013 |
jewels | +0.013 |
brace | +0.013 |
Neg logit contributions | |
Which | -0.027 |
Good | -0.026 |
Time | -0.026 |
Ready | -0.026 |
idget | -0.026 |
Token | Jane |
Token ID | 12091 |
Feature activation | -5.19e-01 |
Pos logit contributions | |
endant | +0.008 |
av | +0.008 |
jewels | +0.007 |
arrest | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.007 |
Time | -0.007 |
Good | -0.007 |
ash | -0.006 |
Why | -0.006 |
Token | . |
Token ID | 13 |
Feature activation | +2.39e+00 |
Pos logit contributions | |
Which | +0.015 |
Good | +0.015 |
Ready | +0.015 |
Time | +0.014 |
Which | +0.014 |
Neg logit contributions | |
endant | -0.015 |
brace | -0.014 |
av | -0.014 |
jewels | -0.014 |
arrest | -0.014 |
Token | She |
Token ID | 1375 |
Feature activation | +7.92e-01 |
Pos logit contributions | |
endant | +0.065 |
av | +0.063 |
jewels | +0.062 |
arrest | +0.062 |
brace | +0.060 |
Neg logit contributions | |
Which | -0.071 |
Good | -0.068 |
Time | -0.067 |
ash | -0.066 |
Where | -0.066 |
Token | was |
Token ID | 373 |
Feature activation | -3.23e-01 |
Pos logit contributions | |
endant | +0.028 |
av | +0.027 |
jewels | +0.026 |
arrest | +0.026 |
brace | +0.025 |
Neg logit contributions | |
Which | -0.018 |
Good | -0.017 |
Time | -0.017 |
Why | -0.017 |
Where | -0.017 |
Token | very |
Token ID | 845 |
Feature activation | +7.20e-01 |
Pos logit contributions | |
Which | +0.008 |
Good | +0.007 |
Why | +0.007 |
Time | +0.007 |
Where | +0.007 |
Neg logit contributions | |
endant | -0.011 |
arrest | -0.010 |
jewels | -0.010 |
av | -0.010 |
pe | -0.010 |
Token | lazy |
Token ID | 16931 |
Feature activation | +1.42e-01 |
Pos logit contributions | |
endant | +0.023 |
arrest | +0.023 |
jewels | +0.022 |
brace | +0.022 |
av | +0.022 |
Neg logit contributions | |
Good | -0.017 |
Clean | -0.017 |
Time | -0.016 |
Time | -0.016 |
Which | -0.016 |
Token | and |
Token ID | 290 |
Feature activation | -3.05e-01 |
Pos logit contributions | |
jewels | +0.003 |
av | +0.003 |
endant | +0.003 |
arrest | +0.003 |
coins | +0.003 |
Neg logit contributions | |
Which | -0.005 |
Time | -0.005 |
Ready | -0.005 |
Good | -0.004 |
idget | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
Which | +0.004 |
Good | +0.003 |
ash | +0.003 |
Time | +0.003 |
idget | +0.003 |
Neg logit contributions | |
endant | -0.004 |
arrest | -0.004 |
av | -0.004 |
jewels | -0.004 |
brace | -0.004 |
Token | The |
Token ID | 464 |
Feature activation | +3.56e-01 |
Pos logit contributions | |
arrest | +0.014 |
brace | +0.013 |
av | +0.013 |
endant | +0.013 |
aches | +0.013 |
Neg logit contributions | |
ash | -0.015 |
Good | -0.015 |
Which | -0.015 |
idget | -0.015 |
Time | -0.014 |
Token | little |
Token ID | 1310 |
Feature activation | +5.43e-01 |
Pos logit contributions | |
endant | +0.011 |
jewels | +0.011 |
av | +0.011 |
arrest | +0.011 |
brace | +0.010 |
Neg logit contributions | |
Which | -0.009 |
ash | -0.009 |
Good | -0.009 |
Time | -0.009 |
idget | -0.009 |
Token | girl |
Token ID | 2576 |
Feature activation | +9.67e-02 |
Pos logit contributions | |
jewels | +0.022 |
endant | +0.022 |
av | +0.022 |
brace | +0.021 |
arrest | +0.021 |
Neg logit contributions | |
Which | -0.009 |
ash | -0.009 |
Good | -0.009 |
Time | -0.008 |
idget | -0.008 |
Token | put |
Token ID | 1234 |
Feature activation | +1.62e+00 |
Pos logit contributions | |
endant | +0.004 |
av | +0.004 |
arrest | +0.004 |
jewels | +0.004 |
hy | +0.004 |
Neg logit contributions | |
Clean | -0.002 |
Which | -0.002 |
over | -0.002 |
Good | -0.001 |
Why | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +2.76e+00 |
Pos logit contributions | |
arrest | +0.063 |
endant | +0.063 |
hy | +0.060 |
vern | +0.059 |
pe | +0.058 |
Neg logit contributions | |
over | -0.033 |
Which | -0.032 |
What | -0.030 |
Where | -0.029 |
Why | -0.028 |
Token | fake |
Token ID | 8390 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
arrest | +0.074 |
hy | +0.071 |
agged | +0.071 |
aches | +0.068 |
onna | +0.067 |
Neg logit contributions | |
Which | -0.079 |
What | -0.079 |
Where | -0.079 |
end | -0.077 |
Why | -0.073 |
Token | gem |
Token ID | 16840 |
Feature activation | +6.38e-01 |
Pos logit contributions | |
hy | +0.038 |
arrest | +0.038 |
agged | +0.035 |
aches | +0.035 |
endant | +0.034 |
Neg logit contributions | |
Which | -0.047 |
over | -0.045 |
Where | -0.045 |
when | -0.044 |
What | -0.044 |
Token | in |
Token ID | 287 |
Feature activation | +9.98e-01 |
Pos logit contributions | |
arrest | +0.028 |
endant | +0.027 |
hy | +0.026 |
av | +0.025 |
vern | +0.025 |
Neg logit contributions | |
over | -0.011 |
when | -0.010 |
across | -0.008 |
ing | -0.008 |
Which | -0.007 |
Token | her |
Token ID | 607 |
Feature activation | +1.14e+00 |
Pos logit contributions | |
endant | +0.044 |
agged | +0.039 |
aches | +0.039 |
av | +0.039 |
ls | +0.038 |
Neg logit contributions | |
when | -0.018 |
over | -0.018 |
Where | -0.017 |
Why | -0.017 |
What | -0.016 |
Token | pocket |
Token ID | 10000 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
aches | +0.030 |
arrest | +0.028 |
av | +0.028 |
pe | +0.027 |
endant | +0.027 |
Neg logit contributions | |
Clean | -0.034 |
Which | -0.034 |
Which | -0.032 |
Good | -0.031 |
Where | -0.031 |
Token | said |
Token ID | 531 |
Feature activation | +1.48e+00 |
Pos logit contributions | |
endant | +0.027 |
arrest | +0.027 |
av | +0.027 |
pe | +0.026 |
hy | +0.026 |
Neg logit contributions | |
Which | -0.017 |
Clean | -0.016 |
over | -0.015 |
Where | -0.015 |
Why | -0.015 |
Token | , |
Token ID | 11 |
Feature activation | -1.05e-01 |
Pos logit contributions | |
endant | +0.049 |
arrest | +0.047 |
� | +0.042 |
agged | +0.042 |
jewels | +0.042 |
Neg logit contributions | |
Which | -0.037 |
Good | -0.036 |
Why | -0.035 |
Which | -0.034 |
over | -0.034 |
Token | " |
Token ID | 366 |
Feature activation | -2.09e-01 |
Pos logit contributions | |
Which | +0.002 |
ash | +0.002 |
Time | +0.002 |
Good | +0.002 |
idget | +0.002 |
Neg logit contributions | |
endant | -0.004 |
av | -0.004 |
jewels | -0.004 |
arrest | -0.004 |
brace | -0.003 |
Token | Wow |
Token ID | 22017 |
Feature activation | +1.62e-01 |
Pos logit contributions | |
ash | +0.005 |
idget | +0.005 |
Which | +0.005 |
Good | +0.005 |
inter | +0.005 |
Neg logit contributions | |
arrest | -0.006 |
brace | -0.006 |
av | -0.006 |
jewels | -0.006 |
pe | -0.006 |
Token | ! |
Token ID | 0 |
Feature activation | +5.82e-01 |
Pos logit contributions | |
endant | +0.004 |
jewels | +0.004 |
av | +0.004 |
arrest | +0.004 |
brace | +0.004 |
Neg logit contributions | |
Which | -0.005 |
Time | -0.005 |
Good | -0.005 |
Where | -0.005 |
Why | -0.005 |
Token | Can |
Token ID | 1680 |
Feature activation | +2.56e+00 |
Pos logit contributions | |
endant | +0.018 |
av | +0.017 |
jewels | +0.017 |
arrest | +0.017 |
hy | +0.017 |
Neg logit contributions | |
Which | -0.015 |
Time | -0.014 |
ash | -0.014 |
idget | -0.014 |
Where | -0.014 |
Token | you |
Token ID | 345 |
Feature activation | +8.71e-01 |
Pos logit contributions | |
endant | +0.099 |
agged | +0.094 |
av | +0.094 |
aches | +0.092 |
jewels | +0.092 |
Neg logit contributions | |
Which | -0.054 |
Why | -0.052 |
Which | -0.051 |
Good | -0.051 |
Why | -0.049 |
Token | help |
Token ID | 1037 |
Feature activation | -3.10e-01 |
Pos logit contributions | |
endant | +0.031 |
av | +0.029 |
agged | +0.028 |
jewels | +0.028 |
kins | +0.028 |
Neg logit contributions | |
Which | -0.019 |
Why | -0.019 |
when | -0.018 |
Clean | -0.018 |
Where | -0.018 |
Token | me |
Token ID | 502 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
Which | +0.008 |
Good | +0.008 |
Time | +0.008 |
ash | +0.007 |
idget | +0.007 |
Neg logit contributions | |
endant | -0.010 |
av | -0.010 |
jewels | -0.009 |
arrest | -0.009 |
brace | -0.009 |
Token | lock |
Token ID | 5793 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
endant | +0.017 |
jewels | +0.016 |
av | +0.016 |
arrest | +0.016 |
brace | +0.015 |
Neg logit contributions | |
Which | -0.015 |
Good | -0.014 |
Why | -0.014 |
Where | -0.014 |
Time | -0.014 |
Token | my |
Token ID | 616 |
Feature activation | -2.93e-01 |
Pos logit contributions | |
Which | +0.012 |
Good | +0.012 |
Time | +0.012 |
Why | +0.011 |
ash | +0.011 |
Neg logit contributions | |
endant | -0.010 |
av | -0.010 |
arrest | -0.010 |
jewels | -0.010 |
brace | -0.009 |
Token | . |
Token ID | 13 |
Feature activation | -2.96e-01 |
Pos logit contributions | |
Which | +0.010 |
Good | +0.009 |
ash | +0.009 |
Time | +0.009 |
Why | +0.009 |
Neg logit contributions | |
endant | -0.020 |
arrest | -0.019 |
jewels | -0.019 |
av | -0.019 |
brace | -0.018 |
Token | It |
Token ID | 632 |
Feature activation | -4.28e-02 |
Pos logit contributions | |
Time | +0.008 |
idget | +0.008 |
ash | +0.008 |
Which | +0.008 |
Where | +0.008 |
Neg logit contributions | |
endant | -0.008 |
jewels | -0.008 |
av | -0.008 |
arrest | -0.008 |
hy | -0.008 |
Token | 's |
Token ID | 338 |
Feature activation | -3.58e-02 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.001 |
Why | +0.001 |
ash | +0.001 |
Neg logit contributions | |
endant | -0.002 |
av | -0.002 |
jewels | -0.002 |
arrest | -0.002 |
brace | -0.001 |
Token | pretty |
Token ID | 2495 |
Feature activation | +2.53e-01 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.001 |
Why | +0.001 |
Where | +0.001 |
Neg logit contributions | |
arrest | -0.001 |
endant | -0.001 |
av | -0.001 |
jewels | -0.001 |
hy | -0.001 |
Token | . |
Token ID | 13 |
Feature activation | -1.07e-02 |
Pos logit contributions | |
endant | +0.009 |
arrest | +0.009 |
av | +0.009 |
jewels | +0.008 |
brace | +0.008 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.005 |
Time | -0.005 |
ash | -0.005 |
Why | -0.005 |
Token | Can |
Token ID | 1680 |
Feature activation | +2.47e+00 |
Pos logit contributions | |
ash | +0.000 |
idget | +0.000 |
Time | +0.000 |
Which | +0.000 |
Where | +0.000 |
Neg logit contributions | |
endant | -0.000 |
jewels | -0.000 |
av | -0.000 |
arrest | -0.000 |
hy | -0.000 |
Token | I |
Token ID | 314 |
Feature activation | +5.34e-01 |
Pos logit contributions | |
endant | +0.096 |
agged | +0.094 |
jewels | +0.091 |
av | +0.090 |
arrest | +0.088 |
Neg logit contributions | |
Why | -0.052 |
Which | -0.050 |
Why | -0.048 |
Which | -0.047 |
What | -0.046 |
Token | play |
Token ID | 711 |
Feature activation | +6.56e-01 |
Pos logit contributions | |
av | +0.018 |
endant | +0.018 |
jewels | +0.018 |
arrest | +0.018 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.012 |
Good | -0.012 |
Why | -0.011 |
Clean | -0.011 |
Time | -0.011 |
Token | with |
Token ID | 351 |
Feature activation | +6.90e-01 |
Pos logit contributions | |
endant | +0.019 |
av | +0.018 |
jewels | +0.018 |
arrest | +0.018 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.019 |
Good | -0.018 |
Time | -0.018 |
Why | -0.017 |
Where | -0.017 |
Token | it |
Token ID | 340 |
Feature activation | -3.98e-01 |
Pos logit contributions | |
endant | +0.021 |
arrest | +0.020 |
jewels | +0.020 |
av | +0.020 |
hy | +0.019 |
Neg logit contributions | |
Which | -0.019 |
Why | -0.018 |
Good | -0.017 |
Where | -0.017 |
What | -0.017 |
Token | later |
Token ID | 1568 |
Feature activation | -6.46e-02 |
Pos logit contributions | |
Which | +0.010 |
Good | +0.009 |
Time | +0.009 |
Why | +0.009 |
ash | +0.009 |
Neg logit contributions | |
endant | -0.013 |
arrest | -0.013 |
jewels | -0.013 |
av | -0.013 |
brace | -0.012 |
Token | , |
Token ID | 11 |
Feature activation | +3.25e-01 |
Pos logit contributions | |
endant | +0.055 |
arrest | +0.053 |
av | +0.052 |
jewels | +0.052 |
brace | +0.052 |
Neg logit contributions | |
Good | -0.036 |
Time | -0.036 |
Which | -0.035 |
Why | -0.034 |
Time | -0.034 |
Token | there |
Token ID | 612 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
endant | +0.008 |
jewels | +0.008 |
av | +0.008 |
arrest | +0.008 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.010 |
Good | -0.010 |
Time | -0.010 |
ash | -0.010 |
idget | -0.009 |
Token | lived |
Token ID | 5615 |
Feature activation | +1.51e-03 |
Pos logit contributions | |
Which | +0.034 |
ash | +0.031 |
Time | +0.031 |
Good | +0.031 |
idget | +0.031 |
Neg logit contributions | |
endant | -0.047 |
av | -0.046 |
jewels | -0.046 |
arrest | -0.046 |
brace | -0.044 |
Token | a |
Token ID | 257 |
Feature activation | -2.13e-02 |
Pos logit contributions | |
endant | +0.000 |
jewels | +0.000 |
arrest | +0.000 |
av | +0.000 |
brace | +0.000 |
Neg logit contributions | |
Which | -0.000 |
Good | -0.000 |
Time | -0.000 |
Where | -0.000 |
Why | -0.000 |
Token | 3 |
Token ID | 513 |
Feature activation | +1.74e+00 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.001 |
Where | +0.001 |
ash | +0.001 |
Neg logit contributions | |
endant | -0.001 |
av | -0.001 |
jewels | -0.001 |
arrest | -0.001 |
brace | -0.001 |
Token | year |
Token ID | 614 |
Feature activation | +2.32e+00 |
Pos logit contributions | |
endant | +0.053 |
jewels | +0.049 |
av | +0.048 |
arrest | +0.048 |
brace | +0.048 |
Neg logit contributions | |
Which | -0.045 |
Time | -0.044 |
ash | -0.044 |
Why | -0.043 |
Good | -0.043 |
Token | old |
Token ID | 1468 |
Feature activation | -1.75e-01 |
Pos logit contributions | |
arrest | +0.074 |
� | +0.072 |
agged | +0.070 |
endant | +0.069 |
brace | +0.068 |
Neg logit contributions | |
ash | -0.051 |
Clean | -0.050 |
ing | -0.049 |
over | -0.048 |
Time | -0.048 |
Token | called |
Token ID | 1444 |
Feature activation | +7.43e-01 |
Pos logit contributions | |
Which | +0.003 |
Good | +0.003 |
Time | +0.003 |
Why | +0.003 |
Where | +0.003 |
Neg logit contributions | |
endant | -0.007 |
arrest | -0.006 |
av | -0.006 |
jewels | -0.006 |
brace | -0.006 |
Token | Lucy |
Token ID | 22162 |
Feature activation | -1.45e+00 |
Pos logit contributions | |
endant | +0.024 |
arrest | +0.022 |
jewels | +0.022 |
av | +0.022 |
brace | +0.022 |
Neg logit contributions | |
Good | -0.018 |
Which | -0.018 |
Time | -0.018 |
Time | -0.017 |
ash | -0.017 |
Token | . |
Token ID | 13 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
Which | +0.044 |
Ready | +0.044 |
Time | +0.043 |
ash | +0.041 |
Good | +0.041 |
Neg logit contributions | |
jewels | -0.039 |
endant | -0.039 |
arrest | -0.038 |
hy | -0.037 |
av | -0.037 |
Token | One |
Token ID | 1881 |
Feature activation | -5.80e-01 |
Pos logit contributions | |
endant | +0.044 |
av | +0.042 |
jewels | +0.042 |
arrest | +0.042 |
brace | +0.040 |
Neg logit contributions | |
Which | -0.045 |
Good | -0.043 |
Time | -0.043 |
ash | -0.042 |
Where | -0.042 |
Token | he |
Token ID | 339 |
Feature activation | -4.14e-01 |
Pos logit contributions | |
Which | +0.002 |
Good | +0.002 |
Where | +0.002 |
Time | +0.002 |
Why | +0.002 |
Neg logit contributions | |
endant | -0.002 |
arrest | -0.002 |
av | -0.002 |
jewels | -0.002 |
brace | -0.002 |
Token | knew |
Token ID | 2993 |
Feature activation | +9.16e-02 |
Pos logit contributions | |
Which | +0.008 |
Good | +0.008 |
Where | +0.008 |
Time | +0.008 |
Why | +0.008 |
Neg logit contributions | |
endant | -0.015 |
av | -0.015 |
arrest | -0.015 |
jewels | -0.014 |
agged | -0.014 |
Token | he |
Token ID | 339 |
Feature activation | +5.50e-01 |
Pos logit contributions | |
endant | +0.003 |
arrest | +0.003 |
agged | +0.003 |
brace | +0.003 |
av | +0.003 |
Neg logit contributions | |
Which | -0.003 |
Where | -0.002 |
Good | -0.002 |
Why | -0.002 |
Time | -0.002 |
Token | had |
Token ID | 550 |
Feature activation | -8.80e-01 |
Pos logit contributions | |
endant | +0.019 |
arrest | +0.018 |
av | +0.018 |
jewels | +0.018 |
brace | +0.018 |
Neg logit contributions | |
Which | -0.013 |
Good | -0.012 |
Time | -0.012 |
Where | -0.012 |
Why | -0.012 |
Token | to |
Token ID | 284 |
Feature activation | -1.86e-01 |
Pos logit contributions | |
Which | +0.024 |
Time | +0.022 |
Good | +0.022 |
Where | +0.022 |
Why | +0.022 |
Neg logit contributions | |
endant | -0.028 |
arrest | -0.026 |
av | -0.026 |
jewels | -0.025 |
brace | -0.025 |
Token | share |
Token ID | 2648 |
Feature activation | +6.25e-01 |
Pos logit contributions | |
Time | +0.003 |
Why | +0.003 |
Time | +0.003 |
Good | +0.003 |
Which | +0.003 |
Neg logit contributions | |
endant | -0.007 |
av | -0.007 |
jewels | -0.007 |
agged | -0.006 |
brace | -0.006 |
Token | this |
Token ID | 428 |
Feature activation | +1.03e+00 |
Pos logit contributions | |
endant | +0.021 |
arrest | +0.020 |
hy | +0.019 |
agged | +0.019 |
� | +0.019 |
Neg logit contributions | |
Which | -0.016 |
over | -0.015 |
Why | -0.015 |
Where | -0.015 |
What | -0.015 |
Token | special |
Token ID | 2041 |
Feature activation | +9.92e-01 |
Pos logit contributions | |
endant | +0.030 |
arrest | +0.030 |
av | +0.029 |
jewels | +0.028 |
hy | +0.028 |
Neg logit contributions | |
Which | -0.028 |
Good | -0.026 |
Time | -0.026 |
Where | -0.026 |
Why | -0.026 |
Token | discovery |
Token ID | 9412 |
Feature activation | +4.72e-01 |
Pos logit contributions | |
endant | +0.043 |
av | +0.041 |
arrest | +0.041 |
jewels | +0.041 |
brace | +0.040 |
Neg logit contributions | |
Which | -0.014 |
Good | -0.012 |
Time | -0.012 |
Where | -0.012 |
Why | -0.012 |
Token | with |
Token ID | 351 |
Feature activation | +9.14e-01 |
Pos logit contributions | |
endant | +0.018 |
arrest | +0.017 |
av | +0.016 |
agged | +0.016 |
jewels | +0.016 |
Neg logit contributions | |
Which | -0.009 |
over | -0.009 |
Why | -0.009 |
ash | -0.009 |
when | -0.009 |
Token | the |
Token ID | 262 |
Feature activation | +6.10e-01 |
Pos logit contributions | |
endant | +0.030 |
arrest | +0.026 |
hy | +0.026 |
brace | +0.025 |
av | +0.025 |
Neg logit contributions | |
Which | -0.023 |
Where | -0.023 |
Why | -0.023 |
when | -0.022 |
over | -0.022 |
Token | flowers |
Token ID | 12734 |
Feature activation | +1.66e-01 |
Pos logit contributions | |
endant | +0.023 |
arrest | +0.022 |
av | +0.022 |
jewels | +0.022 |
brace | +0.021 |
Neg logit contributions | |
Which | -0.022 |
Good | -0.021 |
Time | -0.021 |
Where | -0.020 |
Why | -0.020 |
Token | . |
Token ID | 13 |
Feature activation | -2.65e-01 |
Pos logit contributions | |
endant | +0.006 |
arrest | +0.006 |
av | +0.006 |
jewels | +0.006 |
brace | +0.006 |
Neg logit contributions | |
Which | -0.003 |
Time | -0.003 |
Why | -0.003 |
Good | -0.003 |
Where | -0.003 |
Token | He |
Token ID | 679 |
Feature activation | +6.79e-01 |
Pos logit contributions | |
Which | +0.010 |
ash | +0.010 |
Time | +0.010 |
idget | +0.009 |
stations | +0.009 |
Neg logit contributions | |
av | -0.005 |
endant | -0.005 |
jewels | -0.005 |
arrest | -0.004 |
brace | -0.004 |
Token | wanted |
Token ID | 2227 |
Feature activation | +7.78e-01 |
Pos logit contributions | |
endant | +0.023 |
arrest | +0.022 |
av | +0.022 |
jewels | +0.022 |
brace | +0.021 |
Neg logit contributions | |
Which | -0.016 |
Good | -0.015 |
Time | -0.015 |
Why | -0.015 |
Where | -0.015 |
Token | to |
Token ID | 284 |
Feature activation | +3.89e-01 |
Pos logit contributions | |
endant | +0.031 |
arrest | +0.029 |
agged | +0.029 |
hy | +0.028 |
� | +0.028 |
Neg logit contributions | |
Which | -0.016 |
over | -0.014 |
Why | -0.014 |
Where | -0.014 |
Time | -0.013 |
Token | gather |
Token ID | 6431 |
Feature activation | +1.21e+00 |
Pos logit contributions | |
endant | +0.015 |
jewels | +0.014 |
av | +0.014 |
agged | +0.014 |
arrest | +0.014 |
Neg logit contributions | |
Which | -0.007 |
Why | -0.007 |
over | -0.006 |
Where | -0.006 |
What | -0.006 |
Token | them |
Token ID | 606 |
Feature activation | +2.05e-03 |
Pos logit contributions | |
arrest | +0.047 |
endant | +0.046 |
hy | +0.044 |
pe | +0.043 |
� | +0.043 |
Neg logit contributions | |
over | -0.023 |
Which | -0.023 |
Why | -0.021 |
What | -0.020 |
Where | -0.020 |
Token | for |
Token ID | 329 |
Feature activation | +1.31e+00 |
Pos logit contributions | |
arrest | +0.000 |
endant | +0.000 |
hy | +0.000 |
agged | +0.000 |
av | +0.000 |
Neg logit contributions | |
over | -0.000 |
Which | -0.000 |
when | -0.000 |
ash | -0.000 |
Why | -0.000 |
Token | his |
Token ID | 465 |
Feature activation | +6.01e-01 |
Pos logit contributions | |
endant | +0.049 |
hy | +0.044 |
arrest | +0.042 |
av | +0.041 |
agged | +0.041 |
Neg logit contributions | |
Which | -0.028 |
Where | -0.027 |
What | -0.027 |
Why | -0.026 |
when | -0.026 |
Token | mom |
Token ID | 1995 |
Feature activation | -7.35e-01 |
Pos logit contributions | |
endant | +0.017 |
arrest | +0.017 |
agged | +0.017 |
hy | +0.016 |
aches | +0.016 |
Neg logit contributions | |
Which | -0.015 |
Good | -0.015 |
Why | -0.014 |
Where | -0.014 |
Clean | -0.014 |
Token | my |
Token ID | 1820 |
Feature activation | -9.76e-01 |
Pos logit contributions | |
Which | +0.015 |
Time | +0.015 |
Good | +0.015 |
Where | +0.014 |
Ready | +0.013 |
Neg logit contributions | |
endant | -0.026 |
av | -0.026 |
jewels | -0.026 |
brace | -0.025 |
arrest | -0.025 |
Token | wonder |
Token ID | 4240 |
Feature activation | -3.63e-01 |
Pos logit contributions | |
Which | +0.002 |
Why | +0.002 |
Good | +0.002 |
Time | +0.002 |
What | +0.002 |
Neg logit contributions | |
endant | -0.003 |
agged | -0.003 |
av | -0.003 |
jewels | -0.003 |
arrest | -0.002 |
Token | what |
Token ID | 644 |
Feature activation | +3.69e-04 |
Pos logit contributions | |
Which | +0.007 |
Good | +0.006 |
Why | +0.006 |
Where | +0.006 |
ash | +0.006 |
Neg logit contributions | |
endant | -0.014 |
arrest | -0.013 |
av | -0.013 |
jewels | -0.013 |
brace | -0.013 |
Token | other |
Token ID | 584 |
Feature activation | +5.72e-01 |
Pos logit contributions | |
endant | +0.000 |
arrest | +0.000 |
av | +0.000 |
jewels | +0.000 |
brace | +0.000 |
Neg logit contributions | |
Which | -0.000 |
Good | -0.000 |
Time | -0.000 |
Where | -0.000 |
Why | -0.000 |
Token | surprises |
Token ID | 24072 |
Feature activation | +4.41e-01 |
Pos logit contributions | |
endant | +0.019 |
arrest | +0.018 |
av | +0.018 |
jewels | +0.018 |
brace | +0.018 |
Neg logit contributions | |
Which | -0.014 |
Good | -0.013 |
Time | -0.013 |
Where | -0.012 |
Why | -0.012 |
Token | he |
Token ID | 339 |
Feature activation | +1.46e+00 |
Pos logit contributions | |
endant | +0.015 |
arrest | +0.015 |
agged | +0.014 |
av | +0.014 |
brace | +0.013 |
Neg logit contributions | |
over | -0.010 |
when | -0.009 |
Which | -0.009 |
Why | -0.009 |
Good | -0.009 |
Token | would |
Token ID | 561 |
Feature activation | +1.43e+00 |
Pos logit contributions | |
endant | +0.053 |
arrest | +0.053 |
av | +0.051 |
brace | +0.050 |
jewels | +0.050 |
Neg logit contributions | |
Which | -0.030 |
Where | -0.028 |
Why | -0.028 |
Good | -0.028 |
Time | -0.027 |
Token | find |
Token ID | 1064 |
Feature activation | -4.93e-01 |
Pos logit contributions | |
endant | +0.059 |
agged | +0.056 |
av | +0.056 |
jewels | +0.054 |
brace | +0.053 |
Neg logit contributions | |
Why | -0.025 |
Which | -0.023 |
Where | -0.023 |
over | -0.023 |
when | -0.022 |
Token | . |
Token ID | 13 |
Feature activation | +1.36e-01 |
Pos logit contributions | |
Which | +0.008 |
Good | +0.008 |
Why | +0.008 |
ash | +0.007 |
over | +0.007 |
Neg logit contributions | |
endant | -0.020 |
arrest | -0.019 |
brace | -0.019 |
av | -0.019 |
jewels | -0.018 |
Token | He |
Token ID | 679 |
Feature activation | +9.94e-01 |
Pos logit contributions | |
endant | +0.004 |
av | +0.004 |
jewels | +0.004 |
arrest | +0.004 |
brace | +0.004 |
Neg logit contributions | |
Which | -0.003 |
Good | -0.003 |
Time | -0.003 |
ash | -0.003 |
Where | -0.003 |
Token | knew |
Token ID | 2993 |
Feature activation | +1.40e-01 |
Pos logit contributions | |
endant | +0.036 |
av | +0.036 |
arrest | +0.035 |
agged | +0.034 |
jewels | +0.033 |
Neg logit contributions | |
Which | -0.020 |
over | -0.018 |
Where | -0.018 |
Good | -0.018 |
Why | -0.018 |
Token | it |
Token ID | 340 |
Feature activation | +9.80e-02 |
Pos logit contributions | |
endant | +0.005 |
agged | +0.005 |
arrest | +0.005 |
brace | +0.004 |
av | +0.004 |
Neg logit contributions | |
Which | -0.003 |
when | -0.003 |
why | -0.003 |
Where | -0.003 |
over | -0.003 |
Token | back |
Token ID | 736 |
Feature activation | -1.02e-01 |
Pos logit contributions | |
Which | +0.000 |
Good | +0.000 |
ash | +0.000 |
Where | +0.000 |
Time | +0.000 |
Neg logit contributions | |
endant | -0.000 |
arrest | -0.000 |
av | -0.000 |
jewels | -0.000 |
aches | -0.000 |
Token | . |
Token ID | 13 |
Feature activation | +7.31e-02 |
Pos logit contributions | |
Which | +0.002 |
Good | +0.002 |
Time | +0.002 |
Where | +0.002 |
Why | +0.002 |
Neg logit contributions | |
endant | -0.004 |
jewels | -0.003 |
av | -0.003 |
arrest | -0.003 |
brace | -0.003 |
Token | But |
Token ID | 887 |
Feature activation | +1.72e-01 |
Pos logit contributions | |
endant | +0.003 |
jewels | +0.003 |
aches | +0.003 |
arrest | +0.003 |
av | +0.003 |
Neg logit contributions | |
Which | -0.001 |
Good | -0.001 |
Why | -0.001 |
Why | -0.001 |
Time | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | -5.51e-01 |
Pos logit contributions | |
endant | +0.006 |
agged | +0.006 |
arrest | +0.006 |
av | +0.006 |
vern | +0.005 |
Neg logit contributions | |
Which | -0.004 |
Why | -0.004 |
when | -0.004 |
Where | -0.004 |
over | -0.004 |
Token | dog |
Token ID | 3290 |
Feature activation | +3.30e-01 |
Pos logit contributions | |
Which | +0.016 |
ash | +0.015 |
Good | +0.015 |
idget | +0.015 |
Time | +0.015 |
Neg logit contributions | |
endant | -0.015 |
jewels | -0.015 |
arrest | -0.015 |
av | -0.015 |
brace | -0.014 |
Token | did |
Token ID | 750 |
Feature activation | +1.19e+00 |
Pos logit contributions | |
endant | +0.012 |
av | +0.012 |
jewels | +0.012 |
arrest | +0.011 |
vern | +0.011 |
Neg logit contributions | |
Why | -0.007 |
Which | -0.007 |
Where | -0.006 |
when | -0.006 |
over | -0.006 |
Token | not |
Token ID | 407 |
Feature activation | +2.06e-03 |
Pos logit contributions | |
endant | +0.029 |
av | +0.026 |
jewels | +0.024 |
agged | +0.023 |
arrest | +0.023 |
Neg logit contributions | |
Why | -0.043 |
Which | -0.042 |
over | -0.041 |
Where | -0.041 |
when | -0.041 |
Token | like |
Token ID | 588 |
Feature activation | +6.37e-01 |
Pos logit contributions | |
endant | +0.000 |
av | +0.000 |
jewels | +0.000 |
arrest | +0.000 |
brace | +0.000 |
Neg logit contributions | |
Which | -0.000 |
Good | -0.000 |
Time | -0.000 |
Where | -0.000 |
ash | -0.000 |
Token | that |
Token ID | 326 |
Feature activation | -5.64e-01 |
Pos logit contributions | |
endant | +0.021 |
av | +0.019 |
arrest | +0.019 |
jewels | +0.019 |
agged | +0.018 |
Neg logit contributions | |
Which | -0.016 |
Why | -0.016 |
Where | -0.015 |
Time | -0.015 |
Good | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | +7.23e-01 |
Pos logit contributions | |
Which | +0.014 |
Good | +0.014 |
idget | +0.013 |
Time | +0.013 |
ash | +0.013 |
Neg logit contributions | |
jewels | -0.017 |
av | -0.017 |
endant | -0.017 |
brace | -0.017 |
arrest | -0.017 |
Token | He |
Token ID | 679 |
Feature activation | +9.95e-01 |
Pos logit contributions | |
endant | +0.025 |
arrest | +0.025 |
jewels | +0.025 |
av | +0.024 |
aches | +0.024 |
Neg logit contributions | |
Which | -0.017 |
Good | -0.016 |
Where | -0.016 |
Why | -0.015 |
Time | -0.015 |
Token | a |
Token ID | 257 |
Feature activation | +8.48e-02 |
Pos logit contributions | |
endant | +0.007 |
av | +0.006 |
arrest | +0.006 |
jewels | +0.006 |
pe | +0.006 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.006 |
Time | -0.006 |
Time | -0.006 |
Why | -0.006 |
Token | voice |
Token ID | 3809 |
Feature activation | -5.65e-01 |
Pos logit contributions | |
endant | +0.002 |
arrest | +0.002 |
av | +0.002 |
jewels | +0.002 |
brace | +0.002 |
Neg logit contributions | |
Which | -0.002 |
Time | -0.002 |
Good | -0.002 |
Where | -0.002 |
Why | -0.002 |
Token | spoke |
Token ID | 5158 |
Feature activation | -1.94e-01 |
Pos logit contributions | |
Which | +0.016 |
Good | +0.015 |
ash | +0.015 |
Time | +0.015 |
idget | +0.014 |
Neg logit contributions | |
endant | -0.016 |
jewels | -0.016 |
av | -0.016 |
arrest | -0.016 |
brace | -0.015 |
Token | to |
Token ID | 284 |
Feature activation | -9.13e-01 |
Pos logit contributions | |
Which | +0.004 |
Good | +0.004 |
Time | +0.004 |
ash | +0.004 |
Where | +0.004 |
Neg logit contributions | |
endant | -0.007 |
av | -0.006 |
jewels | -0.006 |
arrest | -0.006 |
brace | -0.006 |
Token | her |
Token ID | 607 |
Feature activation | -8.96e-01 |
Pos logit contributions | |
Which | +0.023 |
Why | +0.023 |
Where | +0.023 |
What | +0.022 |
Good | +0.022 |
Neg logit contributions | |
endant | -0.032 |
jewels | -0.028 |
av | -0.028 |
arrest | -0.028 |
agged | -0.027 |
Token | , |
Token ID | 11 |
Feature activation | +4.85e-01 |
Pos logit contributions | |
Which | +0.023 |
Good | +0.022 |
Time | +0.022 |
ash | +0.021 |
Where | +0.021 |
Neg logit contributions | |
endant | -0.028 |
jewels | -0.027 |
av | -0.027 |
arrest | -0.027 |
brace | -0.026 |
Token | telling |
Token ID | 5149 |
Feature activation | +5.93e-01 |
Pos logit contributions | |
endant | +0.018 |
arrest | +0.018 |
av | +0.018 |
jewels | +0.018 |
brace | +0.017 |
Neg logit contributions | |
Which | -0.009 |
Good | -0.009 |
Time | -0.008 |
Why | -0.008 |
Where | -0.008 |
Token | her |
Token ID | 607 |
Feature activation | +7.19e-01 |
Pos logit contributions | |
endant | +0.020 |
arrest | +0.018 |
av | +0.017 |
jewels | +0.017 |
pe | +0.017 |
Neg logit contributions | |
Which | -0.015 |
Good | -0.014 |
Why | -0.014 |
Time | -0.014 |
Where | -0.014 |
Token | to |
Token ID | 284 |
Feature activation | -1.84e-01 |
Pos logit contributions | |
endant | +0.024 |
arrest | +0.023 |
av | +0.023 |
jewels | +0.022 |
brace | +0.022 |
Neg logit contributions | |
Which | -0.017 |
Good | -0.016 |
Time | -0.016 |
Where | -0.016 |
Why | -0.015 |
Token | look |
Token ID | 804 |
Feature activation | -1.12e+00 |
Pos logit contributions | |
Why | +0.003 |
Time | +0.003 |
Time | +0.003 |
over | +0.003 |
why | +0.003 |
Neg logit contributions | |
endant | -0.007 |
av | -0.007 |
jewels | -0.007 |
agged | -0.007 |
ls | -0.006 |
Token | up |
Token ID | 510 |
Feature activation | +5.04e-01 |
Pos logit contributions | |
Which | +0.029 |
Time | +0.029 |
Good | +0.028 |
Ready | +0.027 |
Where | +0.027 |
Neg logit contributions | |
jewels | -0.034 |
endant | -0.033 |
av | -0.033 |
brace | -0.032 |
coins | -0.031 |
Token | opened |
Token ID | 4721 |
Feature activation | -3.46e-01 |
Pos logit contributions | |
endant | +0.008 |
jewels | +0.007 |
av | +0.007 |
arrest | +0.007 |
brace | +0.007 |
Neg logit contributions | |
Which | -0.007 |
Good | -0.007 |
Time | -0.007 |
ash | -0.007 |
Why | -0.007 |
Token | her |
Token ID | 607 |
Feature activation | +3.94e-01 |
Pos logit contributions | |
Which | +0.009 |
Good | +0.008 |
Why | +0.008 |
over | +0.008 |
Where | +0.008 |
Neg logit contributions | |
endant | -0.011 |
av | -0.011 |
arrest | -0.010 |
hy | -0.010 |
jewels | -0.010 |
Token | eyes |
Token ID | 2951 |
Feature activation | -3.59e-01 |
Pos logit contributions | |
av | +0.009 |
arrest | +0.009 |
pe | +0.009 |
endant | +0.008 |
aches | +0.008 |
Neg logit contributions | |
Which | -0.013 |
Good | -0.013 |
Time | -0.012 |
Clean | -0.012 |
ash | -0.012 |
Token | and |
Token ID | 290 |
Feature activation | -6.48e-02 |
Pos logit contributions | |
Which | +0.011 |
Good | +0.011 |
Time | +0.011 |
ash | +0.011 |
Where | +0.010 |
Neg logit contributions | |
endant | -0.009 |
jewels | -0.009 |
av | -0.009 |
arrest | -0.009 |
brace | -0.008 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.82e+00 |
Pos logit contributions | |
Which | +0.002 |
Good | +0.002 |
Time | +0.002 |
Where | +0.001 |
Why | +0.001 |
Neg logit contributions | |
endant | -0.002 |
av | -0.002 |
arrest | -0.002 |
jewels | -0.002 |
brace | -0.002 |
Token | a |
Token ID | 257 |
Feature activation | +1.88e-01 |
Pos logit contributions | |
Which | +0.054 |
Time | +0.052 |
ash | +0.052 |
Good | +0.052 |
Where | +0.050 |
Neg logit contributions | |
endant | -0.049 |
jewels | -0.048 |
av | -0.048 |
arrest | -0.047 |
brace | -0.046 |
Token | friendly |
Token ID | 8030 |
Feature activation | +2.31e-01 |
Pos logit contributions | |
endant | +0.005 |
av | +0.004 |
jewels | +0.004 |
arrest | +0.004 |
brace | +0.004 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.006 |
Time | -0.006 |
ash | -0.006 |
Why | -0.006 |
Token | ghost |
Token ID | 10905 |
Feature activation | -8.26e-01 |
Pos logit contributions | |
endant | +0.008 |
arrest | +0.007 |
aches | +0.007 |
jewels | +0.007 |
av | +0.007 |
Neg logit contributions | |
Good | -0.005 |
Which | -0.005 |
Time | -0.005 |
Time | -0.005 |
Why | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | +1.42e+00 |
Pos logit contributions | |
Which | +0.024 |
Time | +0.022 |
ash | +0.021 |
Which | +0.021 |
Good | +0.021 |
Neg logit contributions | |
endant | -0.025 |
arrest | -0.024 |
jewels | -0.024 |
brace | -0.023 |
hy | -0.023 |
Token | The |
Token ID | 383 |
Feature activation | +1.58e-01 |
Pos logit contributions | |
endant | +0.049 |
jewels | +0.046 |
aches | +0.045 |
av | +0.045 |
arrest | +0.045 |
Neg logit contributions | |
Good | -0.034 |
Time | -0.033 |
Which | -0.033 |
Why | -0.033 |
Why | -0.032 |
Token | ghost |
Token ID | 10905 |
Feature activation | +5.80e-01 |
Pos logit contributions | |
endant | +0.005 |
jewels | +0.005 |
arrest | +0.005 |
av | +0.005 |
brace | +0.005 |
Neg logit contributions | |
Which | -0.004 |
ash | -0.004 |
Good | -0.004 |
Time | -0.004 |
idget | -0.004 |
Token | very |
Token ID | 845 |
Feature activation | +6.51e-01 |
Pos logit contributions | |
Which | +0.022 |
Good | +0.021 |
Time | +0.021 |
Where | +0.020 |
Why | +0.020 |
Neg logit contributions | |
endant | -0.023 |
av | -0.022 |
jewels | -0.022 |
arrest | -0.022 |
brace | -0.021 |
Token | happy |
Token ID | 3772 |
Feature activation | +5.95e-01 |
Pos logit contributions | |
av | +0.021 |
endant | +0.021 |
arrest | +0.020 |
jewels | +0.020 |
brace | +0.020 |
Neg logit contributions | |
Time | -0.016 |
Good | -0.016 |
Time | -0.015 |
Clean | -0.015 |
over | -0.015 |
Token | . |
Token ID | 13 |
Feature activation | -3.58e-01 |
Pos logit contributions | |
endant | +0.020 |
jewels | +0.019 |
av | +0.019 |
arrest | +0.019 |
brace | +0.018 |
Neg logit contributions | |
Which | -0.014 |
Good | -0.013 |
Time | -0.013 |
ash | -0.013 |
idget | -0.013 |
Token | From |
Token ID | 3574 |
Feature activation | -5.68e-01 |
Pos logit contributions | |
Which | +0.009 |
Good | +0.009 |
Time | +0.009 |
ash | +0.009 |
Where | +0.008 |
Neg logit contributions | |
endant | -0.011 |
av | -0.011 |
jewels | -0.011 |
arrest | -0.011 |
brace | -0.010 |
Token | that |
Token ID | 326 |
Feature activation | -1.57e+00 |
Pos logit contributions | |
Which | +0.011 |
Why | +0.011 |
Good | +0.011 |
Time | +0.010 |
Where | +0.010 |
Neg logit contributions | |
endant | -0.021 |
av | -0.021 |
arrest | -0.021 |
jewels | -0.020 |
brace | -0.020 |
Token | day |
Token ID | 1110 |
Feature activation | -4.34e-02 |
Pos logit contributions | |
Which | +0.021 |
Good | +0.018 |
Time | +0.018 |
Where | +0.017 |
ash | +0.017 |
Neg logit contributions | |
endant | -0.069 |
av | -0.068 |
jewels | -0.067 |
arrest | -0.067 |
brace | -0.066 |
Token | on |
Token ID | 319 |
Feature activation | +8.37e-01 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.001 |
Where | +0.001 |
Why | +0.001 |
Neg logit contributions | |
endant | -0.001 |
av | -0.001 |
jewels | -0.001 |
arrest | -0.001 |
brace | -0.001 |
Token | the |
Token ID | 262 |
Feature activation | +1.45e-01 |
Pos logit contributions | |
endant | +0.035 |
agged | +0.031 |
jewels | +0.030 |
arrest | +0.030 |
av | +0.030 |
Neg logit contributions | |
when | -0.016 |
Time | -0.015 |
Good | -0.014 |
over | -0.014 |
Why | -0.014 |
Token | lady |
Token ID | 10846 |
Feature activation | -1.53e-01 |
Pos logit contributions | |
endant | +0.005 |
av | +0.004 |
arrest | +0.004 |
jewels | +0.004 |
brace | +0.004 |
Neg logit contributions | |
Which | -0.004 |
Good | -0.004 |
Time | -0.004 |
Why | -0.003 |
Where | -0.003 |
Token | was |
Token ID | 373 |
Feature activation | -1.19e+00 |
Pos logit contributions | |
Good | +0.003 |
Which | +0.003 |
Why | +0.003 |
over | +0.003 |
ash | +0.003 |
Neg logit contributions | |
endant | -0.006 |
av | -0.006 |
jewels | -0.006 |
arrest | -0.006 |
brace | -0.005 |
Token | known |
Token ID | 1900 |
Feature activation | -2.11e-01 |
Pos logit contributions | |
Which | +0.035 |
Good | +0.033 |
Time | +0.033 |
Why | +0.032 |
Where | +0.032 |
Neg logit contributions | |
endant | -0.033 |
av | -0.032 |
jewels | -0.032 |
arrest | -0.032 |
brace | -0.030 |
Token | up |
Token ID | 510 |
Feature activation | +1.50e+00 |
Pos logit contributions | |
endant | +0.003 |
arrest | +0.003 |
av | +0.003 |
jewels | +0.003 |
brace | +0.003 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Time | -0.002 |
Why | -0.002 |
Where | -0.002 |
Token | and |
Token ID | 290 |
Feature activation | -1.81e-01 |
Pos logit contributions | |
endant | +0.065 |
arrest | +0.060 |
ocket | +0.058 |
brace | +0.058 |
agged | +0.058 |
Neg logit contributions | |
over | -0.030 |
when | -0.026 |
across | -0.021 |
Why | -0.020 |
out | -0.020 |
Token | went |
Token ID | 1816 |
Feature activation | -5.84e-01 |
Pos logit contributions | |
Which | +0.005 |
Time | +0.005 |
Good | +0.005 |
ash | +0.005 |
Where | +0.005 |
Neg logit contributions | |
endant | -0.005 |
jewels | -0.005 |
av | -0.005 |
arrest | -0.005 |
brace | -0.005 |
Token | outside |
Token ID | 2354 |
Feature activation | -7.96e-01 |
Pos logit contributions | |
Which | +0.013 |
Good | +0.013 |
Time | +0.012 |
Why | +0.012 |
Where | +0.012 |
Neg logit contributions | |
endant | -0.020 |
jewels | -0.019 |
arrest | -0.019 |
av | -0.019 |
brace | -0.018 |
Token | to |
Token ID | 284 |
Feature activation | -9.28e-01 |
Pos logit contributions | |
Which | +0.019 |
Good | +0.019 |
Time | +0.018 |
Why | +0.018 |
ash | +0.018 |
Neg logit contributions | |
endant | -0.026 |
av | -0.025 |
jewels | -0.025 |
arrest | -0.024 |
brace | -0.024 |
Token | the |
Token ID | 262 |
Feature activation | -2.02e-01 |
Pos logit contributions | |
Which | +0.024 |
Time | +0.023 |
Good | +0.022 |
ash | +0.022 |
Where | +0.022 |
Neg logit contributions | |
arrest | -0.028 |
endant | -0.028 |
av | -0.028 |
jewels | -0.028 |
brace | -0.026 |
Token | park |
Token ID | 3952 |
Feature activation | -1.20e-01 |
Pos logit contributions | |
Which | +0.006 |
ash | +0.005 |
idget | +0.005 |
Good | +0.005 |
Time | +0.005 |
Neg logit contributions | |
endant | -0.006 |
jewels | -0.006 |
av | -0.006 |
arrest | -0.006 |
brace | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -3.72e-01 |
Pos logit contributions | |
Which | +0.003 |
Good | +0.002 |
Time | +0.002 |
Why | +0.002 |
ash | +0.002 |
Neg logit contributions | |
endant | -0.004 |
av | -0.004 |
arrest | -0.004 |
jewels | -0.004 |
brace | -0.004 |
Token | Lucy |
Token ID | 22162 |
Feature activation | -7.00e-01 |
Pos logit contributions | |
Which | +0.010 |
Time | +0.009 |
ash | +0.009 |
Why | +0.009 |
Good | +0.009 |
Neg logit contributions | |
endant | -0.011 |
arrest | -0.011 |
av | -0.011 |
jewels | -0.011 |
hy | -0.010 |
Token | saw |
Token ID | 2497 |
Feature activation | -1.50e+00 |
Pos logit contributions | |
Which | +0.015 |
Good | +0.014 |
Time | +0.014 |
Why | +0.014 |
ash | +0.014 |
Neg logit contributions | |
endant | -0.025 |
av | -0.024 |
jewels | -0.024 |
arrest | -0.023 |
brace | -0.023 |
Token | the |
Token ID | 262 |
Feature activation | -9.38e-02 |
Pos logit contributions | |
Which | +0.040 |
Good | +0.038 |
Time | +0.037 |
Why | +0.037 |
Where | +0.037 |
Neg logit contributions | |
endant | -0.046 |
arrest | -0.044 |
av | -0.044 |
jewels | -0.043 |
brace | -0.042 |
Token | it |
Token ID | 340 |
Feature activation | -1.07e+00 |
Pos logit contributions | |
Which | +0.016 |
Good | +0.015 |
Time | +0.015 |
Why | +0.015 |
Where | +0.015 |
Neg logit contributions | |
endant | -0.018 |
av | -0.018 |
jewels | -0.018 |
arrest | -0.017 |
brace | -0.017 |
Token | 's |
Token ID | 338 |
Feature activation | -5.21e-01 |
Pos logit contributions | |
Which | +0.023 |
Where | +0.020 |
Time | +0.018 |
What | +0.018 |
Why | +0.018 |
Neg logit contributions | |
endant | -0.039 |
arrest | -0.039 |
av | -0.038 |
jewels | -0.037 |
brace | -0.037 |
Token | time |
Token ID | 640 |
Feature activation | -2.74e-01 |
Pos logit contributions | |
Which | +0.014 |
Where | +0.013 |
Good | +0.013 |
idget | +0.012 |
Ready | +0.012 |
Neg logit contributions | |
av | -0.016 |
endant | -0.016 |
jewels | -0.015 |
arrest | -0.015 |
aches | -0.015 |
Token | to |
Token ID | 284 |
Feature activation | -2.27e-01 |
Pos logit contributions | |
Which | +0.007 |
Good | +0.006 |
Time | +0.006 |
Where | +0.006 |
Why | +0.006 |
Neg logit contributions | |
endant | -0.009 |
jewels | -0.009 |
av | -0.009 |
arrest | -0.009 |
brace | -0.008 |
Token | stop |
Token ID | 2245 |
Feature activation | -4.58e-01 |
Pos logit contributions | |
Which | +0.005 |
Good | +0.005 |
Time | +0.005 |
Where | +0.005 |
ash | +0.005 |
Neg logit contributions | |
endant | -0.008 |
arrest | -0.007 |
av | -0.007 |
jewels | -0.007 |
brace | -0.007 |
Token | playing |
Token ID | 2712 |
Feature activation | -1.55e-01 |
Pos logit contributions | |
Which | +0.013 |
Time | +0.012 |
Good | +0.012 |
Where | +0.012 |
ash | +0.012 |
Neg logit contributions | |
endant | -0.013 |
arrest | -0.013 |
av | -0.013 |
jewels | -0.013 |
brace | -0.012 |
Token | now |
Token ID | 783 |
Feature activation | -3.99e-01 |
Pos logit contributions | |
Which | +0.004 |
Good | +0.004 |
Time | +0.004 |
Where | +0.004 |
ash | +0.004 |
Neg logit contributions | |
endant | -0.005 |
av | -0.005 |
jewels | -0.005 |
arrest | -0.005 |
brace | -0.004 |
Token | ." |
Token ID | 526 |
Feature activation | -1.73e+00 |
Pos logit contributions | |
Which | +0.008 |
Good | +0.008 |
Time | +0.008 |
Why | +0.008 |
ash | +0.008 |
Neg logit contributions | |
endant | -0.014 |
jewels | -0.014 |
av | -0.014 |
arrest | -0.013 |
brace | -0.013 |
Token |
|
Token ID | 198 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
Which | +0.054 |
ash | +0.054 |
rated | +0.049 |
idget | +0.049 |
Time | +0.049 |
Neg logit contributions | |
endant | -0.039 |
hy | -0.039 |
brace | -0.039 |
arrest | -0.039 |
jewels | -0.037 |
Token |
|
Token ID | 198 |
Feature activation | -9.75e-01 |
Pos logit contributions | |
ash | +0.054 |
Which | +0.053 |
ksh | +0.051 |
idget | +0.050 |
rated | +0.050 |
Neg logit contributions | |
arrest | -0.038 |
endant | -0.038 |
pe | -0.037 |
brace | -0.037 |
hy | -0.036 |
Token | Ch |
Token ID | 1925 |
Feature activation | -3.40e-01 |
Pos logit contributions | |
ash | +0.024 |
idget | +0.022 |
inter | +0.022 |
ksh | +0.022 |
Which | +0.021 |
Neg logit contributions | |
brace | -0.029 |
arrest | -0.028 |
pe | -0.028 |
endant | -0.027 |
vern | -0.027 |
Token | were |
Token ID | 547 |
Feature activation | +5.62e-01 |
Pos logit contributions | |
endant | +0.006 |
arrest | +0.006 |
av | +0.005 |
jewels | +0.005 |
agged | +0.005 |
Neg logit contributions | |
Which | -0.005 |
Why | -0.004 |
Time | -0.004 |
Where | -0.004 |
Good | -0.004 |
Token | very |
Token ID | 845 |
Feature activation | +1.57e+00 |
Pos logit contributions | |
arrest | +0.019 |
endant | +0.018 |
agged | +0.017 |
� | +0.017 |
av | +0.016 |
Neg logit contributions | |
over | -0.014 |
Which | -0.014 |
Why | -0.013 |
Where | -0.013 |
Time | -0.013 |
Token | pretty |
Token ID | 2495 |
Feature activation | +1.13e-01 |
Pos logit contributions | |
arrest | +0.053 |
endant | +0.046 |
agged | +0.045 |
� | +0.045 |
av | +0.044 |
Neg logit contributions | |
Time | -0.038 |
Which | -0.037 |
over | -0.036 |
Where | -0.036 |
Why | -0.036 |
Token | and |
Token ID | 290 |
Feature activation | +1.10e+00 |
Pos logit contributions | |
endant | +0.004 |
arrest | +0.004 |
av | +0.004 |
jewels | +0.004 |
brace | +0.004 |
Neg logit contributions | |
Which | -0.002 |
Good | -0.002 |
Why | -0.002 |
Time | -0.002 |
Where | -0.002 |
Token | colorful |
Token ID | 20239 |
Feature activation | +3.13e-01 |
Pos logit contributions | |
arrest | +0.036 |
endant | +0.034 |
agged | +0.033 |
av | +0.031 |
ir | +0.031 |
Neg logit contributions | |
Which | -0.029 |
Why | -0.027 |
Where | -0.027 |
Time | -0.027 |
What | -0.026 |
Token | . |
Token ID | 13 |
Feature activation | +1.63e-01 |
Pos logit contributions | |
endant | +0.012 |
arrest | +0.011 |
av | +0.011 |
jewels | +0.011 |
brace | +0.011 |
Neg logit contributions | |
Which | -0.006 |
Good | -0.005 |
Why | -0.005 |
Where | -0.005 |
Time | -0.005 |
Token |
|
Token ID | 198 |
Feature activation | -9.00e-03 |
Pos logit contributions | |
endant | +0.005 |
av | +0.005 |
jewels | +0.005 |
arrest | +0.005 |
brace | +0.005 |
Neg logit contributions | |
Which | -0.004 |
ash | -0.004 |
Time | -0.004 |
Good | -0.004 |
idget | -0.004 |
Token |
|
Token ID | 198 |
Feature activation | +9.40e-02 |
Pos logit contributions | |
Which | +0.000 |
Good | +0.000 |
Time | +0.000 |
ash | +0.000 |
Why | +0.000 |
Neg logit contributions | |
endant | -0.000 |
av | -0.000 |
arrest | -0.000 |
jewels | -0.000 |
brace | -0.000 |
Token | " |
Token ID | 1 |
Feature activation | -5.30e-01 |
Pos logit contributions | |
arrest | +0.003 |
endant | +0.003 |
pe | +0.003 |
jewels | +0.003 |
av | +0.003 |
Neg logit contributions | |
Which | -0.002 |
ash | -0.002 |
idget | -0.002 |
Good | -0.002 |
ksh | -0.002 |
Token | Look |
Token ID | 8567 |
Feature activation | -1.93e-01 |
Pos logit contributions | |
ash | +0.012 |
idget | +0.011 |
Good | +0.010 |
rated | +0.010 |
Clean | +0.010 |
Neg logit contributions | |
brace | -0.019 |
jewels | -0.018 |
pe | -0.018 |
av | -0.018 |
endant | -0.018 |
Token | , |
Token ID | 11 |
Feature activation | -6.44e-02 |
Pos logit contributions | |
Which | +0.007 |
Time | +0.007 |
Good | +0.007 |
Where | +0.007 |
Why | +0.006 |
Neg logit contributions | |
endant | -0.004 |
jewels | -0.004 |
av | -0.004 |
brace | -0.004 |
arrest | -0.004 |
Token | the |
Token ID | 262 |
Feature activation | -7.59e-01 |
Pos logit contributions | |
Which | +0.030 |
Good | +0.029 |
Time | +0.029 |
ash | +0.028 |
Where | +0.028 |
Neg logit contributions | |
endant | -0.028 |
av | -0.026 |
jewels | -0.026 |
arrest | -0.026 |
brace | -0.025 |
Token | park |
Token ID | 3952 |
Feature activation | +4.80e-01 |
Pos logit contributions | |
ash | +0.026 |
rated | +0.025 |
idget | +0.024 |
ksh | +0.024 |
Clean | +0.023 |
Neg logit contributions | |
av | -0.018 |
endant | -0.017 |
jewels | -0.016 |
arrest | -0.016 |
brace | -0.016 |
Token | with |
Token ID | 351 |
Feature activation | -5.36e-02 |
Pos logit contributions | |
endant | +0.015 |
av | +0.014 |
jewels | +0.014 |
arrest | +0.014 |
brace | +0.013 |
Neg logit contributions | |
Which | -0.013 |
Good | -0.012 |
Time | -0.012 |
Why | -0.012 |
Where | -0.012 |
Token | her |
Token ID | 607 |
Feature activation | -1.71e-01 |
Pos logit contributions | |
Which | +0.002 |
Good | +0.002 |
Time | +0.002 |
Where | +0.001 |
Why | +0.001 |
Neg logit contributions | |
endant | -0.002 |
arrest | -0.001 |
av | -0.001 |
jewels | -0.001 |
brace | -0.001 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.62e+00 |
Pos logit contributions | |
Which | +0.004 |
Good | +0.004 |
Time | +0.004 |
Where | +0.004 |
Why | +0.004 |
Neg logit contributions | |
endant | -0.005 |
arrest | -0.005 |
av | -0.005 |
jewels | -0.005 |
brace | -0.005 |
Token | my |
Token ID | 1820 |
Feature activation | -1.84e+00 |
Pos logit contributions | |
Ready | +0.049 |
Time | +0.049 |
Good | +0.049 |
Which | +0.048 |
idget | +0.045 |
Neg logit contributions | |
av | -0.044 |
jewels | -0.039 |
brace | -0.038 |
endant | -0.037 |
coins | -0.036 |
Token | and |
Token ID | 290 |
Feature activation | -1.16e+00 |
Pos logit contributions | |
Which | +0.060 |
Time | +0.058 |
Good | +0.058 |
Ready | +0.056 |
Where | +0.054 |
Neg logit contributions | |
av | -0.048 |
jewels | -0.044 |
brace | -0.043 |
arrest | -0.043 |
endant | -0.042 |
Token | daddy |
Token ID | 35822 |
Feature activation | -1.86e+00 |
Pos logit contributions | |
Which | +0.034 |
ash | +0.032 |
Good | +0.032 |
Time | +0.032 |
idget | +0.031 |
Neg logit contributions | |
endant | -0.032 |
jewels | -0.032 |
av | -0.032 |
arrest | -0.031 |
brace | -0.030 |
Token | . |
Token ID | 13 |
Feature activation | -1.06e+00 |
Pos logit contributions | |
Which | +0.062 |
Time | +0.061 |
Good | +0.060 |
Ready | +0.057 |
Where | +0.055 |
Neg logit contributions | |
av | -0.047 |
pe | -0.044 |
jewels | -0.044 |
brace | -0.043 |
arrest | -0.042 |
Token | They |
Token ID | 1119 |
Feature activation | +4.25e-01 |
Pos logit contributions | |
ash | +0.039 |
rated | +0.036 |
Which | +0.036 |
stations | +0.035 |
idget | +0.035 |
Neg logit contributions | |
� | -0.021 |
endant | -0.019 |
av | -0.018 |
jewels | -0.017 |
brace | -0.017 |
Token | played |
Token ID | 2826 |
Feature activation | +5.69e-01 |
Pos logit contributions | |
endant | +0.013 |
arrest | +0.013 |
av | +0.013 |
jewels | +0.013 |
brace | +0.012 |
Neg logit contributions | |
Which | -0.011 |
Good | -0.010 |
Time | -0.010 |
Why | -0.010 |
Where | -0.010 |
Token | was |
Token ID | 373 |
Feature activation | -1.75e+00 |
Pos logit contributions | |
Which | +0.006 |
Good | +0.005 |
Time | +0.005 |
Why | +0.005 |
Where | +0.005 |
Neg logit contributions | |
endant | -0.008 |
arrest | -0.007 |
av | -0.007 |
jewels | -0.007 |
brace | -0.007 |
Token | working |
Token ID | 1762 |
Feature activation | -5.65e-01 |
Pos logit contributions | |
Which | +0.046 |
Good | +0.043 |
Time | +0.042 |
ash | +0.041 |
Where | +0.041 |
Neg logit contributions | |
endant | -0.055 |
jewels | -0.053 |
av | -0.053 |
arrest | -0.052 |
brace | -0.050 |
Token | , |
Token ID | 11 |
Feature activation | -5.91e-01 |
Pos logit contributions | |
Which | +0.011 |
Good | +0.010 |
Why | +0.010 |
Time | +0.010 |
ash | +0.010 |
Neg logit contributions | |
endant | -0.022 |
arrest | -0.021 |
av | -0.020 |
jewels | -0.020 |
brace | -0.020 |
Token | his |
Token ID | 465 |
Feature activation | -1.46e+00 |
Pos logit contributions | |
Which | +0.014 |
Good | +0.014 |
Why | +0.014 |
Time | +0.013 |
Where | +0.013 |
Neg logit contributions | |
endant | -0.020 |
av | -0.019 |
jewels | -0.018 |
arrest | -0.018 |
agged | -0.018 |
Token | little |
Token ID | 1310 |
Feature activation | -2.30e+00 |
Pos logit contributions | |
Which | +0.039 |
Good | +0.037 |
Time | +0.036 |
Where | +0.035 |
ash | +0.035 |
Neg logit contributions | |
endant | -0.045 |
av | -0.043 |
jewels | -0.043 |
arrest | -0.043 |
brace | -0.041 |
Token | face |
Token ID | 1986 |
Feature activation | -1.91e+00 |
Pos logit contributions | |
Which | +0.069 |
Time | +0.065 |
Good | +0.065 |
Where | +0.064 |
Why | +0.064 |
Neg logit contributions | |
endant | -0.063 |
jewels | -0.062 |
av | -0.061 |
arrest | -0.059 |
brace | -0.058 |
Token | gl |
Token ID | 1278 |
Feature activation | -3.39e-01 |
Pos logit contributions | |
Which | +0.051 |
Time | +0.048 |
Good | +0.048 |
Why | +0.047 |
Where | +0.047 |
Neg logit contributions | |
endant | -0.057 |
av | -0.056 |
jewels | -0.055 |
arrest | -0.055 |
brace | -0.053 |
Token | owed |
Token ID | 6972 |
Feature activation | -2.14e-01 |
Pos logit contributions | |
Which | +0.010 |
Good | +0.010 |
Time | +0.010 |
ash | +0.009 |
Where | +0.009 |
Neg logit contributions | |
endant | -0.009 |
av | -0.009 |
jewels | -0.009 |
arrest | -0.009 |
brace | -0.009 |
Token | with |
Token ID | 351 |
Feature activation | -2.75e-01 |
Pos logit contributions | |
Which | +0.006 |
Good | +0.005 |
Time | +0.005 |
ash | +0.005 |
Where | +0.005 |
Neg logit contributions | |
endant | -0.007 |
av | -0.006 |
jewels | -0.006 |
arrest | -0.006 |
brace | -0.006 |
Token | joy |
Token ID | 8716 |
Feature activation | -8.81e-01 |
Pos logit contributions | |
Which | +0.007 |
Good | +0.007 |
Time | +0.007 |
Where | +0.007 |
Why | +0.007 |
Neg logit contributions | |
endant | -0.009 |
av | -0.008 |
arrest | -0.008 |
aches | -0.008 |
pe | -0.008 |
Token | . |
Token ID | 13 |
Feature activation | -1.70e-01 |
Pos logit contributions | |
Which | +0.022 |
Good | +0.020 |
Time | +0.020 |
Where | +0.019 |
ash | +0.019 |
Neg logit contributions | |
endant | -0.029 |
jewels | -0.029 |
av | -0.029 |
arrest | -0.028 |
brace | -0.028 |
Token | having |
Token ID | 1719 |
Feature activation | +4.18e-02 |
Pos logit contributions | |
Why | +0.005 |
Which | +0.005 |
Good | +0.005 |
over | +0.005 |
Time | +0.005 |
Neg logit contributions | |
endant | -0.008 |
av | -0.007 |
arrest | -0.007 |
jewels | -0.007 |
aches | -0.007 |
Token | lots |
Token ID | 6041 |
Feature activation | +3.81e-01 |
Pos logit contributions | |
endant | +0.001 |
jewels | +0.001 |
av | +0.001 |
arrest | +0.001 |
brace | +0.001 |
Neg logit contributions | |
Which | -0.001 |
Time | -0.001 |
Good | -0.001 |
Where | -0.001 |
Why | -0.001 |
Token | of |
Token ID | 286 |
Feature activation | -1.72e-01 |
Pos logit contributions | |
endant | +0.012 |
av | +0.012 |
jewels | +0.012 |
arrest | +0.012 |
brace | +0.011 |
Neg logit contributions | |
Which | -0.009 |
Time | -0.009 |
Good | -0.009 |
ash | -0.009 |
Why | -0.009 |
Token | fun |
Token ID | 1257 |
Feature activation | -4.00e-01 |
Pos logit contributions | |
Which | +0.004 |
Good | +0.004 |
Time | +0.004 |
ash | +0.004 |
Why | +0.004 |
Neg logit contributions | |
endant | -0.006 |
jewels | -0.005 |
av | -0.005 |
arrest | -0.005 |
brace | -0.005 |
Token | . |
Token ID | 13 |
Feature activation | -9.04e-01 |
Pos logit contributions | |
Which | +0.012 |
Good | +0.012 |
idget | +0.012 |
Time | +0.011 |
Ready | +0.011 |
Neg logit contributions | |
arrest | -0.011 |
av | -0.011 |
jewels | -0.011 |
pe | -0.010 |
brace | -0.010 |
Token | |
Token ID | 220 |
Feature activation | -1.74e+00 |
Pos logit contributions | |
Time | +0.029 |
idget | +0.029 |
ash | +0.029 |
Which | +0.029 |
rated | +0.028 |
Neg logit contributions | |
endant | -0.019 |
� | -0.018 |
av | -0.018 |
jewels | -0.018 |
pe | -0.018 |
Token |
|
Token ID | 198 |
Feature activation | -2.62e-01 |
Pos logit contributions | |
Which | +0.049 |
Time | +0.046 |
Good | +0.045 |
ash | +0.044 |
Why | +0.044 |
Neg logit contributions | |
endant | -0.048 |
av | -0.046 |
jewels | -0.045 |
arrest | -0.044 |
pe | -0.044 |
Token | Suddenly |
Token ID | 38582 |
Feature activation | -1.89e-02 |
Pos logit contributions | |
Which | +0.007 |
ash | +0.007 |
Good | +0.007 |
idget | +0.007 |
Time | +0.007 |
Neg logit contributions | |
endant | -0.007 |
av | -0.007 |
arrest | -0.007 |
pe | -0.007 |
jewels | -0.007 |
Token | , |
Token ID | 11 |
Feature activation | -3.70e-01 |
Pos logit contributions | |
Which | +0.001 |
Good | +0.001 |
Time | +0.000 |
Time | +0.000 |
Why | +0.000 |
Neg logit contributions | |
endant | -0.001 |
arrest | -0.001 |
av | -0.001 |
brace | -0.001 |
jewels | -0.001 |
Token | one |
Token ID | 530 |
Feature activation | -1.44e+00 |
Pos logit contributions | |
Which | +0.011 |
Good | +0.010 |
Time | +0.010 |
Where | +0.010 |
Why | +0.010 |
Neg logit contributions | |
endant | -0.011 |
av | -0.010 |
arrest | -0.010 |
jewels | -0.010 |
brace | -0.010 |
Token | of |
Token ID | 286 |
Feature activation | +4.77e-01 |
Pos logit contributions | |
Which | +0.050 |
Good | +0.050 |
idget | +0.049 |
ksh | +0.048 |
Ready | +0.047 |
Neg logit contributions | |
jewels | -0.029 |
av | -0.028 |
hy | -0.028 |
endant | -0.028 |
coins | -0.027 |
Token | the |
Token ID | 262 |
Feature activation | +5.57e-01 |
Pos logit contributions | |
endant | +0.029 |
jewels | +0.025 |
av | +0.025 |
arrest | +0.025 |
pe | +0.025 |
Neg logit contributions | |
Which | -0.021 |
Why | -0.020 |
Where | -0.020 |
Time | -0.019 |
What | -0.019 |
Token | kitchen |
Token ID | 9592 |
Feature activation | -1.35e+00 |
Pos logit contributions | |
av | +0.017 |
endant | +0.017 |
jewels | +0.017 |
arrest | +0.017 |
brace | +0.016 |
Neg logit contributions | |
Which | -0.014 |
ash | -0.013 |
idget | -0.013 |
Time | -0.013 |
Good | -0.013 |
Token | . |
Token ID | 13 |
Feature activation | -9.78e-01 |
Pos logit contributions | |
Which | +0.033 |
Good | +0.032 |
Time | +0.031 |
idget | +0.030 |
ash | +0.030 |
Neg logit contributions | |
av | -0.044 |
endant | -0.044 |
jewels | -0.043 |
arrest | -0.042 |
brace | -0.042 |
Token | One |
Token ID | 1881 |
Feature activation | -9.58e-01 |
Pos logit contributions | |
ting | +0.030 |
tap | +0.029 |
ash | +0.029 |
Time | +0.029 |
Good | +0.029 |
Neg logit contributions | |
av | -0.022 |
endant | -0.022 |
jewels | -0.021 |
brace | -0.020 |
� | -0.020 |
Token | day |
Token ID | 1110 |
Feature activation | -1.09e-01 |
Pos logit contributions | |
Which | +0.020 |
idget | +0.019 |
Ready | +0.019 |
Where | +0.018 |
Good | +0.018 |
Neg logit contributions | |
av | -0.033 |
endant | -0.032 |
jewels | -0.032 |
kins | -0.032 |
aches | -0.032 |
Token | , |
Token ID | 11 |
Feature activation | -1.72e+00 |
Pos logit contributions | |
idget | +0.004 |
Which | +0.004 |
ash | +0.004 |
Good | +0.004 |
Time | +0.004 |
Neg logit contributions | |
jewels | -0.002 |
av | -0.002 |
endant | -0.002 |
coins | -0.002 |
arrest | -0.002 |
Token | mom |
Token ID | 1995 |
Feature activation | -5.16e-01 |
Pos logit contributions | |
ash | +0.062 |
Good | +0.060 |
idget | +0.060 |
Time | +0.059 |
Which | +0.058 |
Neg logit contributions | |
jewels | -0.035 |
av | -0.034 |
endant | -0.033 |
coins | -0.032 |
brace | -0.031 |
Token | asked |
Token ID | 1965 |
Feature activation | -1.21e+00 |
Pos logit contributions | |
Which | +0.015 |
Good | +0.015 |
ash | +0.014 |
Time | +0.014 |
Where | +0.014 |
Neg logit contributions | |
endant | -0.014 |
av | -0.014 |
jewels | -0.013 |
arrest | -0.013 |
brace | -0.013 |
Token | them |
Token ID | 606 |
Feature activation | -3.55e-01 |
Pos logit contributions | |
Which | +0.039 |
Good | +0.038 |
idget | +0.038 |
Ready | +0.038 |
Time | +0.038 |
Neg logit contributions | |
av | -0.029 |
jewels | -0.027 |
coins | -0.026 |
arrest | -0.026 |
brace | -0.026 |
Token | to |
Token ID | 284 |
Feature activation | -9.64e-01 |
Pos logit contributions | |
Time | +0.010 |
Which | +0.010 |
Good | +0.010 |
ash | +0.010 |
idget | +0.009 |
Neg logit contributions | |
av | -0.010 |
jewels | -0.010 |
endant | -0.010 |
coins | -0.009 |
brace | -0.009 |
Token | complete |
Token ID | 1844 |
Feature activation | -4.37e-01 |
Pos logit contributions | |
Why | +0.018 |
Which | +0.017 |
Time | +0.017 |
What | +0.016 |
Where | +0.016 |
Neg logit contributions | |
endant | -0.040 |
jewels | -0.036 |
brace | -0.036 |
agged | -0.035 |
av | -0.035 |
Token | � |
Token ID | 129 |
Feature activation | -1.15e+00 |
Pos logit contributions | |
av | +0.012 |
jewels | +0.012 |
endant | +0.012 |
brace | +0.011 |
coins | +0.011 |
Neg logit contributions | |
Good | -0.009 |
Time | -0.008 |
Time | -0.008 |
Which | -0.008 |
Clean | -0.008 |
Token | � |
Token ID | 241 |
Feature activation | -2.27e+00 |
Pos logit contributions | |
Which | +0.030 |
Good | +0.028 |
Time | +0.027 |
Where | +0.027 |
ash | +0.026 |
Neg logit contributions | |
endant | -0.036 |
arrest | -0.035 |
av | -0.034 |
jewels | -0.034 |
brace | -0.034 |
Token | What |
Token ID | 2061 |
Feature activation | -1.58e+00 |
Pos logit contributions | |
idget | +0.045 |
ash | +0.045 |
Which | +0.042 |
Good | +0.040 |
ting | +0.039 |
Neg logit contributions | |
pe | -0.075 |
arrest | -0.073 |
hy | -0.072 |
endant | -0.071 |
� | -0.068 |
Token | is |
Token ID | 318 |
Feature activation | -7.74e-01 |
Pos logit contributions | |
Which | +0.043 |
Good | +0.041 |
Time | +0.040 |
Where | +0.039 |
ash | +0.039 |
Neg logit contributions | |
endant | -0.047 |
av | -0.046 |
jewels | -0.045 |
arrest | -0.045 |
brace | -0.044 |
Token | it |
Token ID | 340 |
Feature activation | -1.55e+00 |
Pos logit contributions | |
Which | +0.024 |
Time | +0.024 |
ash | +0.024 |
idget | +0.024 |
Good | +0.024 |
Neg logit contributions | |
jewels | -0.019 |
endant | -0.019 |
av | -0.019 |
arrest | -0.019 |
coins | -0.018 |
Token | , |
Token ID | 11 |
Feature activation | -2.46e+00 |
Pos logit contributions | |
Which | +0.039 |
Good | +0.037 |
Time | +0.036 |
Why | +0.035 |
ash | +0.035 |
Neg logit contributions | |
endant | -0.050 |
jewels | -0.048 |
arrest | -0.048 |
av | -0.048 |
brace | -0.046 |
Token | M |
Token ID | 337 |
Feature activation | -8.52e-01 |
Pos logit contributions | |
Which | +0.061 |
ash | +0.058 |
Time | +0.058 |
Good | +0.058 |
Where | +0.057 |
Neg logit contributions | |
endant | -0.076 |
jewels | -0.075 |
av | -0.074 |
arrest | -0.071 |
brace | -0.071 |
Token | ummy |
Token ID | 13513 |
Feature activation | -1.28e+00 |
Pos logit contributions | |
Which | +0.023 |
Where | +0.021 |
Good | +0.021 |
Time | +0.021 |
Why | +0.020 |
Neg logit contributions | |
endant | -0.027 |
av | -0.026 |
arrest | -0.025 |
jewels | -0.025 |
aches | -0.024 |
Token | ? |
Token ID | 30 |
Feature activation | -3.13e-01 |
Pos logit contributions | |
Which | +0.034 |
Time | +0.032 |
Good | +0.032 |
Where | +0.032 |
idget | +0.031 |
Neg logit contributions | |
endant | -0.039 |
av | -0.038 |
jewels | -0.038 |
arrest | -0.037 |
brace | -0.035 |
Token | â |
Token ID | 22940 |
Feature activation | -3.74e-01 |
Pos logit contributions | |
Which | +0.007 |
Time | +0.007 |
ash | +0.006 |
idget | +0.006 |
Good | +0.006 |
Neg logit contributions | |
endant | -0.011 |
av | -0.010 |
jewels | -0.010 |
arrest | -0.010 |
hy | -0.010 |
Token | € |
Token ID | 26391 |
Feature activation | +5.21e-01 |
Pos logit contributions | |
Which | +0.009 |
Where | +0.008 |
Good | +0.008 |
Time | +0.008 |
Why | +0.007 |
Neg logit contributions | |
endant | -0.013 |
av | -0.012 |
arrest | -0.012 |
pe | -0.012 |
jewels | -0.012 |