Token | chief |
Token ID | 4039 |
Feature activation | -3.38e-02 |
Token | J |
Token ID | 449 |
Feature activation | -5.82e-03 |
Token | ens |
Token ID | 641 |
Feature activation | -5.92e-02 |
Token | St |
Token ID | 520 |
Feature activation | +2.62e-02 |
Token | ol |
Token ID | 349 |
Feature activation | -1.19e-01 |
Token | ten |
Token ID | 1452 |
Feature activation | +4.16e-01 |
Token | berg |
Token ID | 3900 |
Feature activation | +1.91e-02 |
Token | and |
Token ID | 290 |
Feature activation | -9.64e-03 |
Token | promised |
Token ID | 8072 |
Feature activation | -3.77e-02 |
Token | to |
Token ID | 284 |
Feature activation | -3.36e-02 |
Token | reiterate |
Token ID | 49852 |
Feature activation | +1.31e-02 |
Token | $ |
Token ID | 720 |
Feature activation | +1.37e-01 |
Token | 5 |
Token ID | 20 |
Feature activation | +2.85e-02 |
Token | million |
Token ID | 1510 |
Feature activation | +6.61e-02 |
Token | by |
Token ID | 416 |
Feature activation | +6.06e-02 |
Token | Z |
Token ID | 1168 |
Feature activation | +1.88e-02 |
Token | ill |
Token ID | 359 |
Feature activation | +4.15e-01 |
Token | ow |
Token ID | 322 |
Feature activation | -2.26e-02 |
Token | . |
Token ID | 13 |
Feature activation | -2.35e-02 |
Token | ( |
Token ID | 357 |
Feature activation | -2.67e-02 |
Token | H |
Token ID | 39 |
Feature activation | -8.20e-03 |
Token | ahn |
Token ID | 15386 |
Feature activation | -2.72e-02 |
Token | Reserved |
Token ID | 33876 |
Feature activation | +9.54e-02 |
Token | . |
Token ID | 13 |
Feature activation | -1.38e-02 |
Token | Rep |
Token ID | 1432 |
Feature activation | +1.44e-03 |
Token | rint |
Token ID | 22272 |
Feature activation | +6.79e-02 |
Token | ed |
Token ID | 276 |
Feature activation | +1.69e-01 |
Token | with |
Token ID | 351 |
Feature activation | +4.03e-01 |
Token | permission |
Token ID | 7170 |
Feature activation | -4.74e-03 |
Token | . |
Token ID | 13 |
Feature activation | -1.97e-02 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -4.50e-03 |
Token | C |
Token ID | 34 |
Feature activation | -1.52e-03 |
Token | ort |
Token ID | 419 |
Feature activation | +1.43e-02 |
Token | ness |
Token ID | 1108 |
Feature activation | -1.60e-02 |
Token | of |
Token ID | 286 |
Feature activation | +6.63e-03 |
Token | a |
Token ID | 257 |
Feature activation | +1.79e-03 |
Token | small |
Token ID | 1402 |
Feature activation | +1.13e-02 |
Token | c |
Token ID | 269 |
Feature activation | +2.88e-02 |
Token | ot |
Token ID | 313 |
Feature activation | +3.94e-01 |
Token | erie |
Token ID | 18287 |
Feature activation | -8.82e-03 |
Token | of |
Token ID | 286 |
Feature activation | +3.31e-02 |
Token | the |
Token ID | 262 |
Feature activation | -1.32e-02 |
Token | super |
Token ID | 2208 |
Feature activation | -2.89e-02 |
Token | - |
Token ID | 12 |
Feature activation | -1.57e-02 |
Token | with |
Token ID | 351 |
Feature activation | -2.43e-02 |
Token | the |
Token ID | 262 |
Feature activation | +9.82e-03 |
Token | mineral |
Token ID | 18352 |
Feature activation | -3.63e-03 |
Token | fe |
Token ID | 730 |
Feature activation | +5.43e-02 |
Token | ld |
Token ID | 335 |
Feature activation | +2.71e-01 |
Token | s |
Token ID | 82 |
Feature activation | +3.79e-01 |
Token | par |
Token ID | 1845 |
Feature activation | +6.45e-02 |
Token | , |
Token ID | 11 |
Feature activation | -2.35e-02 |
Token | and |
Token ID | 290 |
Feature activation | -5.47e-02 |
Token | low |
Token ID | 1877 |
Feature activation | -6.11e-02 |
Token | in |
Token ID | 287 |
Feature activation | -8.31e-02 |
Token | German |
Token ID | 2679 |
Feature activation | +5.89e-03 |
Token | Edu |
Token ID | 40766 |
Feature activation | -4.72e-02 |
Token | ard |
Token ID | 446 |
Feature activation | -1.30e-01 |
Token | Gut |
Token ID | 27549 |
Feature activation | +4.16e-02 |
Token | k |
Token ID | 74 |
Feature activation | +5.31e-02 |
Token | ne |
Token ID | 710 |
Feature activation | +3.78e-01 |
Token | cht |
Token ID | 21474 |
Feature activation | +1.75e-02 |
Token | into |
Token ID | 656 |
Feature activation | +3.70e-02 |
Token | a |
Token ID | 257 |
Feature activation | -7.88e-04 |
Token | coma |
Token ID | 33658 |
Feature activation | -1.79e-02 |
Token | last |
Token ID | 938 |
Feature activation | -7.59e-03 |
Token | slowly |
Token ID | 6364 |
Feature activation | +1.13e-01 |
Token | along |
Token ID | 1863 |
Feature activation | -2.35e-02 |
Token | the |
Token ID | 262 |
Feature activation | +5.17e-02 |
Token | city |
Token ID | 1748 |
Feature activation | -7.10e-03 |
Token | 's |
Token ID | 338 |
Feature activation | +1.03e-01 |
Token | broad |
Token ID | 3154 |
Feature activation | +3.76e-01 |
Token | bou |
Token ID | 35833 |
Feature activation | +1.58e-02 |
Token | lev |
Token ID | 2768 |
Feature activation | -2.03e-02 |
Token | ards |
Token ID | 1371 |
Feature activation | +1.26e-02 |
Token | in |
Token ID | 287 |
Feature activation | +1.97e-01 |
Token | support |
Token ID | 1104 |
Feature activation | +1.98e-02 |
Token | ctl |
Token ID | 34168 |
Feature activation | +1.79e-01 |
Token | restart |
Token ID | 15765 |
Feature activation | +4.62e-02 |
Token | network |
Token ID | 3127 |
Feature activation | +3.28e-03 |
Token | - |
Token ID | 12 |
Feature activation | +4.35e-02 |
Token | manager |
Token ID | 37153 |
Feature activation | +3.66e-02 |
Token | . |
Token ID | 13 |
Feature activation | +3.64e-01 |
Token | service |
Token ID | 15271 |
Feature activation | +1.26e-01 |
Token |
|
Token ID | 198 |
Feature activation | +6.01e-02 |
Token |
|
Token ID | 198 |
Feature activation | -9.95e-02 |
Token | You |
Token ID | 1639 |
Feature activation | -1.60e-02 |
Token | should |
Token ID | 815 |
Feature activation | -6.71e-03 |
Token | The |
Token ID | 464 |
Feature activation | -5.49e-03 |
Token | City |
Token ID | 2254 |
Feature activation | +3.99e-02 |
Token | of |
Token ID | 286 |
Feature activation | +6.99e-02 |
Token | Wh |
Token ID | 854 |
Feature activation | -3.34e-02 |
Token | itt |
Token ID | 715 |
Feature activation | +1.25e-01 |
Token | les |
Token ID | 829 |
Feature activation | +3.53e-01 |
Token | ea |
Token ID | 18213 |
Feature activation | -1.23e-02 |
Token | covers |
Token ID | 8698 |
Feature activation | -1.39e-01 |
Token | almost |
Token ID | 2048 |
Feature activation | -9.36e-02 |
Token | 500 |
Token ID | 5323 |
Feature activation | -1.31e-02 |
Token | square |
Token ID | 6616 |
Feature activation | -1.50e-01 |
Token | affect |
Token ID | 2689 |
Feature activation | +2.93e-03 |
Token | many |
Token ID | 867 |
Feature activation | +5.42e-03 |
Token | — |
Token ID | 851 |
Feature activation | +1.02e-02 |
Token | for |
Token ID | 329 |
Feature activation | +4.82e-03 |
Token | good |
Token ID | 922 |
Feature activation | -6.29e-03 |
Token | or |
Token ID | 393 |
Feature activation | +3.48e-01 |
Token | evil |
Token ID | 6181 |
Feature activation | +5.29e-02 |
Token | — |
Token ID | 851 |
Feature activation | -1.61e-02 |
Token | is |
Token ID | 318 |
Feature activation | +2.34e-02 |
Token | now |
Token ID | 783 |
Feature activation | +4.67e-03 |
Token | scaling |
Token ID | 20796 |
Feature activation | +1.52e-02 |
Token | information |
Token ID | 1321 |
Feature activation | -4.47e-02 |
Token | on |
Token ID | 319 |
Feature activation | +8.12e-03 |
Token | your |
Token ID | 534 |
Feature activation | +5.92e-02 |
Token | website |
Token ID | 3052 |
Feature activation | +1.01e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.61e-02 |
Token | please |
Token ID | 3387 |
Feature activation | +3.46e-01 |
Token | credit |
Token ID | 3884 |
Feature activation | +5.82e-02 |
Token | and |
Token ID | 290 |
Feature activation | +6.78e-02 |
Token | link |
Token ID | 2792 |
Feature activation | +2.31e-02 |
Token | to |
Token ID | 284 |
Feature activation | +1.91e-02 |
Token | this |
Token ID | 428 |
Feature activation | +4.71e-02 |
Token | ethical |
Token ID | 32949 |
Feature activation | +1.55e-04 |
Token | views |
Token ID | 5009 |
Feature activation | +2.04e-02 |
Token | , |
Token ID | 11 |
Feature activation | +9.40e-03 |
Token | takes |
Token ID | 2753 |
Feature activation | +2.23e-02 |
Token | there |
Token ID | 612 |
Feature activation | +3.27e-02 |
Token | to |
Token ID | 284 |
Feature activation | +3.43e-01 |
Token | be |
Token ID | 307 |
Feature activation | +1.13e-02 |
Token | normative |
Token ID | 46219 |
Feature activation | +1.24e-02 |
Token | facts |
Token ID | 6419 |
Feature activation | +5.81e-03 |
Token | which |
Token ID | 543 |
Feature activation | -5.28e-03 |
Token | can |
Token ID | 460 |
Feature activation | +1.68e-02 |
Token | can |
Token ID | 460 |
Feature activation | +3.49e-02 |
Token | 't |
Token ID | 470 |
Feature activation | -9.82e-03 |
Token | for |
Token ID | 329 |
Feature activation | +3.78e-02 |
Token | the |
Token ID | 262 |
Feature activation | +4.68e-02 |
Token | life |
Token ID | 1204 |
Feature activation | +1.42e-01 |
Token | of |
Token ID | 286 |
Feature activation | +3.38e-01 |
Token | me |
Token ID | 502 |
Feature activation | +3.49e-02 |
Token | remember |
Token ID | 3505 |
Feature activation | +3.90e-02 |
Token | anything |
Token ID | 1997 |
Feature activation | +1.31e-02 |
Token | that |
Token ID | 326 |
Feature activation | +1.59e-02 |
Token | preceded |
Token ID | 27165 |
Feature activation | -1.30e-02 |
Token | large |
Token ID | 1588 |
Feature activation | -2.34e-02 |
Token | open |
Token ID | 1280 |
Feature activation | -3.37e-02 |
Token | spaces |
Token ID | 9029 |
Feature activation | -7.45e-04 |
Token | and |
Token ID | 290 |
Feature activation | +6.72e-03 |
Token | pl |
Token ID | 458 |
Feature activation | -4.97e-03 |
Token | az |
Token ID | 1031 |
Feature activation | +3.34e-01 |
Token | as |
Token ID | 292 |
Feature activation | +2.89e-03 |
Token | on |
Token ID | 319 |
Feature activation | -6.68e-02 |
Token | three |
Token ID | 1115 |
Feature activation | -1.03e-02 |
Token | of |
Token ID | 286 |
Feature activation | +8.66e-02 |
Token | its |
Token ID | 663 |
Feature activation | -2.15e-03 |
Token | Read |
Token ID | 5569 |
Feature activation | +7.07e-02 |
Token | or |
Token ID | 393 |
Feature activation | +4.38e-02 |
Token | Share |
Token ID | 8734 |
Feature activation | -1.07e-01 |
Token | this |
Token ID | 428 |
Feature activation | +8.14e-02 |
Token | story |
Token ID | 1621 |
Feature activation | +7.50e-02 |
Token | : |
Token ID | 25 |
Feature activation | +3.31e-01 |
Token | http |
Token ID | 2638 |
Feature activation | +1.47e-02 |
Token | :// |
Token ID | 1378 |
Feature activation | +3.22e-02 |
Token | on |
Token ID | 261 |
Feature activation | +1.20e-01 |
Token | . |
Token ID | 13 |
Feature activation | -1.63e-02 |
Token | c |
Token ID | 66 |
Feature activation | +8.45e-02 |
Token | essays |
Token ID | 27126 |
Feature activation | -6.33e-02 |
Token | by |
Token ID | 416 |
Feature activation | +4.98e-02 |
Token | Scott |
Token ID | 4746 |
Feature activation | -5.72e-02 |
Token | Ric |
Token ID | 15868 |
Feature activation | +6.98e-02 |
Token | her |
Token ID | 372 |
Feature activation | +2.17e-01 |
Token | t |
Token ID | 83 |
Feature activation | +3.28e-01 |
Token | and |
Token ID | 290 |
Feature activation | +1.90e-01 |
Token | David |
Token ID | 3271 |
Feature activation | +6.48e-02 |
Token | Gordon |
Token ID | 11646 |
Feature activation | +7.33e-02 |
Token | ( |
Token ID | 357 |
Feature activation | +7.71e-02 |
Token | IS |
Token ID | 1797 |
Feature activation | -5.23e-02 |
Token | Sch |
Token ID | 3059 |
Feature activation | -1.35e-02 |
Token | oles |
Token ID | 4316 |
Feature activation | +1.11e-02 |
Token | , |
Token ID | 11 |
Feature activation | -3.57e-03 |
Token | Mark |
Token ID | 2940 |
Feature activation | +4.38e-02 |
Token | Raw |
Token ID | 16089 |
Feature activation | +9.06e-02 |
Token | l |
Token ID | 75 |
Feature activation | +3.20e-01 |
Token | inson |
Token ID | 7899 |
Feature activation | +3.87e-02 |
Token | , |
Token ID | 11 |
Feature activation | +1.84e-02 |
Token | John |
Token ID | 1757 |
Feature activation | +3.17e-02 |
Token | O |
Token ID | 440 |
Feature activation | -8.02e-02 |
Token | ' |
Token ID | 6 |
Feature activation | -1.53e-03 |
Token | businesses |
Token ID | 5692 |
Feature activation | -6.62e-03 |
Token | that |
Token ID | 326 |
Feature activation | +3.00e-02 |
Token | received |
Token ID | 2722 |
Feature activation | +2.31e-01 |
Token | Priv |
Token ID | 9243 |
Feature activation | -3.46e-02 |
Token | at |
Token ID | 265 |
Feature activation | +1.17e-02 |
Token | bank |
Token ID | 17796 |
Feature activation | +3.18e-01 |
Token | loans |
Token ID | 10021 |
Feature activation | +5.67e-02 |
Token | are |
Token ID | 389 |
Feature activation | -3.88e-03 |
Token | Vi |
Token ID | 16049 |
Feature activation | -6.88e-02 |
Token | aches |
Token ID | 3694 |
Feature activation | -2.34e-01 |
Token | lav |
Token ID | 18809 |
Feature activation | -5.35e-02 |
Token | . |
Token ID | 13 |
Feature activation | -6.50e-03 |
Token | The |
Token ID | 383 |
Feature activation | -1.16e-02 |
Token | event |
Token ID | 1785 |
Feature activation | +6.81e-03 |
Token | in |
Token ID | 287 |
Feature activation | +3.41e-02 |
Token | Am |
Token ID | 1703 |
Feature activation | +3.19e-02 |
Token | her |
Token ID | 372 |
Feature activation | +3.14e-01 |
Token | st |
Token ID | 301 |
Feature activation | -3.74e-02 |
Token | was |
Token ID | 373 |
Feature activation | -7.21e-03 |
Token | the |
Token ID | 262 |
Feature activation | +1.99e-02 |
Token | first |
Token ID | 717 |
Feature activation | +4.27e-02 |
Token | of |
Token ID | 286 |
Feature activation | +2.04e-02 |
Token | B |
Token ID | 33 |
Feature activation | +3.97e-02 |
Token | uk |
Token ID | 2724 |
Feature activation | -1.14e-01 |
Token | hari |
Token ID | 49573 |
Feature activation | -5.35e-04 |
Token | , |
Token ID | 11 |
Feature activation | +1.27e-02 |
Token | 5 |
Token ID | 642 |
Feature activation | +4.26e-02 |
Token | : |
Token ID | 25 |
Feature activation | +3.10e-01 |
Token | 58 |
Token ID | 3365 |
Feature activation | +4.03e-02 |
Token | : |
Token ID | 25 |
Feature activation | +2.74e-01 |
Token | 148 |
Token ID | 18294 |
Feature activation | +3.57e-02 |
Token |
|
Token ID | 198 |
Feature activation | +3.43e-03 |
Token |
|
Token ID | 198 |
Feature activation | -2.73e-02 |
Token | doi |
Token ID | 23899 |
Feature activation | -8.39e-04 |
Token | : |
Token ID | 25 |
Feature activation | -4.20e-03 |
Token | 10 |
Token ID | 838 |
Feature activation | -8.09e-02 |
Token | . |
Token ID | 13 |
Feature activation | -1.31e-01 |
Token | 10 |
Token ID | 940 |
Feature activation | -5.56e-02 |
Token | 71 |
Token ID | 4869 |
Feature activation | -5.79e-01 |
Token | / |
Token ID | 14 |
Feature activation | -1.86e-01 |
Token | Z |
Token ID | 57 |
Feature activation | +1.12e-02 |
Token | O |
Token ID | 46 |
Feature activation | +5.25e-02 |
Token | 130 |
Token ID | 12952 |
Feature activation | +1.93e-01 |
Token | 95 |
Token ID | 3865 |
Feature activation | +6.08e-02 |
Token | Books |
Token ID | 13661 |
Feature activation | -6.82e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Token | 2000 |
Token ID | 4751 |
Feature activation | -5.35e-02 |
Token | ), |
Token ID | 828 |
Feature activation | -2.39e-01 |
Token | my |
Token ID | 616 |
Feature activation | -7.30e-02 |
Token | biography |
Token ID | 26444 |
Feature activation | -4.11e-01 |
Token | of |
Token ID | 286 |
Feature activation | -6.51e-02 |
Token | the |
Token ID | 262 |
Feature activation | -1.51e-01 |
Token | great |
Token ID | 1049 |
Feature activation | -3.66e-02 |
Token | libertarian |
Token ID | 19466 |
Feature activation | -1.45e-01 |
Token | thinker |
Token ID | 45206 |
Feature activation | -2.46e-01 |
Token | iss |
Token ID | 747 |
Feature activation | -5.83e-02 |
Token | ar |
Token ID | 283 |
Feature activation | -2.05e-02 |
Token | of |
Token ID | 286 |
Feature activation | -9.13e-02 |
Token | Defense |
Token ID | 5947 |
Feature activation | -1.51e-02 |
Token | S |
Token ID | 311 |
Feature activation | -4.94e-03 |
Token | emy |
Token ID | 3065 |
Feature activation | -4.08e-01 |
Token | on |
Token ID | 261 |
Feature activation | -1.35e-02 |
Token | Tim |
Token ID | 5045 |
Feature activation | -7.09e-02 |
Token | oshenko |
Token ID | 43934 |
Feature activation | +1.63e-02 |
Token | and |
Token ID | 290 |
Feature activation | +7.00e-03 |
Token | Zh |
Token ID | 10511 |
Feature activation | +2.45e-03 |
Token | less |
Token ID | 1203 |
Feature activation | +1.77e-02 |
Token | as |
Token ID | 355 |
Feature activation | -5.58e-03 |
Token | possible |
Token ID | 1744 |
Feature activation | -8.62e-04 |
Token | so |
Token ID | 523 |
Feature activation | -3.82e-02 |
Token | try |
Token ID | 1949 |
Feature activation | -1.99e-03 |
Token | not |
Token ID | 407 |
Feature activation | -4.07e-01 |
Token | to |
Token ID | 284 |
Feature activation | -6.68e-02 |
Token | get |
Token ID | 651 |
Feature activation | -1.56e-02 |
Token | overly |
Token ID | 17698 |
Feature activation | -1.71e-03 |
Token | frustrated |
Token ID | 14718 |
Feature activation | +1.56e-03 |
Token | with |
Token ID | 351 |
Feature activation | -2.14e-02 |
Token | , |
Token ID | 11 |
Feature activation | -9.56e-02 |
Token | 055 |
Token ID | 47838 |
Feature activation | -5.58e-03 |
Token | , |
Token ID | 11 |
Feature activation | +6.42e-02 |
Token | and |
Token ID | 290 |
Feature activation | +1.44e-02 |
Token | JPMorgan |
Token ID | 43318 |
Feature activation | -1.09e-01 |
Token | Chase |
Token ID | 16346 |
Feature activation | -3.89e-01 |
Token | was |
Token ID | 373 |
Feature activation | +5.26e-02 |
Token | the |
Token ID | 262 |
Feature activation | +1.89e-04 |
Token | subject |
Token ID | 2426 |
Feature activation | +3.81e-02 |
Token | of |
Token ID | 286 |
Feature activation | +6.85e-02 |
Token | 20 |
Token ID | 1160 |
Feature activation | -1.68e-02 |
Token | functions |
Token ID | 5499 |
Feature activation | -6.92e-02 |
Token | using |
Token ID | 1262 |
Feature activation | +1.45e-02 |
Token | the |
Token ID | 262 |
Feature activation | -1.65e-01 |
Token | archived |
Token ID | 33962 |
Feature activation | -5.79e-02 |
Token | file |
Token ID | 2393 |
Feature activation | -1.86e-02 |
Token | from |
Token ID | 422 |
Feature activation | -3.85e-01 |
Token | S |
Token ID | 311 |
Feature activation | -8.54e-02 |
Token | 3 |
Token ID | 18 |
Feature activation | -3.05e-01 |
Token | bucket |
Token ID | 19236 |
Feature activation | -2.67e-02 |
Token | . |
Token ID | 13 |
Feature activation | -1.61e-02 |
Token | It |
Token ID | 632 |
Feature activation | +6.26e-03 |
Token | Trump |
Token ID | 1301 |
Feature activation | -4.54e-02 |
Token | House |
Token ID | 18102 |
Feature activation | +1.13e-02 |
Token | committee |
Token ID | 5583 |
Feature activation | -2.17e-01 |
Token | believes |
Token ID | 5804 |
Feature activation | -1.94e-02 |
Token | it |
Token ID | 340 |
Feature activation | -1.95e-01 |
Token | has |
Token ID | 468 |
Feature activation | -3.75e-01 |
Token | evidence |
Token ID | 2370 |
Feature activation | -2.20e-01 |
Token | Trump |
Token ID | 1301 |
Feature activation | -3.67e-02 |
Token | requested |
Token ID | 9167 |
Feature activation | +1.22e-01 |
Token | putting |
Token ID | 5137 |
Feature activation | -1.49e-01 |
Token | ally |
Token ID | 12525 |
Feature activation | -7.73e-02 |
Token | Ratings |
Token ID | 36826 |
Feature activation | +4.58e-02 |
Token | . |
Token ID | 13 |
Feature activation | -1.14e-03 |
Token |
|
Token ID | 198 |
Feature activation | -7.04e-02 |
Token |
|
Token ID | 198 |
Feature activation | +3.53e-02 |
Token | Sl |
Token ID | 11122 |
Feature activation | -2.60e-02 |
Token | ideshow |
Token ID | 42286 |
Feature activation | -3.60e-01 |
Token | ( |
Token ID | 357 |
Feature activation | -1.27e-02 |
Token | 2 |
Token ID | 17 |
Feature activation | +5.52e-02 |
Token | Images |
Token ID | 5382 |
Feature activation | -5.73e-02 |
Token | ) |
Token ID | 8 |
Feature activation | -5.53e-03 |
Token |
|
Token ID | 198 |
Feature activation | -6.84e-03 |
Token | par |
Token ID | 1582 |
Feature activation | +1.21e-02 |
Token | asy |
Token ID | 4107 |
Feature activation | +1.40e-02 |
Token | mp |
Token ID | 3149 |
Feature activation | -1.58e-02 |
Token | athetic |
Token ID | 18874 |
Feature activation | -7.76e-02 |
Token | resting |
Token ID | 19186 |
Feature activation | -7.66e-03 |
Token | tone |
Token ID | 8216 |
Feature activation | -3.58e-01 |
Token | in |
Token ID | 287 |
Feature activation | -1.07e-02 |
Token | the |
Token ID | 262 |
Feature activation | +4.57e-03 |
Token | evening |
Token ID | 6180 |
Feature activation | -9.03e-02 |
Token | during |
Token ID | 1141 |
Feature activation | +8.45e-03 |
Token | the |
Token ID | 262 |
Feature activation | +3.42e-02 |
Token | of |
Token ID | 286 |
Feature activation | -6.51e-02 |
Token | the |
Token ID | 262 |
Feature activation | -1.51e-01 |
Token | great |
Token ID | 1049 |
Feature activation | -3.66e-02 |
Token | libertarian |
Token ID | 19466 |
Feature activation | -1.45e-01 |
Token | thinker |
Token ID | 45206 |
Feature activation | -2.46e-01 |
Token | , |
Token ID | 11 |
Feature activation | -3.55e-01 |
Token | here |
Token ID | 994 |
Feature activation | -4.06e-02 |
Token | . |
Token ID | 13 |
Feature activation | -3.76e-02 |
Token |
|
Token ID | 198 |
Feature activation | -4.78e-03 |
Token |
|
Token ID | 198 |
Feature activation | -3.69e-02 |
Token | Read |
Token ID | 5569 |
Feature activation | +2.38e-01 |
Token | , |
Token ID | 11 |
Feature activation | -3.81e-02 |
Token | whilst |
Token ID | 14590 |
Feature activation | -3.48e-02 |
Token | at |
Token ID | 379 |
Feature activation | +3.85e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.20e-02 |
Token | same |
Token ID | 976 |
Feature activation | +1.71e-01 |
Token | time |
Token ID | 640 |
Feature activation | -3.55e-01 |
Token | providing |
Token ID | 4955 |
Feature activation | +7.55e-03 |
Token | us |
Token ID | 514 |
Feature activation | -3.40e-03 |
Token | with |
Token ID | 351 |
Feature activation | -5.29e-03 |
Token | more |
Token ID | 517 |
Feature activation | -3.57e-02 |
Token | than |
Token ID | 621 |
Feature activation | +6.46e-02 |
Token | bit |
Token ID | 1643 |
Feature activation | +2.76e-02 |
Token | stubborn |
Token ID | 24444 |
Feature activation | -2.22e-02 |
Token | ." |
Token ID | 526 |
Feature activation | -1.25e-01 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -2.13e-02 |
Token | Every |
Token ID | 6109 |
Feature activation | +9.47e-03 |
Token | share |
Token ID | 2648 |
Feature activation | -3.55e-01 |
Token | makes |
Token ID | 1838 |
Feature activation | -3.20e-01 |
Token | Black |
Token ID | 2619 |
Feature activation | -2.73e-02 |
Token | Voice |
Token ID | 15282 |
Feature activation | -3.05e-02 |
Token | louder |
Token ID | 27089 |
Feature activation | +4.57e-02 |
Token | ! |
Token ID | 0 |
Feature activation | +4.59e-02 |
Token | winner |
Token ID | 8464 |
Feature activation | +1.83e-03 |
Token | was |
Token ID | 373 |
Feature activation | +7.81e-04 |
Token | Ar |
Token ID | 943 |
Feature activation | +4.61e-02 |
Token | lene |
Token ID | 29466 |
Feature activation | +8.33e-03 |
Token | Go |
Token ID | 1514 |
Feature activation | +7.84e-03 |
Token | le |
Token ID | 293 |
Feature activation | -3.55e-01 |
Token | mb |
Token ID | 2022 |
Feature activation | -7.14e-02 |
Token | iew |
Token ID | 769 |
Feature activation | +1.48e-02 |
Token | ski |
Token ID | 20545 |
Feature activation | +2.44e-02 |
Token | . |
Token ID | 13 |
Feature activation | -7.82e-03 |
Token | Read |
Token ID | 4149 |
Feature activation | -1.41e-01 |
Token | Virtual |
Token ID | 15595 |
Feature activation | +4.68e-03 |
Token | Console |
Token ID | 24371 |
Feature activation | +3.71e-02 |
Token | service |
Token ID | 2139 |
Feature activation | +4.71e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.19e-01 |
Token | which |
Token ID | 543 |
Feature activation | -7.18e-02 |
Token | brings |
Token ID | 6774 |
Feature activation | -3.48e-01 |
Token | you |
Token ID | 345 |
Feature activation | -1.65e-02 |
Token | great |
Token ID | 1049 |
Feature activation | +5.32e-02 |
Token | games |
Token ID | 1830 |
Feature activation | -1.09e-01 |
Token | created |
Token ID | 2727 |
Feature activation | -1.24e-01 |
Token | for |
Token ID | 329 |
Feature activation | -1.62e-01 |
Token | DOI |
Token ID | 40722 |
Feature activation | -2.50e-03 |
Token | : |
Token ID | 25 |
Feature activation | +1.99e-02 |
Token | 10 |
Token ID | 838 |
Feature activation | -9.54e-03 |
Token | . |
Token ID | 13 |
Feature activation | -6.87e-02 |
Token | 10 |
Token ID | 940 |
Feature activation | +7.13e-02 |
Token | 86 |
Token ID | 4521 |
Feature activation | -3.38e-01 |
Token | / |
Token ID | 14 |
Feature activation | +1.21e-01 |
Token | 34 |
Token ID | 2682 |
Feature activation | -3.75e-02 |
Token | 110 |
Token ID | 11442 |
Feature activation | -2.26e-02 |
Token | 7 |
Token ID | 22 |
Feature activation | +2.47e-02 |
Token |
|
Token ID | 198 |
Feature activation | -5.41e-03 |
Token | . |
Token ID | 13 |
Feature activation | -9.18e-03 |
Token | A |
Token ID | 317 |
Feature activation | +5.55e-02 |
Token | 5 |
Token ID | 642 |
Feature activation | -1.22e-02 |
Token | - |
Token ID | 12 |
Feature activation | +5.08e-02 |
Token | mic |
Token ID | 9383 |
Feature activation | -2.91e-02 |
Token | ron |
Token ID | 1313 |
Feature activation | -3.30e-01 |
Token | pin |
Token ID | 6757 |
Feature activation | -3.14e-02 |
Token | hole |
Token ID | 13207 |
Feature activation | -2.79e-02 |
Token | is |
Token ID | 318 |
Feature activation | +6.89e-03 |
Token | about |
Token ID | 546 |
Feature activation | +6.25e-03 |
Token | the |
Token ID | 262 |
Feature activation | +4.41e-02 |
Token | even |
Token ID | 772 |
Feature activation | +2.22e-02 |
Token | if |
Token ID | 611 |
Feature activation | -1.78e-02 |
Token | Lee |
Token ID | 5741 |
Feature activation | -4.92e-02 |
Token | Chung |
Token ID | 43915 |
Feature activation | +3.71e-02 |
Token | - |
Token ID | 12 |
Feature activation | -8.41e-02 |
Token | y |
Token ID | 88 |
Feature activation | -3.28e-01 |
Token | ong |
Token ID | 506 |
Feature activation | +2.08e-02 |
Token | might |
Token ID | 1244 |
Feature activation | +2.49e-03 |
Token | have |
Token ID | 423 |
Feature activation | +2.50e-02 |
Token | done |
Token ID | 1760 |
Feature activation | +4.15e-02 |
Token | better |
Token ID | 1365 |
Feature activation | +4.81e-03 |
Token | ] |
Token ID | 60 |
Feature activation | +6.78e-03 |
Token | :: |
Token ID | 3712 |
Feature activation | -1.54e-01 |
Token | B |
Token ID | 33 |
Feature activation | +3.14e-02 |
Token | old |
Token ID | 727 |
Feature activation | -1.32e-03 |
Token | ) |
Token ID | 8 |
Feature activation | -2.92e-02 |
Token | $ |
Token ID | 720 |
Feature activation | -3.25e-01 |
Token | Br |
Token ID | 9414 |
Feature activation | -8.51e-02 |
Token | ush |
Token ID | 1530 |
Feature activation | -1.84e-02 |
Token | 2 |
Token ID | 17 |
Feature activation | +1.42e-02 |
Token | = |
Token ID | 796 |
Feature activation | +1.47e-02 |
Token | New |
Token ID | 968 |
Feature activation | -9.56e-02 |
Token | delayed |
Token ID | 11038 |
Feature activation | -5.69e-02 |
Token | retirement |
Token ID | 10737 |
Feature activation | +3.90e-03 |
Token | , |
Token ID | 11 |
Feature activation | -1.92e-02 |
Token | see |
Token ID | 766 |
Feature activation | +2.97e-03 |
Token | Pr |
Token ID | 1736 |
Feature activation | -1.40e-02 |
Token | ud |
Token ID | 463 |
Feature activation | -3.23e-01 |
Token | ential |
Token ID | 1843 |
Feature activation | -3.40e-02 |
Token | 2017 |
Token ID | 2177 |
Feature activation | +5.18e-04 |
Token | .) |
Token ID | 2014 |
Feature activation | -1.65e-02 |
Token |
|
Token ID | 198 |
Feature activation | +2.48e-02 |
Token |
|
Token ID | 198 |
Feature activation | -3.57e-03 |
Token | Trump |
Token ID | 1301 |
Feature activation | -6.40e-02 |
Token | House |
Token ID | 18102 |
Feature activation | +5.31e-03 |
Token | committee |
Token ID | 5583 |
Feature activation | -1.83e-01 |
Token | believes |
Token ID | 5804 |
Feature activation | -1.30e-02 |
Token | it |
Token ID | 340 |
Feature activation | -1.53e-01 |
Token | has |
Token ID | 468 |
Feature activation | -3.22e-01 |
Token | evidence |
Token ID | 2370 |
Feature activation | -2.42e-01 |
Token | Trump |
Token ID | 1301 |
Feature activation | -6.54e-02 |
Token | requested |
Token ID | 9167 |
Feature activation | +1.38e-01 |
Token | putting |
Token ID | 5137 |
Feature activation | -1.54e-01 |
Token | ally |
Token ID | 12525 |
Feature activation | -9.51e-02 |
Token | possession |
Token ID | 7797 |
Feature activation | -1.15e-03 |
Token | , |
Token ID | 11 |
Feature activation | +1.87e-02 |
Token | or |
Token ID | 393 |
Feature activation | +7.47e-02 |
Token | tribe |
Token ID | 14893 |
Feature activation | -4.13e-03 |
Token | respecting |
Token ID | 30796 |
Feature activation | +1.95e-01 |
Token | a |
Token ID | 257 |
Feature activation | +1.72e-01 |
Token | relationship |
Token ID | 2776 |
Feature activation | -3.34e-03 |
Token | between |
Token ID | 1022 |
Feature activation | +8.99e-02 |
Token | persons |
Token ID | 6506 |
Feature activation | -3.23e-02 |
Token | of |
Token ID | 286 |
Feature activation | +1.77e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.94e-02 |
Token | Thank |
Token ID | 10449 |
Feature activation | -1.76e-02 |
Token | you |
Token ID | 345 |
Feature activation | -1.36e-01 |
Token | for |
Token ID | 329 |
Feature activation | -8.19e-02 |
Token | signing |
Token ID | 8415 |
Feature activation | -3.66e-02 |
Token | up |
Token ID | 510 |
Feature activation | -4.21e-03 |
Token | . |
Token ID | 13 |
Feature activation | +1.87e-01 |
Token | For |
Token ID | 1114 |
Feature activation | -1.60e-02 |
Token | more |
Token ID | 517 |
Feature activation | -2.51e-02 |
Token | from |
Token ID | 422 |
Feature activation | +1.55e-02 |
Token | The |
Token ID | 383 |
Feature activation | -2.17e-02 |
Token | Nation |
Token ID | 8741 |
Feature activation | -2.86e-02 |
Token | the |
Token ID | 262 |
Feature activation | +1.22e-02 |
Token | arrival |
Token ID | 10325 |
Feature activation | -1.46e-02 |
Token | of |
Token ID | 286 |
Feature activation | +6.81e-03 |
Token | Th |
Token ID | 536 |
Feature activation | +1.60e-02 |
Token | ier |
Token ID | 959 |
Feature activation | +9.59e-02 |
Token | ry |
Token ID | 563 |
Feature activation | +2.58e-01 |
Token | Henry |
Token ID | 8616 |
Feature activation | -1.13e-02 |
Token | . |
Token ID | 13 |
Feature activation | -2.96e-02 |
Token | It |
Token ID | 632 |
Feature activation | -2.02e-02 |
Token | has |
Token ID | 468 |
Feature activation | -1.16e-02 |
Token | picked |
Token ID | 6497 |
Feature activation | +5.76e-02 |
Token | Though |
Token ID | 7486 |
Feature activation | -4.63e-03 |
Token | I |
Token ID | 314 |
Feature activation | +3.24e-02 |
Token | 'm |
Token ID | 1101 |
Feature activation | -1.46e-02 |
Token | pretty |
Token ID | 2495 |
Feature activation | +1.49e-02 |
Token | middle |
Token ID | 3504 |
Feature activation | -2.91e-02 |
Token | of |
Token ID | 286 |
Feature activation | +1.83e-01 |
Token | the |
Token ID | 262 |
Feature activation | +1.73e-01 |
Token | road |
Token ID | 2975 |
Feature activation | -2.19e-02 |
Token | on |
Token ID | 319 |
Feature activation | +1.13e-02 |
Token | Tor |
Token ID | 4022 |
Feature activation | -5.12e-03 |
Token | chy |
Token ID | 29658 |
Feature activation | -2.40e-04 |
Token | ing |
Token ID | 278 |
Feature activation | -5.28e-02 |
Token | Time |
Token ID | 3862 |
Feature activation | -5.84e-02 |
Token | : |
Token ID | 25 |
Feature activation | +1.22e-02 |
Token | The |
Token ID | 383 |
Feature activation | -8.08e-04 |
Token | D |
Token ID | 360 |
Feature activation | -1.63e-02 |
Token | ich |
Token ID | 488 |
Feature activation | +2.13e-01 |
Token | otom |
Token ID | 43125 |
Feature activation | +2.64e-02 |
Token | izing |
Token ID | 2890 |
Feature activation | -2.22e-02 |
Token | Disc |
Token ID | 8444 |
Feature activation | -1.37e-02 |
Token | ourse |
Token ID | 9047 |
Feature activation | +3.01e-02 |
Token | of |
Token ID | 286 |
Feature activation | +1.36e-03 |
Token | that |
Token ID | 326 |
Feature activation | -1.18e-04 |
Token | sense |
Token ID | 2565 |
Feature activation | +9.28e-03 |
Token | of |
Token ID | 286 |
Feature activation | -4.83e-04 |
Token | the |
Token ID | 262 |
Feature activation | -3.12e-03 |
Token | unknown |
Token ID | 6439 |
Feature activation | -1.45e-02 |
Token | is |
Token ID | 318 |
Feature activation | -1.27e-02 |
Token | really |
Token ID | 1107 |
Feature activation | -2.28e-02 |
Token | cool |
Token ID | 3608 |
Feature activation | +1.63e-02 |
Token | . |
Token ID | 13 |
Feature activation | -7.54e-03 |
Token | Every |
Token ID | 3887 |
Feature activation | +4.63e-03 |
Token | map |
Token ID | 3975 |
Feature activation | +3.08e-02 |
Token | Al |
Token ID | 978 |
Feature activation | -2.14e-03 |
Token | P |
Token ID | 350 |
Feature activation | -6.46e-02 |
Token | urdy |
Token ID | 22876 |
Feature activation | +2.02e-02 |
Token | � |
Token ID | 447 |
Feature activation | +2.88e-03 |
Token | � |
Token ID | 247 |
Feature activation | +5.61e-03 |
Token | s |
Token ID | 82 |
Feature activation | +1.52e-02 |
Token | statue |
Token ID | 15207 |
Feature activation | +4.02e-02 |
Token | , |
Token ID | 11 |
Feature activation | +1.33e-02 |
Token | Queen |
Token ID | 7542 |
Feature activation | -1.63e-03 |
Token | � |
Token ID | 447 |
Feature activation | +1.53e-02 |
Token | � |
Token ID | 247 |
Feature activation | -2.85e-02 |
Token | you |
Token ID | 345 |
Feature activation | +8.57e-03 |
Token | don |
Token ID | 836 |
Feature activation | +1.20e-02 |
Token | 't |
Token ID | 470 |
Feature activation | -4.19e-03 |
Token | feel |
Token ID | 1254 |
Feature activation | +2.54e-02 |
Token | confident |
Token ID | 6563 |
Feature activation | +5.15e-02 |
Token | enough |
Token ID | 1576 |
Feature activation | -4.32e-03 |
Token | to |
Token ID | 284 |
Feature activation | -1.80e-02 |
Token | go |
Token ID | 467 |
Feature activation | +1.48e-02 |
Token | to |
Token ID | 284 |
Feature activation | -6.80e-03 |
Token | a |
Token ID | 257 |
Feature activation | -5.87e-03 |
Token | gym |
Token ID | 11550 |
Feature activation | +4.55e-02 |
Token | players |
Token ID | 1938 |
Feature activation | +3.24e-02 |
Token | from |
Token ID | 422 |
Feature activation | -2.76e-02 |
Token | other |
Token ID | 584 |
Feature activation | +6.67e-03 |
Token | team |
Token ID | 1074 |
Feature activation | +6.87e-03 |
Token | such |
Token ID | 884 |
Feature activation | -2.40e-02 |
Token | as |
Token ID | 355 |
Feature activation | -6.43e-04 |
Token | sc |
Token ID | 629 |
Feature activation | -3.08e-03 |
Token | a |
Token ID | 64 |
Feature activation | +4.63e-02 |
Token | . |
Token ID | 13 |
Feature activation | +2.03e-02 |
Token | If |
Token ID | 1002 |
Feature activation | +3.05e-02 |
Token | it |
Token ID | 340 |
Feature activation | -8.70e-02 |
Token | amount |
Token ID | 2033 |
Feature activation | -1.51e-02 |
Token | of |
Token ID | 286 |
Feature activation | +4.59e-03 |
Token | money |
Token ID | 1637 |
Feature activation | +1.02e-01 |
Token | she |
Token ID | 673 |
Feature activation | +3.16e-02 |
Token | receives |
Token ID | 11583 |
Feature activation | -2.04e-03 |
Token | from |
Token ID | 422 |
Feature activation | -9.02e-03 |
Token | the |
Token ID | 262 |
Feature activation | +2.59e-02 |
Token | petroleum |
Token ID | 30918 |
Feature activation | +1.46e-02 |
Token | industry |
Token ID | 2831 |
Feature activation | +1.37e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.34e-02 |
Token |
|
Token ID | 198 |
Feature activation | -5.62e-02 |
Token | е |
Token ID | 16843 |
Feature activation | -9.75e-02 |
Token | л |
Token ID | 30143 |
Feature activation | -5.90e-02 |
Token | � |
Token ID | 12466 |
Feature activation | -1.03e-01 |
Token | � |
Token ID | 110 |
Feature activation | -6.12e-02 |
Token | � |
Token ID | 12466 |
Feature activation | -1.01e-02 |
Token | � |
Token ID | 115 |
Feature activation | -8.62e-02 |
Token | а |
Token ID | 16142 |
Feature activation | -6.67e-02 |
Token | � |
Token ID | 140 |
Feature activation | +5.31e-02 |
Token | � |
Token ID | 123 |
Feature activation | -1.31e-01 |
Token | а |
Token ID | 16142 |
Feature activation | -3.40e-02 |
Token | я |
Token ID | 40623 |
Feature activation | +1.66e-02 |
Token | EN |
Token ID | 1677 |
Feature activation | -8.23e-03 |
Token | p |
Token ID | 79 |
Feature activation | -2.57e-03 |
Token | aul |
Token ID | 2518 |
Feature activation | +1.59e-02 |
Token | i |
Token ID | 72 |
Feature activation | +9.00e-03 |
Token | . |
Token ID | 13 |
Feature activation | +6.33e-03 |
Token | re |
Token ID | 260 |
Feature activation | -1.93e-01 |
Token | in |
Token ID | 259 |
Feature activation | -5.72e-02 |
Token | ik |
Token ID | 1134 |
Feature activation | +2.05e-02 |
Token | ain |
Token ID | 391 |
Feature activation | +2.94e-03 |
Token | en |
Token ID | 268 |
Feature activation | +3.06e-03 |
Token | @ |
Token ID | 2488 |
Feature activation | +6.07e-03 |
Token | the |
Token ID | 262 |
Feature activation | +5.58e-03 |
Token | deal |
Token ID | 1730 |
Feature activation | -1.30e-02 |
Token | , |
Token ID | 11 |
Feature activation | -7.43e-04 |
Token | anything |
Token ID | 1997 |
Feature activation | +3.03e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.21e-01 |
Token | bring |
Token ID | 2222 |
Feature activation | -1.54e-01 |
Token | an |
Token ID | 281 |
Feature activation | +9.89e-03 |
Token | end |
Token ID | 886 |
Feature activation | -9.83e-02 |
Token | to |
Token ID | 284 |
Feature activation | +6.68e-03 |
Token | this |
Token ID | 428 |
Feature activation | +6.26e-02 |
Token | hell |
Token ID | 5968 |
Feature activation | -1.74e-02 |
Token | protections |
Token ID | 15018 |
Feature activation | -5.36e-02 |
Token | of |
Token ID | 286 |
Feature activation | -2.27e-02 |
Token | the |
Token ID | 262 |
Feature activation | -2.24e-02 |
Token | Constitution |
Token ID | 7965 |
Feature activation | -1.42e-02 |
Token | . |
Token ID | 13 |
Feature activation | +4.05e-03 |
Token |
|
Token ID | 198 |
Feature activation | -8.83e-02 |
Token |
|
Token ID | 198 |
Feature activation | -6.71e-04 |
Token | In |
Token ID | 818 |
Feature activation | +9.88e-03 |
Token | the |
Token ID | 262 |
Feature activation | +3.28e-03 |
Token | opinion |
Token ID | 4459 |
Feature activation | +9.36e-04 |
Token | , |
Token ID | 11 |
Feature activation | -6.55e-03 |
Token | . |
Token ID | 13 |
Feature activation | +1.39e-02 |
Token | " |
Token ID | 366 |
Feature activation | +1.95e-02 |
Token | I |
Token ID | 40 |
Feature activation | +9.61e-03 |
Token | bought |
Token ID | 5839 |
Feature activation | -4.61e-02 |
Token | the |
Token ID | 262 |
Feature activation | -2.35e-03 |
Token | drugs |
Token ID | 5010 |
Feature activation | -9.61e-02 |
Token | to |
Token ID | 284 |
Feature activation | +3.12e-03 |
Token | enhance |
Token ID | 9494 |
Feature activation | +2.36e-02 |
Token | masturbation |
Token ID | 41054 |
Feature activation | +1.39e-02 |
Token | . |
Token ID | 13 |
Feature activation | +2.91e-03 |
Token | Because |
Token ID | 4362 |
Feature activation | -4.89e-02 |
Token | functions |
Token ID | 5499 |
Feature activation | -6.92e-02 |
Token | using |
Token ID | 1262 |
Feature activation | +1.45e-02 |
Token | the |
Token ID | 262 |
Feature activation | -1.65e-01 |
Token | archived |
Token ID | 33962 |
Feature activation | -5.79e-02 |
Token | file |
Token ID | 2393 |
Feature activation | -1.86e-02 |
Token | from |
Token ID | 422 |
Feature activation | -3.85e-01 |
Token | S |
Token ID | 311 |
Feature activation | -8.54e-02 |
Token | 3 |
Token ID | 18 |
Feature activation | -3.05e-01 |
Token | bucket |
Token ID | 19236 |
Feature activation | -2.67e-02 |
Token | . |
Token ID | 13 |
Feature activation | -1.61e-02 |
Token | It |
Token ID | 632 |
Feature activation | +6.26e-03 |
Token | iss |
Token ID | 747 |
Feature activation | -5.83e-02 |
Token | ar |
Token ID | 283 |
Feature activation | -2.05e-02 |
Token | of |
Token ID | 286 |
Feature activation | -9.13e-02 |
Token | Defense |
Token ID | 5947 |
Feature activation | -1.51e-02 |
Token | S |
Token ID | 311 |
Feature activation | -4.94e-03 |
Token | emy |
Token ID | 3065 |
Feature activation | -4.08e-01 |
Token | on |
Token ID | 261 |
Feature activation | -1.35e-02 |
Token | Tim |
Token ID | 5045 |
Feature activation | -7.09e-02 |
Token | oshenko |
Token ID | 43934 |
Feature activation | +1.63e-02 |
Token | and |
Token ID | 290 |
Feature activation | +7.00e-03 |
Token | Zh |
Token ID | 10511 |
Feature activation | +2.45e-03 |
Token | , |
Token ID | 11 |
Feature activation | -3.81e-02 |
Token | whilst |
Token ID | 14590 |
Feature activation | -3.48e-02 |
Token | at |
Token ID | 379 |
Feature activation | +3.85e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.20e-02 |
Token | same |
Token ID | 976 |
Feature activation | +1.71e-01 |
Token | time |
Token ID | 640 |
Feature activation | -3.55e-01 |
Token | providing |
Token ID | 4955 |
Feature activation | +7.55e-03 |
Token | us |
Token ID | 514 |
Feature activation | -3.40e-03 |
Token | with |
Token ID | 351 |
Feature activation | -5.29e-03 |
Token | more |
Token ID | 517 |
Feature activation | -3.57e-02 |
Token | than |
Token ID | 621 |
Feature activation | +6.46e-02 |
Token | bit |
Token ID | 1643 |
Feature activation | +2.76e-02 |
Token | stubborn |
Token ID | 24444 |
Feature activation | -2.22e-02 |
Token | ." |
Token ID | 526 |
Feature activation | -1.25e-01 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -2.13e-02 |
Token | Every |
Token ID | 6109 |
Feature activation | +9.47e-03 |
Token | share |
Token ID | 2648 |
Feature activation | -3.55e-01 |
Token | makes |
Token ID | 1838 |
Feature activation | -3.20e-01 |
Token | Black |
Token ID | 2619 |
Feature activation | -2.73e-02 |
Token | Voice |
Token ID | 15282 |
Feature activation | -3.05e-02 |
Token | louder |
Token ID | 27089 |
Feature activation | +4.57e-02 |
Token | ! |
Token ID | 0 |
Feature activation | +4.59e-02 |
Token | DOI |
Token ID | 40722 |
Feature activation | -2.50e-03 |
Token | : |
Token ID | 25 |
Feature activation | +1.99e-02 |
Token | 10 |
Token ID | 838 |
Feature activation | -9.54e-03 |
Token | . |
Token ID | 13 |
Feature activation | -6.87e-02 |
Token | 10 |
Token ID | 940 |
Feature activation | +7.13e-02 |
Token | 86 |
Token ID | 4521 |
Feature activation | -3.38e-01 |
Token | / |
Token ID | 14 |
Feature activation | +1.21e-01 |
Token | 34 |
Token ID | 2682 |
Feature activation | -3.75e-02 |
Token | 110 |
Token ID | 11442 |
Feature activation | -2.26e-02 |
Token | 7 |
Token ID | 22 |
Feature activation | +2.47e-02 |
Token |
|
Token ID | 198 |
Feature activation | -5.41e-03 |