Token | a |
Token ID | 257 |
Feature activation | +9.63e-02 |
Token | little |
Token ID | 1310 |
Feature activation | -3.47e-02 |
Token | bit |
Token ID | 1643 |
Feature activation | +9.34e-02 |
Token | of |
Token ID | 286 |
Feature activation | -3.58e-02 |
Token | mis |
Token ID | 2984 |
Feature activation | +1.87e-01 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.62e-01 |
Token | aving |
Token ID | 2703 |
Feature activation | +1.41e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.69e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.71e-01 |
Token | The |
Token ID | 464 |
Feature activation | +4.95e-02 |
Token | saw |
Token ID | 2497 |
Feature activation | -2.56e-02 |
Token | some |
Token ID | 617 |
Feature activation | +7.47e-02 |
Token | other |
Token ID | 584 |
Feature activation | +4.47e-02 |
Token | kids |
Token ID | 3988 |
Feature activation | -8.47e-02 |
Token | mis |
Token ID | 2984 |
Feature activation | +1.90e-01 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.61e-01 |
Token | aving |
Token ID | 2703 |
Feature activation | +1.42e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.47e-01 |
Token | running |
Token ID | 2491 |
Feature activation | +1.25e-01 |
Token | around |
Token ID | 1088 |
Feature activation | -5.60e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-01 |
Token | listen |
Token ID | 6004 |
Feature activation | +7.96e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.82e-01 |
Token | He |
Token ID | 679 |
Feature activation | +2.34e-02 |
Token | always |
Token ID | 1464 |
Feature activation | -7.56e-02 |
Token | mis |
Token ID | 2984 |
Feature activation | +1.86e-01 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.58e-01 |
Token | aved |
Token ID | 9586 |
Feature activation | +1.50e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.45e-01 |
Token | caused |
Token ID | 4073 |
Feature activation | +1.97e-01 |
Token | trouble |
Token ID | 5876 |
Feature activation | +1.15e-02 |
Token | wherever |
Token ID | 14530 |
Feature activation | -5.48e-02 |
Token | told |
Token ID | 1297 |
Feature activation | +9.03e-02 |
Token | Max |
Token ID | 5436 |
Feature activation | +1.12e-01 |
Token | to |
Token ID | 284 |
Feature activation | -1.34e-01 |
Token | stop |
Token ID | 2245 |
Feature activation | +3.50e-02 |
Token | mis |
Token ID | 2984 |
Feature activation | +1.88e-01 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.57e-01 |
Token | aving |
Token ID | 2703 |
Feature activation | +1.39e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e-01 |
Token | But |
Token ID | 887 |
Feature activation | -9.47e-02 |
Token | he |
Token ID | 339 |
Feature activation | +1.53e-02 |
Token | didn |
Token ID | 1422 |
Feature activation | +7.83e-02 |
Token | very |
Token ID | 845 |
Feature activation | -5.92e-02 |
Token | naughty |
Token ID | 45128 |
Feature activation | +1.42e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.43e-01 |
Token | always |
Token ID | 1464 |
Feature activation | -7.62e-02 |
Token | mis |
Token ID | 2984 |
Feature activation | +1.83e-01 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.57e-01 |
Token | aving |
Token ID | 2703 |
Feature activation | +1.38e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Token | One |
Token ID | 1881 |
Feature activation | +2.12e-02 |
Token | day |
Token ID | 1110 |
Feature activation | -2.11e-01 |
Token | she |
Token ID | 673 |
Feature activation | -6.23e-03 |
Token | became |
Token ID | 2627 |
Feature activation | +9.11e-02 |
Token | friendly |
Token ID | 8030 |
Feature activation | +1.13e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.46e-01 |
Token | well |
Token ID | 880 |
Feature activation | +4.08e-02 |
Token | - |
Token ID | 12 |
Feature activation | +5.76e-02 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.56e-01 |
Token | aved |
Token ID | 9586 |
Feature activation | +1.48e-01 |
Token | , |
Token ID | 11 |
Feature activation | -1.01e-01 |
Token | just |
Token ID | 655 |
Feature activation | +3.85e-02 |
Token | like |
Token ID | 588 |
Feature activation | -1.29e-02 |
Token | Buddy |
Token ID | 36896 |
Feature activation | +1.08e-01 |
Token | told |
Token ID | 1297 |
Feature activation | +9.16e-02 |
Token | him |
Token ID | 683 |
Feature activation | +4.22e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.33e-01 |
Token | stop |
Token ID | 2245 |
Feature activation | +3.30e-02 |
Token | mis |
Token ID | 2984 |
Feature activation | +1.86e-01 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.54e-01 |
Token | aving |
Token ID | 2703 |
Feature activation | +1.39e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.46e-01 |
Token | to |
Token ID | 284 |
Feature activation | -1.32e-01 |
Token | be |
Token ID | 307 |
Feature activation | -8.43e-02 |
Token | kind |
Token ID | 1611 |
Feature activation | +1.53e-01 |
Token | for |
Token ID | 329 |
Feature activation | -7.62e-04 |
Token | being |
Token ID | 852 |
Feature activation | +2.10e-02 |
Token | so |
Token ID | 523 |
Feature activation | -1.90e-01 |
Token | well |
Token ID | 880 |
Feature activation | +3.61e-02 |
Token | - |
Token ID | 12 |
Feature activation | +5.18e-02 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.51e-01 |
Token | aved |
Token ID | 9586 |
Feature activation | +1.42e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.45e-01 |
Token | Jack |
Token ID | 3619 |
Feature activation | +8.52e-02 |
Token | was |
Token ID | 373 |
Feature activation | +9.00e-03 |
Token | delighted |
Token ID | 20707 |
Feature activation | -3.41e-02 |
Token | be |
Token ID | 307 |
Feature activation | -8.55e-02 |
Token | happy |
Token ID | 3772 |
Feature activation | -4.64e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.43e-01 |
Token | well |
Token ID | 880 |
Feature activation | +3.71e-02 |
Token | - |
Token ID | 12 |
Feature activation | +5.31e-02 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.50e-01 |
Token | aved |
Token ID | 9586 |
Feature activation | +1.44e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.84e-01 |
Token | The |
Token ID | 383 |
Feature activation | +7.23e-02 |
Token | end |
Token ID | 886 |
Feature activation | -1.01e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Token | could |
Token ID | 714 |
Feature activation | -3.30e-02 |
Token | be |
Token ID | 307 |
Feature activation | -8.76e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.45e-01 |
Token | never |
Token ID | 1239 |
Feature activation | -1.13e-01 |
Token | mis |
Token ID | 2984 |
Feature activation | +1.80e-01 |
Token | beh |
Token ID | 20709 |
Feature activation | +3.47e-01 |
Token | aved |
Token ID | 9586 |
Feature activation | +1.40e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e-01 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -7.83e-02 |
Token | Once |
Token ID | 7454 |
Feature activation | -2.11e-01 |
Token | upon |
Token ID | 2402 |
Feature activation | -4.93e-02 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.57e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.66e-01 |
Token | " |
Token ID | 1 |
Feature activation | -4.13e-02 |
Token | Looks |
Token ID | 41102 |
Feature activation | +3.35e-01 |
Token | like |
Token ID | 588 |
Feature activation | -1.49e-02 |
Token | the |
Token ID | 262 |
Feature activation | +4.03e-02 |
Token | frog |
Token ID | 21264 |
Feature activation | +3.37e-02 |
Token | likes |
Token ID | 7832 |
Feature activation | +5.15e-02 |
Token | you |
Token ID | 345 |
Feature activation | -2.79e-02 |
Token | table |
Token ID | 3084 |
Feature activation | -1.71e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.66e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.67e-01 |
Token | " |
Token ID | 1 |
Feature activation | -4.15e-02 |
Token | Looks |
Token ID | 41102 |
Feature activation | +3.33e-01 |
Token | like |
Token ID | 588 |
Feature activation | -1.70e-02 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.65e-02 |
Token | has |
Token ID | 468 |
Feature activation | -2.46e-02 |
Token | some |
Token ID | 617 |
Feature activation | +7.48e-02 |
Token | mail |
Token ID | 6920 |
Feature activation | -4.26e-02 |
Token | laughed |
Token ID | 13818 |
Feature activation | +1.72e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.48e-01 |
Token | said |
Token ID | 531 |
Feature activation | +1.87e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.03e-01 |
Token | " |
Token ID | 366 |
Feature activation | -3.44e-02 |
Token | Looks |
Token ID | 41102 |
Feature activation | +3.30e-01 |
Token | like |
Token ID | 588 |
Feature activation | -1.46e-02 |
Token | that |
Token ID | 326 |
Feature activation | -1.09e-01 |
Token | apple |
Token ID | 17180 |
Feature activation | -6.19e-02 |
Token | made |
Token ID | 925 |
Feature activation | +7.60e-02 |
Token | you |
Token ID | 345 |
Feature activation | -2.96e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +2.05e-02 |
Token | mom |
Token ID | 1995 |
Feature activation | -1.41e-02 |
Token | my |
Token ID | 1820 |
Feature activation | -8.38e-03 |
Token | . |
Token ID | 13 |
Feature activation | +1.88e-01 |
Token | " |
Token ID | 366 |
Feature activation | -3.37e-02 |
Token | Looks |
Token ID | 41102 |
Feature activation | +3.28e-01 |
Token | like |
Token ID | 588 |
Feature activation | -1.68e-02 |
Token | the |
Token ID | 262 |
Feature activation | +4.14e-02 |
Token | wave |
Token ID | 6769 |
Feature activation | +3.47e-02 |
Token | destroyed |
Token ID | 6572 |
Feature activation | +1.14e-01 |
Token | all |
Token ID | 477 |
Feature activation | +2.39e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.70e-02 |
Token | owner |
Token ID | 4870 |
Feature activation | -3.50e-02 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.48e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.79e-01 |
Token | " |
Token ID | 366 |
Feature activation | -3.60e-02 |
Token | Looks |
Token ID | 41102 |
Feature activation | +3.26e-01 |
Token | like |
Token ID | 588 |
Feature activation | -1.99e-02 |
Token | you |
Token ID | 345 |
Feature activation | -3.61e-02 |
Token | two |
Token ID | 734 |
Feature activation | +6.16e-02 |
Token | are |
Token ID | 389 |
Feature activation | -7.99e-02 |
Token | friends |
Token ID | 2460 |
Feature activation | +3.18e-02 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.45e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.49e-01 |
Token | said |
Token ID | 531 |
Feature activation | +1.18e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.05e-01 |
Token | " |
Token ID | 366 |
Feature activation | -3.78e-02 |
Token | Looks |
Token ID | 41102 |
Feature activation | +3.23e-01 |
Token | like |
Token ID | 588 |
Feature activation | -2.05e-02 |
Token | you |
Token ID | 345 |
Feature activation | -3.64e-02 |
Token | like |
Token ID | 588 |
Feature activation | -2.05e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.56e-02 |
Token | wardrobe |
Token ID | 35593 |
Feature activation | -1.41e-01 |
Token | the |
Token ID | 262 |
Feature activation | +4.07e-02 |
Token | black |
Token ID | 2042 |
Feature activation | +1.37e-01 |
Token | mascara |
Token ID | 48430 |
Feature activation | +1.51e-01 |
Token | on |
Token ID | 319 |
Feature activation | +1.38e-02 |
Token | her |
Token ID | 607 |
Feature activation | +1.10e-01 |
Token | eyel |
Token ID | 29708 |
Feature activation | +3.18e-01 |
Token | ashes |
Token ID | 7465 |
Feature activation | +6.18e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.88e-01 |
Token | She |
Token ID | 1375 |
Feature activation | -8.75e-03 |
Token | makes |
Token ID | 1838 |
Feature activation | +1.16e-01 |
Token | a |
Token ID | 257 |
Feature activation | +9.87e-02 |
Token | long |
Token ID | 890 |
Feature activation | +4.88e-02 |
Token | until |
Token ID | 1566 |
Feature activation | -1.51e-01 |
Token | Chloe |
Token ID | 29476 |
Feature activation | +7.15e-02 |
Token | felt |
Token ID | 2936 |
Feature activation | +1.11e-01 |
Token | her |
Token ID | 607 |
Feature activation | +1.09e-01 |
Token | eyel |
Token ID | 29708 |
Feature activation | +3.15e-01 |
Token | ids |
Token ID | 2340 |
Feature activation | +7.84e-03 |
Token | getting |
Token ID | 1972 |
Feature activation | -2.14e-02 |
Token | heavy |
Token ID | 4334 |
Feature activation | +5.24e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.88e-01 |
Token | She |
Token ID | 1375 |
Feature activation | -1.05e-02 |
Token | fingers |
Token ID | 9353 |
Feature activation | +1.31e-02 |
Token | were |
Token ID | 547 |
Feature activation | -1.11e-02 |
Token | red |
Token ID | 2266 |
Feature activation | +5.88e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.48e-01 |
Token | bl |
Token ID | 698 |
Feature activation | +1.02e-01 |
Token | istered |
Token ID | 23187 |
Feature activation | +3.13e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.86e-01 |
Token | He |
Token ID | 679 |
Feature activation | +1.85e-02 |
Token | felt |
Token ID | 2936 |
Feature activation | +1.11e-01 |
Token | very |
Token ID | 845 |
Feature activation | -6.00e-02 |
Token | scared |
Token ID | 12008 |
Feature activation | +1.50e-01 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.79e-01 |
Token | pur |
Token ID | 1308 |
Feature activation | +2.43e-01 |
Token | red |
Token ID | 445 |
Feature activation | +1.72e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.37e-01 |
Token | l |
Token ID | 300 |
Feature activation | +1.77e-01 |
Token | icked |
Token ID | 9484 |
Feature activation | +3.13e-01 |
Token | Anna |
Token ID | 11735 |
Feature activation | +7.38e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +3.48e-02 |
Token | face |
Token ID | 1986 |
Feature activation | -5.91e-03 |
Token | . |
Token ID | 13 |
Feature activation | +1.92e-01 |
Token | Anna |
Token ID | 11735 |
Feature activation | +7.19e-02 |
Token | blanket |
Token ID | 18447 |
Feature activation | -1.09e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e-01 |
Token | He |
Token ID | 679 |
Feature activation | +1.51e-02 |
Token | ruined |
Token ID | 20484 |
Feature activation | +9.96e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.44e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.80e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.65e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.66e-01 |
Token | S |
Token ID | 50 |
Feature activation | +8.42e-02 |
Token | ara |
Token ID | 3301 |
Feature activation | +1.18e-03 |
Token | The |
Token ID | 383 |
Feature activation | +6.49e-02 |
Token | little |
Token ID | 1310 |
Feature activation | -4.24e-02 |
Token | boy |
Token ID | 2933 |
Feature activation | -7.11e-02 |
Token | liked |
Token ID | 8288 |
Feature activation | +8.56e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.40e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.80e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.51e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.39e-02 |
Token | man |
Token ID | 582 |
Feature activation | -1.09e-01 |
Token | 's |
Token ID | 338 |
Feature activation | +1.71e-02 |
Token | big |
Token ID | 1263 |
Feature activation | +2.18e-02 |
Token | dust |
Token ID | 8977 |
Feature activation | +4.16e-04 |
Token | onto |
Token ID | 4291 |
Feature activation | +6.36e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.61e-02 |
Token | l |
Token ID | 300 |
Feature activation | +1.53e-01 |
Token | ily |
Token ID | 813 |
Feature activation | +1.08e-01 |
Token | pad |
Token ID | 14841 |
Feature activation | -2.79e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.50e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.69e-02 |
Token | pond |
Token ID | 16723 |
Feature activation | -2.26e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.77e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Token | They |
Token ID | 1119 |
Feature activation | +1.77e-02 |
Token | rested |
Token ID | 29263 |
Feature activation | +2.44e-02 |
Token | on |
Token ID | 319 |
Feature activation | +9.81e-03 |
Token | the |
Token ID | 262 |
Feature activation | +3.69e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -8.00e-02 |
Token | L |
Token ID | 43 |
Feature activation | +1.60e-01 |
Token | ily |
Token ID | 813 |
Feature activation | +1.13e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e-01 |
Token | They |
Token ID | 1119 |
Feature activation | +9.36e-03 |
Token | all |
Token ID | 477 |
Feature activation | +1.89e-02 |
Token | came |
Token ID | 1625 |
Feature activation | +3.97e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.40e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.52e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.52e-01 |
Token | attached |
Token ID | 7223 |
Feature activation | +6.79e-02 |
Token | ropes |
Token ID | 31001 |
Feature activation | -1.46e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.53e-02 |
Token |
|
Token ID | 198 |
Feature activation | -1.79e-01 |
Token | It |
Token ID | 1026 |
Feature activation | -1.02e-01 |
Token | was |
Token ID | 373 |
Feature activation | +2.79e-03 |
Token | an |
Token ID | 281 |
Feature activation | +1.28e-01 |
Token | amazing |
Token ID | 4998 |
Feature activation | -2.64e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | with |
Token ID | 351 |
Feature activation | +3.02e-02 |
Token | many |
Token ID | 867 |
Feature activation | -1.16e-02 |
Token | creatures |
Token ID | 8109 |
Feature activation | +2.17e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.50e-01 |
Token | plants |
Token ID | 6134 |
Feature activation | -2.89e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e-01 |
Token | be |
Token ID | 307 |
Feature activation | -9.10e-02 |
Token | part |
Token ID | 636 |
Feature activation | +3.68e-02 |
Token | of |
Token ID | 286 |
Feature activation | -4.06e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.79e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | family |
Token ID | 1641 |
Feature activation | -9.37e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.79e-01 |
Token | And |
Token ID | 843 |
Feature activation | -4.48e-02 |
Token | they |
Token ID | 484 |
Feature activation | +7.31e-03 |
Token | all |
Token ID | 477 |
Feature activation | +1.97e-02 |
Token | set |
Token ID | 900 |
Feature activation | -1.69e-02 |
Token | off |
Token ID | 572 |
Feature activation | -1.17e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.40e-01 |
Token | explore |
Token ID | 7301 |
Feature activation | -6.34e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.36e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.77e-01 |
Token | As |
Token ID | 1081 |
Feature activation | -3.91e-02 |
Token | they |
Token ID | 484 |
Feature activation | +3.64e-03 |
Token | walked |
Token ID | 6807 |
Feature activation | +1.34e-01 |
Token | , |
Token ID | 11 |
Feature activation | -1.06e-01 |
Token | make |
Token ID | 787 |
Feature activation | +5.89e-02 |
Token | it |
Token ID | 340 |
Feature activation | -9.72e-02 |
Token | safely |
Token ID | 11512 |
Feature activation | +1.29e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.41e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.42e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.49e-01 |
Token | he |
Token ID | 339 |
Feature activation | +7.50e-03 |
Token | explored |
Token ID | 18782 |
Feature activation | +4.66e-04 |
Token | it |
Token ID | 340 |
Feature activation | -9.70e-02 |
Token | for |
Token ID | 329 |
Feature activation | -5.95e-03 |
Token | in |
Token ID | 287 |
Feature activation | +2.91e-04 |
Token | the |
Token ID | 262 |
Feature activation | +3.48e-02 |
Token | park |
Token ID | 3952 |
Feature activation | -2.51e-01 |
Token | many |
Token ID | 867 |
Feature activation | -1.19e-02 |
Token | years |
Token ID | 812 |
Feature activation | -5.46e-02 |
Token | ago |
Token ID | 2084 |
Feature activation | -2.79e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.79e-01 |
Token | Toby |
Token ID | 37578 |
Feature activation | +9.48e-02 |
Token | was |
Token ID | 373 |
Feature activation | +3.23e-03 |
Token | amazed |
Token ID | 24562 |
Feature activation | +3.55e-03 |
Token | ! |
Token ID | 0 |
Feature activation | +1.31e-01 |
Token | she |
Token ID | 673 |
Feature activation | -1.74e-02 |
Token | was |
Token ID | 373 |
Feature activation | +5.88e-03 |
Token | on |
Token ID | 319 |
Feature activation | +1.11e-02 |
Token | a |
Token ID | 257 |
Feature activation | +9.33e-02 |
Token | tropical |
Token ID | 19690 |
Feature activation | +1.52e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | surrounded |
Token ID | 11191 |
Feature activation | +9.25e-02 |
Token | by |
Token ID | 416 |
Feature activation | -5.82e-02 |
Token | pink |
Token ID | 11398 |
Feature activation | +6.32e-02 |
Token | flaming |
Token ID | 39518 |
Feature activation | +1.85e-02 |
Token | os |
Token ID | 418 |
Feature activation | +1.39e-01 |
Token | " |
Token ID | 366 |
Feature activation | -4.09e-02 |
Token | It |
Token ID | 1026 |
Feature activation | -9.55e-02 |
Token | was |
Token ID | 373 |
Feature activation | +5.17e-03 |
Token | hidden |
Token ID | 7104 |
Feature activation | +1.28e-02 |
Token | long |
Token ID | 890 |
Feature activation | +3.85e-02 |
Token | ago |
Token ID | 2084 |
Feature activation | -2.79e-01 |
Token | , |
Token ID | 11 |
Feature activation | -1.08e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.47e-01 |
Token | only |
Token ID | 691 |
Feature activation | -3.35e-02 |
Token | seems |
Token ID | 2331 |
Feature activation | +7.85e-02 |
Token | fancy |
Token ID | 14996 |
Feature activation | +1.72e-02 |
Token | man |
Token ID | 582 |
Feature activation | -1.10e-01 |
Token | shared |
Token ID | 4888 |
Feature activation | +1.52e-01 |
Token | stories |
Token ID | 3923 |
Feature activation | +1.95e-02 |
Token | of |
Token ID | 286 |
Feature activation | -4.31e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.39e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | , |
Token ID | 11 |
Feature activation | -1.05e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.51e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.43e-02 |
Token | little |
Token ID | 1310 |
Feature activation | -4.16e-02 |
Token | girl |
Token ID | 2576 |
Feature activation | -5.67e-02 |
Token | shows |
Token ID | 2523 |
Feature activation | +5.96e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.24e-02 |
Token | way |
Token ID | 835 |
Feature activation | -1.43e-01 |
Token | to |
Token ID | 284 |
Feature activation | -1.37e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.33e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.79e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.88e-01 |
Token | And |
Token ID | 843 |
Feature activation | -4.49e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.30e-02 |
Token | key |
Token ID | 1994 |
Feature activation | -4.78e-02 |
Token | opens |
Token ID | 9808 |
Feature activation | -2.19e-02 |
Token | until |
Token ID | 1566 |
Feature activation | -1.57e-01 |
Token | she |
Token ID | 673 |
Feature activation | -1.78e-02 |
Token | found |
Token ID | 1043 |
Feature activation | -2.42e-02 |
Token | a |
Token ID | 257 |
Feature activation | +9.33e-02 |
Token | little |
Token ID | 1310 |
Feature activation | -4.13e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.78e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-01 |
Token | She |
Token ID | 1375 |
Feature activation | -2.18e-02 |
Token | was |
Token ID | 373 |
Feature activation | +3.09e-03 |
Token | so |
Token ID | 523 |
Feature activation | -1.96e-01 |
Token | happy |
Token ID | 3772 |
Feature activation | -5.41e-02 |
Token | want |
Token ID | 765 |
Feature activation | +1.44e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.37e-01 |
Token | know |
Token ID | 760 |
Feature activation | -7.42e-02 |
Token | about |
Token ID | 546 |
Feature activation | -1.17e-01 |
Token | this |
Token ID | 428 |
Feature activation | -8.98e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.78e-01 |
Token | ." |
Token ID | 526 |
Feature activation | +7.14e-02 |
Token | The |
Token ID | 383 |
Feature activation | +6.63e-02 |
Token | wealthy |
Token ID | 11574 |
Feature activation | +3.39e-02 |
Token | man |
Token ID | 582 |
Feature activation | -1.09e-01 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.47e-01 |
Token | boat |
Token ID | 8848 |
Feature activation | -1.35e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.73e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.78e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.79e-01 |
Token | The |
Token ID | 464 |
Feature activation | +4.19e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.78e-01 |
Token | was |
Token ID | 373 |
Feature activation | +4.56e-03 |
Token | beautiful |
Token ID | 4950 |
Feature activation | +5.04e-03 |
Token | and |
Token ID | 290 |
Feature activation | -1.52e-01 |
Token | it |
Token ID | 340 |
Feature activation | -9.47e-02 |
Token | gl |
Token ID | 1278 |
Feature activation | +5.56e-02 |
Token | ran |
Token ID | 4966 |
Feature activation | +1.44e-01 |
Token | outside |
Token ID | 2354 |
Feature activation | -9.77e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e-01 |
Token | explore |
Token ID | 7301 |
Feature activation | -6.26e-02 |
Token | her |
Token ID | 607 |
Feature activation | +9.74e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.78e-01 |
Token | ! |
Token ID | 0 |
Feature activation | +1.31e-01 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | -7.99e-02 |
Token | M |
Token ID | 44 |
Feature activation | +1.49e-01 |
Token | andy |
Token ID | 10757 |
Feature activation | +3.63e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.45e-01 |
Token | island |
Token ID | 7022 |
Feature activation | -2.78e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.75e-01 |
Token | Sarah |
Token ID | 10490 |
Feature activation | +8.43e-02 |
Token | loved |
Token ID | 6151 |
Feature activation | +7.19e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.44e-02 |
Token | island |
Token ID | 7022 |
Feature activation | -2.78e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.51e-01 |
Token | she |
Token ID | 673 |
Feature activation | -1.72e-02 |
Token | spent |
Token ID | 3377 |
Feature activation | +9.06e-02 |
Token | many |
Token ID | 867 |
Feature activation | -1.17e-02 |
Token | hours |
Token ID | 2250 |
Feature activation | -1.12e-01 |
Token | looked |
Token ID | 3114 |
Feature activation | +3.37e-02 |
Token | underneath |
Token ID | 14638 |
Feature activation | +2.94e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.58e-02 |
Token | l |
Token ID | 300 |
Feature activation | +1.53e-01 |
Token | ily |
Token ID | 813 |
Feature activation | +1.09e-01 |
Token | pad |
Token ID | 14841 |
Feature activation | -2.78e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.77e-01 |
Token | Sure |
Token ID | 10889 |
Feature activation | +2.10e-02 |
Token | enough |
Token ID | 1576 |
Feature activation | -5.95e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.04e-01 |
Token | he |
Token ID | 339 |
Feature activation | +9.70e-03 |
Token | green |
Token ID | 4077 |
Feature activation | +6.14e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.52e-01 |
Token | has |
Token ID | 468 |
Feature activation | -2.09e-02 |
Token | a |
Token ID | 257 |
Feature activation | +9.56e-02 |
Token | for |
Token ID | 329 |
Feature activation | -2.33e-03 |
Token | ked |
Token ID | 9091 |
Feature activation | +2.41e-01 |
Token | tongue |
Token ID | 11880 |
Feature activation | +4.39e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e-01 |
Token | Lily |
Token ID | 20037 |
Feature activation | +1.13e-01 |
Token | is |
Token ID | 318 |
Feature activation | -5.10e-02 |
Token | curious |
Token ID | 11040 |
Feature activation | +9.30e-02 |
Token | boy |
Token ID | 2933 |
Feature activation | -6.23e-02 |
Token | nodded |
Token ID | 14464 |
Feature activation | +9.19e-02 |
Token | his |
Token ID | 465 |
Feature activation | +1.37e-01 |
Token | head |
Token ID | 1182 |
Feature activation | +1.66e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.44e-01 |
Token | scam |
Token ID | 19126 |
Feature activation | +2.27e-01 |
Token | pered |
Token ID | 13653 |
Feature activation | +8.01e-02 |
Token | down |
Token ID | 866 |
Feature activation | +5.55e-02 |
Token | the |
Token ID | 262 |
Feature activation | +4.13e-02 |
Token | street |
Token ID | 4675 |
Feature activation | -2.03e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e-01 |
Token | cat |
Token ID | 3797 |
Feature activation | +2.28e-04 |
Token | gr |
Token ID | 1036 |
Feature activation | +1.81e-01 |
Token | ump |
Token ID | 931 |
Feature activation | +7.78e-02 |
Token | ily |
Token ID | 813 |
Feature activation | +1.17e-01 |
Token | me |
Token ID | 502 |
Feature activation | -1.09e-01 |
Token | owed |
Token ID | 6972 |
Feature activation | +2.20e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.50e-01 |
Token | went |
Token ID | 1816 |
Feature activation | +7.62e-02 |
Token | away |
Token ID | 1497 |
Feature activation | -3.48e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.78e-01 |
Token | |
Token ID | 220 |
Feature activation | -1.28e-01 |
Token | Mar |
Token ID | 1526 |
Feature activation | +8.73e-02 |
Token | cy |
Token ID | 948 |
Feature activation | +7.54e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +2.22e-02 |
Token | ear |
Token ID | 1027 |
Feature activation | +2.83e-03 |
Token | , |
Token ID | 11 |
Feature activation | -1.02e-01 |
Token | � |
Token ID | 6184 |
Feature activation | +2.18e-01 |
Token | � |
Token ID | 95 |
Feature activation | +1.77e-01 |
Token | € |
Token ID | 26391 |
Feature activation | +8.25e-02 |
Token | � |
Token ID | 129 |
Feature activation | +1.49e-01 |
Token | � |
Token ID | 241 |
Feature activation | +1.00e-01 |
Token | It |
Token ID | 1026 |
Feature activation | -8.95e-02 |
Token | so |
Token ID | 523 |
Feature activation | -1.92e-01 |
Token | happy |
Token ID | 3772 |
Feature activation | -4.98e-02 |
Token | that |
Token ID | 326 |
Feature activation | -1.14e-01 |
Token | she |
Token ID | 673 |
Feature activation | -1.01e-02 |
Token | l |
Token ID | 300 |
Feature activation | +1.61e-01 |
Token | icked |
Token ID | 9484 |
Feature activation | +2.97e-01 |
Token | Max |
Token ID | 5436 |
Feature activation | +1.12e-01 |
Token | 's |
Token ID | 338 |
Feature activation | +2.19e-02 |
Token | face |
Token ID | 1986 |
Feature activation | -1.99e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e-01 |
Token | Max |
Token ID | 5436 |
Feature activation | +1.12e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.82e-02 |
Token | root |
Token ID | 6808 |
Feature activation | -4.22e-02 |
Token | was |
Token ID | 373 |
Feature activation | +5.70e-03 |
Token | laughing |
Token ID | 14376 |
Feature activation | +1.19e-01 |
Token | too |
Token ID | 1165 |
Feature activation | -3.44e-02 |
Token | ! |
Token ID | 0 |
Feature activation | +1.31e-01 |
Token | |
Token ID | 220 |
Feature activation | -1.29e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.75e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.75e-01 |
Token | J |
Token ID | 41 |
Feature activation | +2.21e-01 |
Token | enny |
Token ID | 11870 |
Feature activation | +8.41e-02 |
Token | ally |
Token ID | 453 |
Feature activation | +6.09e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.03e-01 |
Token | why |
Token ID | 1521 |
Feature activation | -6.53e-02 |
Token | do |
Token ID | 466 |
Feature activation | -7.47e-02 |
Token | birds |
Token ID | 10087 |
Feature activation | -2.94e-02 |
Token | fly |
Token ID | 6129 |
Feature activation | +4.28e-02 |
Token | ? |
Token ID | 30 |
Feature activation | +1.34e-01 |
Token | â |
Token ID | 22940 |
Feature activation | +1.79e-01 |
Token | € |
Token ID | 26391 |
Feature activation | +7.30e-02 |
Token | Sally |
Token ID | 25737 |
Feature activation | +8.68e-02 |
Token | thought |
Token ID | 1807 |
Feature activation | +3.59e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.80e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.75e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.76e-01 |
Token | The |
Token ID | 464 |
Feature activation | +4.28e-02 |
Token | boy |
Token ID | 2933 |
Feature activation | -6.86e-02 |
Token | replied |
Token ID | 8712 |
Feature activation | +5.45e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.07e-01 |
Token | " |
Token ID | 366 |
Feature activation | -3.85e-02 |
Token | I |
Token ID | 40 |
Feature activation | +9.02e-02 |
Token | was |
Token ID | 373 |
Feature activation | +7.06e-03 |
Token | sailing |
Token ID | 28499 |
Feature activation | -3.82e-02 |
Token | pieces |
Token ID | 5207 |
Feature activation | -1.40e-02 |
Token | ! |
Token ID | 0 |
Feature activation | +1.50e-01 |
Token | It |
Token ID | 632 |
Feature activation | -9.17e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +2.60e-02 |
Token | fun |
Token ID | 1257 |
Feature activation | -1.47e-02 |
Token | ! |
Token ID | 0 |
Feature activation | +1.50e-01 |
Token | All |
Token ID | 1439 |
Feature activation | +8.15e-02 |
Token | you |
Token ID | 345 |
Feature activation | -2.78e-02 |
Token | have |
Token ID | 423 |
Feature activation | -4.27e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.31e-01 |
Token | do |
Token ID | 466 |
Feature activation | -7.20e-02 |
Token | ?" |
Token ID | 1701 |
Feature activation | +7.47e-03 |
Token |
|
Token ID | 198 |
Feature activation | -1.69e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.70e-01 |
Token | B |
Token ID | 33 |
Feature activation | +1.92e-01 |
Token | eth |
Token ID | 2788 |
Feature activation | +3.35e-02 |
Token | replied |
Token ID | 8712 |
Feature activation | +5.83e-02 |
Token | with |
Token ID | 351 |
Feature activation | +3.40e-02 |
Token | a |
Token ID | 257 |
Feature activation | +9.59e-02 |
Token | big |
Token ID | 1263 |
Feature activation | +2.63e-02 |
Token | smile |
Token ID | 8212 |
Feature activation | +2.17e-02 |
Token | on |
Token ID | 319 |
Feature activation | +1.25e-02 |
Token | dolls |
Token ID | 36062 |
Feature activation | -1.81e-02 |
Token | was |
Token ID | 373 |
Feature activation | +1.95e-02 |
Token | very |
Token ID | 845 |
Feature activation | -5.53e-02 |
Token | bad |
Token ID | 2089 |
Feature activation | +8.81e-02 |
Token | ," |
Token ID | 553 |
Feature activation | -3.31e-02 |
Token | she |
Token ID | 673 |
Feature activation | -4.23e-03 |
Token | said |
Token ID | 531 |
Feature activation | +2.88e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.88e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.62e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.64e-01 |
Token | Max |
Token ID | 11518 |
Feature activation | +1.13e-01 |
Token | job |
Token ID | 1693 |
Feature activation | -6.24e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.82e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.72e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.73e-01 |
Token | From |
Token ID | 4863 |
Feature activation | +5.74e-02 |
Token | that |
Token ID | 326 |
Feature activation | -1.14e-01 |
Token | day |
Token ID | 1110 |
Feature activation | -2.11e-01 |
Token | on |
Token ID | 319 |
Feature activation | +1.14e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.02e-01 |
Token | the |
Token ID | 262 |
Feature activation | +4.12e-02 |
Token | bird |
Token ID | 6512 |
Feature activation | -7.38e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.11e-01 |
Token | he |
Token ID | 339 |
Feature activation | +1.49e-02 |
Token | was |
Token ID | 373 |
Feature activation | +7.74e-03 |
Token | careful |
Token ID | 8161 |
Feature activation | +6.26e-03 |
Token | about |
Token ID | 546 |
Feature activation | -1.14e-01 |
Token | what |
Token ID | 644 |
Feature activation | -5.74e-02 |
Token | he |
Token ID | 339 |
Feature activation | +1.94e-02 |
Token | did |
Token ID | 750 |
Feature activation | -6.75e-03 |
Token | and |
Token ID | 290 |
Feature activation | -1.48e-01 |
Token | where |
Token ID | 810 |
Feature activation | -9.60e-02 |
Token | he |
Token ID | 339 |
Feature activation | +2.09e-02 |
Token | Once |
Token ID | 7454 |
Feature activation | -2.10e-01 |
Token | upon |
Token ID | 2402 |
Feature activation | -5.01e-02 |
Token | a |
Token ID | 257 |
Feature activation | +9.77e-02 |
Token | time |
Token ID | 640 |
Feature activation | -2.03e-01 |
Token | , |
Token ID | 11 |
Feature activation | -9.95e-02 |
Token | there |
Token ID | 612 |
Feature activation | -1.03e-01 |
Token | was |
Token ID | 373 |
Feature activation | +9.94e-03 |
Token | a |
Token ID | 257 |
Feature activation | +9.78e-02 |
Token | little |
Token ID | 1310 |
Feature activation | -3.84e-02 |
Token | pig |
Token ID | 12967 |
Feature activation | -1.04e-01 |
Token | who |
Token ID | 508 |
Feature activation | -4.40e-02 |
Token |
|
Token ID | 198 |
Feature activation | -1.69e-01 |
Token | After |
Token ID | 3260 |
Feature activation | -5.02e-02 |
Token | meals |
Token ID | 13840 |
Feature activation | -1.49e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.00e-01 |
Token | Annie |
Token ID | 25860 |
Feature activation | +3.24e-03 |
Token | would |
Token ID | 561 |
Feature activation | -3.79e-02 |
Token | take |
Token ID | 1011 |
Feature activation | +1.08e-01 |
Token | the |
Token ID | 262 |
Feature activation | +4.27e-02 |
Token | car |
Token ID | 1097 |
Feature activation | -4.82e-02 |
Token | outside |
Token ID | 2354 |
Feature activation | -9.06e-02 |
Token | with |
Token ID | 351 |
Feature activation | +3.65e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.81e-01 |
Token | She |
Token ID | 1375 |
Feature activation | -1.22e-02 |
Token | walked |
Token ID | 6807 |
Feature activation | +1.41e-01 |
Token | along |
Token ID | 1863 |
Feature activation | +6.04e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.91e-02 |
Token | path |
Token ID | 3108 |
Feature activation | -1.45e-01 |
Token | until |
Token ID | 1566 |
Feature activation | -1.55e-01 |
Token | she |
Token ID | 673 |
Feature activation | -1.18e-02 |
Token | saw |
Token ID | 2497 |
Feature activation | -3.45e-02 |
Token | a |
Token ID | 257 |
Feature activation | +9.53e-02 |
Token | delivery |
Token ID | 7585 |
Feature activation | -4.82e-02 |
Token | friend |
Token ID | 1545 |
Feature activation | +4.09e-02 |
Token | ." |
Token ID | 526 |
Feature activation | +7.53e-02 |
Token |
|
Token ID | 198 |
Feature activation | -1.59e-01 |
Token |
|
Token ID | 198 |
Feature activation | -1.62e-01 |
Token | The |
Token ID | 464 |
Feature activation | +5.45e-02 |
Token | ostr |
Token ID | 42387 |
Feature activation | -1.30e-01 |
Token | ich |
Token ID | 488 |
Feature activation | -5.70e-02 |
Token | heard |
Token ID | 2982 |
Feature activation | +5.28e-02 |
Token | Ben |
Token ID | 3932 |
Feature activation | +8.46e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +2.62e-02 |
Token | voice |
Token ID | 3809 |
Feature activation | -7.86e-02 |
Token | be |
Token ID | 307 |
Feature activation | -8.68e-02 |
Token | proud |
Token ID | 6613 |
Feature activation | +4.25e-02 |
Token | of |
Token ID | 286 |
Feature activation | -3.94e-02 |
Token | yourself |
Token ID | 3511 |
Feature activation | +5.51e-02 |
Token | !" |
Token ID | 2474 |
Feature activation | +2.27e-02 |
Token |
|
Token ID | 198 |
Feature activation | -1.70e-01 |
Token | Alex |
Token ID | 15309 |
Feature activation | +1.13e-01 |
Token | smiled |
Token ID | 13541 |
Feature activation | +1.50e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.46e-01 |
Token | said |
Token ID | 531 |
Feature activation | +1.42e-02 |
Token | , |
Token ID | 11 |
Feature activation | -1.03e-01 |
Token | couldn |
Token ID | 3521 |
Feature activation | -1.61e-02 |
Token | 't |
Token ID | 470 |
Feature activation | -4.46e-02 |
Token | see |
Token ID | 766 |
Feature activation | -1.34e-01 |
Token | what |
Token ID | 644 |
Feature activation | -5.85e-02 |
Token | was |
Token ID | 373 |
Feature activation | +6.57e-03 |
Token | inside |
Token ID | 2641 |
Feature activation | -1.21e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.80e-01 |
Token | He |
Token ID | 679 |
Feature activation | +1.37e-02 |
Token | tried |
Token ID | 3088 |
Feature activation | +6.35e-02 |
Token | to |
Token ID | 284 |
Feature activation | -1.39e-01 |
Token | get |
Token ID | 651 |
Feature activation | -1.82e-02 |
Token | rad |
Token ID | 2511 |
Feature activation | +1.76e-02 |
Token | ish |
Token ID | 680 |
Feature activation | +2.12e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.85e-01 |
Token | He |
Token ID | 679 |
Feature activation | +1.86e-02 |
Token | hopped |
Token ID | 45230 |
Feature activation | +1.75e-01 |
Token | to |
Token ID | 284 |
Feature activation | -1.36e-01 |
Token | the |
Token ID | 262 |
Feature activation | +3.77e-02 |
Token | rad |
Token ID | 2511 |
Feature activation | +1.69e-02 |
Token | ish |
Token ID | 680 |
Feature activation | +2.03e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.83e-01 |
Token | He |
Token ID | 679 |
Feature activation | +1.69e-02 |