Token | realised |
Token ID | 19169 |
Feature activation | +1.23e-01 |
Token | it |
Token ID | 340 |
Feature activation | +8.12e-02 |
Token | wasn |
Token ID | 2492 |
Feature activation | -3.83e-04 |
Token | 't |
Token ID | 470 |
Feature activation | -1.46e-01 |
Token | her |
Token ID | 607 |
Feature activation | +4.32e-02 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.07e+00 |
Token | after |
Token ID | 706 |
Feature activation | -1.86e-02 |
Token | all |
Token ID | 477 |
Feature activation | -7.60e-03 |
Token | . |
Token ID | 13 |
Feature activation | +7.45e-02 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +1.52e-01 |
Token | Once |
Token ID | 7454 |
Feature activation | -1.02e-01 |
Token | them |
Token ID | 606 |
Feature activation | +1.78e-01 |
Token | it |
Token ID | 340 |
Feature activation | +9.27e-02 |
Token | was |
Token ID | 373 |
Feature activation | +9.17e-02 |
Token | all |
Token ID | 477 |
Feature activation | +2.38e-03 |
Token | their |
Token ID | 511 |
Feature activation | +1.43e-01 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.05e+00 |
Token | . |
Token ID | 13 |
Feature activation | +1.18e-01 |
Token | His |
Token ID | 2399 |
Feature activation | +3.61e-02 |
Token | friends |
Token ID | 2460 |
Feature activation | -5.27e-02 |
Token | were |
Token ID | 547 |
Feature activation | -3.35e-02 |
Token | so |
Token ID | 523 |
Feature activation | +1.24e-01 |
Token | ending |
Token ID | 7464 |
Feature activation | +8.46e-02 |
Token | was |
Token ID | 373 |
Feature activation | +5.68e-02 |
Token | no |
Token ID | 645 |
Feature activation | +3.26e-01 |
Token | one |
Token ID | 530 |
Feature activation | +4.09e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +4.34e-02 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.05e+00 |
Token | , |
Token ID | 11 |
Feature activation | +1.10e-01 |
Token | but |
Token ID | 475 |
Feature activation | -3.19e-01 |
Token | it |
Token ID | 340 |
Feature activation | +5.40e-02 |
Token | left |
Token ID | 1364 |
Feature activation | -1.08e-01 |
Token | the |
Token ID | 262 |
Feature activation | +6.26e-02 |
Token | it |
Token ID | 340 |
Feature activation | +4.61e-02 |
Token | was |
Token ID | 373 |
Feature activation | +4.26e-02 |
Token | Tim |
Token ID | 5045 |
Feature activation | -1.23e-01 |
Token | my |
Token ID | 1820 |
Feature activation | +4.44e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +3.20e-02 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.04e+00 |
Token | but |
Token ID | 475 |
Feature activation | -3.18e-01 |
Token | Tim |
Token ID | 5045 |
Feature activation | -1.15e-01 |
Token | my |
Token ID | 1820 |
Feature activation | +5.41e-02 |
Token | felt |
Token ID | 2936 |
Feature activation | +1.55e-01 |
Token | guilty |
Token ID | 6717 |
Feature activation | -2.02e-01 |
Token | and |
Token ID | 290 |
Feature activation | +7.65e-02 |
Token | it |
Token ID | 340 |
Feature activation | +5.60e-02 |
Token | was |
Token ID | 373 |
Feature activation | +5.67e-02 |
Token | his |
Token ID | 465 |
Feature activation | +6.56e-02 |
Token | own |
Token ID | 898 |
Feature activation | -2.17e-01 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.03e+00 |
Token | . |
Token ID | 13 |
Feature activation | +4.69e-02 |
Token |
|
Token ID | 198 |
Feature activation | +7.52e-02 |
Token |
|
Token ID | 198 |
Feature activation | +7.70e-02 |
Token | Johnny |
Token ID | 44960 |
Feature activation | -4.07e-02 |
Token | smiled |
Token ID | 13541 |
Feature activation | +3.78e-02 |
Token | knew |
Token ID | 2993 |
Feature activation | -9.27e-02 |
Token | it |
Token ID | 340 |
Feature activation | +6.24e-02 |
Token | was |
Token ID | 373 |
Feature activation | +8.14e-02 |
Token | his |
Token ID | 465 |
Feature activation | +6.04e-02 |
Token | own |
Token ID | 898 |
Feature activation | -2.25e-01 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.02e+00 |
Token | . |
Token ID | 13 |
Feature activation | +8.86e-02 |
Token | He |
Token ID | 679 |
Feature activation | +5.29e-02 |
Token | would |
Token ID | 561 |
Feature activation | +3.49e-01 |
Token | have |
Token ID | 423 |
Feature activation | -9.69e-02 |
Token | to |
Token ID | 284 |
Feature activation | +7.34e-02 |
Token | realized |
Token ID | 6939 |
Feature activation | +2.68e-01 |
Token | it |
Token ID | 340 |
Feature activation | +5.16e-02 |
Token | was |
Token ID | 373 |
Feature activation | +6.18e-02 |
Token | his |
Token ID | 465 |
Feature activation | +5.90e-02 |
Token | own |
Token ID | 898 |
Feature activation | -2.21e-01 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.02e+00 |
Token | for |
Token ID | 329 |
Feature activation | +2.03e-02 |
Token | not |
Token ID | 407 |
Feature activation | +1.50e-02 |
Token | val |
Token ID | 1188 |
Feature activation | -2.19e-01 |
Token | uing |
Token ID | 4250 |
Feature activation | +2.87e-01 |
Token | her |
Token ID | 607 |
Feature activation | +2.57e-02 |
Token | it |
Token ID | 340 |
Feature activation | +3.41e-02 |
Token | was |
Token ID | 373 |
Feature activation | +5.19e-02 |
Token | all |
Token ID | 477 |
Feature activation | -3.25e-02 |
Token | Joe |
Token ID | 5689 |
Feature activation | -9.91e-02 |
Token | 's |
Token ID | 338 |
Feature activation | +4.47e-02 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.02e+00 |
Token | . |
Token ID | 13 |
Feature activation | +5.12e-02 |
Token | Joe |
Token ID | 5689 |
Feature activation | -9.84e-02 |
Token | tried |
Token ID | 3088 |
Feature activation | +1.51e-01 |
Token | to |
Token ID | 284 |
Feature activation | +8.39e-02 |
Token | talk |
Token ID | 1561 |
Feature activation | -6.63e-02 |
Token | told |
Token ID | 1297 |
Feature activation | +3.86e-02 |
Token | her |
Token ID | 607 |
Feature activation | -1.15e-02 |
Token | it |
Token ID | 340 |
Feature activation | +5.65e-02 |
Token | was |
Token ID | 373 |
Feature activation | +4.69e-02 |
Token | her |
Token ID | 607 |
Feature activation | +1.10e-03 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.02e+00 |
Token | because |
Token ID | 780 |
Feature activation | -1.26e-01 |
Token | she |
Token ID | 673 |
Feature activation | +4.98e-02 |
Token | dropped |
Token ID | 5710 |
Feature activation | -1.20e-01 |
Token | her |
Token ID | 607 |
Feature activation | +4.11e-03 |
Token | toy |
Token ID | 13373 |
Feature activation | +1.32e-01 |
Token | � |
Token ID | 6184 |
Feature activation | +2.61e-01 |
Token | � |
Token ID | 95 |
Feature activation | +2.73e-01 |
Token | € |
Token ID | 26391 |
Feature activation | -1.75e-01 |
Token | � |
Token ID | 129 |
Feature activation | -2.21e-01 |
Token | � |
Token ID | 241 |
Feature activation | +2.02e-01 |
Token | Be |
Token ID | 3856 |
Feature activation | +1.01e+00 |
Token | careful |
Token ID | 8161 |
Feature activation | +2.77e-01 |
Token | not |
Token ID | 407 |
Feature activation | +4.31e-02 |
Token | to |
Token ID | 284 |
Feature activation | +1.15e-01 |
Token | touch |
Token ID | 3638 |
Feature activation | -1.27e-02 |
Token | it |
Token ID | 340 |
Feature activation | +9.10e-02 |
Token | warned |
Token ID | 7728 |
Feature activation | +1.49e-01 |
Token | the |
Token ID | 262 |
Feature activation | +4.83e-02 |
Token | skeleton |
Token ID | 18328 |
Feature activation | -1.02e-01 |
Token | , |
Token ID | 11 |
Feature activation | +1.09e-01 |
Token | ' |
Token ID | 705 |
Feature activation | +6.32e-02 |
Token | Be |
Token ID | 3856 |
Feature activation | +1.01e+00 |
Token | careful |
Token ID | 8161 |
Feature activation | +2.53e-01 |
Token | ! |
Token ID | 0 |
Feature activation | +3.81e-02 |
Token | The |
Token ID | 383 |
Feature activation | -3.95e-02 |
Token | dark |
Token ID | 3223 |
Feature activation | -1.33e-01 |
Token | woods |
Token ID | 16479 |
Feature activation | +2.85e-01 |
Token | that |
Token ID | 326 |
Feature activation | +1.00e-01 |
Token | it |
Token ID | 340 |
Feature activation | +2.63e-02 |
Token | wasn |
Token ID | 2492 |
Feature activation | -5.10e-02 |
Token | 't |
Token ID | 470 |
Feature activation | -2.18e-01 |
Token | her |
Token ID | 607 |
Feature activation | -1.67e-03 |
Token | fault |
Token ID | 8046 |
Feature activation | +1.00e+00 |
Token | . |
Token ID | 13 |
Feature activation | +3.97e-02 |
Token | Finally |
Token ID | 9461 |
Feature activation | +4.88e-02 |
Token | , |
Token ID | 11 |
Feature activation | +7.62e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.25e-02 |
Token | family |
Token ID | 1641 |
Feature activation | -4.43e-01 |
Token | saying |
Token ID | 2282 |
Feature activation | +3.73e-01 |
Token | that |
Token ID | 326 |
Feature activation | +1.01e-01 |
Token | it |
Token ID | 340 |
Feature activation | +3.99e-02 |
Token | was |
Token ID | 373 |
Feature activation | +3.71e-02 |
Token | his |
Token ID | 465 |
Feature activation | +2.67e-02 |
Token | fault |
Token ID | 8046 |
Feature activation | +9.94e-01 |
Token | that |
Token ID | 326 |
Feature activation | +1.22e-01 |
Token | he |
Token ID | 339 |
Feature activation | -4.47e-02 |
Token | forgot |
Token ID | 16453 |
Feature activation | -9.44e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.29e-02 |
Token | folder |
Token ID | 9483 |
Feature activation | +3.26e-01 |
Token | awn |
Token ID | 3832 |
Feature activation | +1.68e-01 |
Token | â |
Token ID | 22940 |
Feature activation | +3.52e-01 |
Token | € |
Token ID | 26391 |
Feature activation | -1.76e-01 |
Token | ™ |
Token ID | 8151 |
Feature activation | -4.39e-01 |
Token | s |
Token ID | 82 |
Feature activation | -1.68e-01 |
Token | fault |
Token ID | 8046 |
Feature activation | +9.91e-01 |
Token | . |
Token ID | 13 |
Feature activation | +6.68e-02 |
Token | |
Token ID | 220 |
Feature activation | -1.66e-01 |
Token |
|
Token ID | 198 |
Feature activation | +6.31e-02 |
Token |
|
Token ID | 198 |
Feature activation | +5.15e-02 |
Token | The |
Token ID | 464 |
Feature activation | -1.17e-01 |
Token | everyone |
Token ID | 2506 |
Feature activation | -1.48e-01 |
Token | they |
Token ID | 484 |
Feature activation | +8.09e-03 |
Token | met |
Token ID | 1138 |
Feature activation | +1.32e-01 |
Token | : |
Token ID | 25 |
Feature activation | +4.49e-01 |
Token | ' |
Token ID | 705 |
Feature activation | +9.25e-02 |
Token | Be |
Token ID | 3856 |
Feature activation | +9.90e-01 |
Token | patient |
Token ID | 5827 |
Feature activation | +3.51e-01 |
Token | , |
Token ID | 11 |
Feature activation | +1.34e-01 |
Token | be |
Token ID | 307 |
Feature activation | +1.75e-01 |
Token | kind |
Token ID | 1611 |
Feature activation | +2.15e-01 |
Token | and |
Token ID | 290 |
Feature activation | +1.18e-01 |
Token | creature |
Token ID | 7185 |
Feature activation | +1.56e-02 |
Token | simply |
Token ID | 2391 |
Feature activation | +1.49e-01 |
Token | replied |
Token ID | 8712 |
Feature activation | +4.07e-01 |
Token | , |
Token ID | 11 |
Feature activation | +1.74e-01 |
Token | " |
Token ID | 366 |
Feature activation | +5.97e-02 |
Token | Be |
Token ID | 3856 |
Feature activation | +9.89e-01 |
Token | kind |
Token ID | 1611 |
Feature activation | +2.12e-01 |
Token | to |
Token ID | 284 |
Feature activation | +1.13e-01 |
Token | others |
Token ID | 1854 |
Feature activation | +6.52e-02 |
Token | in |
Token ID | 287 |
Feature activation | +5.96e-02 |
Token | the |
Token ID | 262 |
Feature activation | +9.67e-02 |
Token | had |
Token ID | 550 |
Feature activation | +1.24e-01 |
Token | told |
Token ID | 1297 |
Feature activation | +5.25e-02 |
Token | her |
Token ID | 607 |
Feature activation | +2.31e-02 |
Token | : |
Token ID | 25 |
Feature activation | +3.79e-01 |
Token | " |
Token ID | 366 |
Feature activation | +2.00e-02 |
Token | Be |
Token ID | 3856 |
Feature activation | +9.89e-01 |
Token | have |
Token ID | 14150 |
Feature activation | +3.51e-01 |
Token | , |
Token ID | 11 |
Feature activation | +5.39e-02 |
Token | little |
Token ID | 1310 |
Feature activation | +1.03e-01 |
Token | one |
Token ID | 530 |
Feature activation | -1.98e-02 |
Token | ". |
Token ID | 1911 |
Feature activation | -9.17e-02 |
Token | smiled |
Token ID | 13541 |
Feature activation | +6.19e-02 |
Token | and |
Token ID | 290 |
Feature activation | +1.39e-01 |
Token | said |
Token ID | 531 |
Feature activation | +1.61e-01 |
Token | , |
Token ID | 11 |
Feature activation | +1.52e-01 |
Token | " |
Token ID | 366 |
Feature activation | +2.37e-03 |
Token | Be |
Token ID | 3856 |
Feature activation | +9.88e-01 |
Token | careful |
Token ID | 8161 |
Feature activation | +2.25e-01 |
Token | when |
Token ID | 618 |
Feature activation | -8.90e-02 |
Token | drawing |
Token ID | 8263 |
Feature activation | +6.32e-02 |
Token | , |
Token ID | 11 |
Feature activation | +7.82e-02 |
Token | okay |
Token ID | 8788 |
Feature activation | -8.85e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.89e-01 |
Token | He |
Token ID | 679 |
Feature activation | +1.33e-01 |
Token | said |
Token ID | 531 |
Feature activation | +1.69e-01 |
Token | , |
Token ID | 11 |
Feature activation | +1.03e-01 |
Token | " |
Token ID | 366 |
Feature activation | +5.02e-02 |
Token | Be |
Token ID | 3856 |
Feature activation | +9.88e-01 |
Token | smart |
Token ID | 4451 |
Feature activation | -1.22e-01 |
Token | and |
Token ID | 290 |
Feature activation | +7.92e-02 |
Token | always |
Token ID | 1464 |
Feature activation | +3.68e-01 |
Token | think |
Token ID | 892 |
Feature activation | -1.25e-02 |
Token | before |
Token ID | 878 |
Feature activation | -1.09e-01 |
Token | heard |
Token ID | 2982 |
Feature activation | +3.12e-01 |
Token | a |
Token ID | 257 |
Feature activation | +6.21e-02 |
Token | voice |
Token ID | 3809 |
Feature activation | +1.47e-01 |
Token | . |
Token ID | 13 |
Feature activation | +4.77e-02 |
Token | " |
Token ID | 366 |
Feature activation | -5.03e-02 |
Token | Be |
Token ID | 3856 |
Feature activation | +9.88e-01 |
Token | careful |
Token ID | 8161 |
Feature activation | +2.44e-01 |
Token | ," |
Token ID | 553 |
Feature activation | -8.24e-02 |
Token | it |
Token ID | 340 |
Feature activation | +6.69e-02 |
Token | said |
Token ID | 531 |
Feature activation | +1.02e-01 |
Token | . |
Token ID | 13 |
Feature activation | +8.52e-02 |
Token | quickly |
Token ID | 2952 |
Feature activation | -6.82e-02 |
Token | helped |
Token ID | 4193 |
Feature activation | -6.40e-02 |
Token | Tim |
Token ID | 5045 |
Feature activation | -2.10e-01 |
Token | my |
Token ID | 1820 |
Feature activation | -2.41e-03 |
Token | get |
Token ID | 651 |
Feature activation | -5.34e-02 |
Token | unst |
Token ID | 15014 |
Feature activation | -1.01e+00 |
Token | uck |
Token ID | 1347 |
Feature activation | +2.28e-01 |
Token | . |
Token ID | 13 |
Feature activation | +4.24e-02 |
Token | She |
Token ID | 1375 |
Feature activation | -3.72e-03 |
Token | said |
Token ID | 531 |
Feature activation | +5.61e-02 |
Token | , |
Token ID | 11 |
Feature activation | +2.64e-02 |
Token | knows |
Token ID | 4206 |
Feature activation | -1.90e-02 |
Token | how |
Token ID | 703 |
Feature activation | -8.20e-02 |
Token | to |
Token ID | 284 |
Feature activation | +1.15e-02 |
Token | get |
Token ID | 651 |
Feature activation | -6.20e-02 |
Token | things |
Token ID | 1243 |
Feature activation | +5.88e-02 |
Token | unst |
Token ID | 15014 |
Feature activation | -9.87e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +2.48e-01 |
Token | ." |
Token ID | 526 |
Feature activation | -8.22e-02 |
Token | So |
Token ID | 1406 |
Feature activation | -8.66e-02 |
Token | , |
Token ID | 11 |
Feature activation | +7.20e-02 |
Token | they |
Token ID | 484 |
Feature activation | -8.64e-02 |
Token | We |
Token ID | 1135 |
Feature activation | +1.08e-01 |
Token | 'll |
Token ID | 1183 |
Feature activation | +1.52e-01 |
Token | help |
Token ID | 1037 |
Feature activation | -1.66e-01 |
Token | you |
Token ID | 345 |
Feature activation | +3.05e-01 |
Token | get |
Token ID | 651 |
Feature activation | -4.30e-02 |
Token | unst |
Token ID | 15014 |
Feature activation | -9.86e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +2.53e-01 |
Token | ." |
Token ID | 526 |
Feature activation | -1.69e-01 |
Token |
|
Token ID | 198 |
Feature activation | +5.99e-02 |
Token |
|
Token ID | 198 |
Feature activation | +6.18e-02 |
Token | But |
Token ID | 1537 |
Feature activation | -3.78e-01 |
Token | that |
Token ID | 326 |
Feature activation | +1.15e-01 |
Token | the |
Token ID | 262 |
Feature activation | +4.04e-02 |
Token | zipper |
Token ID | 48992 |
Feature activation | +6.82e-02 |
Token | had |
Token ID | 550 |
Feature activation | +1.04e-01 |
Token | become |
Token ID | 1716 |
Feature activation | +1.59e-01 |
Token | unst |
Token ID | 15014 |
Feature activation | -9.79e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +2.68e-01 |
Token | . |
Token ID | 13 |
Feature activation | +4.92e-02 |
Token | She |
Token ID | 1375 |
Feature activation | -2.30e-02 |
Token | was |
Token ID | 373 |
Feature activation | +2.49e-02 |
Token | relieved |
Token ID | 22598 |
Feature activation | -1.66e-01 |
Token | they |
Token ID | 484 |
Feature activation | -4.98e-02 |
Token | didn |
Token ID | 1422 |
Feature activation | +6.42e-02 |
Token | 't |
Token ID | 470 |
Feature activation | -1.98e-01 |
Token | get |
Token ID | 651 |
Feature activation | -3.33e-02 |
Token | it |
Token ID | 340 |
Feature activation | +4.43e-02 |
Token | unst |
Token ID | 15014 |
Feature activation | -9.47e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +2.65e-01 |
Token | . |
Token ID | 13 |
Feature activation | +7.33e-02 |
Token |
|
Token ID | 198 |
Feature activation | +7.27e-02 |
Token |
|
Token ID | 198 |
Feature activation | +7.32e-02 |
Token | Just |
Token ID | 5703 |
Feature activation | -2.85e-01 |
Token | could |
Token ID | 714 |
Feature activation | -1.08e-01 |
Token | help |
Token ID | 1037 |
Feature activation | -1.30e-01 |
Token | get |
Token ID | 651 |
Feature activation | -2.23e-02 |
Token | the |
Token ID | 262 |
Feature activation | +3.58e-02 |
Token | car |
Token ID | 1097 |
Feature activation | +3.15e-01 |
Token | unst |
Token ID | 15014 |
Feature activation | -9.39e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +2.70e-01 |
Token | . |
Token ID | 13 |
Feature activation | +5.87e-02 |
Token |
|
Token ID | 198 |
Feature activation | +6.01e-02 |
Token |
|
Token ID | 198 |
Feature activation | +6.07e-02 |
Token | The |
Token ID | 464 |
Feature activation | -1.03e-01 |
Token | before |
Token ID | 878 |
Feature activation | -1.06e-01 |
Token | all |
Token ID | 477 |
Feature activation | -7.26e-03 |
Token | the |
Token ID | 262 |
Feature activation | +7.32e-02 |
Token | fur |
Token ID | 9230 |
Feature activation | +1.35e-01 |
Token | was |
Token ID | 373 |
Feature activation | +1.02e-01 |
Token | unst |
Token ID | 15014 |
Feature activation | -9.14e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +3.18e-01 |
Token | ! |
Token ID | 0 |
Feature activation | +5.77e-02 |
Token |
|
Token ID | 198 |
Feature activation | +1.29e-01 |
Token |
|
Token ID | 198 |
Feature activation | +1.22e-01 |
Token | The |
Token ID | 464 |
Feature activation | -7.93e-02 |
Token | together |
Token ID | 1978 |
Feature activation | -5.00e-02 |
Token | to |
Token ID | 284 |
Feature activation | +5.85e-02 |
Token | get |
Token ID | 651 |
Feature activation | -2.04e-02 |
Token | the |
Token ID | 262 |
Feature activation | +2.76e-02 |
Token | bird |
Token ID | 6512 |
Feature activation | +4.75e-02 |
Token | unst |
Token ID | 15014 |
Feature activation | -9.00e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +3.07e-01 |
Token | and |
Token ID | 290 |
Feature activation | +1.27e-01 |
Token | freed |
Token ID | 13459 |
Feature activation | -4.84e-01 |
Token | it |
Token ID | 340 |
Feature activation | +8.33e-02 |
Token | from |
Token ID | 422 |
Feature activation | -1.93e-01 |
Token | scared |
Token ID | 12008 |
Feature activation | +1.99e-02 |
Token | of |
Token ID | 286 |
Feature activation | +4.20e-02 |
Token | the |
Token ID | 262 |
Feature activation | +5.39e-02 |
Token | cold |
Token ID | 4692 |
Feature activation | -1.39e-01 |
Token | por |
Token ID | 16964 |
Feature activation | -4.61e-01 |
Token | cel |
Token ID | 5276 |
Feature activation | -8.86e-01 |
Token | ain |
Token ID | 391 |
Feature activation | -1.76e-01 |
Token | bowl |
Token ID | 9396 |
Feature activation | +1.02e-01 |
Token | ! |
Token ID | 0 |
Feature activation | +3.61e-02 |
Token | |
Token ID | 220 |
Feature activation | -1.35e-01 |
Token |
|
Token ID | 198 |
Feature activation | +8.68e-02 |
Token | your |
Token ID | 534 |
Feature activation | +1.56e-01 |
Token | fault |
Token ID | 8046 |
Feature activation | +8.44e-01 |
Token | . |
Token ID | 13 |
Feature activation | -1.11e-01 |
Token | Sometimes |
Token ID | 8975 |
Feature activation | +2.37e-01 |
Token | things |
Token ID | 1243 |
Feature activation | -3.25e-02 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.80e-01 |
Token | that |
Token ID | 326 |
Feature activation | -6.29e-02 |
Token | we |
Token ID | 356 |
Feature activation | -1.98e-01 |
Token | cannot |
Token ID | 2314 |
Feature activation | -9.94e-02 |
Token | control |
Token ID | 1630 |
Feature activation | -2.96e-02 |
Token | . |
Token ID | 13 |
Feature activation | -1.29e-01 |
Token | Benny |
Token ID | 44275 |
Feature activation | +1.90e-02 |
Token | helped |
Token ID | 4193 |
Feature activation | -1.95e-02 |
Token | the |
Token ID | 262 |
Feature activation | +4.08e-02 |
Token | bear |
Token ID | 6842 |
Feature activation | -1.12e-01 |
Token | get |
Token ID | 651 |
Feature activation | -7.48e-03 |
Token | unst |
Token ID | 15014 |
Feature activation | -8.63e-01 |
Token | uck |
Token ID | 1347 |
Feature activation | +3.39e-01 |
Token | and |
Token ID | 290 |
Feature activation | +1.23e-01 |
Token | helped |
Token ID | 4193 |
Feature activation | +2.49e-02 |
Token | the |
Token ID | 262 |
Feature activation | +7.10e-02 |
Token | little |
Token ID | 1310 |
Feature activation | +2.00e-01 |
Token | grandma |
Token ID | 49890 |
Feature activation | -8.27e-02 |
Token | . |
Token ID | 13 |
Feature activation | -6.56e-02 |
Token | How |
Token ID | 1374 |
Feature activation | +4.19e-02 |
Token | did |
Token ID | 750 |
Feature activation | -9.49e-02 |
Token | this |
Token ID | 428 |
Feature activation | -2.10e-02 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.54e-01 |
Token | ?" |
Token ID | 1701 |
Feature activation | -3.03e-01 |
Token | she |
Token ID | 673 |
Feature activation | -1.55e-01 |
Token | asks |
Token ID | 7893 |
Feature activation | -1.64e-01 |
Token | . |
Token ID | 13 |
Feature activation | +9.94e-02 |
Token |
|
Token ID | 198 |
Feature activation | +2.11e-02 |
Token | find |
Token ID | 1064 |
Feature activation | -3.29e-01 |
Token | them |
Token ID | 606 |
Feature activation | +1.26e-05 |
Token | ? |
Token ID | 30 |
Feature activation | -1.23e-01 |
Token | What |
Token ID | 1867 |
Feature activation | -1.39e-01 |
Token | will |
Token ID | 481 |
Feature activation | +1.89e-01 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.52e-01 |
Token | in |
Token ID | 287 |
Feature activation | -1.08e-01 |
Token | the |
Token ID | 262 |
Feature activation | -1.12e-01 |
Token | forest |
Token ID | 8222 |
Feature activation | -4.62e-02 |
Token | ? |
Token ID | 30 |
Feature activation | -1.16e-01 |
Token | <|endoftext|> |
Token ID | 50256 |
Feature activation | +6.61e-02 |
Token | magic |
Token ID | 5536 |
Feature activation | -1.29e-01 |
Token | . |
Token ID | 13 |
Feature activation | -5.14e-02 |
Token | Maybe |
Token ID | 6674 |
Feature activation | -4.05e-01 |
Token | it |
Token ID | 340 |
Feature activation | -9.45e-02 |
Token | will |
Token ID | 481 |
Feature activation | +1.95e-01 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.52e-01 |
Token | again |
Token ID | 757 |
Feature activation | -2.11e-01 |
Token | ." |
Token ID | 526 |
Feature activation | -2.06e-01 |
Token |
|
Token ID | 198 |
Feature activation | -2.72e-02 |
Token |
|
Token ID | 198 |
Feature activation | -2.73e-02 |
Token | They |
Token ID | 2990 |
Feature activation | -5.38e-02 |
Token | 's |
Token ID | 338 |
Feature activation | -1.97e-01 |
Token | okay |
Token ID | 8788 |
Feature activation | -2.61e-01 |
Token | . |
Token ID | 13 |
Feature activation | -8.27e-02 |
Token | Acc |
Token ID | 6366 |
Feature activation | -1.75e-01 |
Token | idents |
Token ID | 3231 |
Feature activation | -2.19e-01 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.48e-01 |
Token | . |
Token ID | 13 |
Feature activation | -8.87e-02 |
Token | Just |
Token ID | 2329 |
Feature activation | -3.71e-01 |
Token | be |
Token ID | 307 |
Feature activation | -4.38e-02 |
Token | more |
Token ID | 517 |
Feature activation | +2.56e-01 |
Token | careful |
Token ID | 8161 |
Feature activation | +5.35e-02 |
Token | I |
Token ID | 314 |
Feature activation | -1.39e-01 |
Token | did |
Token ID | 750 |
Feature activation | -9.14e-02 |
Token | not |
Token ID | 407 |
Feature activation | -1.92e-01 |
Token | mean |
Token ID | 1612 |
Feature activation | -1.10e-01 |
Token | to |
Token ID | 284 |
Feature activation | -1.41e-01 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.46e-01 |
Token | it |
Token ID | 340 |
Feature activation | -9.15e-02 |
Token | ." |
Token ID | 526 |
Feature activation | -1.56e-01 |
Token |
|
Token ID | 198 |
Feature activation | -3.41e-02 |
Token |
|
Token ID | 198 |
Feature activation | -3.67e-02 |
Token | Mom |
Token ID | 29252 |
Feature activation | -8.08e-02 |
Token | the |
Token ID | 262 |
Feature activation | -1.79e-01 |
Token | buttons |
Token ID | 12163 |
Feature activation | +1.04e-02 |
Token | and |
Token ID | 290 |
Feature activation | -1.36e-01 |
Token | make |
Token ID | 787 |
Feature activation | -1.10e-01 |
Token | things |
Token ID | 1243 |
Feature activation | +5.62e-03 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.46e-01 |
Token | on |
Token ID | 319 |
Feature activation | +1.69e-02 |
Token | the |
Token ID | 262 |
Feature activation | -1.20e-01 |
Token | screen |
Token ID | 3159 |
Feature activation | -6.47e-02 |
Token | . |
Token ID | 13 |
Feature activation | -4.41e-02 |
Token | She |
Token ID | 1375 |
Feature activation | -1.29e-01 |
Token | , |
Token ID | 11 |
Feature activation | -8.37e-02 |
Token | Tom |
Token ID | 4186 |
Feature activation | -8.07e-02 |
Token | . |
Token ID | 13 |
Feature activation | -8.97e-02 |
Token | Acc |
Token ID | 6366 |
Feature activation | -1.61e-01 |
Token | idents |
Token ID | 3231 |
Feature activation | -1.85e-01 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.46e-01 |
Token | . |
Token ID | 13 |
Feature activation | -9.18e-02 |
Token | I |
Token ID | 314 |
Feature activation | -1.40e-01 |
Token | 'm |
Token ID | 1101 |
Feature activation | -1.97e-01 |
Token | happy |
Token ID | 3772 |
Feature activation | -1.10e-01 |
Token | that |
Token ID | 326 |
Feature activation | -3.82e-02 |
Token | Fl |
Token ID | 1610 |
Feature activation | -2.82e-01 |
Token | oppy |
Token ID | 26696 |
Feature activation | +3.26e-02 |
Token | saw |
Token ID | 2497 |
Feature activation | +1.72e-01 |
Token | a |
Token ID | 257 |
Feature activation | -3.87e-02 |
Token | mar |
Token ID | 1667 |
Feature activation | +4.33e-02 |
Token | vell |
Token ID | 29333 |
Feature activation | -8.39e-01 |
Token | ous |
Token ID | 516 |
Feature activation | +1.25e-01 |
Token | view |
Token ID | 1570 |
Feature activation | -8.34e-02 |
Token | . |
Token ID | 13 |
Feature activation | +1.99e-02 |
Token | He |
Token ID | 679 |
Feature activation | -5.99e-02 |
Token | also |
Token ID | 635 |
Feature activation | +6.59e-02 |
Token | , |
Token ID | 11 |
Feature activation | -7.56e-02 |
Token | Anna |
Token ID | 11735 |
Feature activation | +2.58e-01 |
Token | . |
Token ID | 13 |
Feature activation | -4.31e-02 |
Token | Acc |
Token ID | 6366 |
Feature activation | -1.58e-01 |
Token | idents |
Token ID | 3231 |
Feature activation | -1.93e-01 |
Token | happen |
Token ID | 1645 |
Feature activation | -8.37e-01 |
Token | . |
Token ID | 13 |
Feature activation | -4.75e-02 |
Token | I |
Token ID | 314 |
Feature activation | -1.32e-01 |
Token | 'm |
Token ID | 1101 |
Feature activation | -1.88e-01 |
Token | not |
Token ID | 407 |
Feature activation | -1.52e-01 |
Token | angry |
Token ID | 7954 |
Feature activation | -2.22e-01 |
Token | . |
Token ID | 13 |
Feature activation | -7.24e-02 |
Token | It |
Token ID | 632 |
Feature activation | -3.14e-01 |
Token | was |
Token ID | 373 |
Feature activation | -9.48e-02 |
Token | not |
Token ID | 407 |
Feature activation | -1.50e-01 |
Token | your |
Token ID | 534 |
Feature activation | +2.17e-01 |
Token | fault |
Token ID | 8046 |
Feature activation | +8.82e-01 |
Token | . |
Token ID | 13 |
Feature activation | -6.36e-02 |
Token | He |
Token ID | 679 |
Feature activation | -1.09e-01 |
Token | was |
Token ID | 373 |
Feature activation | -9.77e-02 |
Token | a |
Token ID | 257 |
Feature activation | -9.95e-02 |
Token | mean |
Token ID | 1612 |
Feature activation | -9.83e-02 |
Token | saved |
Token ID | 7448 |
Feature activation | -2.48e-01 |
Token | , |
Token ID | 11 |
Feature activation | +7.47e-02 |
Token | and |
Token ID | 290 |
Feature activation | +4.86e-02 |
Token | finally |
Token ID | 3443 |
Feature activation | -3.13e-01 |
Token | had |
Token ID | 550 |
Feature activation | +8.79e-02 |
Token | enough |
Token ID | 1576 |
Feature activation | +6.74e-01 |
Token | money |
Token ID | 1637 |
Feature activation | +2.90e-02 |
Token | to |
Token ID | 284 |
Feature activation | +5.06e-02 |
Token | buy |
Token ID | 2822 |
Feature activation | -7.59e-02 |
Token | the |
Token ID | 262 |
Feature activation | -2.52e-02 |
Token | pink |
Token ID | 11398 |
Feature activation | +9.56e-02 |
Token | a |
Token ID | 257 |
Feature activation | +5.53e-02 |
Token | 3 |
Token ID | 513 |
Feature activation | +4.30e-01 |
Token | - |
Token ID | 12 |
Feature activation | -1.04e-01 |
Token | year |
Token ID | 1941 |
Feature activation | +4.17e-01 |
Token | - |
Token ID | 12 |
Feature activation | -1.29e-01 |
Token | old |
Token ID | 727 |
Feature activation | +5.88e-01 |
Token | boy |
Token ID | 2933 |
Feature activation | +1.68e-01 |
Token | who |
Token ID | 508 |
Feature activation | -1.28e-01 |
Token | had |
Token ID | 550 |
Feature activation | +1.27e-01 |
Token | a |
Token ID | 257 |
Feature activation | +5.99e-02 |
Token | new |
Token ID | 649 |
Feature activation | +3.57e-02 |
Token | He |
Token ID | 679 |
Feature activation | +5.56e-02 |
Token | was |
Token ID | 373 |
Feature activation | +6.93e-02 |
Token | stuck |
Token ID | 7819 |
Feature activation | +1.95e-02 |
Token | in |
Token ID | 287 |
Feature activation | +3.49e-02 |
Token | the |
Token ID | 262 |
Feature activation | +6.62e-02 |
Token | same |
Token ID | 976 |
Feature activation | +5.99e-01 |
Token | spot |
Token ID | 4136 |
Feature activation | +1.52e-01 |
Token | . |
Token ID | 13 |
Feature activation | +7.18e-02 |
Token | That |
Token ID | 1320 |
Feature activation | -2.46e-02 |
Token | was |
Token ID | 373 |
Feature activation | +6.04e-02 |
Token | the |
Token ID | 262 |
Feature activation | +5.76e-02 |
Token | walk |
Token ID | 2513 |
Feature activation | +9.48e-02 |
Token | , |
Token ID | 11 |
Feature activation | +3.18e-02 |
Token | he |
Token ID | 339 |
Feature activation | -1.02e-01 |
Token | noticed |
Token ID | 6810 |
Feature activation | +2.32e-01 |
Token | the |
Token ID | 262 |
Feature activation | +1.75e-03 |
Token | same |
Token ID | 976 |
Feature activation | +5.62e-01 |
Token | pencil |
Token ID | 21613 |
Feature activation | +1.30e-01 |
Token | he |
Token ID | 339 |
Feature activation | -1.03e-01 |
Token | had |
Token ID | 550 |
Feature activation | +8.27e-02 |
Token | seen |
Token ID | 1775 |
Feature activation | +1.25e-01 |
Token | earlier |
Token ID | 2961 |
Feature activation | -1.66e-01 |
Token | together |
Token ID | 1978 |
Feature activation | -7.68e-03 |
Token | . |
Token ID | 13 |
Feature activation | +1.20e-01 |
Token |
|
Token ID | 198 |
Feature activation | +1.52e-01 |
Token |
|
Token ID | 198 |
Feature activation | +1.44e-01 |
Token | M |
Token ID | 44 |
Feature activation | -1.86e-02 |
Token | andy |
Token ID | 10757 |
Feature activation | +8.49e-02 |
Token | was |
Token ID | 373 |
Feature activation | +7.47e-02 |
Token | so |
Token ID | 523 |
Feature activation | +1.20e-01 |
Token | happy |
Token ID | 3772 |
Feature activation | +7.98e-02 |
Token | that |
Token ID | 326 |
Feature activation | +1.67e-01 |
Token | her |
Token ID | 607 |
Feature activation | +3.95e-02 |
Token | and |
Token ID | 290 |
Feature activation | +7.05e-02 |
Token | said |
Token ID | 531 |
Feature activation | +5.49e-02 |
Token | , |
Token ID | 11 |
Feature activation | +7.23e-02 |
Token | " |
Token ID | 366 |
Feature activation | -6.03e-02 |
Token | That |
Token ID | 2504 |
Feature activation | -5.12e-02 |
Token | sounds |
Token ID | 5238 |
Feature activation | +2.46e-01 |
Token | like |
Token ID | 588 |
Feature activation | +4.50e-01 |
Token | a |
Token ID | 257 |
Feature activation | -3.21e-02 |
Token | wonderful |
Token ID | 7932 |
Feature activation | +1.21e-02 |
Token | idea |
Token ID | 2126 |
Feature activation | +3.44e-01 |
Token | ." |
Token ID | 526 |
Feature activation | -1.21e-01 |
Token | , |
Token ID | 11 |
Feature activation | +1.04e-01 |
Token | until |
Token ID | 1566 |
Feature activation | -1.52e-01 |
Token | she |
Token ID | 673 |
Feature activation | +1.89e-02 |
Token | knew |
Token ID | 2993 |
Feature activation | -8.50e-02 |
Token | all |
Token ID | 477 |
Feature activation | -3.22e-02 |
Token | about |
Token ID | 546 |
Feature activation | +1.99e-01 |
Token | it |
Token ID | 340 |
Feature activation | +7.67e-02 |
Token | . |
Token ID | 13 |
Feature activation | +6.96e-02 |
Token |
|
Token ID | 198 |
Feature activation | +8.97e-02 |
Token |
|
Token ID | 198 |
Feature activation | +9.08e-02 |
Token | The |
Token ID | 464 |
Feature activation | -9.18e-02 |
Token | playing |
Token ID | 2712 |
Feature activation | -1.60e-01 |
Token | outside |
Token ID | 2354 |
Feature activation | -2.28e-01 |
Token | or |
Token ID | 393 |
Feature activation | -1.29e-01 |
Token | reading |
Token ID | 3555 |
Feature activation | +9.94e-02 |
Token | the |
Token ID | 262 |
Feature activation | -8.43e-03 |
Token | magazine |
Token ID | 7093 |
Feature activation | +1.67e-01 |
Token | ?" |
Token ID | 1701 |
Feature activation | +6.78e-02 |
Token |
|
Token ID | 198 |
Feature activation | +8.29e-02 |
Token |
|
Token ID | 198 |
Feature activation | +7.65e-02 |
Token | L |
Token ID | 43 |
Feature activation | +7.94e-02 |
Token | ily |
Token ID | 813 |
Feature activation | -9.53e-02 |
Token | ay |
Token ID | 323 |
Feature activation | -3.70e-01 |
Token | ons |
Token ID | 684 |
Feature activation | +9.05e-02 |
Token | . |
Token ID | 13 |
Feature activation | +2.80e-02 |
Token | One |
Token ID | 1881 |
Feature activation | +3.11e-01 |
Token | day |
Token ID | 1110 |
Feature activation | -1.02e-01 |
Token | , |
Token ID | 11 |
Feature activation | +5.52e-02 |
Token | she |
Token ID | 673 |
Feature activation | -5.34e-02 |
Token | met |
Token ID | 1138 |
Feature activation | +9.06e-02 |
Token | a |
Token ID | 257 |
Feature activation | -3.31e-02 |
Token | nice |
Token ID | 3621 |
Feature activation | +9.94e-02 |
Token | boy |
Token ID | 2933 |
Feature activation | -2.14e-05 |
Token | girl |
Token ID | 2576 |
Feature activation | +1.50e-01 |
Token | named |
Token ID | 3706 |
Feature activation | -6.45e-02 |
Token | Lily |
Token ID | 20037 |
Feature activation | +6.85e-02 |
Token | . |
Token ID | 13 |
Feature activation | -3.29e-03 |
Token | She |
Token ID | 1375 |
Feature activation | -5.34e-02 |
Token | loved |
Token ID | 6151 |
Feature activation | +1.84e-02 |
Token | her |
Token ID | 607 |
Feature activation | -4.35e-02 |
Token | birthday |
Token ID | 10955 |
Feature activation | +7.24e-02 |
Token | because |
Token ID | 780 |
Feature activation | -2.68e-01 |
Token | she |
Token ID | 673 |
Feature activation | -9.22e-02 |
Token | always |
Token ID | 1464 |
Feature activation | +3.10e-01 |
Token | tried |
Token ID | 3088 |
Feature activation | +9.44e-02 |
Token | to |
Token ID | 284 |
Feature activation | +2.13e-02 |
Token | think |
Token ID | 892 |
Feature activation | -9.36e-02 |
Token | of |
Token ID | 286 |
Feature activation | -5.72e-02 |
Token | a |
Token ID | 257 |
Feature activation | -5.15e-02 |
Token | way |
Token ID | 835 |
Feature activation | -2.19e-01 |
Token | to |
Token ID | 284 |
Feature activation | +2.41e-02 |
Token | help |
Token ID | 1037 |
Feature activation | -1.81e-01 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.46e-02 |
Token | . |
Token ID | 13 |
Feature activation | +2.98e-02 |
Token |
|
Token ID | 198 |
Feature activation | +2.55e-02 |
Token | goal |
Token ID | 3061 |
Feature activation | +1.44e-01 |
Token | . |
Token ID | 13 |
Feature activation | +3.07e-02 |
Token | He |
Token ID | 679 |
Feature activation | -3.37e-02 |
Token | was |
Token ID | 373 |
Feature activation | -3.35e-02 |
Token | very |
Token ID | 845 |
Feature activation | -1.05e-01 |
Token | happy |
Token ID | 3772 |
Feature activation | +4.46e-03 |
Token | . |
Token ID | 13 |
Feature activation | +2.37e-02 |
Token | Luna |
Token ID | 23694 |
Feature activation | +1.81e-01 |
Token | was |
Token ID | 373 |
Feature activation | -2.56e-02 |
Token | a |
Token ID | 257 |
Feature activation | -4.52e-02 |
Token | little |
Token ID | 1310 |
Feature activation | +1.08e-01 |
Token | . |
Token ID | 13 |
Feature activation | -2.60e-02 |
Token | She |
Token ID | 1375 |
Feature activation | -6.68e-02 |
Token | asked |
Token ID | 1965 |
Feature activation | +1.10e-01 |
Token | her |
Token ID | 607 |
Feature activation | -9.21e-02 |
Token | mom |
Token ID | 1995 |
Feature activation | +5.64e-02 |
Token | and |
Token ID | 290 |
Feature activation | -3.68e-02 |
Token | dad |
Token ID | 9955 |
Feature activation | -1.30e-02 |
Token | , |
Token ID | 11 |
Feature activation | -2.99e-02 |
Token | but |
Token ID | 475 |
Feature activation | -4.26e-01 |
Token | they |
Token ID | 484 |
Feature activation | -1.38e-01 |
Token | did |
Token ID | 750 |
Feature activation | -9.38e-03 |
Token | and |
Token ID | 290 |
Feature activation | -2.35e-02 |
Token | make |
Token ID | 787 |
Feature activation | +2.42e-02 |
Token | loud |
Token ID | 7812 |
Feature activation | +2.53e-02 |
Token | noises |
Token ID | 26782 |
Feature activation | +3.03e-01 |
Token | . |
Token ID | 13 |
Feature activation | +1.07e-03 |
Token | He |
Token ID | 679 |
Feature activation | -6.74e-02 |
Token | kept |
Token ID | 4030 |
Feature activation | +4.01e-02 |
Token | his |
Token ID | 465 |
Feature activation | -3.69e-02 |
Token | truck |
Token ID | 7779 |
Feature activation | -5.46e-02 |
Token | in |
Token ID | 287 |
Feature activation | -1.22e-02 |
Token | his |
Token ID | 465 |
Feature activation | -2.38e-02 |
Token | He |
Token ID | 679 |
Feature activation | -1.01e-01 |
Token | could |
Token ID | 714 |
Feature activation | -2.27e-01 |
Token | fly |
Token ID | 6129 |
Feature activation | -2.55e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.52e-01 |
Token | save |
Token ID | 3613 |
Feature activation | -4.54e-01 |
Token | people |
Token ID | 661 |
Feature activation | -4.91e-01 |
Token | . |
Token ID | 13 |
Feature activation | -6.91e-02 |
Token | Tom |
Token ID | 4186 |
Feature activation | -1.03e-01 |
Token | and |
Token ID | 290 |
Feature activation | -1.46e-01 |
Token | Lily |
Token ID | 20037 |
Feature activation | -2.50e-02 |
Token | decided |
Token ID | 3066 |
Feature activation | -7.87e-02 |
Token | dangerous |
Token ID | 4923 |
Feature activation | -8.25e-02 |
Token | . |
Token ID | 13 |
Feature activation | -4.00e-02 |
Token | You |
Token ID | 921 |
Feature activation | +1.78e-01 |
Token | might |
Token ID | 1244 |
Feature activation | -2.02e-01 |
Token | get |
Token ID | 651 |
Feature activation | -1.14e-01 |
Token | hurt |
Token ID | 5938 |
Feature activation | -5.23e-01 |
Token | ," |
Token ID | 553 |
Feature activation | -2.35e-01 |
Token | Mom |
Token ID | 11254 |
Feature activation | +3.36e-02 |
Token | said |
Token ID | 531 |
Feature activation | -6.61e-02 |
Token | . |
Token ID | 13 |
Feature activation | +6.83e-02 |
Token |
|
Token ID | 198 |
Feature activation | +5.21e-02 |
Token | pillar |
Token ID | 41643 |
Feature activation | -5.02e-02 |
Token | home |
Token ID | 1363 |
Feature activation | -3.47e-01 |
Token | so |
Token ID | 523 |
Feature activation | +7.39e-02 |
Token | she |
Token ID | 673 |
Feature activation | +7.44e-03 |
Token | could |
Token ID | 714 |
Feature activation | -6.23e-02 |
Token | show |
Token ID | 905 |
Feature activation | -5.54e-01 |
Token | her |
Token ID | 607 |
Feature activation | +2.43e-02 |
Token | friends |
Token ID | 2460 |
Feature activation | -6.86e-02 |
Token | . |
Token ID | 13 |
Feature activation | +7.07e-02 |
Token | She |
Token ID | 1375 |
Feature activation | +2.32e-02 |
Token | carefully |
Token ID | 7773 |
Feature activation | +1.63e-03 |
Token | . |
Token ID | 13 |
Feature activation | -1.14e-01 |
Token | These |
Token ID | 2312 |
Feature activation | -5.07e-02 |
Token | are |
Token ID | 389 |
Feature activation | -2.25e-01 |
Token | surprise |
Token ID | 5975 |
Feature activation | -1.24e-01 |
Token | eggs |
Token ID | 9653 |
Feature activation | +1.59e-02 |
Token | !" |
Token ID | 2474 |
Feature activation | -5.13e-01 |
Token | she |
Token ID | 673 |
Feature activation | -1.60e-01 |
Token | says |
Token ID | 1139 |
Feature activation | -1.87e-01 |
Token | . |
Token ID | 13 |
Feature activation | +4.38e-02 |
Token | " |
Token ID | 366 |
Feature activation | -1.62e-01 |
Token | Someone |
Token ID | 28211 |
Feature activation | -4.69e-01 |
Token | friend |
Token ID | 1545 |
Feature activation | +2.09e-02 |
Token | . |
Token ID | 13 |
Feature activation | -3.14e-02 |
Token | Please |
Token ID | 4222 |
Feature activation | +2.02e-01 |
Token | don |
Token ID | 836 |
Feature activation | -2.87e-01 |
Token | 't |
Token ID | 470 |
Feature activation | -3.12e-01 |
Token | hurt |
Token ID | 5938 |
Feature activation | -5.30e-01 |
Token | her |
Token ID | 607 |
Feature activation | -9.58e-02 |
Token | , |
Token ID | 11 |
Feature activation | -3.31e-02 |
Token | please |
Token ID | 3387 |
Feature activation | +3.63e-01 |
Token | don |
Token ID | 836 |
Feature activation | -2.83e-01 |
Token | 't |
Token ID | 470 |
Feature activation | -3.06e-01 |