INDEX
    Explanations

    occurrences of quotation marks and parentheses in the text

    New Auto-Interp
    Negative Logits
    '));
    
    -0.83
    ]');
    -0.82
    ValueStyle
    -0.80
    }');
    -0.78
    `;
    
    -0.76
    %");
    -0.74
    ẵn
    -0.73
     ]];
    -0.73
    )");
    
    -0.72
     });
    
    -0.71
    POSITIVE LOGITS
     __('
    1.32
     _("
    1.27
    (__('
    1.22
    ("
    1.18
    (["
    1.16
    :@"
    1.16
    (("
    1.15
    ["
    1.13
    (('
    1.13
     "..\..\..\
    1.13
    Act Density 0.009%

    No Known Activations