INDEX
    Explanations
    New Auto-Interp
    Negative Logits
    -1.05
    /**
    -0.91
    <?
    -0.88
    
    
    -0.85
    /*
    -0.77
    <?
    
    -0.67
    <bos>
    -0.66
    #
    -0.63
    protected
    -0.60
    Transcripción
    -0.57
    POSITIVE LOGITS
     vintage
    2.24
     Vintage
    2.08
    Vintage
    2.02
    vintage
    2.00
    INTAGE
    1.48
     aen
    1.20
     antique
    1.14
     disagre
    1.13
     maneu
    1.13
     ftu
    1.11
    Act Density 0.129%

    No Known Activations