INDEX
Negative Logits
{0.96
{0.64
\{0.54
:
0.46
{,0.42
{//0.39
{.0.38
{
0.38
{\0.37
:
0.37
POSITIVE LOGITS
}\,\
0.44
],"
0.41
",(
0.40
",&
0.40
',['
0.39
"),(
0.39
","#
0.38
],"
0.38
","/
0.38
","
0.38
Activations Density 0.003%
{{ \{:
{, {// {.{
{\:
}\,\
],"
",(
",&
',['
"),(
","#
],"
","/
","