INDEX
Negative Logits
<bos>
-0.50
ir
-0.41
,
-0.40
:
-0.39
ff
-0.38
problem
-0.37
ContentAlignment
-0.37
by
-0.36
.
-0.36
(
-0.36
POSITIVE LOGITS
?>">
0.81
});*/
0.78
}}</
0.76
};*/
0.75
}*/
0.75
"}>
0.75
();*/
0.73
}*/
0.72
']],
0.71
}}}{0.70
Activations Density 0.911%