INDEX
Negative Logits
latter
0.84
}};
0.78
}];
0.76
};
0.75
};
0.70
"];
0.69
>;
0.68
'};
0.68
`;
0.68
}];
0.68
POSITIVE LOGITS
)
1.27
){1.03
&&
1.00
")
0.85
||
0.84
"){0.83
]
0.81
){//0.79
)
0.79
){0.78
Activations Density 0.050%
latter
}};
}];
};
};
"];
>;
'};
`;
}];
)
){&&
")
||
"){]
){//)
){