tool-call-verifier / best_metrics.json
Huamin's picture
Update model with binary classification (UNAUTHORIZED F1: 93.50%)
386b5c0 verified
{
"classification_report": {
"AUTHORIZED": {
"precision": 0.9037877897531266,
"recall": 0.9392273925756695,
"f1-score": 0.9211668545659526,
"support": 139191.0
},
"UNAUTHORIZED": {
"precision": 0.950093511979563,
"recall": 0.9204538309851105,
"f1-score": 0.9350388443092216,
"support": 174955.0
},
"accuracy": 0.9287719722676717,
"macro avg": {
"precision": 0.9269406508663448,
"recall": 0.9298406117803899,
"f1-score": 0.9281028494375871,
"support": 314146.0
},
"weighted avg": {
"precision": 0.9295764919238567,
"recall": 0.9287719722676717,
"f1-score": 0.9288924788474447,
"support": 314146.0
}
},
"accuracy": 0.9287719722676717,
"macro_f1": 0.9281028494375871,
"weighted_f1": 0.9288924788474447,
"unauthorized_avg_f1": 0.9350388443092216,
"unauthorized_precision": 0.950093511979563,
"unauthorized_recall": 0.9204538309851105,
"unauthorized_f1": 0.9350388443092216
}