KeivanR
/

Qwen2.5-1.5B-Instruct-Zero-Shot

KeivanR commited on 9 days ago

Commit

5aa158a

verified ·

1 Parent(s): 0079aa1

Upload evaluation/evaluation_metrics.json with huggingface_hub

Files changed (1) hide show

evaluation/evaluation_metrics.json CHANGED Viewed

@@ -1,43 +1,43 @@
 {
   "overall": {
-    "accuracy": 0.06048387096774194,
-    "precision_macro": 0.25129020766791754,
-    "recall_macro": 0.41524017589800666,
-    "f1_macro": 0.2812384171233439
   },
   "per_class": {
     "precision": {
-      "games": 0.375,
-      "geometry": 0.10047846889952153,
-      "graphs": 0.16129032258064516,
-      "math": 0.26259541984732826,
-      "number theory": 0.3176470588235294,
       "other": 0.0,
-      "probabilities": 0.2413793103448276,
-      "strings": 0.44047619047619047,
-      "trees": 0.3627450980392157
     },
     "recall": {
-      "games": 0.13043478260869565,
-      "geometry": 0.6176470588235294,
-      "graphs": 0.514018691588785,
-      "math": 0.6825396825396826,
-      "number theory": 0.4153846153846154,
       "other": 0.0,
-      "probabilities": 0.3888888888888889,
-      "strings": 0.47435897435897434,
-      "trees": 0.5138888888888888
     },
     "f1": {
-      "games": 0.1935483870967742,
-      "geometry": 0.1728395061728395,
-      "graphs": 0.24553571428571427,
-      "math": 0.37927232635060637,
       "number theory": 0.36,
       "other": 0.0,
-      "probabilities": 0.2978723404255319,
-      "strings": 0.4567901234567901,
-      "trees": 0.42528735632183906
     }
   }
 }

 {
   "overall": {
+    "accuracy": 0.06,
+    "precision_macro": 0.25,
+    "recall_macro": 0.42,
+    "f1_macro": 0.28
   },
   "per_class": {
     "precision": {
+      "games": 0.38,
+      "geometry": 0.1,
+      "graphs": 0.16,
+      "math": 0.26,
+      "number theory": 0.32,
       "other": 0.0,
+      "probabilities": 0.24,
+      "strings": 0.44,
+      "trees": 0.36
     },
     "recall": {
+      "games": 0.13,
+      "geometry": 0.62,
+      "graphs": 0.51,
+      "math": 0.68,
+      "number theory": 0.42,
       "other": 0.0,
+      "probabilities": 0.39,
+      "strings": 0.47,
+      "trees": 0.51
     },
     "f1": {
+      "games": 0.19,
+      "geometry": 0.17,
+      "graphs": 0.25,
+      "math": 0.38,
       "number theory": 0.36,
       "other": 0.0,
+      "probabilities": 0.3,
+      "strings": 0.46,
+      "trees": 0.43
     }
   }
 }