phospho-app
/

PAphospho-AI-voice-lego-red-2

+{
+  "best_metric": null,
+  "best_model_checkpoint": null,
+  "epoch": 0.6741573033707865,
+  "eval_steps": 500,
+  "global_step": 60,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.11235955056179775,
+      "grad_norm": 2.1474151611328125,
+      "learning_rate": 0.00019264940672148018,
+      "loss": 0.6606,
+      "step": 10
+    },
+    {
+      "epoch": 0.2247191011235955,
+      "grad_norm": 32.052978515625,
+      "learning_rate": 0.00015922352526649803,
+      "loss": 0.3779,
+      "step": 20
+    },
+    {
+      "epoch": 0.33707865168539325,
+      "grad_norm": 94.88410186767578,
+      "learning_rate": 0.00010825793454723325,
+      "loss": 0.3968,
+      "step": 30
+    },
+    {
+      "epoch": 0.449438202247191,
+      "grad_norm": 99.2090072631836,
+      "learning_rate": 5.484666416891109e-05,
+      "loss": 0.3301,
+      "step": 40
+    },
+    {
+      "epoch": 0.5617977528089888,
+      "grad_norm": 106.09911346435547,
+      "learning_rate": 1.4808059116167305e-05,
+      "loss": 0.3134,
+      "step": 50
+    },
+    {
+      "epoch": 0.6741573033707865,
+      "grad_norm": 217.75341796875,
+      "learning_rate": 0.0,
+      "loss": 0.3172,
+      "step": 60
+    },
+    {
+      "epoch": 0.6741573033707865,
+      "step": 60,
+      "total_flos": 8512833379000320.0,
+      "train_loss": 0.3993192434310913,
+      "train_runtime": 93.2679,
+      "train_samples_per_second": 41.172,
+      "train_steps_per_second": 0.643
+    }
+  ],
+  "logging_steps": 10,
+  "max_steps": 60,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 1,
+  "save_steps": 10000,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 8512833379000320.0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": null
+}