MohamedAhmedAE commited on
Commit
73dd7eb
·
verified ·
1 Parent(s): e70f279

Training in progress, step 600, checkpoint

Browse files
last-checkpoint/optimizer.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:792ea85767dea8354213c046ddfc283c058438c9bd42b956b56d21b999bed010
3
  size 1598819130
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b11b4fbe976846a9b3278e44f225a63a67e85d625a57e67c37fa9ae5e307aace
3
  size 1598819130
last-checkpoint/scheduler.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5148b50590ba2eccaa9614d01e91c63955c36980943998f454561d580e8f60ba
3
  size 1064
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6f48b81368166faa6e913dbe50b345c1ff918742c19e7d11caea2dc2d9e56500
3
  size 1064
last-checkpoint/trainer_state.json CHANGED
@@ -2,9 +2,9 @@
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
- "epoch": 0.006114338122898196,
6
  "eval_steps": 1000,
7
- "global_step": 400,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
@@ -22,6 +22,13 @@
22
  "learning_rate": 4.99999995525116e-05,
23
  "loss": 0.0,
24
  "step": 400
 
 
 
 
 
 
 
25
  }
26
  ],
27
  "logging_steps": 200,
@@ -41,7 +48,7 @@
41
  "attributes": {}
42
  }
43
  },
44
- "total_flos": 121767624073170.0,
45
  "train_batch_size": 1,
46
  "trial_name": null,
47
  "trial_params": null
 
2
  "best_global_step": null,
3
  "best_metric": null,
4
  "best_model_checkpoint": null,
5
+ "epoch": 0.009171507184347295,
6
  "eval_steps": 1000,
7
+ "global_step": 600,
8
  "is_hyper_param_search": false,
9
  "is_local_process_zero": true,
10
  "is_world_process_zero": true,
 
22
  "learning_rate": 4.99999995525116e-05,
23
  "loss": 0.0,
24
  "step": 400
25
+ },
26
+ {
27
+ "epoch": 0.009171507184347295,
28
+ "grad_norm": NaN,
29
+ "learning_rate": 4.999999898290334e-05,
30
+ "loss": 0.0,
31
+ "step": 600
32
  }
33
  ],
34
  "logging_steps": 200,
 
48
  "attributes": {}
49
  }
50
  },
51
+ "total_flos": 179452957671360.0,
52
  "train_batch_size": 1,
53
  "trial_name": null,
54
  "trial_params": null