AjayP13 commited on
Commit
60673a0
·
verified ·
1 Parent(s): 9a0340f

Pushed by DataDreamer

Browse files

Update training_args.json

Files changed (1) hide show
  1. training_args.json +5 -5
training_args.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "output_dir": "/mnt/nlpgpu-io1/data/ajayp/output/fineinstructions/dated/2025-03-05-13:09:26/data/train_matcher/train-matching-embedding/_checkpoints",
3
  "overwrite_output_dir": false,
4
  "do_train": false,
5
  "do_eval": true,
@@ -20,16 +20,16 @@
20
  "adam_beta2": 0.999,
21
  "adam_epsilon": 1e-08,
22
  "max_grad_norm": 1.0,
23
- "num_train_epochs": 3,
24
  "max_steps": -1,
25
- "lr_scheduler_type": "linear",
26
  "lr_scheduler_kwargs": {},
27
  "warmup_ratio": 0.0,
28
  "warmup_steps": 0,
29
  "log_level": "passive",
30
  "log_level_replica": "warning",
31
  "log_on_each_node": true,
32
- "logging_dir": "/mnt/nlpgpu-io1/data/ajayp/output/fineinstructions/dated/2025-03-05-13:09:26/data/train_matcher/train-matching-embedding/_checkpoints/runs/Mar06_20-29-59_nlpgpu04.seas.upenn.edu",
33
  "logging_strategy": "steps",
34
  "logging_first_step": false,
35
  "logging_steps": 1,
@@ -70,7 +70,7 @@
70
  "remove_unused_columns": false,
71
  "label_names": null,
72
  "load_best_model_at_end": true,
73
- "metric_for_best_model": "eval_loss",
74
  "greater_is_better": true,
75
  "ignore_data_skip": false,
76
  "fsdp": [],
 
1
  {
2
+ "output_dir": "/mnt/nlpgpu-io1/data/ajayp/output/fineinstructions/dated/2025-03-26-09:28:15/data/train_matcher_v2/train-matching-embedding/_checkpoints",
3
  "overwrite_output_dir": false,
4
  "do_train": false,
5
  "do_eval": true,
 
20
  "adam_beta2": 0.999,
21
  "adam_epsilon": 1e-08,
22
  "max_grad_norm": 1.0,
23
+ "num_train_epochs": 2,
24
  "max_steps": -1,
25
+ "lr_scheduler_type": "constant",
26
  "lr_scheduler_kwargs": {},
27
  "warmup_ratio": 0.0,
28
  "warmup_steps": 0,
29
  "log_level": "passive",
30
  "log_level_replica": "warning",
31
  "log_on_each_node": true,
32
+ "logging_dir": "/mnt/nlpgpu-io1/data/ajayp/output/fineinstructions/dated/2025-03-26-09:28:15/data/train_matcher_v2/train-matching-embedding/_checkpoints/runs/Mar28_23-33-16_nlpgpu10.seas.upenn.edu",
33
  "logging_strategy": "steps",
34
  "logging_first_step": false,
35
  "logging_steps": 1,
 
70
  "remove_unused_columns": false,
71
  "label_names": null,
72
  "load_best_model_at_end": true,
73
+ "metric_for_best_model": "eval_joint_metric",
74
  "greater_is_better": true,
75
  "ignore_data_skip": false,
76
  "fsdp": [],