RyanYr commited on
Commit
ef73fe0
·
verified ·
1 Parent(s): 68fe022

Save model at global step 40

Browse files
config.yaml CHANGED
@@ -63,7 +63,7 @@ actor_rollout_ref:
63
  lr_warmup_steps_ratio: 0
64
  min_lr_ratio: null
65
  warmup_style: constant
66
- total_training_steps: 400
67
  weight_decay: 0.01
68
  fsdp_config:
69
  wrap_policy:
@@ -147,7 +147,7 @@ custom_reward_function:
147
  trainer:
148
  balance_batch: true
149
  total_epochs: 100
150
- total_training_steps: 400
151
  project_name: value-LLM
152
  experiment_name: brm-dapo-llama3.2-3B-it_lr1e-6_rspL4096-beta0.002
153
  logger:
 
63
  lr_warmup_steps_ratio: 0
64
  min_lr_ratio: null
65
  warmup_style: constant
66
+ total_training_steps: 800
67
  weight_decay: 0.01
68
  fsdp_config:
69
  wrap_policy:
 
147
  trainer:
148
  balance_batch: true
149
  total_epochs: 100
150
+ total_training_steps: 800
151
  project_name: value-LLM
152
  experiment_name: brm-dapo-llama3.2-3B-it_lr1e-6_rspL4096-beta0.002
153
  logger:
data.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:47b1eb3307b0a3e4ad15ac7a14693b23d313cf327cb9bbd20cd4f8f181793ab3
3
  size 1492
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2ac703df2ea9887685ba1076ead9d06649af4d654947c84fbf72be54795654ee
3
  size 1492
extra_state_world_size_4_rank_0.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1268e9aa07b5bf0b6e7f8a82bbef08667d9bf19c816443bc74909e8775f2aa8a
3
  size 14632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1ab08b34f7000fc99b714608686487f4b0ef5f419a1c23610e1c44c7aaad8137
3
  size 14632
extra_state_world_size_4_rank_1.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:edb0d33891e39c7b6c62dd9b5af87516001ba3bf756d5fa8ae086b601ef00754
3
  size 14632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:af9fc86f6e469cb0834476b71b525358133f74ff5ee77ed4bce6eac57aa550ca
3
  size 14632
extra_state_world_size_4_rank_2.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1f375391e56ced691d83d7960525e831c29dcae3ca70ef20db607d44e9dfdf95
3
  size 14632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d321ba942354b0228acd80bb829660d58c1006ff7e77e69386c788b91137c6b8
3
  size 14632
extra_state_world_size_4_rank_3.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:6d50d61eaecff9490b24d2f7572a78f1896ed930081d60b40600a9b9bc4eb497
3
  size 14632
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:720ecba3014916b6c126dc326620e82c0dc2b8c061000f556b103b296edc5656
3
  size 14632
model_world_size_4_rank_0.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c328e978022c414a9349da0a388ac1a2aeedae9d696b4f51962638e9d971a377
3
  size 3606904378
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88bbbcce88a120658133d3bd17dd4b398bc710195dc8e022fab72524cb403b8a
3
  size 3606904378
model_world_size_4_rank_1.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:3621d450be05b8cdc4a001e9000e8511167d22997aac4f70c2e3858b03d4c0b7
3
  size 3606904378
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:05244404bd868e0eea5b56904355ac3a893756350bc492bc9fceeb6a9d29b583
3
  size 3606904378
model_world_size_4_rank_2.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c73c2ba7e3c559eeab99fa66f6e61639648ad32dd99c04a7bbae6002a3ab0e50
3
  size 3606904378
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d00f30935d09407d89d030a1080b622fa4e9d79cf25dd6ce3381c5d2e4fd983d
3
  size 3606904378
model_world_size_4_rank_3.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c04dffaedf1cf155e9bd8759c48e71123660e5365797ac0b2f42c634b2051542
3
  size 3606904378
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a92814edb47ba3e517b3a6b27ab6afd62f71b9f9268a5af559ccd0090a966ddb
3
  size 3606904378
optim_world_size_4_rank_0.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5da0b6789ecafb1b910fb7722470aa5fa15db9ab8a5921a670c2865267f15b90
3
  size 6425526231
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ac28c3aa1c8e728a30dd42d32ae3f038598a9584221604f358ee6f2c53cb7d58
3
  size 6425526231
optim_world_size_4_rank_1.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4d07e4ea18b13151750fdb548610cfb983d62fc3e5bc85b33348b6c2b7dfc4e7
3
  size 6425526231
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:063280c83e0f63110920a52e595be7ebe087140cbf3d9563f0be985cbf5f8fb5
3
  size 6425526231
optim_world_size_4_rank_2.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:1e628c6be1366b2107760d0e3eff914970f4c3191d5fd89233cb5ca2ae617dd1
3
  size 6425526231
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d96c83791fe962212f4b9eaa7e73faab5e21303553d84d7d3eb62243a4d3fd59
3
  size 6425526231
optim_world_size_4_rank_3.pt CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:915b8e443d9a3964890bd6da3434538104cc36a9ba6e904afc6d30830a566e7a
3
  size 6425526231
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:45bf05404791e3710b1cff753681a14ca4125dbdb8a4bdf2c4cf65786d615961
3
  size 6425526231