Save model at global step 40
Browse files- config.yaml +2 -2
- data.pt +1 -1
- extra_state_world_size_4_rank_0.pt +1 -1
- extra_state_world_size_4_rank_1.pt +1 -1
- extra_state_world_size_4_rank_2.pt +1 -1
- extra_state_world_size_4_rank_3.pt +1 -1
- model_world_size_4_rank_0.pt +1 -1
- model_world_size_4_rank_1.pt +1 -1
- model_world_size_4_rank_2.pt +1 -1
- model_world_size_4_rank_3.pt +1 -1
- optim_world_size_4_rank_0.pt +1 -1
- optim_world_size_4_rank_1.pt +1 -1
- optim_world_size_4_rank_2.pt +1 -1
- optim_world_size_4_rank_3.pt +1 -1
config.yaml
CHANGED
@@ -63,7 +63,7 @@ actor_rollout_ref:
|
|
63 |
lr_warmup_steps_ratio: 0
|
64 |
min_lr_ratio: null
|
65 |
warmup_style: constant
|
66 |
-
total_training_steps:
|
67 |
weight_decay: 0.01
|
68 |
fsdp_config:
|
69 |
wrap_policy:
|
@@ -147,7 +147,7 @@ custom_reward_function:
|
|
147 |
trainer:
|
148 |
balance_batch: true
|
149 |
total_epochs: 100
|
150 |
-
total_training_steps:
|
151 |
project_name: value-LLM
|
152 |
experiment_name: brm-dapo-llama3.2-3B-it_lr1e-6_rspL4096-beta0.002
|
153 |
logger:
|
|
|
63 |
lr_warmup_steps_ratio: 0
|
64 |
min_lr_ratio: null
|
65 |
warmup_style: constant
|
66 |
+
total_training_steps: 800
|
67 |
weight_decay: 0.01
|
68 |
fsdp_config:
|
69 |
wrap_policy:
|
|
|
147 |
trainer:
|
148 |
balance_batch: true
|
149 |
total_epochs: 100
|
150 |
+
total_training_steps: 800
|
151 |
project_name: value-LLM
|
152 |
experiment_name: brm-dapo-llama3.2-3B-it_lr1e-6_rspL4096-beta0.002
|
153 |
logger:
|
data.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1492
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2ac703df2ea9887685ba1076ead9d06649af4d654947c84fbf72be54795654ee
|
3 |
size 1492
|
extra_state_world_size_4_rank_0.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14632
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1ab08b34f7000fc99b714608686487f4b0ef5f419a1c23610e1c44c7aaad8137
|
3 |
size 14632
|
extra_state_world_size_4_rank_1.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14632
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:af9fc86f6e469cb0834476b71b525358133f74ff5ee77ed4bce6eac57aa550ca
|
3 |
size 14632
|
extra_state_world_size_4_rank_2.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14632
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d321ba942354b0228acd80bb829660d58c1006ff7e77e69386c788b91137c6b8
|
3 |
size 14632
|
extra_state_world_size_4_rank_3.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 14632
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:720ecba3014916b6c126dc326620e82c0dc2b8c061000f556b103b296edc5656
|
3 |
size 14632
|
model_world_size_4_rank_0.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3606904378
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:88bbbcce88a120658133d3bd17dd4b398bc710195dc8e022fab72524cb403b8a
|
3 |
size 3606904378
|
model_world_size_4_rank_1.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3606904378
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:05244404bd868e0eea5b56904355ac3a893756350bc492bc9fceeb6a9d29b583
|
3 |
size 3606904378
|
model_world_size_4_rank_2.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3606904378
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d00f30935d09407d89d030a1080b622fa4e9d79cf25dd6ce3381c5d2e4fd983d
|
3 |
size 3606904378
|
model_world_size_4_rank_3.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 3606904378
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a92814edb47ba3e517b3a6b27ab6afd62f71b9f9268a5af559ccd0090a966ddb
|
3 |
size 3606904378
|
optim_world_size_4_rank_0.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6425526231
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ac28c3aa1c8e728a30dd42d32ae3f038598a9584221604f358ee6f2c53cb7d58
|
3 |
size 6425526231
|
optim_world_size_4_rank_1.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6425526231
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:063280c83e0f63110920a52e595be7ebe087140cbf3d9563f0be985cbf5f8fb5
|
3 |
size 6425526231
|
optim_world_size_4_rank_2.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6425526231
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d96c83791fe962212f4b9eaa7e73faab5e21303553d84d7d3eb62243a4d3fd59
|
3 |
size 6425526231
|
optim_world_size_4_rank_3.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 6425526231
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:45bf05404791e3710b1cff753681a14ca4125dbdb8a4bdf2c4cf65786d615961
|
3 |
size 6425526231
|