Upload folder using huggingface_hub
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- added_tokens.json +24 -0
- checkpoint-2000/added_tokens.json +24 -0
- checkpoint-2000/config.json +203 -0
- checkpoint-2000/generation_config.json +14 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt +3 -0
- checkpoint-2000/global_step2000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt +3 -0
added_tokens.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"</tool_call>": 151658,
|
3 |
+
"<tool_call>": 151657,
|
4 |
+
"<|box_end|>": 151649,
|
5 |
+
"<|box_start|>": 151648,
|
6 |
+
"<|endoftext|>": 151643,
|
7 |
+
"<|file_sep|>": 151664,
|
8 |
+
"<|fim_middle|>": 151660,
|
9 |
+
"<|fim_pad|>": 151662,
|
10 |
+
"<|fim_prefix|>": 151659,
|
11 |
+
"<|fim_suffix|>": 151661,
|
12 |
+
"<|im_end|>": 151645,
|
13 |
+
"<|im_start|>": 151644,
|
14 |
+
"<|image_pad|>": 151655,
|
15 |
+
"<|object_ref_end|>": 151647,
|
16 |
+
"<|object_ref_start|>": 151646,
|
17 |
+
"<|quad_end|>": 151651,
|
18 |
+
"<|quad_start|>": 151650,
|
19 |
+
"<|repo_name|>": 151663,
|
20 |
+
"<|video_pad|>": 151656,
|
21 |
+
"<|vision_end|>": 151653,
|
22 |
+
"<|vision_pad|>": 151654,
|
23 |
+
"<|vision_start|>": 151652
|
24 |
+
}
|
checkpoint-2000/added_tokens.json
ADDED
@@ -0,0 +1,24 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"</tool_call>": 151658,
|
3 |
+
"<tool_call>": 151657,
|
4 |
+
"<|box_end|>": 151649,
|
5 |
+
"<|box_start|>": 151648,
|
6 |
+
"<|endoftext|>": 151643,
|
7 |
+
"<|file_sep|>": 151664,
|
8 |
+
"<|fim_middle|>": 151660,
|
9 |
+
"<|fim_pad|>": 151662,
|
10 |
+
"<|fim_prefix|>": 151659,
|
11 |
+
"<|fim_suffix|>": 151661,
|
12 |
+
"<|im_end|>": 151645,
|
13 |
+
"<|im_start|>": 151644,
|
14 |
+
"<|image_pad|>": 151655,
|
15 |
+
"<|object_ref_end|>": 151647,
|
16 |
+
"<|object_ref_start|>": 151646,
|
17 |
+
"<|quad_end|>": 151651,
|
18 |
+
"<|quad_start|>": 151650,
|
19 |
+
"<|repo_name|>": 151663,
|
20 |
+
"<|video_pad|>": 151656,
|
21 |
+
"<|vision_end|>": 151653,
|
22 |
+
"<|vision_pad|>": 151654,
|
23 |
+
"<|vision_start|>": 151652
|
24 |
+
}
|
checkpoint-2000/config.json
ADDED
@@ -0,0 +1,203 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"_name_or_path": "/mnt/bn/tiktok-mm-4/aiic/users/brianli/prod/checkpoints/LLaVA-OV-Qwen2-Mammoth-VL-8B",
|
3 |
+
"add_faster_video": false,
|
4 |
+
"add_time_instruction": false,
|
5 |
+
"architectures": [
|
6 |
+
"LlavaQwenForCausalLM"
|
7 |
+
],
|
8 |
+
"attention_dropout": 0.0,
|
9 |
+
"bos_token_id": 151643,
|
10 |
+
"eos_token_id": 151645,
|
11 |
+
"faster_token_stride": 10,
|
12 |
+
"force_sample": false,
|
13 |
+
"hidden_act": "silu",
|
14 |
+
"hidden_size": 3584,
|
15 |
+
"image_aspect_ratio": "anyres_max_4",
|
16 |
+
"image_crop_resolution": null,
|
17 |
+
"image_grid_pinpoints": [
|
18 |
+
[
|
19 |
+
384,
|
20 |
+
384
|
21 |
+
],
|
22 |
+
[
|
23 |
+
384,
|
24 |
+
768
|
25 |
+
],
|
26 |
+
[
|
27 |
+
384,
|
28 |
+
1152
|
29 |
+
],
|
30 |
+
[
|
31 |
+
384,
|
32 |
+
1536
|
33 |
+
],
|
34 |
+
[
|
35 |
+
384,
|
36 |
+
1920
|
37 |
+
],
|
38 |
+
[
|
39 |
+
384,
|
40 |
+
2304
|
41 |
+
],
|
42 |
+
[
|
43 |
+
768,
|
44 |
+
384
|
45 |
+
],
|
46 |
+
[
|
47 |
+
768,
|
48 |
+
768
|
49 |
+
],
|
50 |
+
[
|
51 |
+
768,
|
52 |
+
1152
|
53 |
+
],
|
54 |
+
[
|
55 |
+
768,
|
56 |
+
1536
|
57 |
+
],
|
58 |
+
[
|
59 |
+
768,
|
60 |
+
1920
|
61 |
+
],
|
62 |
+
[
|
63 |
+
768,
|
64 |
+
2304
|
65 |
+
],
|
66 |
+
[
|
67 |
+
1152,
|
68 |
+
384
|
69 |
+
],
|
70 |
+
[
|
71 |
+
1152,
|
72 |
+
768
|
73 |
+
],
|
74 |
+
[
|
75 |
+
1152,
|
76 |
+
1152
|
77 |
+
],
|
78 |
+
[
|
79 |
+
1152,
|
80 |
+
1536
|
81 |
+
],
|
82 |
+
[
|
83 |
+
1152,
|
84 |
+
1920
|
85 |
+
],
|
86 |
+
[
|
87 |
+
1152,
|
88 |
+
2304
|
89 |
+
],
|
90 |
+
[
|
91 |
+
1536,
|
92 |
+
384
|
93 |
+
],
|
94 |
+
[
|
95 |
+
1536,
|
96 |
+
768
|
97 |
+
],
|
98 |
+
[
|
99 |
+
1536,
|
100 |
+
1152
|
101 |
+
],
|
102 |
+
[
|
103 |
+
1536,
|
104 |
+
1536
|
105 |
+
],
|
106 |
+
[
|
107 |
+
1536,
|
108 |
+
1920
|
109 |
+
],
|
110 |
+
[
|
111 |
+
1536,
|
112 |
+
2304
|
113 |
+
],
|
114 |
+
[
|
115 |
+
1920,
|
116 |
+
384
|
117 |
+
],
|
118 |
+
[
|
119 |
+
1920,
|
120 |
+
768
|
121 |
+
],
|
122 |
+
[
|
123 |
+
1920,
|
124 |
+
1152
|
125 |
+
],
|
126 |
+
[
|
127 |
+
1920,
|
128 |
+
1536
|
129 |
+
],
|
130 |
+
[
|
131 |
+
1920,
|
132 |
+
1920
|
133 |
+
],
|
134 |
+
[
|
135 |
+
1920,
|
136 |
+
2304
|
137 |
+
],
|
138 |
+
[
|
139 |
+
2304,
|
140 |
+
384
|
141 |
+
],
|
142 |
+
[
|
143 |
+
2304,
|
144 |
+
768
|
145 |
+
],
|
146 |
+
[
|
147 |
+
2304,
|
148 |
+
1152
|
149 |
+
],
|
150 |
+
[
|
151 |
+
2304,
|
152 |
+
1536
|
153 |
+
],
|
154 |
+
[
|
155 |
+
2304,
|
156 |
+
1920
|
157 |
+
],
|
158 |
+
[
|
159 |
+
2304,
|
160 |
+
2304
|
161 |
+
]
|
162 |
+
],
|
163 |
+
"image_split_resolution": null,
|
164 |
+
"initializer_range": 0.02,
|
165 |
+
"intermediate_size": 18944,
|
166 |
+
"max_position_embeddings": 32768,
|
167 |
+
"max_window_layers": 28,
|
168 |
+
"mm_hidden_size": 1152,
|
169 |
+
"mm_newline_position": "grid",
|
170 |
+
"mm_patch_merge_type": "spatial_unpad",
|
171 |
+
"mm_projector_lr": null,
|
172 |
+
"mm_projector_type": "mlp2x_gelu",
|
173 |
+
"mm_resampler_type": null,
|
174 |
+
"mm_spatial_pool_mode": "bilinear",
|
175 |
+
"mm_spatial_pool_stride": null,
|
176 |
+
"mm_tunable_parts": "mm_vision_tower,mm_mlp_adapter,mm_language_model",
|
177 |
+
"mm_use_im_patch_token": false,
|
178 |
+
"mm_use_im_start_end": false,
|
179 |
+
"mm_vision_select_feature": "patch",
|
180 |
+
"mm_vision_select_layer": -2,
|
181 |
+
"mm_vision_tower": "google/siglip-so400m-patch14-384",
|
182 |
+
"mm_vision_tower_lr": 2e-06,
|
183 |
+
"model_type": "qwen2",
|
184 |
+
"num_attention_heads": 28,
|
185 |
+
"num_hidden_layers": 28,
|
186 |
+
"num_key_value_heads": 4,
|
187 |
+
"pos_skipping_range": 4096,
|
188 |
+
"rms_norm_eps": 1e-06,
|
189 |
+
"rope_scaling": null,
|
190 |
+
"rope_theta": 1000000.0,
|
191 |
+
"sliding_window": 131072,
|
192 |
+
"tie_word_embeddings": false,
|
193 |
+
"tokenizer_model_max_length": 8192,
|
194 |
+
"tokenizer_padding_side": "right",
|
195 |
+
"torch_dtype": "bfloat16",
|
196 |
+
"transformers_version": "4.40.0.dev0",
|
197 |
+
"use_cache": false,
|
198 |
+
"use_mm_proj": true,
|
199 |
+
"use_pos_skipping": false,
|
200 |
+
"use_sliding_window": false,
|
201 |
+
"vision_tower_pretrained": null,
|
202 |
+
"vocab_size": 152064
|
203 |
+
}
|
checkpoint-2000/generation_config.json
ADDED
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"bos_token_id": 151643,
|
3 |
+
"do_sample": true,
|
4 |
+
"eos_token_id": [
|
5 |
+
151645,
|
6 |
+
151643
|
7 |
+
],
|
8 |
+
"pad_token_id": 151643,
|
9 |
+
"repetition_penalty": 1.05,
|
10 |
+
"temperature": 0.7,
|
11 |
+
"top_k": 20,
|
12 |
+
"top_p": 0.8,
|
13 |
+
"transformers_version": "4.40.0.dev0"
|
14 |
+
}
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e784eec9f44f1921f833f7db927454daad27d5920772db126c9d248eded5858c
|
3 |
+
size 1505698422
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:83c17212f58f9c499c8a81664aa0c02ccef09c2b43c1cb746b0dd18e4cbf9de3
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ab1f53cb50c04d61528c414baaa0cc0362bf2fa9e98fd4fa6aa5704765a56a8
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7196b53618aa1b048972d634b084ac4c1ee3f2788a91b08591f4153f87ca7876
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7ae60854326bf5e987f1c6bfadb8ca6792d10ca3749e2254f6d7ae227e17a133
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7c7bf4e03d0a993c0d9521b8effff93eecd4aa88ef39985f4fd076829fa174f8
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:08ed2a87e12693cfaace961512d879c89b0529b6b1e9273f24af856f4fa3a225
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b43a2d5376336f761f9f3274e7f9e2473e853e928cb4d30e9a4808b36343059
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a938b74892f7c54e56f226b105ef0a9707a035e27af1b5f458b8d13047a7f61c
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e469b66b15e1461c170f370f3be7d8dd31649b50b2c3da4c911c3e8a3e2f6ad3
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9b8a5cef74805cf2ce950dc96bf5a4e7c99d9dafd05a9485e2658bf31a31b624
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:71f868666eb7355289e6884089fc47eb7bd926fee94c7372f53ebfd909bf56b8
|
3 |
+
size 1505698422
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8f4c72d699163d24962ce891295af9b6da694bf1ac3bad8dce291a5e5aa616fe
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:62c8ecc09eac4bc57e826daa97cbf6b03b319a6672bea4803f01f82e2bd3737a
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4832166e62246993354d5c63e4d4415d177abd5ed60eee5427ff7bd943028ca9
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f752974379ed48d353c4e27b2895658bc8e8b14069f5073b3fdda034935ef2dc
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8d40f5f15730bbba70bddb35aeafe466bca80468d350eccfbcf8dd5e17d2c8b
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:604225b4019516f6a1c3d595244bc54b87af993e756a5a4b0e1ba07fe68a66b9
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:89178ba1dfbb36afe119d00d5800bddd2e52826746ef8ee98cd0b21812a96b60
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3946c87020767bbb246fc78ba43d0a68f24cac7f813b9fc1e200ddf4bdb9b929
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:60451ccf87e35d1065fe58da16ac3be27eb78b46bc4119b4985f389e71500fbe
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8729b3e87651d30c0358d79c90cebecafc3a813e70bae2fb67cddee85cbc85e1
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:13771c95c975e4d2d4b1e22b20d1442117609b9dcb8d420a82fb912e99882314
|
3 |
+
size 1505698422
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:10757d4b3a152009441bc57d8cebc96b2f6ad376129d2e3ca1686fcd6e0f2fca
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b667938d7a648eabdf68221bdc9a469c562b0a3b35819c6e7cd44f937b0397b5
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e4886e711332c0e5f33cb90bbaa156b5dd32257b50042a4401210ffb62175571
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:53b6efc30fe25965905b46bbad5e49e157594ea72faaa28ac757fe09070a1dbc
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dc1935307096eb06d6f57bcd328e6b97ec455840aace02a6ba1b7cd39b3e2533
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1229cc89c9e978f0d7b9c906c7351ca78033fe3ff5a4509b5bb7c427e6413f3f
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98fc13e761e66441491f1bae147a1bac62a5d5caa83fe9f1bd29ea5002eceae5
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b653f93635549a74493847f3cb33b23c47132fd05a3b652f43c87eaf56d71cb
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:b531ef1e4442d3f4d1591c060567a958b0b406122c9b1aa2e009436e84a82919
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67be010dca55eb813d75c74a14622dd85831c149af7db0c39891196b36e7365d
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:101789c2d5f4cf0528fbf63bb1eecbae801cee081b674a5f8fc85498e5fbacfa
|
3 |
+
size 1505698422
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4c0626b9b2997f7a040150236a9d4be5cd9d662476cd850979b503ca7e7423e9
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:103c4598a5041ccae782b49a5b7052a8311560847183262d32b74bfad62297f7
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6efa88f71156d10bf6e61ac747c9262b8ba4a1bc3d742e98987d4aa4a37f235a
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:57790c925d3de7034010ce0fcefc9b28fdf22a2ca845d8615b17589a98a8f9d9
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7f95b14fff2bcdc36ac21f6069f5b08445b77ea17cae051724e9ca8e6fdda7a7
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dd420d3a5cd1c0d4c7e1d475bd15878b680b87382b62d34b663c8166c468d85c
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:21f1f438786017c703bd725da52f5f50715e60004d763d7f85370aa4bcfbe0ec
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:49884b83aa6e1f33b625f0e5a1a79c96c9144d414eb79de1ae16c66239747aa9
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddcf8c302ee7ca12f092dfb11b2d736e79da10f7226f8177a00bf206d8180fac
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:137d2e30b593637febf4a0860fa1ba66c729e4847d552d8f2c0d1207bffbd8a1
|
3 |
+
size 1505698442
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0b1b06562f9fe964049c4e1f259b20e3644926f521af412ba489b6f0b6e1ab1b
|
3 |
+
size 1505698422
|
checkpoint-2000/global_step2000/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a239363f13755e1355ed51835d3eaaaaf1f40243ad362627f9dcf9209de1d39f
|
3 |
+
size 1505698442
|