jiuhai commited on May 7

Commit

5d9fdf0

verified ·

1 Parent(s): 79ebdfb

Upload folder using huggingface_hub

Browse files

Files changed (30) hide show

checkpoint-19000/config.json +79 -0
checkpoint-19000/generation_config.json +6 -0
checkpoint-19000/model.safetensors +3 -0
checkpoint-19000/optimizer.pt +3 -0
checkpoint-19000/rng_state_0.pth +3 -0
checkpoint-19000/rng_state_1.pth +3 -0
checkpoint-19000/rng_state_2.pth +3 -0
checkpoint-19000/rng_state_3.pth +3 -0
checkpoint-19000/rng_state_4.pth +3 -0
checkpoint-19000/rng_state_5.pth +3 -0
checkpoint-19000/rng_state_6.pth +3 -0
checkpoint-19000/rng_state_7.pth +3 -0
checkpoint-19000/scheduler.pt +3 -0
checkpoint-19000/trainer_state.json +0 -0
checkpoint-19000/training_args.bin +3 -0
checkpoint-20000/config.json +79 -0
checkpoint-20000/generation_config.json +6 -0
checkpoint-20000/model.safetensors +3 -0
checkpoint-20000/optimizer.pt +3 -0
checkpoint-20000/rng_state_0.pth +3 -0
checkpoint-20000/rng_state_1.pth +3 -0
checkpoint-20000/rng_state_2.pth +3 -0
checkpoint-20000/rng_state_3.pth +3 -0
checkpoint-20000/rng_state_4.pth +3 -0
checkpoint-20000/rng_state_5.pth +3 -0
checkpoint-20000/rng_state_6.pth +3 -0
checkpoint-20000/rng_state_7.pth +3 -0
checkpoint-20000/scheduler.pt +3 -0
checkpoint-20000/trainer_state.json +0 -0
checkpoint-20000/training_args.bin +3 -0

checkpoint-19000/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "ar_steps": 1,
+  "architectures": [
+    "DiffVLMDiffusion"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "condition_layer": -1,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 1536,
+  "image_token_id": 151655,
+  "img_cross_attention_dim": 2048,
+  "img_diffuser_depth": 2,
+  "img_ffn_dim_multiplier": null,
+  "img_hidden_size": 1536,
+  "img_multiple_of": 256,
+  "img_norm_eps": 1e-05,
+  "img_num_attention_heads": 12,
+  "img_num_kv_heads": 12,
+  "img_qk_norm": true,
+  "in_channels": 32,
+  "initializer_range": 0.02,
+  "inject_img_diffuser": false,
+  "input_size": 32,
+  "intermediate_size": 8960,
+  "layer_group_size": 7,
+  "layerwise_start_idx": 0,
+  "lora_alpha": 128,
+  "lora_bias": "none",
+  "lora_dropout": 0.05,
+  "lora_enable": false,
+  "lora_r": 64,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen2_vl",
+  "non_linearity": 1,
+  "norm_elementwise_affine": true,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 2,
+  "patch_size": 1,
+  "repa_coeff": 0.1,
+  "repa_layers": "2",
+  "repa_shared": false,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": {
+    "mrope_section": [
+      16,
+      24,
+      24
+    ],
+    "rope_type": "default",
+    "type": "default"
+  },
+  "rope_theta": 1000000.0,
+  "sample_size": 128,
+  "sampling_steps": 28,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "use_repa": false,
+  "use_residual_attn": true,
+  "use_sliding_window": false,
+  "vae_path": "mit-han-lab/dc-ae-f32c32-in-1.0-diffusers",
+  "video_token_id": 151656,
+  "vision_config": {
+    "hidden_size": 1536,
+    "in_chans": 3,
+    "model_type": "qwen2_vl",
+    "spatial_patch_size": 14
+  },
+  "vision_end_token_id": 151653,
+  "vision_start_token_id": 151652,
+  "vision_token_id": 151654,
+  "vocab_size": 151936
+}

checkpoint-19000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 151643,
+  "eos_token_id": 151645,
+  "transformers_version": "4.47.0"
+}

checkpoint-19000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6144326a7c89a238b8a5728a2bb4d7e495cfa5f604ef0f5bc20a89128b1b1024
+size 4411759432

checkpoint-19000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3ec934a1d2e107e4bb8c4dc8b54f5d00fbfc689c8aaaf9647e2465cd8104f439
+size 6332050591

checkpoint-19000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f32834cd6fa8833497ee317351e8bd92140b42e322bbc0115d4b4b37ed58d4bc
+size 16389

checkpoint-19000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:95a13512bacf20dcc8134db2bdfcc167143318a0999e971892c590289db28c84
+size 16389

checkpoint-19000/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:765096eb5f9213d328752c2e51b4beb6ef4a7cc7bc8f5c06929f5561d163433d
+size 16389

checkpoint-19000/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ba20f7acaf426f0911480458241278d2ed8ac45881b6c9eec483a608cce85ec1
+size 16389

checkpoint-19000/rng_state_4.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f63d5298fb46bff7799bbb1c7de07e23ac92e940f84b3389c253601bf9049411
+size 16389

checkpoint-19000/rng_state_5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:83645ff5db2c307262ce73b44569c4db27f28082aaef9d22374c866b41c2c182
+size 16389

checkpoint-19000/rng_state_6.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2399e712b38badae75ef0924f2ded1aa1a017f6923505f9d3681191f44b37425
+size 16389

checkpoint-19000/rng_state_7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be063871626c47d466d1f0e8d0246a3808cf2c8112791c3490787609a3a49dbd
+size 16389

checkpoint-19000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c514e2fa22f1ec05f5c1eb9a9426d0db66f426a5951f0e7d5c30024338f9d9ee
+size 1465

checkpoint-19000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-19000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f0c0f94e3977c9f10667c6558f8cde45a2d25ed9a32ba11183a3f9b1ffb8874d
+size 6481

checkpoint-20000/config.json ADDED Viewed

	@@ -0,0 +1,79 @@

+{
+  "ar_steps": 1,
+  "architectures": [
+    "DiffVLMDiffusion"
+  ],
+  "attention_dropout": 0.0,
+  "bos_token_id": 151643,
+  "condition_layer": -1,
+  "eos_token_id": 151645,
+  "hidden_act": "silu",
+  "hidden_size": 1536,
+  "image_token_id": 151655,
+  "img_cross_attention_dim": 2048,
+  "img_diffuser_depth": 2,
+  "img_ffn_dim_multiplier": null,
+  "img_hidden_size": 1536,
+  "img_multiple_of": 256,
+  "img_norm_eps": 1e-05,
+  "img_num_attention_heads": 12,
+  "img_num_kv_heads": 12,
+  "img_qk_norm": true,
+  "in_channels": 32,
+  "initializer_range": 0.02,
+  "inject_img_diffuser": false,
+  "input_size": 32,
+  "intermediate_size": 8960,
+  "layer_group_size": 7,
+  "layerwise_start_idx": 0,
+  "lora_alpha": 128,
+  "lora_bias": "none",
+  "lora_dropout": 0.05,
+  "lora_enable": false,
+  "lora_r": 64,
+  "max_position_embeddings": 32768,
+  "max_window_layers": 28,
+  "model_type": "qwen2_vl",
+  "non_linearity": 1,
+  "norm_elementwise_affine": true,
+  "num_attention_heads": 12,
+  "num_hidden_layers": 28,
+  "num_key_value_heads": 2,
+  "patch_size": 1,
+  "repa_coeff": 0.1,
+  "repa_layers": "2",
+  "repa_shared": false,
+  "rms_norm_eps": 1e-06,
+  "rope_scaling": {
+    "mrope_section": [
+      16,
+      24,
+      24
+    ],
+    "rope_type": "default",
+    "type": "default"
+  },
+  "rope_theta": 1000000.0,
+  "sample_size": 128,
+  "sampling_steps": 28,
+  "sliding_window": null,
+  "tie_word_embeddings": true,
+  "torch_dtype": "bfloat16",
+  "transformers_version": "4.47.0",
+  "use_cache": true,
+  "use_repa": false,
+  "use_residual_attn": true,
+  "use_sliding_window": false,
+  "vae_path": "mit-han-lab/dc-ae-f32c32-in-1.0-diffusers",
+  "video_token_id": 151656,
+  "vision_config": {
+    "hidden_size": 1536,
+    "in_chans": 3,
+    "model_type": "qwen2_vl",
+    "spatial_patch_size": 14
+  },
+  "vision_end_token_id": 151653,
+  "vision_start_token_id": 151652,
+  "vision_token_id": 151654,
+  "vocab_size": 151936
+}

checkpoint-20000/generation_config.json ADDED Viewed

	@@ -0,0 +1,6 @@

+{
+  "_from_model_config": true,
+  "bos_token_id": 151643,
+  "eos_token_id": 151645,
+  "transformers_version": "4.47.0"
+}

checkpoint-20000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:68624365ec0341333330d8da4a7724ae5331bf5e447fd4186da3736d1d4ce838
+size 4411759432

checkpoint-20000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2e8e5d87624763bc232005bde21968d8b43e8fbb9bff2c95d47e207ceabdd509
+size 6332050591

checkpoint-20000/rng_state_0.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:091a066a8497bca04ac02c008c92b842286fd06b1d689d17f036c36d906f3a1d
+size 16389

checkpoint-20000/rng_state_1.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4ae95aac0102a46ef08b8460f940cfd69cb1891d84493d9cb77dee9f9a8f7076
+size 16389

checkpoint-20000/rng_state_2.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0ff002809b4b7760e8a734141510f12e3c88684ecaa5c94ec06a9424195f236
+size 16389

checkpoint-20000/rng_state_3.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7bb298fe8030ae0ec8b48aa5386603fe491a4d1f4fa9daac4214564f35e6d2f6
+size 16389

checkpoint-20000/rng_state_4.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:25806bd4ecf4dccd1d3394038ae3b548578eb3d84609740be67dfbb4097cf81e
+size 16389

checkpoint-20000/rng_state_5.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04a88b2bc0a760e8a9af73a15472580e7e004d8380b7360eb7aaa888d9a168bf
+size 16389

checkpoint-20000/rng_state_6.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:27c5451f352ce1d665dc562fbabd378d7bc35060eb1cd2a9c87a683147ba973a
+size 16389

checkpoint-20000/rng_state_7.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:e4f7c2d40bf3decc7c29649a7bbcbd72ab28a0048488cbb0678ff343879a50b6
+size 16389

checkpoint-20000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:316097d176c72b920fc8f57cc642dd3fcc80943e45ab12846b465890c925518c
+size 1465

checkpoint-20000/trainer_state.json ADDED Viewed

The diff for this file is too large to render. See raw diff

checkpoint-20000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f0c0f94e3977c9f10667c6558f8cde45a2d25ed9a32ba11183a3f9b1ffb8874d
+size 6481