dataset: align_stage_components: - download/llava-laion-cc-sbu-558k/chat.json - download/llava-laion-cc-sbu-558k dataset_id: llava-v15 dataset_resampled: true dataset_root_dir: data finetune_stage_components: - /local/home/weizhiwang/data/MAmmoTH-VL-Instruct-12M/mammoth_si_10M_simple.jsonl - /share/edc/home/weizhiwang/data/MAmmoTH-VL-Instruct-12M/single_image_data max_num_images: 6 min_num_images: 1 train_num_samples: 200000 type: llava-v15 workers: 4 model: align_epochs: 1 align_global_batch_size: 256 align_learning_rate: 0.001 align_lr_scheduler_type: linear-warmup+cosine-decay align_max_grad_norm: 1.0 align_max_steps: null align_per_device_batch_size: 16 align_train_strategy: fsdp-shard-grad-op align_warmup_ratio: 0.03 align_weight_decay: 0.0 arch_specifier: full-align+729-avgpool enable_gradient_checkpointing: true enable_mixed_precision_training: true finetune_epochs: 1 finetune_global_batch_size: 128 finetune_learning_rate: 2.0e-05 finetune_lr_scheduler_type: linear-warmup+cosine-decay finetune_max_grad_norm: 1.0 finetune_max_steps: null finetune_per_device_batch_size: 2 finetune_train_strategy: fsdp-full-shard finetune_warmup_ratio: 0.03 finetune_weight_decay: 0.1 image_resize_strategy: resize-naive llm_backbone_id: qwen2.5-1.5b-instruct llm_max_length: 4096 model_id: qwen2.5-1.5b-instruct-continue-training-ccs-datacomp-mlm-filter-mammoth-10m pretrain_epochs: 1 pretrain_global_batch_size: 512 pretrain_learning_rate: 5.0e-05 pretrain_lr_scheduler_type: linear-warmup+cosine-decay pretrain_max_grad_norm: 1.0 pretrain_max_steps: null pretrain_per_device_batch_size: 16 pretrain_train_strategy: fsdp-full-shard pretrain_warmup_ratio: 0.03 pretrain_weight_decay: 0.01 reduce_in_full_precision: false type: one-stage+7b vision_backbone_id: siglip-vit-so400m-384px mount_path: Qwen pretrained_checkpoint: /local/home/weizhiwang/checkpoints/obelics+qwen2.5-1.5b-instruct-continue-training-ccs-datacomp-mlm-filter+stage-pretrain+x7/checkpoints/latest-checkpoint.pt run_id: qwen2.5-1.5b-instruct-continue-training-ccs-datacomp-mlm-filter-mammoth-10m+stage-finetune+x7 run_root_dir: /share/edc/home/weizhiwang/checkpoints seed: 7 stage: finetune trackers: - jsonl wandb_entity: null wandb_project: mmpretrain