{ "data_path": "/h/pritam/pritam_ssd004/OUTPUTS/Video-LLM/Phase2/GenData/video_chat2_mistral/tp_random-random_erase-stage2/diverse_10.json", "media_root": "", "num_frames": 16, "yes_count": 500, "no_count": 750, "num_workers": 6, "batch_size": 2, "gradient_accumulation_steps": 4, "trainable_modules": [], "subset_size": -1, "init_lora_zero": false, "model_name_or_path": "/h/pritam/pritam_ssd004/.cache/huggingface/hub/VideoChat2_stage3_Mistral_7B", "model": { "lora_r": 128, "lora_alpha": 256, "lora_dropout": 0.05, "lora_bias": "none" }, "loss_alpha": 0.01, "loss_beta": 0.9, "loss_fn": "phrase_dpo_tkld", "optimizer": { "opt": "adamW", "lr": 2e-05, "opt_betas": [ 0.9, 0.999 ], "weight_decay": 0.02, "max_grad_norm": -1, "different_lr": { "enable": false, "module_names": [], "lr": 0.001 } }, "scheduler": { "sched": "cosine", "epochs": 1, "min_lr_multi": 0.01, "warmup_epochs": 0.0 }, "fp16": true, "gradient_checkpointing": true, "wandb": { "enable": true, "entity": "pritamqu", "project": "ViSA-VideoChat2" }, "dist_url": "env://", "device": "cuda", "output_dir": "/h/pritam/pritam_ssd004/OUTPUTS/Video-LLM/Phase2/ViSA/videochat2_mistral_7b/202503070207031433_phrase_dpo_tkld_2e-5_0.01_0.9_500_750_1_diverse_10_tp_random-random_erase_lora_128_256_cosine_lr_gradfix_dynamic", "resume": false, "debug": false, "log_freq": 1, "seed": 42, "save_latest": true, "auto_resume": true, "pretrained_path": "", "rank": 0, "world_size": 4, "gpu": 0, "distributed": true, "dist_backend": "nccl" }