pritamqu's picture
Upload folder using huggingface_hub
11aa5e5 verified
raw
history blame
1.68 kB
{
"data_path": "/h/pritam/pritam_ssd004/OUTPUTS/Video-LLM/Phase2/GenData/video_chat2_mistral/tp_random-random_erase-stage2/diverse_10.json",
"media_root": "",
"num_frames": 16,
"yes_count": 500,
"no_count": 750,
"num_workers": 6,
"batch_size": 2,
"gradient_accumulation_steps": 4,
"trainable_modules": [],
"subset_size": -1,
"init_lora_zero": false,
"model_name_or_path": "/h/pritam/pritam_ssd004/.cache/huggingface/hub/VideoChat2_stage3_Mistral_7B",
"model": {
"lora_r": 128,
"lora_alpha": 256,
"lora_dropout": 0.05,
"lora_bias": "none"
},
"loss_alpha": 0.01,
"loss_beta": 0.9,
"loss_fn": "phrase_dpo_tkld",
"optimizer": {
"opt": "adamW",
"lr": 2e-05,
"opt_betas": [
0.9,
0.999
],
"weight_decay": 0.02,
"max_grad_norm": -1,
"different_lr": {
"enable": false,
"module_names": [],
"lr": 0.001
}
},
"scheduler": {
"sched": "cosine",
"epochs": 1,
"min_lr_multi": 0.01,
"warmup_epochs": 0.0
},
"fp16": true,
"gradient_checkpointing": true,
"wandb": {
"enable": true,
"entity": "pritamqu",
"project": "ViSA-VideoChat2"
},
"dist_url": "env://",
"device": "cuda",
"output_dir": "/h/pritam/pritam_ssd004/OUTPUTS/Video-LLM/Phase2/ViSA/videochat2_mistral_7b/202503070207031433_phrase_dpo_tkld_2e-5_0.01_0.9_500_750_1_diverse_10_tp_random-random_erase_lora_128_256_cosine_lr_gradfix_dynamic",
"resume": false,
"debug": false,
"log_freq": 1,
"seed": 42,
"save_latest": true,
"auto_resume": true,
"pretrained_path": "",
"rank": 0,
"world_size": 4,
"gpu": 0,
"distributed": true,
"dist_backend": "nccl"
}