Gaie
/

TI2T_13B_RM_2392

Model card Files Files and versions Community

TI2T_13B_RM_2392 / wandb /run-20241023_195332-5p9x2ymn /files /config.yaml

Gaie's picture

Add files using upload-large-folder tool

f7308d8 verified 2 months ago

2.53 kB

	_wandb:
	value:
	cli_version: 0.18.5
	m: []
	python_version: 3.11.10
	t:
	"1":
	- 1
	- 11
	- 41
	- 49
	- 51
	- 55
	- 71
	- 83
	- 98
	- 105
	"2":
	- 1
	- 11
	- 41
	- 49
	- 51
	- 55
	- 71
	- 83
	- 98
	- 105
	"3":
	- 2
	- 13
	- 16
	- 23
	- 55
	- 61
	"4": 3.11.10
	"5": 0.18.5
	"6": 4.46.0.dev0
	"8":
	- 5
	"12": 0.18.5
	"13": linux-x86_64
	data_cfgs:
	value:
	eval_data_files: null
	eval_datasets: /home/align-anything/datasets/40k_ti2t_filtered
	eval_name: null
	eval_optional_args: []
	eval_size: null
	eval_split: train
	eval_subset: null
	eval_template: AA_TI2T
	train_data_files: null
	train_datasets: /data/align-anything/jiayi/ti2t/refine_gen_wo_res/1021_13b_2000
	train_name: null
	train_optional_args: []
	train_size: null
	train_split: train
	train_subset: null
	train_template: AA_TI2T_Critique
	logger_cfgs:
	value:
	cache_dir: null
	log_project: align-anything
	log_run_name: rm
	log_type: wandb
	output_dir: /data/align-anything/jiayi/ti2t/rm_10_22_ours_13b_2000
	save_interval: 598
	model_cfgs:
	value:
	model_max_length: 2048
	model_name_or_path: /data/models/llava/llava-1.5-13b-hf
	trust_remote_code: true
	special_tokens:
	value: null
	train_cfgs:
	value:
	adam_betas:
	- 0.9
	- 0.95
	bf16: true
	ds_cfgs: ds_z3_config.json
	epochs: 5
	eval_interval: 10
	eval_strategy: epoch
	fp16: false
	freeze_language_model: false
	freeze_mm_proj: false
	freeze_vision_tower: true
	gradient_accumulation_steps: 1
	gradient_checkpointing: true
	learning_rate: 3e-05
	lr_scheduler_type: constant_with_warmup
	lr_warmup_ratio: 0.03
	per_device_eval_batch_size: 4
	per_device_train_batch_size: 4
	regularization: 0.001
	seed: 42
	weight_decay: 0