compute_environment: LOCAL_MACHINE | |
deepspeed_config: | |
deepspeed_multinode_launcher: standard | |
gradient_accumulation_steps: 1 | |
gradient_clipping: 1.5 | |
offload_optimizer_device: none | |
offload_param_device: none | |
zero3_init_flag: true | |
zero_stage: 2 | |
reduce_scatter: false | |
overlap_comm: true | |
distributed_type: DEEPSPEED | |
downcast_bf16: 'no' | |
dynamo_backend: 'NO' | |
fsdp_config: {} | |
machine_rank: 0 | |
main_process_ip: 10.82.42.75 | |
main_process_port: 22280 | |
main_training_function: main | |
megatron_lm_config: {} | |
mixed_precision: fp16 | |
num_machines: 1 | |
num_processes: 8 | |
rdzv_backend: static | |
same_network: true | |
use_cpu: false | |