compute_environment: LOCAL_MACHINE deepspeed_config: {} distributed_type: MULTI_GPU downcast_bfloat16: "no" fp16: "yes" machine_rank: 0 main_process_ip: "127.0.0.1" main_process_port: 29500 main_training_function: main meets_minimum_cuda_version: 11.7 mixed_precision: fp16 num_machines: 1 num_processes: 1 use_cpu: false