num_processes = 1 num_machines = 1 num_cpu_threads_per_process = 2 dynamo_backend = "no" dynamo_mode = "default" mixed_precision = "bf16"