Unverified Commit 7645c660 authored by Da Zheng's avatar Da Zheng Committed by GitHub
Browse files

fix launch. (#1822)


Co-authored-by: default avatarUbuntu <ubuntu@ip-172-31-19-1.us-west-2.compute.internal>
parent 20734637
......@@ -64,9 +64,8 @@ def submit_jobs(args, udf_command):
torch_cmd = torch_cmd + ' ' + '--master_addr=' + str(hosts[0][0])
torch_cmd = torch_cmd + ' ' + '--master_port=' + str(1234)
for i in range(args.num_client):
node_id = int(i / client_count_per_machine)
ip, _ = hosts[node_id]
for node_id, host in enumerate(hosts):
ip, _ = host
new_torch_cmd = torch_cmd.replace('node_rank=0', 'node_rank='+str(node_id))
new_udf_command = udf_command.replace('python3', 'python3 ' + new_torch_cmd)
cmd = client_cmd + ' ' + new_udf_command
......
Markdown is supported
0% or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment