f"{detected_str} but ignoring it because one or several of --include/--exclude/--num_gpus/--num_nodes cl args were used. If you want to use CUDA_VISIBLE_DEVICES don't pass any of these arguments to deepspeed."
)
...
...
@@ -416,20 +412,17 @@ def main(args=None):
ifnotmulti_node_execandargs.num_nodes>1:
raiseValueError("Num nodes is >1 but no extra nodes available via hostfile")
f"Using hostfile at {args.hostfile} but host={first_host} was not reachable via ssh. If you are running with a single node please remove {args.hostfile} or setup passwordless ssh."