Exit the process with the subprocess's return code when utilizing the CLI

Former-commit-id: f6b62f00707baf582bc168c15886732ac5218524
This commit is contained in:
faddddeout 2024-06-27 09:58:00 +00:00
parent 58607ec1b0
commit 9a2e77a5d8

View File

@ -91,7 +91,7 @@ def main():
master_addr = os.environ.get("MASTER_ADDR", "127.0.0.1")
master_port = os.environ.get("MASTER_PORT", str(random.randint(20001, 29999)))
logger.info("Initializing distributed tasks at: {}:{}".format(master_addr, master_port))
subprocess.run(
subproc = subprocess.run(
(
"torchrun --nnodes {nnodes} --node_rank {node_rank} --nproc_per_node {nproc_per_node} "
"--master_addr {master_addr} --master_port {master_port} {file_name} {args}"
@ -106,6 +106,7 @@ def main():
),
shell=True,
)
sys.exit(subproc.returncode)
else:
run_exp()
elif command == Command.WEBDEMO: