twitter-algorithm-ml/projects/twhin/scripts/run_in_docker.sh
2023-03-31 10:31:35 -05:00

10 lines
327 B
Bash

#! /bin/sh
torchrun \
--standalone \
--nnodes 1 \
--nproc_per_node $(echo $MACHINES_CONFIG | jq .chief.num_accelerators) \
/usr/src/app/tml/projects/twhin/run.py \
--config_yaml_path="/usr/src/app/tml/projects/twhin/config/local.yaml" \
--save_dir="gs://scratch-user.$USER.dp.gcp.twttr.net/twhin-training/$RANDOM"