meg HF staff commited on
Commit
b3e0a2b
·
verified ·
1 Parent(s): 9826ac5

Upload train.sh with huggingface_hub

Browse files
Files changed (1) hide show
  1. train.sh +5 -0
train.sh ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ #!/bin/bash
2
+ NUM_PROC=$1
3
+ shift
4
+ # the localhost fixes are from https://github.com/pytorch/pytorch/issues/73320
5
+ torchrun --rdzv_backend c10d --rdzv_endpoint localhost:0 --nproc_per_node=$NUM_PROC train.py "$@"