diff --git a/tools/benchmark/run_multi_nodes.sh b/tools/benchmark/run_multi_nodes.sh new file mode 100755 index 0000000000000000000000000000000000000000..4a111999843a3ac64e11ba88cef20e768ad8653a --- /dev/null +++ b/tools/benchmark/run_multi_nodes.sh @@ -0,0 +1,14 @@ +#!/usr/bin/env bash + +# IP Addresses of all nodes, modify it corresponding to your own environment +ALL_NODE_IPS="10.10.10.1,10.10.10.2" +# IP Address of the current node, modify it corresponding to your own environment +CUR_NODE_IPS="10.10.10.1" + +python -m paddle.distributed.launch \ + --cluster_node_ips=$ALL_NODE_IPS \ + --node_ip=$CUR_NODE_IPS \ + --gpus="0,1,2,3" \ + tools/train.py \ + -c ./configs/ResNet/ResNet50.yaml \ + -o print_interval=10 diff --git a/tools/benchmark/run_single_node.sh b/tools/benchmark/run_single_node.sh new file mode 100755 index 0000000000000000000000000000000000000000..5ec44455700d821951da9ff5e51d50fd8e621b1d --- /dev/null +++ b/tools/benchmark/run_single_node.sh @@ -0,0 +1,7 @@ +#!/usr/bin/env bash + +python -m paddle.distributed.launch \ + --gpus="0,1,2,3" \ + tools/train.py \ + -c ./configs/ResNet/ResNet50.yaml \ + -o print_interval=10