未验证 提交 441d24d3 编写于 作者: S ShawnXuan 提交者: GitHub

Merge pull request #132 from Oneflow-Inc/args_ctrl_port

Args ctrl port
...@@ -52,6 +52,7 @@ def get_parser(parser=None): ...@@ -52,6 +52,7 @@ def get_parser(parser=None):
help='node/machine number for training') help='node/machine number for training')
parser.add_argument('--node_ips', type=str_list, default=['192.168.1.13', '192.168.1.14'], parser.add_argument('--node_ips', type=str_list, default=['192.168.1.13', '192.168.1.14'],
help='nodes ip list for training, devided by ",", length >= num_nodes') help='nodes ip list for training, devided by ",", length >= num_nodes')
parser.add_argument("--ctrl_port", type=int, default=50051, help='ctrl_port for multinode job')
parser.add_argument("--model", type=str, default="resnet50", parser.add_argument("--model", type=str, default="resnet50",
help="resnet50") help="resnet50")
......
...@@ -25,7 +25,7 @@ import oneflow as flow ...@@ -25,7 +25,7 @@ import oneflow as flow
def InitNodes(args): def InitNodes(args):
if args.num_nodes > 1: if args.num_nodes > 1:
assert args.num_nodes <= len(args.node_ips) assert args.num_nodes <= len(args.node_ips)
flow.env.ctrl_port(12138) flow.env.ctrl_port(args.ctrl_port)
nodes = [] nodes = []
for ip in args.node_ips[:args.num_nodes]: for ip in args.node_ips[:args.num_nodes]:
addr_dict = {} addr_dict = {}
......
...@@ -50,6 +50,7 @@ parser.add_argument('--num_nodes', type=int, default=1, ...@@ -50,6 +50,7 @@ parser.add_argument('--num_nodes', type=int, default=1,
help='node/machine number for training') help='node/machine number for training')
parser.add_argument('--node_ips', type=str_list, default=['192.168.1.13', '192.168.1.14'], parser.add_argument('--node_ips', type=str_list, default=['192.168.1.13', '192.168.1.14'],
help='nodes ip list for training, devided by ",", length >= num_nodes') help='nodes ip list for training, devided by ",", length >= num_nodes')
parser.add_argument("--ctrl_port", type=int, default=50051, help='ctrl_port for multinode job')
parser.add_argument('--hidden_units_num', type=int, default=7) parser.add_argument('--hidden_units_num', type=int, default=7)
parser.add_argument('--hidden_size', type=int, default=1024) parser.add_argument('--hidden_size', type=int, default=1024)
...@@ -189,7 +190,7 @@ def eval_job(): ...@@ -189,7 +190,7 @@ def eval_job():
def InitNodes(args): def InitNodes(args):
if args.num_nodes > 1: if args.num_nodes > 1:
assert args.num_nodes <= len(args.node_ips) assert args.num_nodes <= len(args.node_ips)
flow.env.ctrl_port(12138) flow.env.ctrl_port(args.ctrl_port)
nodes = [] nodes = []
for ip in args.node_ips[:args.num_nodes]: for ip in args.node_ips[:args.num_nodes]:
addr_dict = {} addr_dict = {}
......
...@@ -48,6 +48,7 @@ def get_parser(parser=None): ...@@ -48,6 +48,7 @@ def get_parser(parser=None):
help='node/machine number for training') help='node/machine number for training')
parser.add_argument('--node_ips', type=str_list, default=['192.168.1.13', '192.168.1.14'], parser.add_argument('--node_ips', type=str_list, default=['192.168.1.13', '192.168.1.14'],
help='nodes ip list for training, devided by ",", length >= num_nodes') help='nodes ip list for training, devided by ",", length >= num_nodes')
parser.add_argument("--ctrl_port", type=int, default=50051, help='ctrl_port for multinode job')
# train # train
parser.add_argument("--learning_rate", type=float, default=1e-4, help="Learning rate") parser.add_argument("--learning_rate", type=float, default=1e-4, help="Learning rate")
......
...@@ -26,7 +26,7 @@ import oneflow as flow ...@@ -26,7 +26,7 @@ import oneflow as flow
def InitNodes(args): def InitNodes(args):
if args.num_nodes > 1: if args.num_nodes > 1:
assert args.num_nodes <= len(args.node_ips) assert args.num_nodes <= len(args.node_ips)
#flow.env.ctrl_port(12138) flow.env.ctrl_port(args.ctrl_port)
nodes = [] nodes = []
for ip in args.node_ips[:args.num_nodes]: for ip in args.node_ips[:args.num_nodes]:
addr_dict = {} addr_dict = {}
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册