提交 11d0faa2 编写于 作者: C chenguowei01

update train.py

上级 10ee66c7
...@@ -197,7 +197,7 @@ def train(model, ...@@ -197,7 +197,7 @@ def train(model,
avg_loss += loss.numpy()[0] avg_loss += loss.numpy()[0]
lr = optimizer.current_step_lr() lr = optimizer.current_step_lr()
num_steps += 1 num_steps += 1
if num_steps % log_steps == 0: if num_steps % log_steps == 0 and ParallelEnv().local_rank == 0:
avg_loss /= log_steps avg_loss /= log_steps
time_step = timer.elapsed_time() / log_steps time_step = timer.elapsed_time() / log_steps
remain_steps = total_steps - num_steps remain_steps = total_steps - num_steps
...@@ -206,14 +206,14 @@ def train(model, ...@@ -206,14 +206,14 @@ def train(model,
.format(epoch + 1, num_epochs, step + 1, steps_per_epoch, .format(epoch + 1, num_epochs, step + 1, steps_per_epoch,
avg_loss, lr, time_step, avg_loss, lr, time_step,
calculate_eta(remain_steps, time_step))) calculate_eta(remain_steps, time_step)))
avg_loss = 0.0
timer.restart()
if use_vdl: if use_vdl:
log_writer.add_scalar('Train/loss', avg_loss, num_steps) log_writer.add_scalar('Train/loss', avg_loss, num_steps)
log_writer.add_scalar('Train/lr', lr, num_steps) log_writer.add_scalar('Train/lr', lr, num_steps)
avg_loss = 0.0
timer.restart()
if ((epoch + 1) % save_interval_epochs == 0 if ((epoch + 1) % save_interval_epochs == 0
or epoch == num_epochs - 1) and ParallelEnv().local_rank == 0: or epoch + 1 == num_epochs) and ParallelEnv().local_rank == 0:
current_save_dir = os.path.join(save_dir, current_save_dir = os.path.join(save_dir,
"epoch_{}".format(epoch + 1)) "epoch_{}".format(epoch + 1))
if not os.path.isdir(current_save_dir): if not os.path.isdir(current_save_dir):
...@@ -235,10 +235,12 @@ def train(model, ...@@ -235,10 +235,12 @@ def train(model,
epoch_id=epoch + 1) epoch_id=epoch + 1)
if use_vdl: if use_vdl:
log_writer.add_scalar('Evaluate/mean_iou', mean_iou, log_writer.add_scalar('Evaluate/mean_iou', mean_iou,
num_steps) epoch + 1)
log_writer.add_scalar('Evaluate/mean_acc', mean_acc, log_writer.add_scalar('Evaluate/mean_acc', mean_acc,
num_steps) epoch + 1)
model.train() model.train()
if use_vdl:
log_writer.close()
def main(args): def main(args):
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册