opt reward model

65604ada · u010280923 · 887ca941 · 65604ada
隐藏空白更改
内联并排

Showing with 2 addition and 2 deletion

src/trainer.py src/trainer.py +2 -2

未找到文件。
--- a/src/trainer.py
+++ b/src/trainer.py
@@ -248,7 +248,7 @@ class rm_train_callback(pl.Callback):
                    to_save_dict = pl_module.state_dict()
                    my_save(
                        to_save_dict,
-                        f"{args.proj_dir}/rwkv-final.pth",
+                        f"{args.proj_dir}/rm-final.pth",
                    )
@@ -276,7 +276,7 @@ class rm_train_callback(pl.Callback):
                try:
                    my_save(
                        to_save_dict,
-                        f"{args.proj_dir}/rwkv-{args.epoch_begin + trainer.current_epoch}.pth",
+                        f"{args.proj_dir}/rm-{args.epoch_begin + trainer.current_epoch}.pth",
                    )
                except Exception as e:
                    print('Error\n\n', e, '\n\n')