From c012172f02dd2513b754137e20c328091b220c02 Mon Sep 17 00:00:00 2001 From: malin10 Date: Wed, 23 Sep 2020 14:30:46 +0800 Subject: [PATCH] test=develop, bug fix --- models/recall/word2vec/README.md | 9 ++++++--- models/recall/youtube_dnn/README.md | 4 ++-- 2 files changed, 8 insertions(+), 5 deletions(-) diff --git a/models/recall/word2vec/README.md b/models/recall/word2vec/README.md index 7f6ed752..88edf362 100644 --- a/models/recall/word2vec/README.md +++ b/models/recall/word2vec/README.md @@ -222,15 +222,18 @@ Infer phase2 of epoch 3 done, use time: 4.43099021912, global metrics: acc=[1.] ## 论文复现 1. 用原论文的完整数据复现论文效果需要在config.yaml修改超参: +``` - name: dataset_train batch_size: 100 # 1. 修改batch_size为100 type: DataLoader data_path: "{workspace}/data/all_train" # 2. 修改数据为全量训练数据 - word_count_dict_path: "{workspace}/data/all_dict/ word_count_dict.txt" # 3. 修改词表为全量词表 + word_count_dict_path: "{workspace}/data/all_dict/word_count_dict.txt" # 3. 修改词表为全量词表 data_converter: "{workspace}/w2v_reader.py" +- name: dataset_infer + data_path: "{workspace}/data/all_test" # 4. 修改数据为全量测试数据 + word_id_dict_path: "{workspace}/data/all_dict/word_id_dict.txt" # 5. 修改词表为全量词表 -- name: single_cpu_train - - epochs: # 4. 修改config.yaml中runner的epochs为5。 +``` 修改后运行方案:修改config.yaml中的'workspace'为config.yaml的目录位置,执行 ``` diff --git a/models/recall/youtube_dnn/README.md b/models/recall/youtube_dnn/README.md index d7ae92e2..7f44937f 100644 --- a/models/recall/youtube_dnn/README.md +++ b/models/recall/youtube_dnn/README.md @@ -8,7 +8,7 @@ ├── data.txt ├── test ├── data.txt -├── generate_ramdom_data # 随机训练数据生成文件 +├── generate_ramdom_data.py # 随机训练数据生成文件 ├── __init__.py ├── README.md # 文档 ├── model.py #模型文件 @@ -107,7 +107,7 @@ python infer.py --use_gpu 1 --test_epoch 19 --inference_model_dir ./inference_yo ``` ### 运行 ``` -python -m paddlerec.run -m paddlerec.models.recall.w2v +python -m paddlerec.run -m paddlerec.models.recall.youtube_dnn ``` ### 结果展示 -- GitLab