diff --git a/ppcls/configs/PULC/safety_helmet/PPLCNet_x1_0_distillation.yaml b/ppcls/configs/PULC/safety_helmet/PPLCNet_x1_0_distillation.yaml index fc1073d9b24584569a6dc14c4a5760436aa7497d..0fce89bc094b7c2311d0fae69b360ede0710cf21 100644 --- a/ppcls/configs/PULC/safety_helmet/PPLCNet_x1_0_distillation.yaml +++ b/ppcls/configs/PULC/safety_helmet/PPLCNet_x1_0_distillation.yaml @@ -26,27 +26,42 @@ Arch: pretrained_list: # if not null, its lengths should be same as models freeze_params_list: - - True + - False - False use_sync_bn: True models: - Teacher: - name: ResNet101_vd + name: PPLCNet_x1_0 class_num: *class_num - pretrained: pretrained/teacher_ResNet101_vd_0/ResNet101_vd/best_model + pretrained: True + use_ssld: True + return_stages: True + return_patterns: ["blocks3", "blocks4", "blocks5", "blocks6"] - Student: name: PPLCNet_x1_0 class_num: *class_num pretrained: True use_ssld: True + return_stages: True + return_patterns: ["blocks3", "blocks4", "blocks5", "blocks6"] infer_model_name: "Student" # loss function config for traing/eval process Loss: Train: + - DistillationGTCELoss: + weight: 1.0 + key: logits + model_names: ["Student", "Teacher"] - DistillationDMLLoss: weight: 1.0 + key: logits + model_name_pairs: + - ["Student", "Teacher"] + - DistillationDistanceLoss: + weight: 1.0 + key: "blocks4" model_name_pairs: - ["Student", "Teacher"] Eval: diff --git a/ppcls/configs/PULC/safety_helmet/search.yaml b/ppcls/configs/PULC/safety_helmet/search.yaml index f1787641efe3f8c7ec0994bbb0879e1bd463a26b..09bf2e9e5cdfe0008a2c0010a29d6a33a8d879a1 100644 --- a/ppcls/configs/PULC/safety_helmet/search.yaml +++ b/ppcls/configs/PULC/safety_helmet/search.yaml @@ -30,11 +30,7 @@ search_dict: - [0.0, 0.4, 0.4, 0.8, 0.8, 1.0] - [1.0, 1.0, 1.0, 1.0, 1.0, 1.0] teacher: - rm_keys: - - Arch.lr_mult_list - search_values: - - ResNet101_vd - - ResNet50_vd + algorithm: "udml" final_replace: Arch.lr_mult_list: Arch.models.1.Student.lr_mult_list