create_ctr_reader_op.cc 3.4 KB
Newer Older
Q
Qiao Longfei 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43
// Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/operators/reader/ctr_reader.h"

#include "paddle/fluid/operators/reader/lod_tensor_blocking_queue.h"
#include "paddle/fluid/operators/reader/reader_op_registry.h"

namespace paddle {
namespace operators {
namespace reader {

class CreateCTRReaderOp : public framework::OperatorBase {
 public:
  using framework::OperatorBase::OperatorBase;

 private:
  void RunImpl(const framework::Scope& scope,
               const platform::Place& dev_place) const override {
    auto* out = scope.FindVar(Output("Out"))
                    ->template GetMutable<framework::ReaderHolder>();
    if (out->Get() != nullptr) return;

    const std::string& queue_name = Input("blocking_queue");
    auto* queue_holder_var = scope.FindVar(queue_name);
    PADDLE_ENFORCE_NOT_NULL(
        queue_holder_var,
        "No LoDTensorBlockingQueueHolder variable with name %s found",
        queue_name);
    auto* queue_holder =
        queue_holder_var->template GetMutable<LoDTensorBlockingQueueHolder>();

Q
Qiao Longfei 已提交
44 45 46 47 48 49 50 51 52 53
    auto thread_num = Attr<int>("thread_num");
    auto sparse_slots = Attr<std::vector<std::string>>("sparse_slots");
    auto dense_slots = Attr<std::vector<std::string>>("dense_slots");
    auto batch_size = Attr<int>("batch_size");
    auto file_type = Attr<std::string>("file_type");
    auto file_format = Attr<std::string>("file_format");
    auto file_list = Attr<std::vector<std::string>>("file_list");
    out->Reset(std::make_shared<CTRReader>(
        queue_holder->GetQueue(), batch_size, thread_num, file_type,
        file_format, dense_slots, sparse_slots, file_list));
Q
Qiao Longfei 已提交
54 55 56 57 58 59 60 61
  }
};

class CreateCTRReaderOpMaker : public FileReaderMakerBase {
 protected:
  void Apply() override {
    AddInput("blocking_queue",
             "Name of the `LoDTensorBlockingQueueHolder` variable");
Q
Qiao Longfei 已提交
62 63
    AddAttr<int>("thread_num", "the thread num to read data");
    AddAttr<int>("batch_size", "the batch size of read data");
Q
Qiao Longfei 已提交
64 65
    AddAttr<std::string>("file_type", "plain or gzip").SetDefault("plain");
    AddAttr<std::string>("file_format", "svm or csv").SetDefault("csv");
Q
Qiao Longfei 已提交
66 67 68
    AddAttr<std::vector<std::string>>("file_list",
                                      "The list of files that need to read");
    AddAttr<std::vector<std::string>>(
Q
Qiao Longfei 已提交
69 70 71 72
        "dense_slots", "the sparse slots id that should be extract from file")
        .SetDefault({});
    AddAttr<std::vector<std::string>>(
        "sparse_slots", "the sparse slots id that should be extract from file");
Q
Qiao Longfei 已提交
73 74 75 76 77 78 79 80 81 82 83 84 85 86 87

    AddComment(R"DOC(
			Create CTRReader to support read ctr data with cpp.
      )DOC");
  }
};

}  // namespace reader
}  // namespace operators
}  // namespace paddle

namespace reader = ::paddle::operators::reader;

REGISTER_FILE_READER_OPERATOR(create_ctr_reader, reader::CreateCTRReaderOp,
                              reader::CreateCTRReaderOpMaker);