scanner.cc 1.4 KB
Newer Older
Y
Yu Yang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30
//   Copyright (c) 2018 PaddlePaddle Authors. All Rights Reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License");
// you may not use this file except in compliance with the License.
// You may obtain a copy of the License at
//
//     http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software
// distributed under the License is distributed on an "AS IS" BASIS,
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
// See the License for the specific language governing permissions and
// limitations under the License.

#include "paddle/fluid/recordio/scanner.h"
#include "paddle/fluid/platform/enforce.h"

namespace paddle {
namespace recordio {
Scanner::Scanner(std::unique_ptr<std::istream> &&stream)
    : stream_(std::move(stream)) {
  Reset();
}

Scanner::Scanner(const std::string &filename) {
  stream_.reset(new std::ifstream(filename));
  Reset();
}

void Scanner::Reset() {
F
fengjiayi 已提交
31
  stream_->clear();
Y
Yu Yang 已提交
32 33 34 35
  stream_->seekg(0, std::ios::beg);
  ParseNextChunk();
}

Y
Yu Yang 已提交
36
std::string Scanner::Next() {
Y
Yu Yang 已提交
37
  PADDLE_ENFORCE(!eof_, "StopIteration");
Y
Yu Yang 已提交
38
  auto rec = cur_chunk_.Record(offset_++);
Y
Yu Yang 已提交
39 40 41 42 43 44 45 46 47 48 49 50 51 52
  if (offset_ == cur_chunk_.NumRecords()) {
    ParseNextChunk();
  }
  return rec;
}

void Scanner::ParseNextChunk() {
  eof_ = !cur_chunk_.Parse(*stream_);
  offset_ = 0;
}

bool Scanner::HasNext() const { return !eof_; }
}  // namespace recordio
}  // namespace paddle