/******************************************************************************* * Copyright 上海赜睿信息科技有限公司(Zilliz) - All Rights Reserved * Unauthorized copying of this file, via any medium is strictly prohibited. * Proprietary and confidential. ******************************************************************************/ #include "FaissExecutionEngine.h" #include #include #include #include #include #include #include #include #include "metrics/Metrics.h" namespace zilliz { namespace vecwise { namespace engine { FaissExecutionEngine::FaissExecutionEngine(uint16_t dimension, const std::string& location, const std::string& build_index_type, const std::string& raw_index_type) : pIndex_(faiss::index_factory(dimension, raw_index_type.c_str())), location_(location), build_index_type_(build_index_type), raw_index_type_(raw_index_type) { } FaissExecutionEngine::FaissExecutionEngine(std::shared_ptr index, const std::string& location, const std::string& build_index_type, const std::string& raw_index_type) : pIndex_(index), location_(location), build_index_type_(build_index_type), raw_index_type_(raw_index_type) { } Status FaissExecutionEngine::AddWithIds(long n, const float *xdata, const long *xids) { pIndex_->add_with_ids(n, xdata, xids); return Status::OK(); } size_t FaissExecutionEngine::Count() const { return (size_t)(pIndex_->ntotal); } size_t FaissExecutionEngine::Size() const { return (size_t)(Count() * pIndex_->d)*sizeof(float); } size_t FaissExecutionEngine::PhysicalSize() const { return (size_t)(Count() * pIndex_->d)*sizeof(float); } Status FaissExecutionEngine::Serialize() { write_index(pIndex_.get(), location_.c_str()); return Status::OK(); } Status FaissExecutionEngine::Load() { auto index = zilliz::vecwise::cache::CpuCacheMgr::GetInstance()->GetIndex(location_); bool to_cache = false; auto start_time = METRICS_NOW_TIME; if (!index) { index = read_index(location_); to_cache = true; LOG(DEBUG) << "Disk io from: " << location_; } pIndex_ = index->data(); if (to_cache) { Cache(); auto end_time = METRICS_NOW_TIME; auto total_time = METRICS_MICROSECONDS(start_time, end_time); server::Metrics::GetInstance().FaissDiskLoadDurationSecondsHistogramObserve(total_time); double total_size = (pIndex_->d) * (pIndex_->ntotal) * 4; server::Metrics::GetInstance().FaissDiskLoadSizeBytesHistogramObserve(total_size); // server::Metrics::GetInstance().FaissDiskLoadIOSpeedHistogramObserve(total_size/double(total_time)); server::Metrics::GetInstance().FaissDiskLoadIOSpeedGaugeSet(total_size/double(total_time)); } return Status::OK(); } Status FaissExecutionEngine::Merge(const std::string& location) { if (location == location_) { return Status::Error("Cannot Merge Self"); } auto to_merge = zilliz::vecwise::cache::CpuCacheMgr::GetInstance()->GetIndex(location); if (!to_merge) { to_merge = read_index(location); } auto file_index = dynamic_cast(to_merge->data().get()); pIndex_->add_with_ids(file_index->ntotal, dynamic_cast(file_index->index)->xb.data(), file_index->id_map.data()); return Status::OK(); } ExecutionEnginePtr FaissExecutionEngine::BuildIndex(const std::string& location) { auto opd = std::make_shared(); opd->d = pIndex_->d; opd->index_type = build_index_type_; IndexBuilderPtr pBuilder = GetIndexBuilder(opd); auto from_index = dynamic_cast(pIndex_.get()); auto index = pBuilder->build_all(from_index->ntotal, dynamic_cast(from_index->index)->xb.data(), from_index->id_map.data()); ExecutionEnginePtr new_ee(new FaissExecutionEngine(index->data(), location, build_index_type_, raw_index_type_)); new_ee->Serialize(); return new_ee; } Status FaissExecutionEngine::Search(long n, const float *data, long k, float *distances, long *labels) const { pIndex_->search(n, data, k, distances, labels); return Status::OK(); } Status FaissExecutionEngine::Cache() { zilliz::vecwise::cache::CpuCacheMgr::GetInstance( )->InsertItem(location_, std::make_shared(pIndex_)); return Status::OK(); } } // namespace engine } // namespace vecwise } // namespace zilliz