Schema.cpp 3.1 KB
Newer Older
C
cai.zhang 已提交
1 2 3 4 5 6 7 8 9 10 11 12 13
// Copyright (C) 2019-2020 Zilliz. All rights reserved.
//
// Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance
// with the License. You may obtain a copy of the License at
//
// http://www.apache.org/licenses/LICENSE-2.0
//
// Unless required by applicable law or agreed to in writing, software distributed under the License
// is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
// or implied. See the License for the specific language governing permissions and limitations under the License

#include "common/Schema.h"
#include <google/protobuf/text_format.h>
X
XuanYang-cn 已提交
14
#include <boost/lexical_cast.hpp>
15
#include "common/SystemProperty.h"
C
cai.zhang 已提交
16 17

namespace milvus {
X
XuanYang-cn 已提交
18 19 20 21 22 23 24 25 26 27 28 29

using std::string;
static std::map<string, string>
RepeatedKeyValToMap(const google::protobuf::RepeatedPtrField<proto::common::KeyValuePair>& kvs) {
    std::map<string, string> mapping;
    for (auto& kv : kvs) {
        AssertInfo(!mapping.count(kv.key()), "repeat key(" + kv.key() + ") in protobuf");
        mapping.emplace(kv.key(), kv.value());
    }
    return mapping;
}

C
cai.zhang 已提交
30 31 32 33
std::shared_ptr<Schema>
Schema::ParseFrom(const milvus::proto::schema::CollectionSchema& schema_proto) {
    auto schema = std::make_shared<Schema>();
    schema->set_auto_id(schema_proto.autoid());
B
bigsheeper 已提交
34 35 36

    // NOTE: only two system

C
cai.zhang 已提交
37
    for (const milvus::proto::schema::FieldSchema& child : schema_proto.fields()) {
G
GuoRentong 已提交
38
        auto field_offset = FieldOffset(schema->size());
39 40 41 42
        auto field_id = FieldId(child.fieldid());
        auto name = FieldName(child.name());

        if (field_id.get() < 100) {
B
bigsheeper 已提交
43
            // system field id
44 45 46
            auto is_system = SystemProperty::Instance().SystemFieldVerify(name, field_id);
            AssertInfo(is_system,
                       "invalid system type: name(" + name.get() + "), id(" + std::to_string(field_id.get()) + ")");
B
bigsheeper 已提交
47 48 49
            continue;
        }

C
cai.zhang 已提交
50 51 52 53
        auto data_type = DataType(child.data_type());

        if (child.is_primary_key()) {
            AssertInfo(!schema->primary_key_offset_opt_.has_value(), "repetitive primary key");
G
GuoRentong 已提交
54
            schema->primary_key_offset_opt_ = field_offset;
C
cai.zhang 已提交
55 56
        }

N
neza2017 已提交
57
        if (datatype_is_vector(data_type)) {
X
XuanYang-cn 已提交
58 59 60 61 62
            auto type_map = RepeatedKeyValToMap(child.type_params());
            auto index_map = RepeatedKeyValToMap(child.index_params());
            if (!index_map.count("metric_type")) {
                auto default_metric_type =
                    data_type == DataType::VECTOR_FLOAT ? MetricType::METRIC_L2 : MetricType::METRIC_Jaccard;
F
FluorineDog 已提交
63
                index_map["metric_type"] = MetricTypeToName(default_metric_type);
X
XuanYang-cn 已提交
64 65 66 67 68 69
            }

            AssertInfo(type_map.count("dim"), "dim not found");
            auto dim = boost::lexical_cast<int64_t>(type_map.at("dim"));
            AssertInfo(index_map.count("metric_type"), "index not found");
            auto metric_type = GetMetricType(index_map.at("metric_type"));
70
            schema->AddField(name, field_id, data_type, dim, metric_type);
X
XuanYang-cn 已提交
71
        } else {
72
            schema->AddField(name, field_id, data_type);
X
XuanYang-cn 已提交
73
        }
C
cai.zhang 已提交
74 75 76 77
    }
    return schema;
}
}  // namespace milvus