PrometheusMetrics.cpp 5.1 KB
Newer Older
Y
yu yunfeng 已提交
1 2 3 4 5 6 7
/*******************************************************************************
 * Copyright 上海赜睿信息科技有限公司(Zilliz) - All Rights Reserved
 * Unauthorized copying of this file, via any medium is strictly prohibited.
 * Proprietary and confidential.
 ******************************************************************************/

#include "PrometheusMetrics.h"
G
groot 已提交
8
#include "utils/Log.h"
Y
yu yunfeng 已提交
9
#include "SystemInfo.h"
Y
yu yunfeng 已提交
10

11

Y
yu yunfeng 已提交
12 13 14 15 16 17
namespace zilliz {
namespace vecwise {
namespace server {

ServerError
PrometheusMetrics::Init() {
G
groot 已提交
18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34
    try {
        ConfigNode &configNode = ServerConfig::GetInstance().GetConfig(CONFIG_METRIC);
        startup_ = configNode.GetValue(CONFIG_METRIC_IS_STARTUP) == "true" ? true : false;
        // Following should be read from config file.
        const std::string bind_address = configNode.GetChild(CONFIG_PROMETHEUS).GetValue(CONFIG_METRIC_PROMETHEUS_PORT);
        const std::string uri = std::string("/metrics");
        const std::size_t num_threads = 2;

        // Init Exposer
        exposer_ptr_ = std::make_shared<prometheus::Exposer>(bind_address, uri, num_threads);

        // Exposer Registry
        exposer_ptr_->RegisterCollectable(registry_);
    } catch (std::exception& ex) {
        SERVER_LOG_ERROR << "Failed to connect prometheus server: " << std::string(ex.what());
        return SERVER_UNEXPECTED_ERROR;
    }
Y
yu yunfeng 已提交
35 36

    return SERVER_SUCCESS;
Y
yu yunfeng 已提交
37 38 39

}

Y
fix  
yu yunfeng 已提交
40

Y
yu yunfeng 已提交
41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57
void
PrometheusMetrics::CPUUsagePercentSet()  {
    if(!startup_) return ;
    double usage_percent = server::SystemInfo::GetInstance().CPUPercent();
    CPU_usage_percent_.Set(usage_percent);
}

void
PrometheusMetrics::RAMUsagePercentSet() {
    if(!startup_) return ;
    double usage_percent = server::SystemInfo::GetInstance().MemoryPercent();
    RAM_usage_percent_.Set(usage_percent);
}

void
PrometheusMetrics::GPUPercentGaugeSet() {
    if(!startup_) return;
Y
fix  
yu yunfeng 已提交
58
    int numDevide = server::SystemInfo::GetInstance().num_device();
Y
yu yunfeng 已提交
59
    std::vector<unsigned int> values = server::SystemInfo::GetInstance().GPUPercent();
Y
fix  
yu yunfeng 已提交
60 61 62
//    for (int i = 0; i < numDevide; ++i) {
//        GPU_percent_gauges_[i].Set(static_cast<double>(values[i]));
//    }
Y
yu yunfeng 已提交
63 64 65 66 67 68 69 70 71 72 73 74 75 76
    if(numDevide >= 1) GPU0_percent_gauge_.Set(static_cast<double>(values[0]));
    if(numDevide >= 2) GPU1_percent_gauge_.Set(static_cast<double>(values[1]));
    if(numDevide >= 3) GPU2_percent_gauge_.Set(static_cast<double>(values[2]));
    if(numDevide >= 4) GPU3_percent_gauge_.Set(static_cast<double>(values[3]));
    if(numDevide >= 5) GPU4_percent_gauge_.Set(static_cast<double>(values[4]));
    if(numDevide >= 6) GPU5_percent_gauge_.Set(static_cast<double>(values[5]));
    if(numDevide >= 7) GPU6_percent_gauge_.Set(static_cast<double>(values[6]));
    if(numDevide >= 8) GPU7_percent_gauge_.Set(static_cast<double>(values[7]));

    // to do
}

void PrometheusMetrics::GPUMemoryUsageGaugeSet() {
    if(!startup_) return;
Y
fix  
yu yunfeng 已提交
77
    int numDevide = server::SystemInfo::GetInstance().num_device();
Y
yu yunfeng 已提交
78
    std::vector<unsigned long long> values = server::SystemInfo::GetInstance().GPUMemoryUsed();
Y
fix  
yu yunfeng 已提交
79
    constexpr unsigned long long MtoB = 1024*1024;
Y
yu yunfeng 已提交
80
    int numDevice = values.size();
Y
fix  
yu yunfeng 已提交
81 82 83
//    for (int i = 0; i < numDevice; ++i) {
//        GPU_memory_usage_gauges_[i].Set(values[i]/MtoB);
//    }
Y
yu yunfeng 已提交
84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102
    if(numDevice >=1) GPU0_memory_usage_gauge_.Set(values[0]/MtoB);
    if(numDevice >=2) GPU1_memory_usage_gauge_.Set(values[1]/MtoB);
    if(numDevice >=3) GPU2_memory_usage_gauge_.Set(values[2]/MtoB);
    if(numDevice >=4) GPU3_memory_usage_gauge_.Set(values[3]/MtoB);
    if(numDevice >=5) GPU4_memory_usage_gauge_.Set(values[4]/MtoB);
    if(numDevice >=6) GPU5_memory_usage_gauge_.Set(values[5]/MtoB);
    if(numDevice >=7) GPU6_memory_usage_gauge_.Set(values[6]/MtoB);
    if(numDevice >=8) GPU7_memory_usage_gauge_.Set(values[7]/MtoB);

    // to do
}
void PrometheusMetrics::AddVectorsPerSecondGaugeSet(int num_vector, int dim, double time) {
    // MB/s
    if(!startup_) return;

    long long MtoB = 1024*1024;
    long long size = num_vector * dim * 4;
    add_vectors_per_second_gauge_.Set(size/time/MtoB);

Y
yu yunfeng 已提交
103
}
Y
yu yunfeng 已提交
104
void PrometheusMetrics::QueryIndexTypePerSecondSet(std::string type, double value) {
Y
yu yunfeng 已提交
105
    if(!startup_) return;
Y
yu yunfeng 已提交
106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121
    if(type == "IVF"){
        query_index_IVF_type_per_second_gauge_.Set(value);
    } else if(type == "IDMap"){
        query_index_IDMAP_type_per_second_gauge_.Set(value);
    }

}
void PrometheusMetrics::ConnectionGaugeIncrement() {
    if(!startup_) return;
    connection_gauge_.Increment();
}
void PrometheusMetrics::ConnectionGaugeDecrement() {
    if(!startup_) return;
    connection_gauge_.Decrement();
}

Y
fix  
yu yunfeng 已提交
122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137
//void PrometheusMetrics::GpuPercentInit() {
//    int num_device = SystemInfo::GetInstance().num_device();
//    constexpr char device_number[] = "DeviceNum";
//    for(int i = 0; i < num_device; ++ i) {
//        GPU_percent_gauges_.emplace_back(GPU_percent_.Add({{device_number,std::to_string(i)}}));
//    }
//
//}
//void PrometheusMetrics::GpuMemoryInit() {
//    int num_device = SystemInfo::GetInstance().num_device();
//    constexpr char device_number[] = "DeviceNum";
//    for(int i = 0; i < num_device; ++ i) {
//        GPU_memory_usage_gauges_.emplace_back(GPU_memory_usage_.Add({{device_number,std::to_string(i)}}));
//    }
//}

Y
yu yunfeng 已提交
138 139 140 141

}
}
}