未验证 提交 a1837886 编写于 作者: J Jiawei Wang 提交者: GitHub

Merge pull request #108 from wangguibao/elastic_ctr

Fix elastic-ctr Serving OP
...@@ -62,7 +62,7 @@ ExternalProject_Add( ...@@ -62,7 +62,7 @@ ExternalProject_Add(
${CMAKE_COMMAND} -E copy_directory ${PADDLE_DOWNLOAD_DIR}/paddle/include ${PADDLE_INSTALL_DIR}/include && ${CMAKE_COMMAND} -E copy_directory ${PADDLE_DOWNLOAD_DIR}/paddle/include ${PADDLE_INSTALL_DIR}/include &&
${CMAKE_COMMAND} -E copy_directory ${PADDLE_DOWNLOAD_DIR}/paddle/lib ${PADDLE_INSTALL_DIR}/lib && ${CMAKE_COMMAND} -E copy_directory ${PADDLE_DOWNLOAD_DIR}/paddle/lib ${PADDLE_INSTALL_DIR}/lib &&
${CMAKE_COMMAND} -E copy_directory ${PADDLE_DOWNLOAD_DIR}/third_party ${PADDLE_INSTALL_DIR}/third_party && ${CMAKE_COMMAND} -E copy_directory ${PADDLE_DOWNLOAD_DIR}/third_party ${PADDLE_INSTALL_DIR}/third_party &&
${CMAKE_COMMAND} -E copy ${PADDLE_INSTALL_DIR}/third_party/install/mkldnn/lib/libmkldnn.so.0 ${PADDLE_INSTALL_DIR}/third_party/install/mkldnn/lib/libmkldnn.so ${CMAKE_COMMAND} -E copy ${PADDLE_INSTALL_DIR}/third_party/install/mkldnn/lib/libmkldnn.so.1 ${PADDLE_INSTALL_DIR}/third_party/install/mkldnn/lib/libmkldnn.so
) )
INCLUDE_DIRECTORIES(${PADDLE_INCLUDE_DIR}) INCLUDE_DIRECTORIES(${PADDLE_INCLUDE_DIR})
......
...@@ -90,7 +90,7 @@ if (${WITH_MKL}) ...@@ -90,7 +90,7 @@ if (${WITH_MKL})
install(FILES install(FILES
${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libmklml_intel.so ${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libmklml_intel.so
${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libiomp5.so ${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libiomp5.so
${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mkldnn/lib/libmkldnn.so.0 ${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mkldnn/lib/libmkldnn.so.1
DESTINATION DESTINATION
${PADDLE_SERVING_INSTALL_DIR}/demo/serving/bin) ${PADDLE_SERVING_INSTALL_DIR}/demo/serving/bin)
endif() endif()
...@@ -105,13 +105,11 @@ def data_reader(data_file, samples, labels): ...@@ -105,13 +105,11 @@ def data_reader(data_file, samples, labels):
for i in range(0, len(features)): for i in range(0, len(features)):
if slots[i] in sample: if slots[i] in sample:
sample[slots[i]] = [ sample[slots[i]].append(int(features[i]) %
sample[slots[i]] + str2long(features[i]) % CTR_EMBEDDING_TABLE_SIZE)
CTR_EMBEDDING_TABLE_SIZE
]
else: else:
sample[slots[i]] = [ sample[slots[i]] = [
str2long(features[i]) % CTR_EMBEDDING_TABLE_SIZE int(features[i]) % CTR_EMBEDDING_TABLE_SIZE
] ]
for x in SLOTS: for x in SLOTS:
...@@ -142,11 +140,11 @@ if __name__ == "__main__": ...@@ -142,11 +140,11 @@ if __name__ == "__main__":
sys.exit(-1) sys.exit(-1)
ret = data_reader(sys.argv[4], samples, labels) ret = data_reader(sys.argv[4], samples, labels)
print(len(samples))
correct = 0 correct = 0
wrong_label_1_count = 0 wrong_label_1_count = 0
result_list = [] result_list = []
for i in range(0, len(samples) - BATCH_SIZE, BATCH_SIZE): #for i in range(0, len(samples) - BATCH_SIZE, BATCH_SIZE):
for i in range(0, len(samples), BATCH_SIZE):
api.clear() api.clear()
batch = samples[i:i + BATCH_SIZE] batch = samples[i:i + BATCH_SIZE]
instances = [] instances = []
...@@ -182,6 +180,4 @@ if __name__ == "__main__": ...@@ -182,6 +180,4 @@ if __name__ == "__main__":
pass pass
idx = idx + 1 idx = idx + 1
#print("Acc=%f" % (float(correct) / len(samples)))
print("auc = ", auc(labels, result_list) ) print("auc = ", auc(labels, result_list) )
...@@ -53,7 +53,7 @@ if (${WITH_MKL}) ...@@ -53,7 +53,7 @@ if (${WITH_MKL})
install(FILES install(FILES
${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libmklml_intel.so ${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libmklml_intel.so
${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libiomp5.so ${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mklml/lib/libiomp5.so
${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mkldnn/lib/libmkldnn.so.0 ${CMAKE_BINARY_DIR}/third_party/install/Paddle/third_party/install/mkldnn/lib/libmkldnn.so.1
DESTINATION DESTINATION
${PADDLE_SERVING_INSTALL_DIR}/elastic_ctr/serving/bin) ${PADDLE_SERVING_INSTALL_DIR}/elastic_ctr/serving/bin)
endif() endif()
...@@ -15,6 +15,7 @@ ...@@ -15,6 +15,7 @@
#include "elastic-ctr/serving/op/elastic_ctr_prediction_op.h" #include "elastic-ctr/serving/op/elastic_ctr_prediction_op.h"
#include <algorithm> #include <algorithm>
#include <string> #include <string>
#include <iomanip>
#include "cube/cube-api/include/cube_api.h" #include "cube/cube-api/include/cube_api.h"
#include "predictor/framework/infer.h" #include "predictor/framework/infer.h"
#include "predictor/framework/kv_manager.h" #include "predictor/framework/kv_manager.h"
...@@ -70,17 +71,65 @@ int ElasticCTRPredictionOp::inference() { ...@@ -70,17 +71,65 @@ int ElasticCTRPredictionOp::inference() {
return 0; return 0;
} }
Samples samples;
samples.resize(req->instances_size());
for (int i = 0; i < req->instances_size(); ++i) {
const ReqInstance &req_instance = req->instances(i);
for (int j = 0; j < req_instance.slots_size(); ++j) {
const Slot &slot = req_instance.slots(j);
for (int k = 0; k < slot.feasigns().size(); ++k) {
int slot_id = strtol(slot.slot_name().c_str(), NULL, 10);
samples[i][slot_id].push_back(slot.feasigns(k));
}
}
}
// Verify all request instances have same slots // Verify all request instances have same slots
int slot_num = req->instances(0).slots_size(); std::vector<int> slot_ids;
#if 1 for (auto x: samples[0]) {
LOG(INFO) << "slot_num =" << slot_num; slot_ids.push_back(x.first);
#endif }
for (int i = 1; i < req->instances_size(); ++i) { std::sort(slot_ids.begin(), slot_ids.end());
if (req->instances(i).slots_size() != slot_num) {
// use of slot_map:
//
// Example:
// slot_ids: 1, 20, 50, 100
//
// Then
// slot_map[1] = 0
// slot_map[20] = 1
// slot_map[50] = 2
// slot_map[100] = 3
//
// Later we use slot_map to index into lod_tenor array
//
std::map<int, int> slot_map;
int index = 0;
for (auto slot_id: slot_ids) {
slot_map[slot_id] = index;
++index;
}
for (size_t i = 1; i < samples.size(); ++i) {
if (samples[i].size() != slot_ids.size()) {
LOG(WARNING) << "Req " << i LOG(WARNING) << "Req " << i
<< " has different slot num with that of req 0"; << " has different slot num with that of req 0";
fill_response_with_message( fill_response_with_message(
res, -1, "Req intance has varying slot numbers"); res, -1, "Req intance has varying slot numbers");
return 0;
}
for (auto slot: samples[i]) {
int id = slot.first;
auto x = std::find(slot_ids.begin(), slot_ids.end(), id);
if (x == slot_ids.end()) {
std::ostringstream oss;
oss << "Req instance " << i << " has an outlier slot id: " << id;
fill_response_with_message(res, -1, oss.str().c_str());
return 0;
}
} }
} }
...@@ -115,30 +164,27 @@ int ElasticCTRPredictionOp::inference() { ...@@ -115,30 +164,27 @@ int ElasticCTRPredictionOp::inference() {
// Level of details of each feature slot // Level of details of each feature slot
std::vector<std::vector<size_t>> feature_slot_lods; std::vector<std::vector<size_t>> feature_slot_lods;
feature_slot_lods.resize(slot_num); feature_slot_lods.resize(slot_ids.size());
// Number of feature signs in each slot // Number of feature signs in each slot
std::vector<int> feature_slot_sizes; std::vector<int> feature_slot_sizes;
feature_slot_sizes.resize(slot_num); feature_slot_sizes.resize(slot_ids.size());
// Iterate over each feature slot // Iterate over each feature slot
for (int i = 0; i < slot_num; ++i) { for (auto slot_id: slot_ids) {
feature_slot_lods[i].push_back(0); feature_slot_lods[slot_map[slot_id]].push_back(0);
feature_slot_sizes[i] = 0; feature_slot_sizes[slot_map[slot_id]] = 0;
// Extract feature i values from each instance si // Extract feature i values from each instance si
for (int si = 0; si < sample_size; ++si) { for (size_t si = 0; si < samples.size(); ++si) {
#if 1 Sample &sample = samples[si];
LOG(INFO) << "slot " << i << " sample " << si; std::vector<int64_t> &slot = sample[slot_id];
#endif feature_slot_lods[slot_map[slot_id]].push_back(feature_slot_lods[slot_map[slot_id]].back() +
const ReqInstance &req_instance = req->instances(si); slot.size());
const Slot &slot = req_instance.slots(i); feature_slot_sizes[slot_map[slot_id]] += slot.size();
feature_slot_lods[i].push_back(feature_slot_lods[i].back() +
slot.feasigns_size());
feature_slot_sizes[i] += slot.feasigns_size();
for (int j = 0; j < slot.feasigns_size(); ++j) { for (size_t j = 0; j < slot.size(); ++j) {
keys.push_back(slot.feasigns(j)); keys.push_back(slot[j]);
} }
} }
} }
...@@ -234,10 +280,9 @@ int ElasticCTRPredictionOp::inference() { ...@@ -234,10 +280,9 @@ int ElasticCTRPredictionOp::inference() {
return 0; return 0;
} }
for (int i = 0; i < keys.size(); ++i) { for (size_t i = 0; i < keys.size(); ++i) {
std::ostringstream oss; std::ostringstream oss;
oss << keys[i] << ": "; oss << keys[i] << ": ";
const char *value = (values[i].buff.data());
if (values[i].buff.size() != if (values[i].buff.size() !=
sizeof(float) * CTR_PREDICTION_EMBEDDING_SIZE) { sizeof(float) * CTR_PREDICTION_EMBEDDING_SIZE) {
LOG(WARNING) << "Key " << keys[i] << " has values less than " LOG(WARNING) << "Key " << keys[i] << " has values less than "
...@@ -256,21 +301,20 @@ int ElasticCTRPredictionOp::inference() { ...@@ -256,21 +301,20 @@ int ElasticCTRPredictionOp::inference() {
// Fill feature embedding into feed tensors // Fill feature embedding into feed tensors
std::vector<paddle::PaddleTensor> lod_tensors; std::vector<paddle::PaddleTensor> lod_tensors;
lod_tensors.resize(slot_num); lod_tensors.resize(slot_ids.size());
const ReqInstance &instance = req->instances(0); for (auto slot_id: slot_ids) {
for (int i = 0; i < slot_num; ++i) { paddle::PaddleTensor &lod_tensor = lod_tensors[slot_map[slot_id]];
paddle::PaddleTensor &lod_tensor = lod_tensors[i];
char name[VARIABLE_NAME_LEN]; char name[VARIABLE_NAME_LEN];
snprintf(name, snprintf(name,
VARIABLE_NAME_LEN, VARIABLE_NAME_LEN,
"embedding_%s.tmp_0", "embedding_%d.tmp_0",
instance.slots(i).slot_name().c_str()); slot_id);
lod_tensor.name = std::string(name); lod_tensor.name = std::string(name);
lod_tensors[i].dtype = paddle::PaddleDType::FLOAT32; lod_tensor.dtype = paddle::PaddleDType::FLOAT32;
std::vector<std::vector<size_t>> &lod = lod_tensors[i].lod; std::vector<std::vector<size_t>> &lod = lod_tensor.lod;
lod.resize(1); lod.resize(1);
lod[0].push_back(0); lod[0].push_back(0);
} }
...@@ -278,11 +322,11 @@ int ElasticCTRPredictionOp::inference() { ...@@ -278,11 +322,11 @@ int ElasticCTRPredictionOp::inference() {
int base = 0; int base = 0;
// Iterate over all slots // Iterate over all slots
for (int i = 0; i < slot_num; ++i) { for (auto slot_id: slot_ids) {
paddle::PaddleTensor &lod_tensor = lod_tensors[i]; paddle::PaddleTensor &lod_tensor = lod_tensors[slot_map[slot_id]];
std::vector<std::vector<size_t>> &lod = lod_tensor.lod; std::vector<std::vector<size_t>> &lod = lod_tensor.lod;
lod[0] = feature_slot_lods[i]; lod[0] = feature_slot_lods[slot_map[slot_id]];
lod_tensor.shape = {lod[0].back(), CTR_PREDICTION_EMBEDDING_SIZE}; lod_tensor.shape = {lod[0].back(), CTR_PREDICTION_EMBEDDING_SIZE};
lod_tensor.data.Resize(lod[0].back() * sizeof(float) * lod_tensor.data.Resize(lod[0].back() * sizeof(float) *
...@@ -290,7 +334,7 @@ int ElasticCTRPredictionOp::inference() { ...@@ -290,7 +334,7 @@ int ElasticCTRPredictionOp::inference() {
int offset = 0; int offset = 0;
// Copy all slot i feature embeddings to lod_tensor[i] // Copy all slot i feature embeddings to lod_tensor[i]
for (uint32_t j = 0; j < feature_slot_sizes[i]; ++j) { for (uint32_t j = 0; j < feature_slot_sizes[slot_map[slot_id]]; ++j) {
float *data_ptr = static_cast<float *>(lod_tensor.data.data()) + offset; float *data_ptr = static_cast<float *>(lod_tensor.data.data()) + offset;
int idx = base + j; int idx = base + j;
...@@ -303,19 +347,24 @@ int ElasticCTRPredictionOp::inference() { ...@@ -303,19 +347,24 @@ int ElasticCTRPredictionOp::inference() {
return 0; return 0;
#else #else
// sizeof(float) * CTR_PREDICTION_EMBEDDING_SIZE = 36 // sizeof(float) * CTR_PREDICTION_EMBEDDING_SIZE = 36
#if 1
LOG(INFO) << "values[" << idx << "].buff.size != 36";
#endif
values[idx].buff.append(36, '0'); values[idx].buff.append(36, '0');
#endif #endif
} }
memcpy(data_ptr, values[idx].buff.data(), values[idx].buff.size()); memcpy(data_ptr, values[idx].buff.data(), values[idx].buff.size());
offset += CTR_PREDICTION_EMBEDDING_SIZE; offset += CTR_PREDICTION_EMBEDDING_SIZE;
} }
in->push_back(lod_tensor); in->push_back(lod_tensor);
// Bump base counter // Bump base counter
base += feature_slot_sizes[i]; base += feature_slot_sizes[slot_map[slot_id]];
} }
#else #else
// Fill all tensors // Fill all tensors
......
...@@ -41,6 +41,8 @@ class ElasticCTRPredictionOp ...@@ -41,6 +41,8 @@ class ElasticCTRPredictionOp
baidu::paddle_serving::predictor::elastic_ctr::Response> { baidu::paddle_serving::predictor::elastic_ctr::Response> {
public: public:
typedef std::vector<paddle::PaddleTensor> TensorVector; typedef std::vector<paddle::PaddleTensor> TensorVector;
typedef std::map<int, std::vector<int64_t>> Sample;
typedef std::vector<Sample> Samples;
DECLARE_OP(ElasticCTRPredictionOp); DECLARE_OP(ElasticCTRPredictionOp);
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册