Fix softmax bug

a3eb0c0b · hjchen2 · 5df51432 · a3eb0c0b · a3eb0c0b · a3eb0c0b
隐藏空白更改
内联并排

Showing with 19 addition and 10 deletion

src/framework/tensor.h src/framework/tensor.h +3 -3

src/operators/math/softmax.cpp src/operators/math/softmax.cpp +1 -1

test/net/test_ocr.cpp test/net/test_ocr.cpp +15 -6

未找到文件。
--- a/src/framework/tensor.h
+++ b/src/framework/tensor.h
@@ -148,8 +148,8 @@ class Tensor : public TensorBase {
    PADDLE_MOBILE_ENFORCE(
        (std::is_same<T, void>::value ||
         holder_->type().hash_code() == typeid(T).hash_code()),
-        "Tensor holds the wrong type, it holds %s",
-        this->holder_->type().name());
+        "Tensor holds the wrong type, it holds %s, requested %s",
+        this->holder_->type().name(), typeid(T).name());

    return reinterpret_cast<T *>(reinterpret_cast<uintptr_t>(holder_->ptr()) +
                                 offset_);
@@ -162,7 +162,7 @@ class Tensor : public TensorBase {
    PADDLE_MOBILE_ENFORCE(
        (std::is_same<T, void>::value ||
         holder_->type().hash_code() == typeid(T).hash_code()),
-        "Tensor holds the wrong type, it holds %s ,requested:%s",
+        "Tensor holds the wrong type, it holds %s, requested %s",
        this->holder_->type().name(), typeid(T).name());

    return reinterpret_cast<const T *>(

--- a/src/operators/math/softmax.cpp
+++ b/src/operators/math/softmax.cpp
@@ -128,7 +128,7 @@ void SoftmaxFuntor<CPU, float>::operator()(const framework::Tensor *X,
        x0 = vmulq_f32(x0, __inv_sum);
        x1 = vmulq_f32(x1, __inv_sum);
        vst1q_f32(output, x0);
-        vst1q_f32(output + 4, x0);
+        vst1q_f32(output + 4, x1);
      }
 #endif
      for (int i = 0; i < remain; ++i) {

--- a/test/net/test_ocr.cpp
+++ b/test/net/test_ocr.cpp
@@ -28,6 +28,7 @@ void load_images(const char *image_dir, const char *images_list,
    image_shapes->push_back(std::make_pair(height, width));
    image_names->push_back(filename);
  }
+  if_list.close();
 }

 int main(int argc, char **argv) {
@@ -53,7 +54,7 @@ int main(int argc, char **argv) {

  for (int i = 0; i < image_names.size(); i++) {
    std::string file_name = image_names[i];
-    std::vector<float> input;
+    std::vector<float> input_vec;
    std::vector<int64_t> dims{1, 1, 48, 512};
    dims[2] = image_shapes[i].first;
    dims[3] = image_shapes[i].second;
@@ -62,14 +63,22 @@ int main(int argc, char **argv) {
    std::cerr << "img_path: " << img_path << std::endl;
    std::cerr << "shape = [" << dims[0] << ", " << dims[1] << ", " << dims[2]
              << ", " << dims[3] << "]" << std::endl;
-    GetInput<float>(img_path, &input, dims);
+    GetInput<float>(img_path, &input_vec, dims);
+    framework::Tensor input(input_vec, framework::make_ddim(dims));
    // predict
-    auto output = paddle_mobile.Predict(input, dims);
+    paddle_mobile.Predict(input);
+    auto output_topk = paddle_mobile.Fetch("top_k_1.tmp_0");
+    auto output_indices = paddle_mobile.Fetch("cast_68.tmp_0");
    // print result
    std::cerr << file_name << std::endl;
-    std::cerr << output[0];
-    for (int j = 1; j < output.size(); ++j) {
-      std::cerr << " " << output[j];
+    std::cerr << output_topk->data<float>()[0];
+    for (int j = 1; j < output_topk->numel(); ++j) {
+      std::cerr << " " << output_topk->data<float>()[j];
+    }
+    std::cerr << std::endl;
+    std::cerr << output_indices->data<float>()[0];
+    for (int j = 1; j < output_indices->numel(); ++j) {
+      std::cerr << " " << output_indices->data<float>()[j];
    }
    std::cerr << std::endl;
  }