提交 875d0b57 编写于 作者: Y yejianwu

update fmax, clamp para in relu.cl

上级 eef80d7c
......@@ -10,7 +10,7 @@ __kernel void relu(__read_only image2d_t input,
const int pos = ch_blk * width + w;
DATA_TYPE4 in = READ_IMAGET(input, SAMPLER, (int2)(pos, hb));
DATA_TYPE4 out = fmax(in, (DATA_TYPE4)0);
DATA_TYPE4 out = fmax(in, 0);
WRITE_IMAGET(output, (int2)(pos, hb), out);
}
......@@ -24,6 +24,6 @@ __kernel void relux(__read_only image2d_t input,
const int pos = ch_blk * width + w;
DATA_TYPE4 in = READ_IMAGET(input, SAMPLER, (int2)(pos, hb));
DATA_TYPE4 out = clamp(in, (DATA_TYPE4)0, (DATA_TYPE4)max_limit);
DATA_TYPE4 out = clamp(in, 0, max_limit);
WRITE_IMAGET(output, (int2)(pos, hb), out);
}
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册