Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
Greenplum
Opencv
提交
6a6ccf60
O
Opencv
项目概览
Greenplum
/
Opencv
大约 1 年 前同步成功
通知
7
Star
0
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
O
Opencv
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
体验新版 GitCode,发现更多精彩内容 >>
提交
6a6ccf60
编写于
7月 21, 2015
作者:
M
Maksim Shabunin
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
v_extract universal intrinsic
上级
11c3fa52
变更
3
显示空白变更内容
内联
并排
Showing
3 changed file
with
44 addition
and
0 deletion
+44
-0
modules/hal/include/opencv2/hal/intrin_cpp.hpp
modules/hal/include/opencv2/hal/intrin_cpp.hpp
+14
-0
modules/hal/include/opencv2/hal/intrin_neon.hpp
modules/hal/include/opencv2/hal/intrin_neon.hpp
+19
-0
modules/hal/include/opencv2/hal/intrin_sse.hpp
modules/hal/include/opencv2/hal/intrin_sse.hpp
+11
-0
未找到文件。
modules/hal/include/opencv2/hal/intrin_cpp.hpp
浏览文件 @
6a6ccf60
...
...
@@ -566,6 +566,7 @@ inline v_reg<_Tp, n> v_combine_low(const v_reg<_Tp, n>& a, const v_reg<_Tp, n>&
c
.
s
[
i
]
=
a
.
s
[
i
];
c
.
s
[
i
+
(
n
/
2
)]
=
b
.
s
[
i
];
}
return
c
;
}
template
<
typename
_Tp
,
int
n
>
...
...
@@ -577,6 +578,7 @@ inline v_reg<_Tp, n> v_combine_high(const v_reg<_Tp, n>& a, const v_reg<_Tp, n>&
c
.
s
[
i
]
=
a
.
s
[
i
+
(
n
/
2
)];
c
.
s
[
i
+
(
n
/
2
)]
=
b
.
s
[
i
+
(
n
/
2
)];
}
return
c
;
}
template
<
typename
_Tp
,
int
n
>
...
...
@@ -592,6 +594,18 @@ inline void v_recombine(const v_reg<_Tp, n>& a, const v_reg<_Tp, n>& b,
}
}
template
<
int
s
,
typename
_Tp
,
int
n
>
inline
v_reg
<
_Tp
,
n
>
v_extract
(
const
v_reg
<
_Tp
,
n
>&
a
,
const
v_reg
<
_Tp
,
n
>&
b
)
{
v_reg
<
_Tp
,
n
>
r
;
int
i
=
0
;
for
(;
i
<
s
;
++
i
)
r
.
s
[
i
]
=
a
.
s
[
i
+
n
-
s
];
for
(;
i
<
n
;
++
i
)
r
.
s
[
i
]
=
b
.
s
[
i
-
s
];
return
r
;
}
template
<
int
n
>
inline
v_reg
<
int
,
n
>
v_round
(
const
v_reg
<
float
,
n
>&
a
)
{
v_reg
<
int
,
n
>
c
;
...
...
modules/hal/include/opencv2/hal/intrin_neon.hpp
浏览文件 @
6a6ccf60
...
...
@@ -557,6 +557,8 @@ OPENCV_HAL_IMPL_NEON_LOADSTORE_OP(v_uint16x8, ushort, u16)
OPENCV_HAL_IMPL_NEON_LOADSTORE_OP
(
v_int16x8
,
short
,
s16
)
OPENCV_HAL_IMPL_NEON_LOADSTORE_OP
(
v_uint32x4
,
unsigned
,
u32
)
OPENCV_HAL_IMPL_NEON_LOADSTORE_OP
(
v_int32x4
,
int
,
s32
)
OPENCV_HAL_IMPL_NEON_LOADSTORE_OP
(
v_uint64x2
,
uint64
,
u64
)
OPENCV_HAL_IMPL_NEON_LOADSTORE_OP
(
v_int64x2
,
int64
,
s64
)
OPENCV_HAL_IMPL_NEON_LOADSTORE_OP
(
v_float32x4
,
float
,
f32
)
#define OPENCV_HAL_IMPL_NEON_REDUCE_OP_4(_Tpvec, scalartype, func, scalar_func) \
...
...
@@ -720,6 +722,23 @@ OPENCV_HAL_IMPL_NEON_UNPACKS(uint32x4, u32)
OPENCV_HAL_IMPL_NEON_UNPACKS
(
int32x4
,
s32
)
OPENCV_HAL_IMPL_NEON_UNPACKS
(
float32x4
,
f32
)
#define OPENCV_HAL_IMPL_NEON_EXTRACT(_Tpvec, suffix) \
template <int s> \
inline v_##_Tpvec v_extract(const v_##_Tpvec& a, const v_##_Tpvec& b) \
{ \
return v_##_Tpvec(vextq_##suffix(a.val, b.val, s)); \
}
OPENCV_HAL_IMPL_NEON_EXTRACT
(
uint8x16
,
u8
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
int8x16
,
s8
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
uint16x8
,
u16
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
int16x8
,
s16
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
uint32x4
,
u32
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
int32x4
,
s32
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
uint64x2
,
u64
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
int64x2
,
s64
)
OPENCV_HAL_IMPL_NEON_EXTRACT
(
float32x4
,
f32
)
inline
v_int32x4
v_round
(
const
v_float32x4
&
a
)
{
static
const
int32x4_t
v_sign
=
vdupq_n_s32
(
1
<<
31
),
...
...
modules/hal/include/opencv2/hal/intrin_sse.hpp
浏览文件 @
6a6ccf60
...
...
@@ -1149,6 +1149,17 @@ OPENCV_HAL_IMPL_SSE_UNPACKS(v_int32x4, epi32, OPENCV_HAL_NOP, OPENCV_HAL_NOP)
OPENCV_HAL_IMPL_SSE_UNPACKS
(
v_float32x4
,
ps
,
_mm_castps_si128
,
_mm_castsi128_ps
)
OPENCV_HAL_IMPL_SSE_UNPACKS
(
v_float64x2
,
pd
,
_mm_castpd_si128
,
_mm_castsi128_pd
)
template
<
int
s
,
typename
_Tpvec
>
inline
_Tpvec
v_extract
(
const
_Tpvec
&
a
,
const
_Tpvec
&
b
)
{
const
int
w
=
sizeof
(
typename
_Tpvec
::
lane_type
);
const
int
n
=
_Tpvec
::
nlanes
;
__m128i
ra
,
rb
;
ra
=
_mm_srli_si128
(
a
.
val
,
s
*
w
);
rb
=
_mm_slli_si128
(
b
.
val
,
(
n
-
s
)
*
w
);
return
_Tpvec
(
_mm_or_si128
(
ra
,
rb
));
}
inline
v_int32x4
v_round
(
const
v_float32x4
&
a
)
{
return
v_int32x4
(
_mm_cvtps_epi32
(
a
.
val
));
}
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录