Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
2dot5
ClickHouse
提交
eb5ebc79
C
ClickHouse
项目概览
2dot5
/
ClickHouse
通知
3
Star
0
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
DevOps
流水线
流水线任务
计划
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
C
ClickHouse
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
DevOps
DevOps
流水线
流水线任务
计划
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
流水线任务
提交
Issue看板
体验新版 GitCode,发现更多精彩内容 >>
提交
eb5ebc79
编写于
3月 05, 2013
作者:
M
Michael Kolupaev
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
clickhouse: added function extractURLParameter [#CONV-6788].
上级
24ffa945
变更
3
隐藏空白更改
内联
并排
Showing
3 changed file
with
88 addition
and
15 deletion
+88
-15
dbms/include/DB/Functions/FunctionsStringSearch.h
dbms/include/DB/Functions/FunctionsStringSearch.h
+8
-12
dbms/include/DB/Functions/FunctionsURL.h
dbms/include/DB/Functions/FunctionsURL.h
+79
-3
dbms/src/Functions/FunctionFactory.cpp
dbms/src/Functions/FunctionFactory.cpp
+1
-0
未找到文件。
dbms/include/DB/Functions/FunctionsStringSearch.h
浏览文件 @
eb5ebc79
...
...
@@ -358,16 +358,6 @@ struct ExtractImpl
prev_offset
=
cur_offset
;
}
}
static
void
constant
(
const
std
::
string
&
data
,
const
std
::
string
&
pattern
,
std
::
string
&
res
)
{
std
::
vector
<
UInt8
>
vdata
(
data
.
begin
(),
data
.
end
());
ColumnArray
::
Offsets_t
offsets
(
1
,
data
.
size
());
std
::
vector
<
UInt8
>
res_vdata
;
ColumnArray
::
Offsets_t
res_offsets
;
vector
(
vdata
,
offsets
,
pattern
,
res_vdata
,
res_offsets
);
res
=
std
::
string
(
res_vdata
.
begin
(),
res_vdata
.
end
()
-
1
);
}
};
...
...
@@ -487,8 +477,14 @@ public:
}
else
if
(
const
ColumnConstString
*
col
=
dynamic_cast
<
const
ColumnConstString
*>
(
&*
column
))
{
std
::
string
res
;
Impl
::
constant
(
col
->
getData
(),
col_needle
->
getData
(),
res
);
const
std
::
string
&
data
=
col
->
getData
();
std
::
vector
<
UInt8
>
vdata
(
data
.
c_str
(),
data
.
c_str
()
+
data
.
size
()
+
1
);
ColumnArray
::
Offsets_t
offsets
(
1
,
vdata
.
size
());
std
::
vector
<
UInt8
>
res_vdata
;
ColumnArray
::
Offsets_t
res_offsets
;
Impl
::
vector
(
vdata
,
offsets
,
col_needle
->
getData
(),
res_vdata
,
res_offsets
);
std
::
string
res
=
std
::
string
(
res_vdata
.
begin
(),
res_vdata
.
end
()
-
1
);
ColumnConstString
*
col_res
=
new
ColumnConstString
(
col
->
size
(),
res
);
block
.
getByPosition
(
result
).
column
=
col_res
;
...
...
dbms/include/DB/Functions/FunctionsURL.h
浏览文件 @
eb5ebc79
...
...
@@ -4,6 +4,7 @@
#include <DB/Columns/ColumnString.h>
#include <DB/Columns/ColumnConst.h>
#include <DB/Functions/FunctionsString.h>
#include "FunctionsStringSearch.h"
namespace
DB
...
...
@@ -256,6 +257,78 @@ struct ExtractWWW
};
struct
ExtractURLParameterImpl
{
static
void
vector
(
const
std
::
vector
<
UInt8
>
&
data
,
const
ColumnArray
::
Offsets_t
&
offsets
,
std
::
string
pattern
,
std
::
vector
<
UInt8
>
&
res_data
,
ColumnArray
::
Offsets_t
&
res_offsets
)
{
res_data
.
reserve
(
data
.
size
()
/
5
);
res_offsets
.
resize
(
offsets
.
size
());
pattern
+=
'='
;
const
char
*
param_str
=
pattern
.
c_str
();
size_t
param_len
=
pattern
.
size
();
std
::
string
and_pattern
=
'&'
+
pattern
;
const
char
*
and_param_str
=
and_pattern
.
c_str
();
size_t
and_param_len
=
and_pattern
.
size
();
size_t
prev_offset
=
0
;
size_t
res_offset
=
0
;
for
(
size_t
i
=
0
;
i
<
offsets
.
size
();
++
i
)
{
size_t
cur_offset
=
offsets
[
i
];
const
char
*
pos
=
NULL
;
do
{
const
char
*
str
=
reinterpret_cast
<
const
char
*>
(
&
data
[
prev_offset
]);
const
char
*
begin
=
strchr
(
str
,
'?'
);
if
(
begin
==
NULL
)
break
;
++
begin
;
if
(
!
strncmp
(
begin
,
param_str
,
param_len
))
{
pos
=
begin
+
param_len
;
break
;
}
pos
=
strstr
(
begin
,
and_param_str
);
if
(
pos
!=
NULL
)
pos
+=
and_param_len
;
}
while
(
false
);
if
(
pos
!=
NULL
)
{
const
char
*
end
=
strpbrk
(
pos
,
"&#"
);
if
(
end
==
NULL
)
end
=
pos
+
strlen
(
pos
);
res_data
.
resize
(
res_offset
+
(
end
-
pos
)
+
1
);
memcpy
(
&
res_data
[
res_offset
],
pos
,
end
-
pos
);
res_offset
+=
end
-
pos
;
}
else
{
res_data
.
resize
(
res_offset
+
1
);
}
res_data
[
res_offset
]
=
0
;
++
res_offset
;
res_offsets
[
i
]
=
res_offset
;
prev_offset
=
cur_offset
;
}
}
};
/** Выделить кусок строки, используя Extractor.
*/
template
<
typename
Extractor
>
...
...
@@ -372,19 +445,22 @@ struct NameCutQueryString { static const char * get() { return "cutQueryStrin
struct
NameCutFragment
{
static
const
char
*
get
()
{
return
"cutFragment"
;
}
};
struct
NameCutQueryStringAndFragment
{
static
const
char
*
get
()
{
return
"cutQueryStringAndFragment"
;
}
};
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractProtocol
>
,
NameProtocol
>
FunctionProtocol
;
struct
NameExtractURLParameter
{
static
const
char
*
get
()
{
return
"extractURLParameter"
;
}
};
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractProtocol
>
,
NameProtocol
>
FunctionProtocol
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractDomain
<
false
>
>
,
NameDomain
>
FunctionDomain
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractDomain
<
true
>
>
,
NameDomainWithoutWWW
>
FunctionDomainWithoutWWW
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractTopLevelDomain
>
,
NameTopLevelDomain
>
FunctionTopLevelDomain
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractPath
>
,
NamePath
>
FunctionPath
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractPath
>
,
NamePath
>
FunctionPath
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractQueryString
<
true
>
>
,
NameQueryString
>
FunctionQueryString
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractFragment
<
true
>
>
,
NameFragment
>
FunctionFragment
;
typedef
FunctionStringToString
<
ExtractSubstringImpl
<
ExtractQueryStringAndFragment
<
true
>
>
,
NameQueryStringAndFragment
>
FunctionQueryStringAndFragment
;
typedef
FunctionStringToString
<
CutSubstringImpl
<
ExtractWWW
>
,
NameCutWWW
>
FunctionCutWWW
;
typedef
FunctionStringToString
<
CutSubstringImpl
<
ExtractQueryString
<
false
>
>
,
NameCutQueryString
>
FunctionCutQueryString
;
typedef
FunctionStringToString
<
CutSubstringImpl
<
ExtractFragment
<
false
>
>
,
NameCutFragment
>
FunctionCutFragment
;
typedef
FunctionStringToString
<
CutSubstringImpl
<
ExtractFragment
<
false
>
>
,
NameCutFragment
>
FunctionCutFragment
;
typedef
FunctionStringToString
<
CutSubstringImpl
<
ExtractQueryStringAndFragment
<
false
>
>
,
NameCutQueryStringAndFragment
>
FunctionCutQueryStringAndFragment
;
typedef
FunctionsStringSearchToString
<
ExtractURLParameterImpl
,
NameExtractURLParameter
>
FunctionExtractURLParameter
;
}
dbms/src/Functions/FunctionFactory.cpp
浏览文件 @
eb5ebc79
...
...
@@ -150,6 +150,7 @@ FunctionPtr FunctionFactory::get(
else
if
(
name
==
"cutQueryString"
)
return
new
FunctionCutQueryString
;
else
if
(
name
==
"cutFragment"
)
return
new
FunctionCutFragment
;
else
if
(
name
==
"cutQueryStringAndFragment"
)
return
new
FunctionCutQueryStringAndFragment
;
else
if
(
name
==
"extractURLParameter"
)
return
new
FunctionExtractURLParameter
;
else
if
(
name
==
"visibleWidth"
)
return
new
FunctionVisibleWidth
;
else
if
(
name
==
"toTypeName"
)
return
new
FunctionToTypeName
;
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录