Skip to content
体验新版
项目
组织
正在加载...
登录
切换导航
打开侧边栏
加钱居士.
foot
提交
e9d489ce
F
foot
项目概览
加钱居士.
/
foot
通知
3
Star
1
Fork
0
代码
文件
提交
分支
Tags
贡献者
分支图
Diff
Issue
0
列表
看板
标记
里程碑
合并请求
0
Wiki
0
Wiki
分析
仓库
DevOps
项目成员
Pages
F
foot
项目概览
项目概览
详情
发布
仓库
仓库
文件
提交
分支
标签
贡献者
分支图
比较
Issue
0
Issue
0
列表
看板
标记
里程碑
合并请求
0
合并请求
0
Pages
分析
分析
仓库分析
DevOps
Wiki
0
Wiki
成员
成员
收起侧边栏
关闭侧边栏
动态
分支图
创建新Issue
提交
Issue看板
前往新版Gitcode,体验更适合开发者的 AI 搜索 >>
提交
e9d489ce
编写于
3月 14, 2020
作者:
M
monomania
浏览文件
操作
浏览文件
下载
电子邮件补丁
差异文件
1.优化爬虫线程带出的bug
上级
97d249cd
变更
7
隐藏空白更改
内联
并排
Showing
7 changed file
with
56 addition
and
38 deletion
+56
-38
foot-spider/module/win007/proc/AsiaLastNewProcesser.go
foot-spider/module/win007/proc/AsiaLastNewProcesser.go
+8
-5
foot-spider/module/win007/proc/BaseFaceProcesser.go
foot-spider/module/win007/proc/BaseFaceProcesser.go
+8
-5
foot-spider/module/win007/proc/EuroLastProcesser.go
foot-spider/module/win007/proc/EuroLastProcesser.go
+8
-5
foot-spider/module/win007/proc/EuroTrackProcesser.go
foot-spider/module/win007/proc/EuroTrackProcesser.go
+8
-6
foot-spider/module/win007/proc/LeagueProcesser.go
foot-spider/module/win007/proc/LeagueProcesser.go
+8
-5
foot-spider/module/win007/proc/LeagueSeasonProcesser.go
foot-spider/module/win007/proc/LeagueSeasonProcesser.go
+8
-6
foot-spider/module/win007/proc/MatchHisProcesser.go
foot-spider/module/win007/proc/MatchHisProcesser.go
+8
-6
未找到文件。
foot-spider/module/win007/proc/AsiaLastNewProcesser.go
浏览文件 @
e9d489ce
...
...
@@ -44,13 +44,14 @@ func (this *AsiaLastNewProcesser) Setup(temp *AsiaLastNewProcesser) {
func
(
this
*
AsiaLastNewProcesser
)
Startup
()
{
var
processer
*
AsiaLastNewProcesser
var
newSpider
*
spider
.
Spider
for
i
,
v
:=
range
this
.
MatchLastList
{
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer
=
GetAsiaLastNewProcesser
()
processer
.
Setup
(
this
)
newSpider
=
spider
.
NewSpider
(
processer
,
"AsiaLastNewProcesser"
+
strconv
.
Itoa
(
i
))
}
newSpider
:=
spider
.
NewSpider
(
processer
,
"AsiaLastNewProcesser"
+
strconv
.
Itoa
(
i
))
temp_flag
:=
v
.
Ext
[
win007
.
MODULE_FLAG
]
bytes
,
_
:=
json
.
Marshal
(
temp_flag
)
...
...
@@ -62,10 +63,12 @@ func (this *AsiaLastNewProcesser) Startup() {
url
:=
strings
.
Replace
(
win007
.
WIN007_ASIAODD_NEW_URL_PATTERN
,
"${matchId}"
,
win007_id
,
1
)
newSpider
=
newSpider
.
AddUrl
(
url
,
"json"
)
newSpider
.
SetDownloader
(
down
.
NewMAsiaLastApiDownloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
newSpider
.
SetDownloader
(
down
.
NewMAsiaLastApiDownloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
}
}
...
...
foot-spider/module/win007/proc/BaseFaceProcesser.go
浏览文件 @
e9d489ce
...
...
@@ -49,13 +49,14 @@ func (this *BaseFaceProcesser) Setup(temp *BaseFaceProcesser) {
func
(
this
*
BaseFaceProcesser
)
Startup
()
{
var
processer
*
BaseFaceProcesser
var
newSpider
*
spider
.
Spider
for
i
,
v
:=
range
this
.
MatchLastList
{
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer
=
GetBaseFaceProcesser
()
processer
.
Setup
(
this
)
newSpider
=
spider
.
NewSpider
(
processer
,
"BaseFaceProcesser"
+
strconv
.
Itoa
(
i
))
}
newSpider
:=
spider
.
NewSpider
(
processer
,
"BaseFaceProcesser"
+
strconv
.
Itoa
(
i
))
temp_flag
:=
v
.
Ext
[
win007
.
MODULE_FLAG
]
bytes
,
_
:=
json
.
Marshal
(
temp_flag
)
...
...
@@ -67,11 +68,13 @@ func (this *BaseFaceProcesser) Startup() {
url
:=
strings
.
Replace
(
win007
.
WIN007_BASE_FACE_URL_PATTERN
,
"${matchId}"
,
win007_id
,
1
)
newSpider
=
newSpider
.
AddUrl
(
url
,
"html"
)
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
}
...
...
foot-spider/module/win007/proc/EuroLastProcesser.go
浏览文件 @
e9d489ce
...
...
@@ -50,13 +50,14 @@ func (this *EuroLastProcesser) Setup(temp *EuroLastProcesser) {
func
(
this
*
EuroLastProcesser
)
Startup
()
{
var
processer
*
EuroLastProcesser
var
newSpider
*
spider
.
Spider
for
i
,
v
:=
range
this
.
MatchLastList
{
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer
=
GetEuroLastProcesser
()
processer
.
Setup
(
this
)
newSpider
=
spider
.
NewSpider
(
processer
,
"EuroLastProcesser"
+
strconv
.
Itoa
(
i
))
}
newSpider
:=
spider
.
NewSpider
(
processer
,
"EuroLastProcesser"
+
strconv
.
Itoa
(
i
))
temp_flag
:=
v
.
Ext
[
win007
.
MODULE_FLAG
]
bytes
,
_
:=
json
.
Marshal
(
temp_flag
)
...
...
@@ -68,10 +69,12 @@ func (this *EuroLastProcesser) Startup() {
url
:=
strings
.
Replace
(
win007
.
WIN007_EUROODD_URL_PATTERN
,
"${matchId}"
,
win007_id
,
1
)
newSpider
=
newSpider
.
AddUrl
(
url
,
"html"
)
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
100
,
2000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
100
,
2000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
}
}
...
...
foot-spider/module/win007/proc/EuroTrackProcesser.go
浏览文件 @
e9d489ce
...
...
@@ -49,13 +49,14 @@ func (this *EuroTrackProcesser) Setup(temp *EuroTrackProcesser) {
func
(
this
*
EuroTrackProcesser
)
Startup
()
{
var
processer
*
EuroTrackProcesser
var
newSpider
*
spider
.
Spider
for
i
,
v
:=
range
this
.
MatchLastList
{
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer
=
GetEuroTrackProcesser
()
processer
.
Setup
(
this
)
newSpider
=
spider
.
NewSpider
(
processer
,
"EuroTrackProcesser"
+
strconv
.
Itoa
(
i
))
}
newSpider
:=
spider
.
NewSpider
(
processer
,
"EuroTrackProcesser"
+
strconv
.
Itoa
(
i
))
temp_flag
:=
v
.
Ext
[
win007
.
MODULE_FLAG
]
bytes
,
_
:=
json
.
Marshal
(
temp_flag
)
...
...
@@ -69,11 +70,12 @@ func (this *EuroTrackProcesser) Startup() {
url
:=
strings
.
Replace
(
base_url
,
"${cId}"
,
v
,
1
)
newSpider
=
newSpider
.
AddUrl
(
url
,
"html"
)
}
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
if
i
%
10000
==
0
{
//10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
}
}
...
...
foot-spider/module/win007/proc/LeagueProcesser.go
浏览文件 @
e9d489ce
...
...
@@ -46,6 +46,7 @@ func (this *LeagueProcesser) Startup() {
document
,
_
:=
GetDocument
(
sid_stat_url
)
var
processer
*
LeagueProcesser
var
newSpider
*
spider
.
Spider
document
.
Find
(
"a[href*='sid']"
)
.
Each
(
func
(
i
int
,
selection
*
goquery
.
Selection
)
{
sUrl
,
_
:=
selection
.
Attr
(
"href"
)
sId
:=
strings
.
Split
(
sUrl
,
"sid="
)[
1
]
...
...
@@ -58,16 +59,18 @@ func (this *LeagueProcesser) Startup() {
if
i
%
10
==
0
{
//10个联赛一个spider,总数1000多个联赛,最多100spider
processer
=
GetLeagueProcesser
()
processer
.
Setup
(
this
)
newSpider
=
spider
.
NewSpider
(
processer
,
"LeagueProcesser"
+
strconv
.
Itoa
(
i
))
}
newSpider
:=
spider
.
NewSpider
(
processer
,
"LeagueProcesser"
+
strconv
.
Itoa
(
i
))
processer
.
sUrl_Id
[
win007
.
WIN007_BASE_URL
+
sUrl
]
=
sId
processer
.
sUrl_Name
[
win007
.
WIN007_BASE_URL
+
sUrl
]
=
sName
newSpider
=
newSpider
.
AddUrl
(
win007
.
WIN007_BASE_URL
+
sUrl
,
"html"
)
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
if
i
%
10
==
0
{
//10个联赛一个spider,总数1000多个联赛,最多100spider
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
})
}
...
...
foot-spider/module/win007/proc/LeagueSeasonProcesser.go
浏览文件 @
e9d489ce
...
...
@@ -49,6 +49,7 @@ func (this *LeagueSeasonProcesser) Startup() {
this
.
LeagueService
.
FindAll
(
&
leaguesList
)
//2.配置要抓取的路径
var
processer
*
LeagueSeasonProcesser
var
newSpider
*
spider
.
Spider
//index := 0
for
i
,
v
:=
range
leaguesList
{
//先不处理杯赛....
...
...
@@ -62,8 +63,8 @@ func (this *LeagueSeasonProcesser) Startup() {
if
i
%
10
==
0
{
//10个联赛一个spider,总数1000多个联赛,最多100spider
processer
=
GetLeagueSeasonProcesser
()
processer
.
Setup
(
this
)
newSpider
=
spider
.
NewSpider
(
processer
,
"LeagueSeasonProcesser"
+
strconv
.
Itoa
(
i
))
}
newSpider
:=
spider
.
NewSpider
(
processer
,
"LeagueSeasonProcesser"
+
strconv
.
Itoa
(
i
))
url
:=
win007
.
WIN007_MATCH_HIS_PATTERN
if
v
.
SeasonCross
{
...
...
@@ -77,11 +78,12 @@ func (this *LeagueSeasonProcesser) Startup() {
processer
.
sUrl_leagueId
[
url
]
=
v
.
Id
newSpider
=
newSpider
.
AddUrl
(
url
,
"html"
)
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
if
i
%
10
==
0
{
//10个联赛一个spider,总数1000多个联赛,最多100spider
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
}
}
...
...
foot-spider/module/win007/proc/MatchHisProcesser.go
浏览文件 @
e9d489ce
...
...
@@ -61,13 +61,14 @@ func (this *MatchHisProcesser) Startup() {
seasonList
:=
this
.
LeagueSeasonService
.
FindBySeason
(
this
.
Season
)
//2.配置要抓取的路径
var
processer
*
MatchHisProcesser
var
newSpider
*
spider
.
Spider
for
i
,
v
:=
range
seasonList
{
if
i
%
10
==
0
{
//10个联赛一个spider,总数1000多个联赛,最多100spider
processer
=
GetMatchHisProcesser
()
processer
.
Setup
(
this
)
newSpider
=
spider
.
NewSpider
(
processer
,
"MatchHisProcesser"
+
strconv
.
Itoa
(
i
))
}
newSpider
:=
spider
.
NewSpider
(
processer
,
"MatchHisProcesser"
+
strconv
.
Itoa
(
i
))
url
:=
win007
.
WIN007_MATCH_HIS_PATTERN
url
=
strings
.
Replace
(
url
,
"${season}"
,
v
.
Season
,
1
)
...
...
@@ -81,11 +82,12 @@ func (this *MatchHisProcesser) Startup() {
processer
.
SUrl_Season
[
round_url
]
=
v
newSpider
=
newSpider
.
AddUrl
(
round_url
,
"html"
)
}
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
if
i
%
10
==
0
{
//10个联赛一个spider,总数1000多个联赛,最多100spider
newSpider
.
SetDownloader
(
down
.
NewMWin007Downloader
())
newSpider
=
newSpider
.
AddPipeline
(
pipeline
.
NewPipelineConsole
())
newSpider
.
SetSleepTime
(
"rand"
,
1000
,
20000
)
newSpider
.
SetThreadnum
(
1
)
.
Run
()
}
}
}
...
...
编辑
预览
Markdown
is supported
0%
请重试
或
添加新附件
.
添加附件
取消
You are about to add
0
people
to the discussion. Proceed with caution.
先完成此消息的编辑!
取消
想要评论请
注册
或
登录