提交 0f5187b1 编写于 作者: S shi.zeyuan

1.xx

上级 51600121
......@@ -2,6 +2,7 @@ package main
import (
"fmt"
"tesou.io/platform/foot-parent/foot-spider/launch"
"time"
)
......@@ -17,7 +18,8 @@ func main() {
fmt.Println(parse2)
//launch.Spider_match_his("2019")
//launch.Spider_History()
//launch.Spider_leagueSeason()
launch.Spider_match(0)
launch.Spider_baseFace(false)
fmt.Println(SingleThread)
......
......@@ -44,17 +44,15 @@ func (this *AsiaLastNewProcesser) Setup(temp *AsiaLastNewProcesser) {
func (this *AsiaLastNewProcesser) Startup() {
processer := this
var newSpider *spider.Spider
processer := this
newSpider = spider.NewSpider(processer, "AsiaLastNewProcesser")
for i, v := range this.MatchLastList {
if !this.SingleThread && i%10000 == 0 { //10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer = GetAsiaLastNewProcesser()
processer.Setup(this)
newSpider = spider.NewSpider(processer, "AsiaLastNewProcesser"+strconv.Itoa(i))
}else{
processer = this
newSpider = spider.NewSpider(processer, "AsiaLastNewProcesser"+strconv.Itoa(i))
}
temp_flag := v.Ext[win007.MODULE_FLAG]
......
......@@ -49,17 +49,15 @@ func (this *BaseFaceProcesser) Setup(temp *BaseFaceProcesser) {
func (this *BaseFaceProcesser) Startup() {
processer := this
var newSpider *spider.Spider
processer := this
newSpider = spider.NewSpider(processer, "BaseFaceProcesser")
for i, v := range this.MatchLastList {
if !this.SingleThread && i%10000 == 0 { //10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer = GetBaseFaceProcesser()
processer.Setup(this)
newSpider = spider.NewSpider(processer, "BaseFaceProcesser"+strconv.Itoa(i))
}else{
processer = this
newSpider = spider.NewSpider(processer, "BaseFaceProcesser"+strconv.Itoa(i))
}
temp_flag := v.Ext[win007.MODULE_FLAG]
......
......@@ -51,17 +51,15 @@ func (this *EuroLastProcesser) Setup(temp *EuroLastProcesser) {
func (this *EuroLastProcesser) Startup() {
processer := this
var newSpider *spider.Spider
processer := this
newSpider = spider.NewSpider(processer, "EuroLastProcesser")
for i, v := range this.MatchLastList {
if !this.SingleThread && i%10000 == 0 { //10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer = GetEuroLastProcesser()
processer.Setup(this)
newSpider = spider.NewSpider(processer, "EuroLastProcesser"+strconv.Itoa(i))
}else{
processer = this
newSpider = spider.NewSpider(processer, "EuroLastProcesser"+strconv.Itoa(i))
}
temp_flag := v.Ext[win007.MODULE_FLAG]
......
......@@ -50,17 +50,15 @@ func (this *EuroTrackProcesser) Setup(temp *EuroTrackProcesser) {
func (this *EuroTrackProcesser) Startup() {
processer := this
var newSpider *spider.Spider
processer := this
newSpider = spider.NewSpider(processer, "EuroTrackProcesser")
for i, v := range this.MatchLastList {
if !this.SingleThread &&i%10000 == 0 { //10000个比赛一个spider,一个赛季大概有30万场比赛,最多30spider
processer = GetEuroTrackProcesser()
processer.Setup(this)
newSpider = spider.NewSpider(processer, "EuroTrackProcesser"+strconv.Itoa(i))
}else{
processer = this
newSpider = spider.NewSpider(processer, "EuroTrackProcesser"+strconv.Itoa(i))
}
temp_flag := v.Ext[win007.MODULE_FLAG]
......
......@@ -49,8 +49,9 @@ func (this *LeagueSeasonProcesser) Startup() {
leaguesList := make([]*pojo.League, 0)
this.LeagueService.FindAll(&leaguesList)
//2.配置要抓取的路径
processer := this
var newSpider *spider.Spider
processer := this
newSpider = spider.NewSpider(processer, "LeagueSeasonProcesser")
//index := 0
for i, v := range leaguesList {
//先不处理杯赛....
......
......@@ -61,8 +61,9 @@ func (this *MatchHisProcesser) Startup() {
//1.获取所有的联赛赛季信息
seasonList := this.LeagueSeasonService.FindBySeason(this.Season)
//2.配置要抓取的路径
processer := this
var newSpider *spider.Spider
processer := this
newSpider = spider.NewSpider(processer, "MatchHisProcesser")
for i, v := range seasonList {
if i%10 == 0 { //10个联赛一个spider,总数1000多个联赛,最多100spider
......
......@@ -36,16 +36,19 @@ type MatchLastProcesser struct {
}
func GetMatchLastProcesser() *MatchLastProcesser {
return &MatchLastProcesser{}
processer := &MatchLastProcesser{}
processer.Init()
return processer
}
func (this *MatchLastProcesser) Startup() {
//联赛数据
func (this *MatchLastProcesser) Init() {
//初始化参数值
this.league_list = make([]*entity2.League, 0)
this.win007Id_leagueId_map = make(map[string]string)
//比赛数据
this.matchLast_list = make([]*pojo.MatchLast, 0)
}
func (this *MatchLastProcesser) Startup() {
if this.MatchlastUrl == "" {
this.MatchlastUrl = "http://m.win007.com/phone/Schedule_0_0.txt"
}
......@@ -54,7 +57,7 @@ func (this *MatchLastProcesser) Startup() {
newSpider = newSpider.AddUrl(this.MatchlastUrl, "text")
newSpider.SetDownloader(down.NewMWin007Downloader())
newSpider = newSpider.AddPipeline(pipeline.NewPipelineConsole())
newSpider.SetSleepTime("rand",100,2000)
newSpider.SetSleepTime("rand", 100, 2000)
newSpider.SetThreadnum(1).Run()
}
......@@ -73,7 +76,7 @@ func (this *MatchLastProcesser) Process(p *page.Page) {
rawText_arr := strings.Split(rawText, "$$")
if len(rawText_arr) < 2 {
base.Log.Error("rawText:解析失败,rawTextArr长度小于所必需要的长度2,url:",request.Url,"内容:", rawText_arr)
base.Log.Error("rawText:解析失败,rawTextArr长度小于所必需要的长度2,url:", request.Url, "内容:", rawText_arr)
return
}
......@@ -88,9 +91,9 @@ func (this *MatchLastProcesser) Process(p *page.Page) {
match_str = rawText_arr[2]
}
base.Log.Info("日期:TODAY","联赛信息:", league_str)
base.Log.Info("日期:TODAY", "联赛信息:", league_str)
this.league_process(league_str)
base.Log.Info("日期:TODAY","比赛信息:", match_str)
base.Log.Info("日期:TODAY", "比赛信息:", match_str)
this.match_process(match_str)
now := time.Now()
......@@ -124,16 +127,16 @@ func (this *MatchLastProcesser) futrueMatch(date string) {
rawText_arr := strings.Split(rawText, "$")
if len(rawText_arr) < 2 {
base.Log.Error("rawText:解析失败,rawTextArr长度小于所必需要的长度2,url:",url,"内容:", rawText_arr)
base.Log.Error("rawText:解析失败,rawTextArr长度小于所必需要的长度2,url:", url, "内容:", rawText_arr)
return
}
league_str := rawText_arr[0]
match_str := rawText_arr[1]
base.Log.Info("日期:",date,"联赛信息:", league_str)
base.Log.Info("日期:", date, "联赛信息:", league_str)
this.league_process(league_str)
base.Log.Info("日期:",date,"比赛信息:", match_str)
base.Log.Info("日期:", date, "比赛信息:", match_str)
this.match_process(match_str)
}
......@@ -146,8 +149,6 @@ func (this *MatchLastProcesser) findParamVal(url string) string {
func (this *MatchLastProcesser) league_process(rawText string) {
league_arr := strings.Split(rawText, "!")
this.league_list = make([]*entity2.League, len(league_arr))
var index int
for _, v := range league_arr {
league_info_arr := strings.Split(v, "^")
if len(league_info_arr) < 3 {
......@@ -183,8 +184,8 @@ func (this *MatchLastProcesser) league_process(rawText string) {
i++
league.SName = league_info_arr[i]
this.league_list[index] = league
index++
//最后加入数据中
this.league_list = append(this.league_list, league)
}
}
......@@ -264,7 +265,7 @@ func (this *MatchLastProcesser) Finish() {
base.Log.Info(string(bytes))*/
exists := this.LeagueService.ExistById(v.Id)
if exists {
league_modify_list_slice = append(league_modify_list_slice,v)
league_modify_list_slice = append(league_modify_list_slice, v)
continue
}
league_list_slice = append(league_list_slice, v)
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册