提交 ce283903 编写于 作者: H hjdhnx

自动获取爬虫列表

上级 0ae5ff3e
......@@ -5,7 +5,7 @@
# Date : 2022/8/25
from flask import Flask, jsonify, abort,request,redirect,make_response,render_template
from js.rules import rule_list
from js.rules import getRules
from utils import error,parser
import sys
import codecs
......@@ -15,6 +15,8 @@ sys.stdout = codecs.getwriter("utf-8")(sys.stdout.detach())
app = Flask(__name__)
app.config["JSON_AS_ASCII"] = False # jsonify返回的中文正常显示
from utils.web import *
rule_list = getRules()
print(rule_list)
def getParmas(key=None):
"""
......
......@@ -4,6 +4,17 @@
# Author: DaShenHan&道长-----先苦后甜,任凭晚风拂柳颜------
# Date : 2022/8/25
rule_list = [
'鸭奈飞'
]
import os
def getRules():
base_path = os.path.dirname(os.path.abspath(__file__)) # 当前文件所在目录
# print(base_path)
file_name = os.listdir(base_path)
file_name = list(filter(lambda x:str(x).endswith('.js'),file_name))
# print(file_name)
rule_list = [file.replace('.js','') for file in file_name]
# print(rule_list)
return rule_list
if __name__ == '__main__':
print(getRules())
\ No newline at end of file
var rule = {
title:'蓝莓影视',
url:'https://lanmeiguojiang.com/show/fyclass--------fypage---.html',
searchUrl:'/vodsearch/**----------fypage---.html',
ua:'MOBILE_UA',
class_name:'电影&网剧&剧集&动漫&综艺&记录',
class_url:'20&1&2&3&4&23',
一级:'body a.module-poster-item.module-item;a&&title;.lazyload&&data-original;.module-item-note&&Text;a&&href',
二级:{"title":"h1&&Text;.module-info-tag&&Text","img":".lazyload&&data-original","desc":".module-info-item:eq(1)&&Text;.module-info-item:eq(2)&&Text;.module-info-item:eq(3)&&Text","content":".module-info-introduction&&Text","tabs":".module-tab-item","lists":".module-play-list:eq(#id) a"},
搜索:'body .module-item;.module-card-item-title&&Text;.lazyload&&data-original;.module-item-note&&Text;a&&href;.module-info-item-content&&Text',
}
\ No newline at end of file
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册