diff --git a/classes/cms.py b/classes/cms.py index ae290b1053348c2f888e7db38f358e318703490e..d31319dcc6c0687d2be955b7ce574f1f50f7dc07 100644 --- a/classes/cms.py +++ b/classes/cms.py @@ -74,7 +74,10 @@ class CMS: url = rule.get('url','') detailUrl = rule.get('detailUrl','') searchUrl = rule.get('searchUrl','') - headers = rule.get('headers',{}) + default_headers = getHeaders(host) + self_headers = rule.get('headers',{}) + default_headers.update(self_headers) + headers = default_headers cookie = self.getCookie() # print(f'{self.title}cookie:{cookie}') if cookie: @@ -97,6 +100,7 @@ class CMS: headers['User-Agent'] = UA if not 'referer' in lower_keys: headers['Referer'] = host + # print(headers) self.headers = headers self.host = host self.homeUrl = urljoin(host,homeUrl) if host and homeUrl else homeUrl @@ -331,6 +335,7 @@ class CMS: 'type_id': class_urls[i] }) # print(self.url) + print(self.headers) has_cache = False if self.homeUrl.startswith('http'): # print(self.homeUrl) @@ -504,6 +509,7 @@ class CMS: r.encoding = self.encoding print(r.url) html = r.text + # print(html) items = pdfa(html, p[0]) except: pass diff --git "a/js/\345\205\273\347\253\257.js" "b/js/\345\205\273\347\253\257.js" new file mode 100644 index 0000000000000000000000000000000000000000..bbe7d3540042de64aebd340e577a3bea34bd0903 --- /dev/null +++ "b/js/\345\205\273\347\253\257.js" @@ -0,0 +1,16 @@ +var rule = { + title:'养端', + host:'https://aaq48.com:33666', + homeUrl:'/home/index.html', + url:'/home/vodlist/38/fyclass-fypage.html', + headers:{ + 'User-Agent':'MOBILE_UA' + }, + timeout:5000, + class_parse:'.menu&&dl&ⅆa&&Text;a&&href;.*/(.*?)-', + limit:5, + play_parse:true, + lazy:'', + 一级:'.channel-list&&dl;h3&&Text;img&&data-original;font&&Text;a&&href', + 二级:'*', +} \ No newline at end of file diff --git a/models/rules.db b/models/rules.db index 5bab170b985ece673fed633c415766dc1636773b..ba625b869d246ed0fb1b5d497d7d14d508e6b685 100644 Binary files a/models/rules.db and b/models/rules.db differ diff --git a/utils/web.py b/utils/web.py index 178cdf46530a531073d4a758a6794b616953a9ce..232595d2322fc8d4bc181b3211ec9b846bb8ed11 100644 --- a/utils/web.py +++ b/utils/web.py @@ -87,3 +87,12 @@ def verfy_token(token=''): if token != ctoken: return False return True + +def getHeaders(url): + headers = {} + if url: + headers.setdefault("Referer", url) + headers.setdefault("User-Agent", PC_UA) + headers.setdefault("Accept", "text/html,application/xhtml+xml,application/xml;q=0.9,image/avif,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9") + headers.setdefault("Accept-Language", "zh-CN,zh;q=0.8,zh-TW;q=0.7,zh-HK;q=0.5,en-US;q=0.3,en;q=0.2") + return headers \ No newline at end of file