__main__.py 15.5 KB
Newer Older
H
Hsury 已提交
1 2 3 4 5 6 7 8
#!/usr/bin/env python3.7
# -*- coding: utf-8 -*-

import argparse
import hashlib
import json
import math
import os
H
Hsury 已提交
9
import re
H
Hsury 已提交
10
import requests
H
Hsury 已提交
11
import shlex
H
Hsury 已提交
12
import signal
H
Hsury 已提交
13
import struct
H
Hsury 已提交
14
import sys
H
Hsury 已提交
15
import threading
H
Hsury 已提交
16
import time
H
Hsury 已提交
17
import traceback
H
Hsury 已提交
18
import types
W
wizardforcel 已提交
19 20 21
from BiliDriveEx import __version__
from BiliDriveEx.bilibili import Bilibili
from BiliDriveEx.encoder import Encoder
W
wizardforcel 已提交
22
from BiliDriveEx.util import *
H
Hsury 已提交
23

W
wizardforcel 已提交
24
encoder = Encoder()
H
Hsury 已提交
25

W
wizardforcel 已提交
26 27
default_url = lambda sha1: f"http://i0.hdslb.com/bfs/album/{sha1}.png"
meta_string = lambda url: ("bdex://" + re.findall(r"[a-fA-F0-9]{40}", url)[0]) if re.match(r"^http(s?)://i0.hdslb.com/bfs/album/[a-fA-F0-9]{40}.png$", url) else url
H
Hsury 已提交
28

W
wizardforcel 已提交
29 30 31 32 33 34 35 36 37
def fetch_meta(s):
    if re.match(r"^bdex://[a-fA-F0-9]{40}$", s):
        full_meta = image_download(default_url(re.findall(r"[a-fA-F0-9]{40}", s)[0]))
    elif re.match(r"^bdrive://[a-fA-F0-9]{40}$", s):
        full_meta = image_download(
            default_url(re.findall(r"[a-fA-F0-9]{40}", s)[0]).replace('png', 'x-ms-bmp')
        )
    elif s.startswith("http://") or s.startswith("https://"):
        full_meta = image_download(s)
H
Hsury 已提交
38 39 40
    else:
        return None
    try:
W
wizardforcel 已提交
41
        meta_dict = json.loads(encoder.decode(full_meta).decode("utf-8"))
H
Hsury 已提交
42 43 44 45
        return meta_dict
    except:
        return None

H
Hsury 已提交
46
def image_upload(data, cookies):
H
Hsury 已提交
47 48 49 50
    url = "https://api.vc.bilibili.com/api/v1/drawImage/upload"
    headers = {
        'Origin': "https://t.bilibili.com",
        'Referer': "https://t.bilibili.com/",
51
        'User-Agent': "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.79 Safari/537.36",
H
Hsury 已提交
52 53
    }
    files = {
W
wizardforcel 已提交
54
        'file_up': (f"{int(time.time() * 1000)}.png", data),
W
wizardforcel 已提交
55 56
    }
    data = {
H
Hsury 已提交
57 58 59
        'biz': "draw",
        'category': "daily",
    }
H
Hsury 已提交
60
    try:
W
wizardforcel 已提交
61
        response = requests.post(url, data=data, headers=headers, cookies=cookies, files=files, timeout=300).json()
H
Hsury 已提交
62 63
    except:
        response = None
H
Hsury 已提交
64 65
    return response

H
Hsury 已提交
66 67 68 69
def login_handle(args):
    bilibili = Bilibili()
    if bilibili.login(username=args.username, password=args.password):
        bilibili.get_user_info()
H
Hsury 已提交
70
        with open(os.path.join(bundle_dir, "cookies.json"), "w", encoding="utf-8") as f:
H
Hsury 已提交
71 72
            f.write(json.dumps(bilibili.get_cookies(), ensure_ascii=False, indent=2))

H
Hsury 已提交
73
def upload_handle(args):
H
Hsury 已提交
74
    def core(index, block):
H
Hsury 已提交
75
        try:
W
wizardforcel 已提交
76
            block_sha1 = calc_sha1(block)
W
wizardforcel 已提交
77
            full_block = encoder.encode(block)
W
wizardforcel 已提交
78
            full_block_sha1 = calc_sha1(full_block)
H
Hsury 已提交
79
            url = is_skippable(full_block_sha1)
H
Hsury 已提交
80
            if url:
81
                log(f"分块{index + 1}/{block_num}上传完毕")
H
Hsury 已提交
82 83 84 85 86
                block_dict[index] = {
                    'url': url,
                    'size': len(block),
                    'sha1': block_sha1,
                }
H
Hsury 已提交
87
            else:
88
                # log(f"分块{index + 1}/{block_num}开始上传")
H
Hsury 已提交
89
                for _ in range(10):
H
Hsury 已提交
90 91
                    if terminate_flag.is_set():
                        return
H
Hsury 已提交
92 93 94 95
                    response = image_upload(full_block, cookies)
                    if response:
                        if response['code'] == 0:
                            url = response['data']['image_url']
96
                            log(f"分块{index + 1}/{block_num}上传完毕")
H
Hsury 已提交
97 98 99 100 101
                            block_dict[index] = {
                                'url': url,
                                'size': len(block),
                                'sha1': block_sha1,
                            }
H
Hsury 已提交
102
                            return
H
Hsury 已提交
103 104
                        elif response['code'] == -4:
                            terminate_flag.set()
105
                            log(f"分块{index + 1}/{block_num}{_ + 1}次上传失败, 请重新登录")
H
Hsury 已提交
106
                            return
107
                    log(f"分块{index + 1}/{block_num}{_ + 1}次上传失败")
H
Hsury 已提交
108 109 110 111 112
                else:
                    terminate_flag.set()
        except:
            terminate_flag.set()
            traceback.print_exc()
H
Hsury 已提交
113 114
        finally:
            done_flag.release()
H
Hsury 已提交
115

H
Hsury 已提交
116
    def is_skippable(sha1):
H
Hsury 已提交
117
        url = default_url(sha1)
H
Hsury 已提交
118 119
        headers = {
            'Referer': "http://t.bilibili.com/",
120
            'User-Agent': "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/79.0.3945.79 Safari/537.36",
H
Hsury 已提交
121
        }
H
Hsury 已提交
122
        for _ in range(5):
H
Hsury 已提交
123
            try:
H
Hsury 已提交
124
                response = requests.head(url, headers=headers, timeout=10)
H
Hsury 已提交
125 126 127 128
                return url if response.status_code == 200 else None
            except:
                pass
        return None
H
Hsury 已提交
129

H
Hsury 已提交
130
    def write_history(first_4mb_sha1, meta_dict, url):
H
Hsury 已提交
131
        history = read_history()
H
Hsury 已提交
132 133
        history[first_4mb_sha1] = meta_dict
        history[first_4mb_sha1]['url'] = url
H
Hsury 已提交
134
        with open(os.path.join(bundle_dir, "history.json"), "w", encoding="utf-8") as f:
H
Hsury 已提交
135 136
            f.write(json.dumps(history, ensure_ascii=False, indent=2))

H
Hsury 已提交
137 138
    start_time = time.time()
    file_name = args.file
H
Hsury 已提交
139
    if not os.path.exists(file_name):
140
        log(f"文件{file_name}不存在")
H
Hsury 已提交
141
        return None
H
Hsury 已提交
142
    if os.path.isdir(file_name):
143
        log("暂不支持上传文件夹")
H
Hsury 已提交
144
        return None
145
    log(f"上传: {os.path.basename(file_name)} ({size_string(os.path.getsize(file_name))})")
W
wizardforcel 已提交
146
    first_4mb_sha1 = calc_sha1(read_in_chunk(file_name, chunk_size=4 * 1024 * 1024, chunk_number=1))
H
Hsury 已提交
147
    history = read_history()
H
Hsury 已提交
148 149
    if first_4mb_sha1 in history:
        url = history[first_4mb_sha1]['url']
150 151
        log(f"文件已于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(history[first_4mb_sha1]['time']))}上传, 共有{len(history[first_4mb_sha1]['block'])}个分块")
        log(f"META URL -> {meta_string(url)}")
H
Hsury 已提交
152
        return url
H
Hsury 已提交
153 154 155 156 157 158
    try:
        with open(os.path.join(bundle_dir, "cookies.json"), "r", encoding="utf-8") as f:
            cookies = json.loads(f.read())
    except:
        log("Cookies加载失败, 请先登录")
        return None
H
Hsury 已提交
159
    log(f"线程数: {args.thread}")
H
Hsury 已提交
160 161 162 163
    done_flag = threading.Semaphore(0)
    terminate_flag = threading.Event()
    thread_pool = []
    block_dict = {}
164
    block_num = math.ceil(os.path.getsize(file_name) / (args.block_size * 1024 * 1024))
H
Hsury 已提交
165
    for index, block in enumerate(read_in_chunk(file_name, chunk_size=args.block_size * 1024 * 1024)):
H
Hsury 已提交
166 167 168 169 170
        if len(thread_pool) >= args.thread:
            done_flag.acquire()
        if not terminate_flag.is_set():
            thread_pool.append(threading.Thread(target=core, args=(index, block)))
            thread_pool[-1].start()
H
Hsury 已提交
171
        else:
H
Hsury 已提交
172
            log("已终止上传, 等待线程回收")
H
Hsury 已提交
173
            break
H
Hsury 已提交
174 175 176 177
    for thread in thread_pool:
        thread.join()
    if terminate_flag.is_set():
        return None
W
wizardforcel 已提交
178
    sha1 = calc_sha1(read_in_chunk(file_name))
H
Hsury 已提交
179
    meta_dict = {
H
Hsury 已提交
180
        'time': int(time.time()),
H
Hsury 已提交
181
        'filename': os.path.basename(file_name),
H
Hsury 已提交
182
        'size': os.path.getsize(file_name),
H
Hsury 已提交
183 184
        'sha1': sha1,
        'block': [block_dict[i] for i in range(len(block_dict))],
H
Hsury 已提交
185
    }
H
Hsury 已提交
186
    meta = json.dumps(meta_dict, ensure_ascii=False).encode("utf-8")
W
wizardforcel 已提交
187
    full_meta = encoder.encode(meta)
H
Hsury 已提交
188
    for _ in range(10):
H
Hsury 已提交
189
        response = image_upload(full_meta, cookies)
H
Hsury 已提交
190
        if response and response['code'] == 0:
H
Hsury 已提交
191
            url = response['data']['image_url']
H
Hsury 已提交
192
            log("元数据上传完毕")
193 194
            log(f"{meta_dict['filename']} ({size_string(meta_dict['size'])}) 上传完毕, 用时{time.time() - start_time:.1f}秒, 平均速度{size_string(meta_dict['size'] / (time.time() - start_time))}/s")
            log(f"META URL -> {meta_string(url)}")
H
Hsury 已提交
195
            write_history(first_4mb_sha1, meta_dict, url)
H
Hsury 已提交
196
            return url
H
Hsury 已提交
197
        log(f"元数据第{_ + 1}次上传失败")
H
Hsury 已提交
198
    else:
H
Hsury 已提交
199
        return None
H
Hsury 已提交
200 201

def download_handle(args):
H
Hsury 已提交
202
    def core(index, block_dict):
H
Hsury 已提交
203
        try:
204
            # log(f"分块{index + 1}/{len(meta_dict['block'])}开始下载")
H
Hsury 已提交
205
            for _ in range(10):
H
Hsury 已提交
206 207
                if terminate_flag.is_set():
                    return
H
Hsury 已提交
208 209
                block = image_download(block_dict['url'])
                if block:
W
wizardforcel 已提交
210
                    block = encoder.decode(block)
W
wizardforcel 已提交
211
                    if calc_sha1(block) == block_dict['sha1']:
H
Hsury 已提交
212 213 214 215
                        file_lock.acquire()
                        f.seek(block_offset(index))
                        f.write(block)
                        file_lock.release()
216
                        log(f"分块{index + 1}/{len(meta_dict['block'])}下载完毕")
H
Hsury 已提交
217
                        return
H
Hsury 已提交
218
                    else:
219
                        log(f"分块{index + 1}/{len(meta_dict['block'])}校验未通过")
H
Hsury 已提交
220
                else:
221
                    log(f"分块{index + 1}/{len(meta_dict['block'])}{_ + 1}次下载失败")
H
Hsury 已提交
222
            else:
H
Hsury 已提交
223 224
                terminate_flag.set()
        except:
H
Hsury 已提交
225
            terminate_flag.set()
H
Hsury 已提交
226
            traceback.print_exc()
H
Hsury 已提交
227 228
        finally:
            done_flag.release()
H
Hsury 已提交
229 230 231

    def block_offset(index):
        return sum(meta_dict['block'][i]['size'] for i in range(index))
H
Hsury 已提交
232

H
Hsury 已提交
233
    def is_overwritable(file_name):
H
Hsury 已提交
234 235 236
        if args.force:
            return True
        else:
237
            return (input("文件已存在, 是否覆盖? [y/N] ") in ["y", "Y"])
H
Hsury 已提交
238

H
Hsury 已提交
239
    start_time = time.time()
H
Hsury 已提交
240 241 242
    meta_dict = fetch_meta(args.meta)
    if meta_dict:
        file_name = args.file if args.file else meta_dict['filename']
243
        log(f"下载: {os.path.basename(file_name)} ({size_string(meta_dict['size'])}), 共有{len(meta_dict['block'])}个分块, 上传于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
H
Hsury 已提交
244
    else:
H
Hsury 已提交
245
        log("元数据解析失败")
H
Hsury 已提交
246
        return None
H
Hsury 已提交
247
    log(f"线程数: {args.thread}")
H
Hsury 已提交
248
    download_block_list = []
H
Hsury 已提交
249
    if os.path.exists(file_name):
W
wizardforcel 已提交
250
        if os.path.getsize(file_name) == meta_dict['size'] and calc_sha1(read_in_chunk(file_name)) == meta_dict['sha1']:
251
            log("文件已存在, 且与服务器端内容一致")
H
Hsury 已提交
252
            return file_name
H
Hsury 已提交
253
        elif is_overwritable(file_name):
H
Hsury 已提交
254 255 256
            with open(file_name, "rb") as f:
                for index, block_dict in enumerate(meta_dict['block']):
                    f.seek(block_offset(index))
W
wizardforcel 已提交
257
                    if calc_sha1(f.read(block_dict['size'])) == block_dict['sha1']:
258
                        # log(f"分块{index + 1}/{len(meta_dict['block'])}校验通过")
H
Hsury 已提交
259
                        pass
H
Hsury 已提交
260
                    else:
261
                        # log(f"分块{index + 1}/{len(meta_dict['block'])}校验未通过")
H
Hsury 已提交
262
                        download_block_list.append(index)
263
            log(f"{len(download_block_list)}/{len(meta_dict['block'])}个分块待下载")
H
Hsury 已提交
264 265
        else:
            return None
H
Hsury 已提交
266
    else:
H
Hsury 已提交
267
        download_block_list = list(range(len(meta_dict['block'])))
H
Hsury 已提交
268 269 270 271
    done_flag = threading.Semaphore(0)
    terminate_flag = threading.Event()
    file_lock = threading.Lock()
    thread_pool = []
H
Hsury 已提交
272 273
    with open(file_name, "r+b" if os.path.exists(file_name) else "wb") as f:
        for index in download_block_list:
H
Hsury 已提交
274 275 276
            if len(thread_pool) >= args.thread:
                done_flag.acquire()
            if not terminate_flag.is_set():
H
Hsury 已提交
277
                thread_pool.append(threading.Thread(target=core, args=(index, meta_dict['block'][index])))
H
Hsury 已提交
278
                thread_pool[-1].start()
H
Hsury 已提交
279
            else:
H
Hsury 已提交
280
                log("已终止下载, 等待线程回收")
H
Hsury 已提交
281
                break
H
Hsury 已提交
282 283 284 285
        for thread in thread_pool:
            thread.join()
        if terminate_flag.is_set():
            return None
H
Hsury 已提交
286
        f.truncate(sum(block['size'] for block in meta_dict['block']))
287
    log(f"{os.path.basename(file_name)} ({size_string(meta_dict['size'])}) 下载完毕, 用时{time.time() - start_time:.1f}秒, 平均速度{size_string(meta_dict['size'] / (time.time() - start_time))}/s")
W
wizardforcel 已提交
288
    sha1 = calc_sha1(read_in_chunk(file_name))
H
Hsury 已提交
289
    if sha1 == meta_dict['sha1']:
290
        log("文件校验通过")
H
Hsury 已提交
291
        return file_name
H
Hsury 已提交
292
    else:
293
        log("文件校验未通过")
H
Hsury 已提交
294
        return None
H
Hsury 已提交
295

H
Hsury 已提交
296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319
def info_handle(args):
    meta_dict = fetch_meta(args.meta)
    if meta_dict:
        print(f"文件名: {meta_dict['filename']}")
        print(f"大小: {size_string(meta_dict['size'])}")
        print(f"SHA-1: {meta_dict['sha1']}")
        print(f"上传时间: {time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
        print(f"分块数: {len(meta_dict['block'])}")
        for index, block_dict in enumerate(meta_dict['block']):
            print(f"分块{index + 1} ({size_string(block_dict['size'])}) URL: {block_dict['url']}")
    else:
        print("元数据解析失败")

def history_handle(args):
    history = read_history()
    if history:
        for index, meta_dict in enumerate(history.values()):
            prefix = f"[{index + 1}]"
            print(f"{prefix} {meta_dict['filename']} ({size_string(meta_dict['size'])}), 共有{len(meta_dict['block'])}个分块, 上传于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
            print(f"{' ' * len(prefix)} META URL -> {meta_string(meta_dict['url'])}")
    else:
        print(f"暂无历史记录")

def main():
H
Hsury 已提交
320
    signal.signal(signal.SIGINT, lambda signum, frame: os.kill(os.getpid(), 9))
W
wizardforcel 已提交
321 322
    parser = argparse.ArgumentParser(prog="BiliDriveEx", description="Make Bilibili A Great Cloud Storage!", formatter_class=argparse.RawDescriptionHelpFormatter)
    parser.add_argument("-v", "--version", action="version", version=f"BiliDriveEx version: {__version__}")
H
Hsury 已提交
323
    subparsers = parser.add_subparsers()
H
Hsury 已提交
324
    login_parser = subparsers.add_parser("login", help="log in to bilibili")
H
Hsury 已提交
325 326
    login_parser.add_argument("username", help="your bilibili username")
    login_parser.add_argument("password", help="your bilibili password")
H
Hsury 已提交
327 328
    login_parser.set_defaults(func=login_handle)
    upload_parser = subparsers.add_parser("upload", help="upload a file")
H
Hsury 已提交
329
    upload_parser.add_argument("file", help="name of the file to upload")
H
Hsury 已提交
330
    upload_parser.add_argument("-b", "--block-size", default=4, type=int, help="block size in MB")
H
Hsury 已提交
331
    upload_parser.add_argument("-t", "--thread", default=4, type=int, help="upload thread number")
H
Hsury 已提交
332 333
    upload_parser.set_defaults(func=upload_handle)
    download_parser = subparsers.add_parser("download", help="download a file")
H
Hsury 已提交
334
    download_parser.add_argument("meta", help="meta url")
H
Hsury 已提交
335
    download_parser.add_argument("file", nargs="?", default="", help="new file name")
H
Hsury 已提交
336
    download_parser.add_argument("-f", "--force", action="store_true", help="force to overwrite if file exists")
H
Hsury 已提交
337
    download_parser.add_argument("-t", "--thread", default=8, type=int, help="download thread number")
H
Hsury 已提交
338
    download_parser.set_defaults(func=download_handle)
H
Hsury 已提交
339 340 341 342 343
    info_parser = subparsers.add_parser("info", help="show meta info")
    info_parser.add_argument("meta", help="meta url")
    info_parser.set_defaults(func=info_handle)
    history_parser = subparsers.add_parser("history", help="show upload history")
    history_parser.set_defaults(func=history_handle)
H
Hsury 已提交
344 345 346
    shell = False
    while True:
        if shell:
W
wizardforcel 已提交
347
            args = shlex.split(input("BiliDriveEx > "))
H
Hsury 已提交
348 349 350 351 352
            try:
                args = parser.parse_args(args)
                args.func(args)
            except:
                pass
H
Hsury 已提交
353 354 355 356
        else:
            args = parser.parse_args()
            try:
                args.func(args)
H
Hsury 已提交
357
                break
H
Hsury 已提交
358 359
            except AttributeError:
                shell = True
H
Hsury 已提交
360 361 362 363 364 365 366
                subparsers.add_parser("help", help="show this help message").set_defaults(func=lambda _: parser.parse_args(["--help"]).func())
                subparsers.add_parser("version", help="show program's version number").set_defaults(func=lambda _: parser.parse_args(["--version"]).func())
                subparsers.add_parser("exit", help="exit program").set_defaults(func=lambda _: os._exit(0))
                parser.print_help()

if __name__ == "__main__":
    main()