__main__.py 13.7 KB
Newer Older
H
Hsury 已提交
1 2 3 4 5 6 7 8
#!/usr/bin/env python3.7
# -*- coding: utf-8 -*-

import argparse
import hashlib
import json
import math
import os
H
Hsury 已提交
9
import re
H
Hsury 已提交
10
import requests
H
Hsury 已提交
11
import shlex
H
Hsury 已提交
12
import signal
H
Hsury 已提交
13
import struct
H
Hsury 已提交
14
import sys
H
Hsury 已提交
15
import threading
H
Hsury 已提交
16
import time
H
Hsury 已提交
17
import traceback
H
Hsury 已提交
18
import types
W
wizardforcel 已提交
19 20 21
from BiliDriveEx import __version__
from BiliDriveEx.bilibili import Bilibili
from BiliDriveEx.encoder import Encoder
W
wizardforcel 已提交
22
from BiliDriveEx.util import *
H
Hsury 已提交
23

W
wizardforcel 已提交
24
encoder = Encoder()
W
wizardforcel 已提交
25
api = Bilibili()
H
Hsury 已提交
26

W
wizardforcel 已提交
27 28
def fetch_meta(s):
    if re.match(r"^bdex://[a-fA-F0-9]{40}$", s):
W
wizardforcel 已提交
29
        full_meta = image_download(api.default_url(re.findall(r"[a-fA-F0-9]{40}", s)[0]))
W
wizardforcel 已提交
30 31
    elif re.match(r"^bdrive://[a-fA-F0-9]{40}$", s):
        full_meta = image_download(
W
wizardforcel 已提交
32
            api.default_url(re.findall(r"[a-fA-F0-9]{40}", s)[0]).replace('png', 'x-ms-bmp')
W
wizardforcel 已提交
33 34 35
        )
    elif s.startswith("http://") or s.startswith("https://"):
        full_meta = image_download(s)
H
Hsury 已提交
36
    else:
W
wizardforcel 已提交
37
        return
H
Hsury 已提交
38
    try:
W
wizardforcel 已提交
39
        meta_dict = json.loads(encoder.decode(full_meta).decode("utf-8"))
H
Hsury 已提交
40 41
        return meta_dict
    except:
W
wizardforcel 已提交
42
        return
H
Hsury 已提交
43

H
Hsury 已提交
44

H
Hsury 已提交
45
def login_handle(args):
W
wizardforcel 已提交
46
    if api.login(username=args.username, password=args.password):
W
wizardforcel 已提交
47
        info = api.get_user_info()
W
wizardforcel 已提交
48
        if info: log(info)
W
wizardforcel 已提交
49
        else: log("用户信息获取失败")
W
wizardforcel 已提交
50

W
wizardforcel 已提交
51 52 53
def cookies_handle(args):
    api.set_cookies(args.cookies)
    info = api.get_user_info()
W
wizardforcel 已提交
54
    if info: log(info)
W
wizardforcel 已提交
55
    else: log("用户信息获取失败")
H
Hsury 已提交
56

W
wizardforcel 已提交
57 58 59 60 61
def userinfo_handle(args):
    info = api.get_user_info()
    if info: log(info)
    else: log("用户未登录")

H
Hsury 已提交
62
def upload_handle(args):
H
Hsury 已提交
63
    def core(index, block):
H
Hsury 已提交
64
        try:
W
wizardforcel 已提交
65
            block_sha1 = calc_sha1(block)
W
wizardforcel 已提交
66
            full_block = encoder.encode(block)
W
wizardforcel 已提交
67
            full_block_sha1 = calc_sha1(full_block)
W
wizardforcel 已提交
68
            url = api.exist(full_block_sha1)
H
Hsury 已提交
69
            if url:
70
                log(f"分块{index + 1}/{block_num}上传完毕")
H
Hsury 已提交
71 72 73 74 75
                block_dict[index] = {
                    'url': url,
                    'size': len(block),
                    'sha1': block_sha1,
                }
H
Hsury 已提交
76
            else:
77
                # log(f"分块{index + 1}/{block_num}开始上传")
H
Hsury 已提交
78
                for _ in range(10):
H
Hsury 已提交
79 80
                    if terminate_flag.is_set():
                        return
W
wizardforcel 已提交
81
                    response = api.image_upload(full_block)
H
Hsury 已提交
82 83 84
                    if response:
                        if response['code'] == 0:
                            url = response['data']['image_url']
85
                            log(f"分块{index + 1}/{block_num}上传完毕")
H
Hsury 已提交
86 87 88 89 90
                            block_dict[index] = {
                                'url': url,
                                'size': len(block),
                                'sha1': block_sha1,
                            }
H
Hsury 已提交
91
                            return
H
Hsury 已提交
92 93
                        elif response['code'] == -4:
                            terminate_flag.set()
94
                            log(f"分块{index + 1}/{block_num}{_ + 1}次上传失败, 请重新登录")
H
Hsury 已提交
95
                            return
96
                    log(f"分块{index + 1}/{block_num}{_ + 1}次上传失败")
H
Hsury 已提交
97 98 99 100 101
                else:
                    terminate_flag.set()
        except:
            terminate_flag.set()
            traceback.print_exc()
H
Hsury 已提交
102 103
        finally:
            done_flag.release()
H
Hsury 已提交
104

H
Hsury 已提交
105 106
    start_time = time.time()
    file_name = args.file
H
Hsury 已提交
107
    if not os.path.exists(file_name):
108
        log(f"文件{file_name}不存在")
W
wizardforcel 已提交
109
        return
H
Hsury 已提交
110
    if os.path.isdir(file_name):
111
        log("暂不支持上传文件夹")
W
wizardforcel 已提交
112
        return
113
    log(f"上传: {os.path.basename(file_name)} ({size_string(os.path.getsize(file_name))})")
W
wizardforcel 已提交
114
    first_4mb_sha1 = calc_sha1(read_in_chunk(file_name, size=4 * 1024 * 1024, cnt=1))
H
Hsury 已提交
115
    history = read_history()
H
Hsury 已提交
116 117
    if first_4mb_sha1 in history:
        url = history[first_4mb_sha1]['url']
118
        log(f"文件已于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(history[first_4mb_sha1]['time']))}上传, 共有{len(history[first_4mb_sha1]['block'])}个分块")
W
wizardforcel 已提交
119
        log(f"META URL -> {api.meta_string(url)}")
H
Hsury 已提交
120
        return url
W
wizardforcel 已提交
121

W
wizardforcel 已提交
122 123 124 125
    if not api.get_user_info():
        log("账号未登录,请先登录")
        return
        
H
Hsury 已提交
126
    log(f"线程数: {args.thread}")
H
Hsury 已提交
127 128 129 130
    done_flag = threading.Semaphore(0)
    terminate_flag = threading.Event()
    thread_pool = []
    block_dict = {}
131
    block_num = math.ceil(os.path.getsize(file_name) / (args.block_size * 1024 * 1024))
W
wizardforcel 已提交
132
    for index, block in enumerate(read_in_chunk(file_name, size=args.block_size * 1024 * 1024)):
H
Hsury 已提交
133 134 135 136 137
        if len(thread_pool) >= args.thread:
            done_flag.acquire()
        if not terminate_flag.is_set():
            thread_pool.append(threading.Thread(target=core, args=(index, block)))
            thread_pool[-1].start()
H
Hsury 已提交
138
        else:
H
Hsury 已提交
139
            log("已终止上传, 等待线程回收")
H
Hsury 已提交
140
            break
H
Hsury 已提交
141 142 143
    for thread in thread_pool:
        thread.join()
    if terminate_flag.is_set():
W
wizardforcel 已提交
144
        return
W
wizardforcel 已提交
145
    sha1 = calc_sha1(read_in_chunk(file_name))
H
Hsury 已提交
146
    meta_dict = {
H
Hsury 已提交
147
        'time': int(time.time()),
H
Hsury 已提交
148
        'filename': os.path.basename(file_name),
H
Hsury 已提交
149
        'size': os.path.getsize(file_name),
H
Hsury 已提交
150 151
        'sha1': sha1,
        'block': [block_dict[i] for i in range(len(block_dict))],
H
Hsury 已提交
152
    }
H
Hsury 已提交
153
    meta = json.dumps(meta_dict, ensure_ascii=False).encode("utf-8")
W
wizardforcel 已提交
154
    full_meta = encoder.encode(meta)
H
Hsury 已提交
155
    for _ in range(10):
W
wizardforcel 已提交
156
        response = api.image_upload(full_meta)
H
Hsury 已提交
157
        if response and response['code'] == 0:
H
Hsury 已提交
158
            url = response['data']['image_url']
H
Hsury 已提交
159
            log("元数据上传完毕")
160
            log(f"{meta_dict['filename']} ({size_string(meta_dict['size'])}) 上传完毕, 用时{time.time() - start_time:.1f}秒, 平均速度{size_string(meta_dict['size'] / (time.time() - start_time))}/s")
W
wizardforcel 已提交
161
            log(f"META URL -> {api.meta_string(url)}")
H
Hsury 已提交
162
            write_history(first_4mb_sha1, meta_dict, url)
H
Hsury 已提交
163
            return url
H
Hsury 已提交
164
        log(f"元数据第{_ + 1}次上传失败")
H
Hsury 已提交
165
    else:
W
wizardforcel 已提交
166
        return
H
Hsury 已提交
167 168

def download_handle(args):
H
Hsury 已提交
169
    def core(index, block_dict):
H
Hsury 已提交
170
        try:
171
            # log(f"分块{index + 1}/{len(meta_dict['block'])}开始下载")
H
Hsury 已提交
172
            for _ in range(10):
H
Hsury 已提交
173 174
                if terminate_flag.is_set():
                    return
H
Hsury 已提交
175 176
                block = image_download(block_dict['url'])
                if block:
W
wizardforcel 已提交
177
                    block = encoder.decode(block)
W
wizardforcel 已提交
178
                    if calc_sha1(block) == block_dict['sha1']:
H
Hsury 已提交
179 180 181 182
                        file_lock.acquire()
                        f.seek(block_offset(index))
                        f.write(block)
                        file_lock.release()
183
                        log(f"分块{index + 1}/{len(meta_dict['block'])}下载完毕")
H
Hsury 已提交
184
                        return
H
Hsury 已提交
185
                    else:
186
                        log(f"分块{index + 1}/{len(meta_dict['block'])}校验未通过")
H
Hsury 已提交
187
                else:
188
                    log(f"分块{index + 1}/{len(meta_dict['block'])}{_ + 1}次下载失败")
H
Hsury 已提交
189
            else:
H
Hsury 已提交
190 191
                terminate_flag.set()
        except:
H
Hsury 已提交
192
            terminate_flag.set()
H
Hsury 已提交
193
            traceback.print_exc()
H
Hsury 已提交
194 195
        finally:
            done_flag.release()
H
Hsury 已提交
196 197 198

    def block_offset(index):
        return sum(meta_dict['block'][i]['size'] for i in range(index))
H
Hsury 已提交
199

H
Hsury 已提交
200
    def is_overwritable(file_name):
H
Hsury 已提交
201 202 203
        if args.force:
            return True
        else:
204
            return (input("文件已存在, 是否覆盖? [y/N] ") in ["y", "Y"])
H
Hsury 已提交
205

H
Hsury 已提交
206
    start_time = time.time()
H
Hsury 已提交
207 208 209
    meta_dict = fetch_meta(args.meta)
    if meta_dict:
        file_name = args.file if args.file else meta_dict['filename']
210
        log(f"下载: {os.path.basename(file_name)} ({size_string(meta_dict['size'])}), 共有{len(meta_dict['block'])}个分块, 上传于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
H
Hsury 已提交
211
    else:
H
Hsury 已提交
212
        log("元数据解析失败")
W
wizardforcel 已提交
213
        return
H
Hsury 已提交
214
    log(f"线程数: {args.thread}")
H
Hsury 已提交
215
    download_block_list = []
H
Hsury 已提交
216
    if os.path.exists(file_name):
W
wizardforcel 已提交
217
        if os.path.getsize(file_name) == meta_dict['size'] and calc_sha1(read_in_chunk(file_name)) == meta_dict['sha1']:
218
            log("文件已存在, 且与服务器端内容一致")
H
Hsury 已提交
219
            return file_name
H
Hsury 已提交
220
        elif is_overwritable(file_name):
H
Hsury 已提交
221 222 223
            with open(file_name, "rb") as f:
                for index, block_dict in enumerate(meta_dict['block']):
                    f.seek(block_offset(index))
W
wizardforcel 已提交
224
                    if calc_sha1(f.read(block_dict['size'])) == block_dict['sha1']:
225
                        # log(f"分块{index + 1}/{len(meta_dict['block'])}校验通过")
H
Hsury 已提交
226
                        pass
H
Hsury 已提交
227
                    else:
228
                        # log(f"分块{index + 1}/{len(meta_dict['block'])}校验未通过")
H
Hsury 已提交
229
                        download_block_list.append(index)
230
            log(f"{len(download_block_list)}/{len(meta_dict['block'])}个分块待下载")
H
Hsury 已提交
231
        else:
W
wizardforcel 已提交
232
            return
H
Hsury 已提交
233
    else:
H
Hsury 已提交
234
        download_block_list = list(range(len(meta_dict['block'])))
H
Hsury 已提交
235 236 237 238
    done_flag = threading.Semaphore(0)
    terminate_flag = threading.Event()
    file_lock = threading.Lock()
    thread_pool = []
H
Hsury 已提交
239 240
    with open(file_name, "r+b" if os.path.exists(file_name) else "wb") as f:
        for index in download_block_list:
H
Hsury 已提交
241 242 243
            if len(thread_pool) >= args.thread:
                done_flag.acquire()
            if not terminate_flag.is_set():
H
Hsury 已提交
244
                thread_pool.append(threading.Thread(target=core, args=(index, meta_dict['block'][index])))
H
Hsury 已提交
245
                thread_pool[-1].start()
H
Hsury 已提交
246
            else:
H
Hsury 已提交
247
                log("已终止下载, 等待线程回收")
H
Hsury 已提交
248
                break
H
Hsury 已提交
249 250 251
        for thread in thread_pool:
            thread.join()
        if terminate_flag.is_set():
W
wizardforcel 已提交
252
            return
H
Hsury 已提交
253
        f.truncate(sum(block['size'] for block in meta_dict['block']))
254
    log(f"{os.path.basename(file_name)} ({size_string(meta_dict['size'])}) 下载完毕, 用时{time.time() - start_time:.1f}秒, 平均速度{size_string(meta_dict['size'] / (time.time() - start_time))}/s")
W
wizardforcel 已提交
255
    sha1 = calc_sha1(read_in_chunk(file_name))
H
Hsury 已提交
256
    if sha1 == meta_dict['sha1']:
257
        log("文件校验通过")
H
Hsury 已提交
258
        return file_name
H
Hsury 已提交
259
    else:
260
        log("文件校验未通过")
W
wizardforcel 已提交
261
        return
H
Hsury 已提交
262

H
Hsury 已提交
263 264 265
def info_handle(args):
    meta_dict = fetch_meta(args.meta)
    if meta_dict:
W
wizardforcel 已提交
266
        print_meta(meta_dict)
H
Hsury 已提交
267 268 269 270 271 272 273 274 275
    else:
        print("元数据解析失败")

def history_handle(args):
    history = read_history()
    if history:
        for index, meta_dict in enumerate(history.values()):
            prefix = f"[{index + 1}]"
            print(f"{prefix} {meta_dict['filename']} ({size_string(meta_dict['size'])}), 共有{len(meta_dict['block'])}个分块, 上传于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
W
wizardforcel 已提交
276
            print(f"{' ' * len(prefix)} META URL -> {api.meta_string(meta_dict['url'])}")
H
Hsury 已提交
277 278 279 280
    else:
        print(f"暂无历史记录")

def main():
H
Hsury 已提交
281
    signal.signal(signal.SIGINT, lambda signum, frame: os.kill(os.getpid(), 9))
W
wizardforcel 已提交
282 283
    parser = argparse.ArgumentParser(prog="BiliDriveEx", description="Make Bilibili A Great Cloud Storage!", formatter_class=argparse.RawDescriptionHelpFormatter)
    parser.add_argument("-v", "--version", action="version", version=f"BiliDriveEx version: {__version__}")
H
Hsury 已提交
284
    subparsers = parser.add_subparsers()
W
wizardforcel 已提交
285
    
H
Hsury 已提交
286
    login_parser = subparsers.add_parser("login", help="log in to bilibili")
H
Hsury 已提交
287 288
    login_parser.add_argument("username", help="your bilibili username")
    login_parser.add_argument("password", help="your bilibili password")
H
Hsury 已提交
289
    login_parser.set_defaults(func=login_handle)
W
wizardforcel 已提交
290 291 292 293 294
    
    cookies_parser = subparsers.add_parser("cookies", help="set cookies to bilibili")
    cookies_parser.add_argument("cookies", help="your bilibili cookies")
    cookies_parser.set_defaults(func=cookies_handle)

W
wizardforcel 已提交
295 296 297
    userinfo_parser = subparsers.add_parser("userinfo", help="get userinfo")
    userinfo_parser.set_defaults(func=userinfo_handle)
    
H
Hsury 已提交
298
    upload_parser = subparsers.add_parser("upload", help="upload a file")
H
Hsury 已提交
299
    upload_parser.add_argument("file", help="name of the file to upload")
H
Hsury 已提交
300
    upload_parser.add_argument("-b", "--block-size", default=4, type=int, help="block size in MB")
H
Hsury 已提交
301
    upload_parser.add_argument("-t", "--thread", default=4, type=int, help="upload thread number")
H
Hsury 已提交
302
    upload_parser.set_defaults(func=upload_handle)
W
wizardforcel 已提交
303
    
H
Hsury 已提交
304
    download_parser = subparsers.add_parser("download", help="download a file")
H
Hsury 已提交
305
    download_parser.add_argument("meta", help="meta url")
H
Hsury 已提交
306
    download_parser.add_argument("file", nargs="?", default="", help="new file name")
H
Hsury 已提交
307
    download_parser.add_argument("-f", "--force", action="store_true", help="force to overwrite if file exists")
H
Hsury 已提交
308
    download_parser.add_argument("-t", "--thread", default=8, type=int, help="download thread number")
H
Hsury 已提交
309
    download_parser.set_defaults(func=download_handle)
W
wizardforcel 已提交
310
    
H
Hsury 已提交
311 312 313 314 315
    info_parser = subparsers.add_parser("info", help="show meta info")
    info_parser.add_argument("meta", help="meta url")
    info_parser.set_defaults(func=info_handle)
    history_parser = subparsers.add_parser("history", help="show upload history")
    history_parser.set_defaults(func=history_handle)
H
Hsury 已提交
316 317 318
    shell = False
    while True:
        if shell:
W
wizardforcel 已提交
319
            args = shlex.split(input("BiliDriveEx > "))
H
Hsury 已提交
320 321 322 323 324
            try:
                args = parser.parse_args(args)
                args.func(args)
            except:
                pass
H
Hsury 已提交
325 326 327 328
        else:
            args = parser.parse_args()
            try:
                args.func(args)
H
Hsury 已提交
329
                break
W
wizardforcel 已提交
330 331
            except AttributeError as ex:
                traceback.print_exc(file=sys.stdout)
H
Hsury 已提交
332
                shell = True
H
Hsury 已提交
333 334 335 336 337 338 339
                subparsers.add_parser("help", help="show this help message").set_defaults(func=lambda _: parser.parse_args(["--help"]).func())
                subparsers.add_parser("version", help="show program's version number").set_defaults(func=lambda _: parser.parse_args(["--version"]).func())
                subparsers.add_parser("exit", help="exit program").set_defaults(func=lambda _: os._exit(0))
                parser.print_help()

if __name__ == "__main__":
    main()