__main__.py 14.0 KB
Newer Older
H
Hsury 已提交
1 2 3 4 5 6 7 8
#!/usr/bin/env python3.7
# -*- coding: utf-8 -*-

import argparse
import hashlib
import json
import math
import os
H
Hsury 已提交
9
import re
H
Hsury 已提交
10
import requests
H
Hsury 已提交
11
import shlex
H
Hsury 已提交
12
import signal
H
Hsury 已提交
13
import struct
H
Hsury 已提交
14
import sys
H
Hsury 已提交
15
import threading
H
Hsury 已提交
16
import time
H
Hsury 已提交
17
import traceback
H
Hsury 已提交
18
import types
W
wizardforcel 已提交
19 20 21
from BiliDriveEx import __version__
from BiliDriveEx.bilibili import Bilibili
from BiliDriveEx.encoder import Encoder
W
wizardforcel 已提交
22
from BiliDriveEx.util import *
H
Hsury 已提交
23

W
wizardforcel 已提交
24
encoder = Encoder()
W
wizardforcel 已提交
25
api = Bilibili()
H
Hsury 已提交
26

W
wizardforcel 已提交
27 28
def fetch_meta(s):
    if re.match(r"^bdex://[a-fA-F0-9]{40}$", s):
W
wizardforcel 已提交
29
        full_meta = image_download(api.default_url(re.findall(r"[a-fA-F0-9]{40}", s)[0]))
W
wizardforcel 已提交
30 31
    elif re.match(r"^bdrive://[a-fA-F0-9]{40}$", s):
        full_meta = image_download(
W
wizardforcel 已提交
32
            api.default_url(re.findall(r"[a-fA-F0-9]{40}", s)[0]).replace('png', 'x-ms-bmp')
W
wizardforcel 已提交
33 34 35
        )
    elif s.startswith("http://") or s.startswith("https://"):
        full_meta = image_download(s)
H
Hsury 已提交
36
    else:
W
wizardforcel 已提交
37
        return
H
Hsury 已提交
38
    try:
W
wizardforcel 已提交
39
        meta_dict = json.loads(encoder.decode(full_meta).decode("utf-8"))
H
Hsury 已提交
40 41
        return meta_dict
    except:
W
wizardforcel 已提交
42
        return
H
Hsury 已提交
43

H
Hsury 已提交
44

H
Hsury 已提交
45
def login_handle(args):
W
wizardforcel 已提交
46
    if api.login(username=args.username, password=args.password):
W
wizardforcel 已提交
47 48 49
        info = api.get_user_info()
        if info: log_info(info)
        else: log("用户信息获取失败")
W
wizardforcel 已提交
50

W
wizardforcel 已提交
51 52 53 54 55
def cookies_handle(args):
    api.set_cookies(args.cookies)
    info = api.get_user_info()
    if info: log_info(info)
    else: log("用户信息获取失败")
H
Hsury 已提交
56

H
Hsury 已提交
57
def upload_handle(args):
H
Hsury 已提交
58
    def core(index, block):
H
Hsury 已提交
59
        try:
W
wizardforcel 已提交
60
            block_sha1 = calc_sha1(block)
W
wizardforcel 已提交
61
            full_block = encoder.encode(block)
W
wizardforcel 已提交
62
            full_block_sha1 = calc_sha1(full_block)
W
wizardforcel 已提交
63
            url = api.exist(full_block_sha1)
H
Hsury 已提交
64
            if url:
65
                log(f"分块{index + 1}/{block_num}上传完毕")
H
Hsury 已提交
66 67 68 69 70
                block_dict[index] = {
                    'url': url,
                    'size': len(block),
                    'sha1': block_sha1,
                }
H
Hsury 已提交
71
            else:
72
                # log(f"分块{index + 1}/{block_num}开始上传")
H
Hsury 已提交
73
                for _ in range(10):
H
Hsury 已提交
74 75
                    if terminate_flag.is_set():
                        return
W
wizardforcel 已提交
76
                    response = api.image_upload(full_block)
H
Hsury 已提交
77 78 79
                    if response:
                        if response['code'] == 0:
                            url = response['data']['image_url']
80
                            log(f"分块{index + 1}/{block_num}上传完毕")
H
Hsury 已提交
81 82 83 84 85
                            block_dict[index] = {
                                'url': url,
                                'size': len(block),
                                'sha1': block_sha1,
                            }
H
Hsury 已提交
86
                            return
H
Hsury 已提交
87 88
                        elif response['code'] == -4:
                            terminate_flag.set()
89
                            log(f"分块{index + 1}/{block_num}{_ + 1}次上传失败, 请重新登录")
H
Hsury 已提交
90
                            return
91
                    log(f"分块{index + 1}/{block_num}{_ + 1}次上传失败")
H
Hsury 已提交
92 93 94 95 96
                else:
                    terminate_flag.set()
        except:
            terminate_flag.set()
            traceback.print_exc()
H
Hsury 已提交
97 98
        finally:
            done_flag.release()
H
Hsury 已提交
99

H
Hsury 已提交
100 101
    start_time = time.time()
    file_name = args.file
H
Hsury 已提交
102
    if not os.path.exists(file_name):
103
        log(f"文件{file_name}不存在")
W
wizardforcel 已提交
104
        return
H
Hsury 已提交
105
    if os.path.isdir(file_name):
106
        log("暂不支持上传文件夹")
W
wizardforcel 已提交
107
        return
108
    log(f"上传: {os.path.basename(file_name)} ({size_string(os.path.getsize(file_name))})")
W
wizardforcel 已提交
109
    first_4mb_sha1 = calc_sha1(read_in_chunk(file_name, size=4 * 1024 * 1024, cnt=1))
H
Hsury 已提交
110
    history = read_history()
H
Hsury 已提交
111 112
    if first_4mb_sha1 in history:
        url = history[first_4mb_sha1]['url']
113
        log(f"文件已于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(history[first_4mb_sha1]['time']))}上传, 共有{len(history[first_4mb_sha1]['block'])}个分块")
W
wizardforcel 已提交
114
        log(f"META URL -> {api.meta_string(url)}")
H
Hsury 已提交
115
        return url
W
wizardforcel 已提交
116

W
wizardforcel 已提交
117 118 119 120
    if not api.get_user_info():
        log("账号未登录,请先登录")
        return
        
H
Hsury 已提交
121
    log(f"线程数: {args.thread}")
H
Hsury 已提交
122 123 124 125
    done_flag = threading.Semaphore(0)
    terminate_flag = threading.Event()
    thread_pool = []
    block_dict = {}
126
    block_num = math.ceil(os.path.getsize(file_name) / (args.block_size * 1024 * 1024))
W
wizardforcel 已提交
127
    for index, block in enumerate(read_in_chunk(file_name, size=args.block_size * 1024 * 1024)):
H
Hsury 已提交
128 129 130 131 132
        if len(thread_pool) >= args.thread:
            done_flag.acquire()
        if not terminate_flag.is_set():
            thread_pool.append(threading.Thread(target=core, args=(index, block)))
            thread_pool[-1].start()
H
Hsury 已提交
133
        else:
H
Hsury 已提交
134
            log("已终止上传, 等待线程回收")
H
Hsury 已提交
135
            break
H
Hsury 已提交
136 137 138
    for thread in thread_pool:
        thread.join()
    if terminate_flag.is_set():
W
wizardforcel 已提交
139
        return
W
wizardforcel 已提交
140
    sha1 = calc_sha1(read_in_chunk(file_name))
H
Hsury 已提交
141
    meta_dict = {
H
Hsury 已提交
142
        'time': int(time.time()),
H
Hsury 已提交
143
        'filename': os.path.basename(file_name),
H
Hsury 已提交
144
        'size': os.path.getsize(file_name),
H
Hsury 已提交
145 146
        'sha1': sha1,
        'block': [block_dict[i] for i in range(len(block_dict))],
H
Hsury 已提交
147
    }
H
Hsury 已提交
148
    meta = json.dumps(meta_dict, ensure_ascii=False).encode("utf-8")
W
wizardforcel 已提交
149
    full_meta = encoder.encode(meta)
H
Hsury 已提交
150
    for _ in range(10):
W
wizardforcel 已提交
151
        response = api.image_upload(full_meta)
H
Hsury 已提交
152
        if response and response['code'] == 0:
H
Hsury 已提交
153
            url = response['data']['image_url']
H
Hsury 已提交
154
            log("元数据上传完毕")
155
            log(f"{meta_dict['filename']} ({size_string(meta_dict['size'])}) 上传完毕, 用时{time.time() - start_time:.1f}秒, 平均速度{size_string(meta_dict['size'] / (time.time() - start_time))}/s")
W
wizardforcel 已提交
156
            log(f"META URL -> {api.meta_string(url)}")
H
Hsury 已提交
157
            write_history(first_4mb_sha1, meta_dict, url)
H
Hsury 已提交
158
            return url
H
Hsury 已提交
159
        log(f"元数据第{_ + 1}次上传失败")
H
Hsury 已提交
160
    else:
W
wizardforcel 已提交
161
        return
H
Hsury 已提交
162 163

def download_handle(args):
H
Hsury 已提交
164
    def core(index, block_dict):
H
Hsury 已提交
165
        try:
166
            # log(f"分块{index + 1}/{len(meta_dict['block'])}开始下载")
H
Hsury 已提交
167
            for _ in range(10):
H
Hsury 已提交
168 169
                if terminate_flag.is_set():
                    return
H
Hsury 已提交
170 171
                block = image_download(block_dict['url'])
                if block:
W
wizardforcel 已提交
172
                    block = encoder.decode(block)
W
wizardforcel 已提交
173
                    if calc_sha1(block) == block_dict['sha1']:
H
Hsury 已提交
174 175 176 177
                        file_lock.acquire()
                        f.seek(block_offset(index))
                        f.write(block)
                        file_lock.release()
178
                        log(f"分块{index + 1}/{len(meta_dict['block'])}下载完毕")
H
Hsury 已提交
179
                        return
H
Hsury 已提交
180
                    else:
181
                        log(f"分块{index + 1}/{len(meta_dict['block'])}校验未通过")
H
Hsury 已提交
182
                else:
183
                    log(f"分块{index + 1}/{len(meta_dict['block'])}{_ + 1}次下载失败")
H
Hsury 已提交
184
            else:
H
Hsury 已提交
185 186
                terminate_flag.set()
        except:
H
Hsury 已提交
187
            terminate_flag.set()
H
Hsury 已提交
188
            traceback.print_exc()
H
Hsury 已提交
189 190
        finally:
            done_flag.release()
H
Hsury 已提交
191 192 193

    def block_offset(index):
        return sum(meta_dict['block'][i]['size'] for i in range(index))
H
Hsury 已提交
194

H
Hsury 已提交
195
    def is_overwritable(file_name):
H
Hsury 已提交
196 197 198
        if args.force:
            return True
        else:
199
            return (input("文件已存在, 是否覆盖? [y/N] ") in ["y", "Y"])
H
Hsury 已提交
200

H
Hsury 已提交
201
    start_time = time.time()
H
Hsury 已提交
202 203 204
    meta_dict = fetch_meta(args.meta)
    if meta_dict:
        file_name = args.file if args.file else meta_dict['filename']
205
        log(f"下载: {os.path.basename(file_name)} ({size_string(meta_dict['size'])}), 共有{len(meta_dict['block'])}个分块, 上传于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
H
Hsury 已提交
206
    else:
H
Hsury 已提交
207
        log("元数据解析失败")
W
wizardforcel 已提交
208
        return
H
Hsury 已提交
209
    log(f"线程数: {args.thread}")
H
Hsury 已提交
210
    download_block_list = []
H
Hsury 已提交
211
    if os.path.exists(file_name):
W
wizardforcel 已提交
212
        if os.path.getsize(file_name) == meta_dict['size'] and calc_sha1(read_in_chunk(file_name)) == meta_dict['sha1']:
213
            log("文件已存在, 且与服务器端内容一致")
H
Hsury 已提交
214
            return file_name
H
Hsury 已提交
215
        elif is_overwritable(file_name):
H
Hsury 已提交
216 217 218
            with open(file_name, "rb") as f:
                for index, block_dict in enumerate(meta_dict['block']):
                    f.seek(block_offset(index))
W
wizardforcel 已提交
219
                    if calc_sha1(f.read(block_dict['size'])) == block_dict['sha1']:
220
                        # log(f"分块{index + 1}/{len(meta_dict['block'])}校验通过")
H
Hsury 已提交
221
                        pass
H
Hsury 已提交
222
                    else:
223
                        # log(f"分块{index + 1}/{len(meta_dict['block'])}校验未通过")
H
Hsury 已提交
224
                        download_block_list.append(index)
225
            log(f"{len(download_block_list)}/{len(meta_dict['block'])}个分块待下载")
H
Hsury 已提交
226
        else:
W
wizardforcel 已提交
227
            return
H
Hsury 已提交
228
    else:
H
Hsury 已提交
229
        download_block_list = list(range(len(meta_dict['block'])))
H
Hsury 已提交
230 231 232 233
    done_flag = threading.Semaphore(0)
    terminate_flag = threading.Event()
    file_lock = threading.Lock()
    thread_pool = []
H
Hsury 已提交
234 235
    with open(file_name, "r+b" if os.path.exists(file_name) else "wb") as f:
        for index in download_block_list:
H
Hsury 已提交
236 237 238
            if len(thread_pool) >= args.thread:
                done_flag.acquire()
            if not terminate_flag.is_set():
H
Hsury 已提交
239
                thread_pool.append(threading.Thread(target=core, args=(index, meta_dict['block'][index])))
H
Hsury 已提交
240
                thread_pool[-1].start()
H
Hsury 已提交
241
            else:
H
Hsury 已提交
242
                log("已终止下载, 等待线程回收")
H
Hsury 已提交
243
                break
H
Hsury 已提交
244 245 246
        for thread in thread_pool:
            thread.join()
        if terminate_flag.is_set():
W
wizardforcel 已提交
247
            return
H
Hsury 已提交
248
        f.truncate(sum(block['size'] for block in meta_dict['block']))
249
    log(f"{os.path.basename(file_name)} ({size_string(meta_dict['size'])}) 下载完毕, 用时{time.time() - start_time:.1f}秒, 平均速度{size_string(meta_dict['size'] / (time.time() - start_time))}/s")
W
wizardforcel 已提交
250
    sha1 = calc_sha1(read_in_chunk(file_name))
H
Hsury 已提交
251
    if sha1 == meta_dict['sha1']:
252
        log("文件校验通过")
H
Hsury 已提交
253
        return file_name
H
Hsury 已提交
254
    else:
255
        log("文件校验未通过")
W
wizardforcel 已提交
256
        return
H
Hsury 已提交
257

H
Hsury 已提交
258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276
def info_handle(args):
    meta_dict = fetch_meta(args.meta)
    if meta_dict:
        print(f"文件名: {meta_dict['filename']}")
        print(f"大小: {size_string(meta_dict['size'])}")
        print(f"SHA-1: {meta_dict['sha1']}")
        print(f"上传时间: {time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
        print(f"分块数: {len(meta_dict['block'])}")
        for index, block_dict in enumerate(meta_dict['block']):
            print(f"分块{index + 1} ({size_string(block_dict['size'])}) URL: {block_dict['url']}")
    else:
        print("元数据解析失败")

def history_handle(args):
    history = read_history()
    if history:
        for index, meta_dict in enumerate(history.values()):
            prefix = f"[{index + 1}]"
            print(f"{prefix} {meta_dict['filename']} ({size_string(meta_dict['size'])}), 共有{len(meta_dict['block'])}个分块, 上传于{time.strftime('%Y-%m-%d %H:%M:%S', time.localtime(meta_dict['time']))}")
W
wizardforcel 已提交
277
            print(f"{' ' * len(prefix)} META URL -> {api.meta_string(meta_dict['url'])}")
H
Hsury 已提交
278 279 280 281
    else:
        print(f"暂无历史记录")

def main():
H
Hsury 已提交
282
    signal.signal(signal.SIGINT, lambda signum, frame: os.kill(os.getpid(), 9))
W
wizardforcel 已提交
283 284
    parser = argparse.ArgumentParser(prog="BiliDriveEx", description="Make Bilibili A Great Cloud Storage!", formatter_class=argparse.RawDescriptionHelpFormatter)
    parser.add_argument("-v", "--version", action="version", version=f"BiliDriveEx version: {__version__}")
H
Hsury 已提交
285
    subparsers = parser.add_subparsers()
W
wizardforcel 已提交
286
    
H
Hsury 已提交
287
    login_parser = subparsers.add_parser("login", help="log in to bilibili")
H
Hsury 已提交
288 289
    login_parser.add_argument("username", help="your bilibili username")
    login_parser.add_argument("password", help="your bilibili password")
H
Hsury 已提交
290
    login_parser.set_defaults(func=login_handle)
W
wizardforcel 已提交
291 292 293 294 295
    
    cookies_parser = subparsers.add_parser("cookies", help="set cookies to bilibili")
    cookies_parser.add_argument("cookies", help="your bilibili cookies")
    cookies_parser.set_defaults(func=cookies_handle)

H
Hsury 已提交
296
    upload_parser = subparsers.add_parser("upload", help="upload a file")
H
Hsury 已提交
297
    upload_parser.add_argument("file", help="name of the file to upload")
H
Hsury 已提交
298
    upload_parser.add_argument("-b", "--block-size", default=4, type=int, help="block size in MB")
H
Hsury 已提交
299
    upload_parser.add_argument("-t", "--thread", default=4, type=int, help="upload thread number")
H
Hsury 已提交
300
    upload_parser.set_defaults(func=upload_handle)
W
wizardforcel 已提交
301
    
H
Hsury 已提交
302
    download_parser = subparsers.add_parser("download", help="download a file")
H
Hsury 已提交
303
    download_parser.add_argument("meta", help="meta url")
H
Hsury 已提交
304
    download_parser.add_argument("file", nargs="?", default="", help="new file name")
H
Hsury 已提交
305
    download_parser.add_argument("-f", "--force", action="store_true", help="force to overwrite if file exists")
H
Hsury 已提交
306
    download_parser.add_argument("-t", "--thread", default=8, type=int, help="download thread number")
H
Hsury 已提交
307
    download_parser.set_defaults(func=download_handle)
W
wizardforcel 已提交
308
    
H
Hsury 已提交
309 310 311 312 313
    info_parser = subparsers.add_parser("info", help="show meta info")
    info_parser.add_argument("meta", help="meta url")
    info_parser.set_defaults(func=info_handle)
    history_parser = subparsers.add_parser("history", help="show upload history")
    history_parser.set_defaults(func=history_handle)
H
Hsury 已提交
314 315 316
    shell = False
    while True:
        if shell:
W
wizardforcel 已提交
317
            args = shlex.split(input("BiliDriveEx > "))
H
Hsury 已提交
318 319 320 321 322
            try:
                args = parser.parse_args(args)
                args.func(args)
            except:
                pass
H
Hsury 已提交
323 324 325 326
        else:
            args = parser.parse_args()
            try:
                args.func(args)
H
Hsury 已提交
327
                break
W
wizardforcel 已提交
328 329
            except AttributeError as ex:
                traceback.print_exc(file=sys.stdout)
H
Hsury 已提交
330
                shell = True
H
Hsury 已提交
331 332 333 334 335 336 337
                subparsers.add_parser("help", help="show this help message").set_defaults(func=lambda _: parser.parse_args(["--help"]).func())
                subparsers.add_parser("version", help="show program's version number").set_defaults(func=lambda _: parser.parse_args(["--version"]).func())
                subparsers.add_parser("exit", help="exit program").set_defaults(func=lambda _: os._exit(0))
                parser.print_help()

if __name__ == "__main__":
    main()