一. 参考程式

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
from tkinter import *
from retrying import retry
import urllib3,time,sys,re,requests

headers = {
"Cookie": r'',
"User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36"
}

request_header = {
'Host': 'pan.baidu.com',
'Connection': 'keep-alive',
'Upgrade-Insecure-Requests': '1',
'Sec-Fetch-Dest': 'document',
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.9',
'Sec-Fetch-Site': 'same-site',
'Sec-Fetch-Mode': 'navigate',
'Referer': 'https://pan.baidu.com',
'Accept-Encoding': 'gzip, deflate, br',
'Accept-Language': 'zh-CN,zh;q=0.9,en;q=0.8,en-US;q=0.7,en-GB;q=0.6,ru;q=0.5',
}

urllib3.disable_warnings()
s = requests.session()
s.trust_env = False

@retry(stop_max_attempt_number=5, wait_fixed=1000)
def get_bdstoken():
url = 'https://pan.baidu.com/api/gettemplatevariable?clienttype=0&app_id=250528&web=1&fields=[%22bdstoken%22,%22token%22,%22uk%22,%22isdocuser%22,%22servertime%22]'
response = s.get(url=url, headers=request_header, timeout=20, allow_redirects=True, verify=False)
return response.json()['errno'] if response.json()['errno'] != 0 else response.json()['result']['bdstoken']

@retry(stop_max_attempt_number=5, wait_fixed=1000)
def get_dir_list(bdstoken):
url = 'https://pan.baidu.com/api/list?order=time&desc=1&showempty=0&web=1&page=1&num=1000&dir=%2Fupload&bdstoken=' + bdstoken
response = s.get(url=url, headers=request_header, timeout=15, allow_redirects=False, verify=False)
return response.json()['errno'] if response.json()['errno'] != 0 else response.json()['list']

@retry(stop_max_attempt_number=5, wait_fixed=1000)
def create_dir(dir_name, bdstoken):
url = 'https://pan.baidu.com/api/create?a=commit&bdstoken=' + bdstoken
post_data = {'path': "/"+dir_name, 'isdir': '1', 'block_list': '[]', }
response = s.post(url=url, headers=request_header, data=post_data, timeout=15, allow_redirects=False, verify=False)
return response.json()['errno']

@retry(stop_max_attempt_number=6, wait_fixed=2000)
def check_links(link_url, pass_code, bdstoken):
if pass_code:
t_str = str(int(round(time.time() * 1000)))
check_url = 'https://pan.baidu.com/share/verify?surl=' + link_url[25:48] + '&bdstoken=' + bdstoken + '&t=' + t_str + '&channel=chunlei&web=1&clienttype=0'
post_data = {'pwd': pass_code, 'vcode': '', 'vcode_str': '', }
response_post = s.post(url=check_url, headers=request_header, data=post_data, timeout=10, allow_redirects=False, verify=False)
if response_post.json()['errno'] == 0:
bdclnd = response_post.json()['randsk']
else:
return response_post.json()['errno']
if bool(re.search('BDCLND=', request_header['Cookie'], re.IGNORECASE)):
request_header['Cookie'] = re.sub(r'BDCLND=(\S+);?', r'BDCLND=' + bdclnd + ';', request_header['Cookie'])
else:
request_header['Cookie'] += ';BDCLND=' + bdclnd
response = s.get(url=link_url, headers=request_header, timeout=15, allow_redirects=True, verify=False).content.decode("utf-8")
shareid_list = re.findall('"shareid":(\\d+?),"', response)
user_id_list = re.findall('"share_uk":"(\\d+?)","', response)
fs_id_list = re.findall('"fs_id":(\\d+?),"', response)
info_title_list = re.findall('<title>(.+)</title>', response)
if not shareid_list:
return 1
elif not user_id_list:
return 2
elif not fs_id_list:
return info_title_list[0] if info_title_list else 3
else:
return [shareid_list[0], user_id_list[0], fs_id_list, info_title_list[0].replace("_免费高速下载|百度网盘-分享无限制","")]

@retry(stop_max_attempt_number=20, wait_fixed=2000)
def transfer_files(check_links_reason, dir_name, bdstoken):
url = 'https://pan.baidu.com/share/transfer?shareid=' + check_links_reason[0] + '&from=' + check_links_reason[1] + '&bdstoken=' + bdstoken + '&channel=chunlei&web=1&clienttype=0'
fs_id = ','.join(i for i in check_links_reason[2])
post_data = {'fsidlist': '[' + fs_id + ']', 'path': '/' + dir_name, }
response = s.post(url=url, headers=request_header, data=post_data, timeout=15, allow_redirects=False, verify=False)
return response.json()['errno']

def savebp(dir_name,url):
cookie = headers['Cookie']
user_agent = headers['User-Agent']
request_header['Cookie'] = cookie
request_header['User-Agent'] = user_agent
try:
if any([ord(word) not in range(256) for word in cookie]) or cookie.find('BAIDUID=') == -1:
sys.exit()
bdstoken = get_bdstoken()
if isinstance(bdstoken, int):
sys.exit()
dir_list_json = get_dir_list(bdstoken)
if type(dir_list_json) != list:
sys.exit()
dir_list = [dir_json['server_filename'] for dir_json in dir_list_json]
if dir_name and dir_name not in dir_list:
create_dir_reason = create_dir(dir_name, bdstoken)
if create_dir_reason != 0:
sys.exit()
url_code = url.replace("?pwd=", " ")
link_url_org, pass_code_org = re.sub(r'提取码*[::](.*)', r'\1', url_code.lstrip()).split(' ', maxsplit=1)
[link_url, pass_code] = [link_url_org.strip()[:47], pass_code_org.strip()[:4]]
check_links_reason = check_links(link_url, pass_code, bdstoken)
if isinstance(check_links_reason, list):
transfer_files_reason = transfer_files(check_links_reason, dir_name, bdstoken)
if transfer_files_reason == 0:
filepath = "/"+dir_name+"/"+check_links_reason[3]
print(f'转存成功:{filepath} {url_code}')
return filepath
except Exception as e:
print(e)
return None

# 单链接转存
url = "https://pan.baidu.com/s/*******************?pwd=****"
savebp("test",url)

# 批量链接转存
urls = [
"https://pan.baidu.com/s/*******************?pwd=****",
"https://pan.baidu.com/s/*******************?pwd=****",
"https://pan.baidu.com/s/*******************?pwd=****"
]
for url in urls:
savebp("test",url)

二. 使用方法

  1. 首先需要使用浏览器登陆百度网盘,打开浏览器开发者模式,并打开网络选项

    pptrOpR.md.png

  2. 重新刷新网页后找到pan.baidu.com的请求,并复制Cookie

    pptsCAe.md.png

  3. 将拿到的Cookie填入headers中,并将需要转存的链接添加到 url 或 urls 中,注意链接格式

    1
    2
    3
    4
    5
    6
    7
    8
    9
    10
    11
    12
    13
    14
    15
    16
    17
    18
    19
    # cookie
    headers = {
    "Cookie": r'Your Cookie',
    "User-Agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/96.0.4664.110 Safari/537.36"
    }

    # 单链接转存
    url = "https://pan.baidu.com/s/*******************?pwd=****"
    savebp("test",url)

    # 批量链接转存
    urls = [
    "https://pan.baidu.com/s/*******************?pwd=****",
    "https://pan.baidu.com/s/*******************?pwd=****",
    "https://pan.baidu.com/s/*******************?pwd=****"
    ]
    for url in urls:
    # 参数:转存目录,分享链接
    savebp("test",url)

注:链接格式确保一致

三. 注意事项

需要将以下程序保存为retrying.py,并放在同目录

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
import random
import six
import sys
import time
import traceback

# sys.maxint / 2, since Python 3.2 doesn't have a sys.maxint...
MAX_WAIT = 1073741823

def retry(*dargs, **dkw):
"""
Decorator function that instantiates the Retrying object
@param *dargs: positional arguments passed to Retrying object
@param **dkw: keyword arguments passed to the Retrying object
"""
# support both @retry and @retry() as valid syntax
if len(dargs) == 1 and callable(dargs[0]):
def wrap_simple(f):
@six.wraps(f)
def wrapped_f(*args, **kw):
return Retrying().call(f, *args, **kw)
return wrapped_f
return wrap_simple(dargs[0])
else:
def wrap(f):
@six.wraps(f)
def wrapped_f(*args, **kw):
return Retrying(*dargs, **dkw).call(f, *args, **kw)
return wrapped_f
return wrap

class Retrying(object):
def __init__(self,
stop=None, wait=None,
stop_max_attempt_number=None,
stop_max_delay=None,
wait_fixed=None,
wait_random_min=None, wait_random_max=None,
wait_incrementing_start=None, wait_incrementing_increment=None,
wait_exponential_multiplier=None, wait_exponential_max=None,
retry_on_exception=None,
retry_on_result=None,
wrap_exception=False,
stop_func=None,
wait_func=None,
wait_jitter_max=None):
self._stop_max_attempt_number = 5 if stop_max_attempt_number is None else stop_max_attempt_number
self._stop_max_delay = 100 if stop_max_delay is None else stop_max_delay
self._wait_fixed = 1000 if wait_fixed is None else wait_fixed
self._wait_random_min = 0 if wait_random_min is None else wait_random_min
self._wait_random_max = 1000 if wait_random_max is None else wait_random_max
self._wait_incrementing_start = 0 if wait_incrementing_start is None else wait_incrementing_start
self._wait_incrementing_increment = 100 if wait_incrementing_increment is None else wait_incrementing_increment
self._wait_exponential_multiplier = 1 if wait_exponential_multiplier is None else wait_exponential_multiplier
self._wait_exponential_max = MAX_WAIT if wait_exponential_max is None else wait_exponential_max
self._wait_jitter_max = 0 if wait_jitter_max is None else wait_jitter_max
# TODO add chaining of stop behaviors
# stop behavior
stop_funcs = []
if stop_max_attempt_number is not None:
stop_funcs.append(self.stop_after_attempt)
if stop_max_delay is not None:
stop_funcs.append(self.stop_after_delay)
if stop_func is not None:
self.stop = stop_func
elif stop is None:
self.stop = lambda attempts, delay: any(f(attempts, delay) for f in stop_funcs)
else:
self.stop = getattr(self, stop)
# TODO add chaining of wait behaviors
# wait behavior
wait_funcs = [lambda *args, **kwargs: 0]
if wait_fixed is not None:
wait_funcs.append(self.fixed_sleep)
if wait_random_min is not None or wait_random_max is not None:
wait_funcs.append(self.random_sleep)
if wait_incrementing_start is not None or wait_incrementing_increment is not None:
wait_funcs.append(self.incrementing_sleep)
if wait_exponential_multiplier is not None or wait_exponential_max is not None:
wait_funcs.append(self.exponential_sleep)
if wait_func is not None:
self.wait = wait_func
elif wait is None:
self.wait = lambda attempts, delay: max(f(attempts, delay) for f in wait_funcs)
else:
self.wait = getattr(self, wait)
# retry on exception filter
if retry_on_exception is None:
self._retry_on_exception = self.always_reject
else:
self._retry_on_exception = retry_on_exception
# TODO simplify retrying by Exception types
# retry on result filter
if retry_on_result is None:
self._retry_on_result = self.never_reject
else:
self._retry_on_result = retry_on_result
self._wrap_exception = wrap_exception
def stop_after_attempt(self, previous_attempt_number, delay_since_first_attempt_ms):
"""Stop after the previous attempt >= stop_max_attempt_number."""
return previous_attempt_number >= self._stop_max_attempt_number
def stop_after_delay(self, previous_attempt_number, delay_since_first_attempt_ms):
"""Stop after the time from the first attempt >= stop_max_delay."""
return delay_since_first_attempt_ms >= self._stop_max_delay
def no_sleep(self, previous_attempt_number, delay_since_first_attempt_ms):
"""Don't sleep at all before retrying."""
return 0
def fixed_sleep(self, previous_attempt_number, delay_since_first_attempt_ms):
"""Sleep a fixed amount of time between each retry."""
return self._wait_fixed
def random_sleep(self, previous_attempt_number, delay_since_first_attempt_ms):
"""Sleep a random amount of time between wait_random_min and wait_random_max"""
return random.randint(self._wait_random_min, self._wait_random_max)
def incrementing_sleep(self, previous_attempt_number, delay_since_first_attempt_ms):
"""
Sleep an incremental amount of time after each attempt, starting at
wait_incrementing_start and incrementing by wait_incrementing_increment
"""
result = self._wait_incrementing_start + (self._wait_incrementing_increment * (previous_attempt_number - 1))
if result < 0:
result = 0
return result
def exponential_sleep(self, previous_attempt_number, delay_since_first_attempt_ms):
exp = 2 ** previous_attempt_number
result = self._wait_exponential_multiplier * exp
if result > self._wait_exponential_max:
result = self._wait_exponential_max
if result < 0:
result = 0
return result
def never_reject(self, result):
return False
def always_reject(self, result):
return True
def should_reject(self, attempt):
reject = False
if attempt.has_exception:
reject |= self._retry_on_exception(attempt.value[1])
else:
reject |= self._retry_on_result(attempt.value)
return reject
def call(self, fn, *args, **kwargs):
start_time = int(round(time.time() * 1000))
attempt_number = 1
while True:
try:
attempt = Attempt(fn(*args, **kwargs), attempt_number, False)
except:
tb = sys.exc_info()
attempt = Attempt(tb, attempt_number, True)
if not self.should_reject(attempt):
return attempt.get(self._wrap_exception)
delay_since_first_attempt_ms = int(round(time.time() * 1000)) - start_time
if self.stop(attempt_number, delay_since_first_attempt_ms):
if not self._wrap_exception and attempt.has_exception:
# get() on an attempt with an exception should cause it to be raised, but raise just in case
raise attempt.get()
else:
raise RetryError(attempt)
else:
sleep = self.wait(attempt_number, delay_since_first_attempt_ms)
if self._wait_jitter_max:
jitter = random.random() * self._wait_jitter_max
sleep = sleep + max(0, jitter)
time.sleep(sleep / 1000.0)
attempt_number += 1

class Attempt(object):
"""
An Attempt encapsulates a call to a target function that may end as a
normal return value from the function or an Exception depending on what
occurred during the execution.
"""
def __init__(self, value, attempt_number, has_exception):
self.value = value
self.attempt_number = attempt_number
self.has_exception = has_exception
def get(self, wrap_exception=False):
"""
Return the return value of this Attempt instance or raise an Exception.
If wrap_exception is true, this Attempt is wrapped inside of a
RetryError before being raised.
"""
if self.has_exception:
if wrap_exception:
raise RetryError(self)
else:
six.reraise(self.value[0], self.value[1], self.value[2])
else:
return self.value
def __repr__(self):
if self.has_exception:
return "Attempts: {0}, Error:\n{1}".format(self.attempt_number, "".join(traceback.format_tb(self.value[2])))
else:
return "Attempts: {0}, Value: {1}".format(self.attempt_number, self.value)
class RetryError(Exception):
"""
A RetryError encapsulates the last Attempt instance right before giving up.
"""
def __init__(self, last_attempt):
self.last_attempt = last_attempt
def __str__(self):
return "RetryError[{0}]".format(self.last_attempt)