-
Notifications
You must be signed in to change notification settings - Fork 2
/
Copy pathserver_multi.py
260 lines (206 loc) · 7.87 KB
/
server_multi.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
# -*- coding: utf-8 -*-
import threading
import requests
import json
import config
from time import sleep
import parser_torrent
from parser_origin import byr, tjupt, npupt
import shutil
import re
import sys
from urllib.parse import unquote
import os
# 继承式开启线程
class Task (threading.Thread):
def __init__(self, origin_url):
super(Task, self).__init__()
self.origin_url = origin_url
def run(self):
main(self.origin_url)
# 用于加载pt站的信息
def load_pt_sites():
pt_sites = {}
try:
with open('pt_sites.json', 'r') as pt_file:
pt_sites = json.load(pt_file)
except Exception as exc:
print("Pt_sites.Json load failed: %s" % exc)
sys.exit(0)
finally:
return pt_sites
# 根据链接获取源网站
def find_origin_site(url):
match_site = ''
pt_sites = load_pt_sites()
for site in pt_sites:
domain = pt_sites[site]['domain']
if ''.join(url.split(' ')).find(domain) >= 0:
print("该种子来自于%s!" % pt_sites[site]['abbr'])
match_site = site
break
if match_site == '':
print('不支持的网站')
sys.exit(0)
return pt_sites[match_site]
# 根据链接获取种子id
def get_id(url):
id_ = re.search(r'id=(\d{6})', url)
my_id = id_.group(1)
if not my_id:
my_id = 0
print('获取种子id失败!')
return my_id
# 获取网站响应:有可能是网页也有可能是种子,所以单独拿出来
def get_response(url, cookie):
headers = {
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/71.0.3578.98 Safari/537.36'
}
session = requests.session()
session.headers = headers
response = session.get(url, cookies=cookie)
return response
# 获取源网站种子详情的网页
def get_html(url, cookie):
try:
response = get_response(url, cookie)
html = response.text
print('获取原始网页解析!')
except Exception as exc:
print('原始网页获取失败: %s' % exc)
sys.exit(0)
return html
# 根据网站简称使用网页解析返回待上传的信息
def parser_choose(abbr, html, torrent_path):
if abbr == 'byr':
raw_info = byr.parser_html(html, torrent_path)
elif abbr == 'tjupt':
raw_info = tjupt.parser_html(html, torrent_path)
elif abbr == 'npupt':
raw_info = npupt.parser_html(html, torrent_path)
return raw_info
# 根据网站以及种子id下载种子
def download_torrent(host, tid, cookie, abbr):
download_url = "{host}/download.php?id={tid}".format(host=host, tid=tid)
response = get_response(download_url, cookie)
# 获取种子名称并进行转换,因为蝴蝶不支持某些内容,如[]、中文等等,然后去掉视频后缀
content = response.headers['Content-Disposition'].replace('"', '')
if host == 'https://npupt.com':
content = (unquote(content, 'utf-8'))
try:
origin_filename = re.search('filename=(.*?).torrent', content).group(1)
# print(origin_filename)
except Exception as exc:
print('获取下载种子的文件名失败: %s' % exc)
exit(0)
file_path = config.save_path + '\\%s.torrent' % origin_filename
# 传给待发布的站点的种子名称,有的时候源网站是中文种子,解析不出来?替换成源网站简称+id
filename = ' '.join(
re.sub(
r'^\[.{3,10}?\]|.mp4$|.mkv$|\[|\]|[^-(a-zA-Z0-9)]|[\u4e00-\u9fff]',
' ',
origin_filename).split('.')).lstrip()
if filename == '':
filename = abbr+' '+tid
back_file_path = config.backup_path + '\\%s.torrent' % filename
try:
response.raise_for_status()
f = open(back_file_path, 'wb')
for chunk in response.iter_content(100000):
f.write(chunk)
f.close()
shutil.copyfile(back_file_path, file_path)
print('种子下载保存成功!')
except Exception as exc:
print('种子下载失败: %s' % exc)
sys.exit(0)
return filename
# 上传,根据解析到的信息构造上传内容
def upload_torrent(raw_info, params=None, data=None, files=None):
pt_sites = load_pt_sites()
hudbt = pt_sites['hudbt']
des_url = "{host}/takeupload.php".format(host=hudbt['domain'])
des_cookie = hudbt['cookie']
abs_file_path = config.backup_path + \
'\\%s' % raw_info['filename'] + '.torrent'
try:
files = [("file", (raw_info['filename'], open(abs_file_path, "rb"), "application/x-bittorrent")),
("nfo", ("", "", "application/octet-stream"))]
except Exception as exc:
print('待上传文件寻找失败: %s' % exc)
sys.exit(0)
data = {
"dl-url": "",
"name": raw_info['filename'],
"small_descr": raw_info["small_descr"],
"url": "",
"descr": raw_info["descr"],
"type": str(raw_info["type_"]),
"data[Tcategory][Tcategory][]": "",
"standard_sel": str(raw_info["standard_sel"]),
"uplver": 'yes',
}
print('开始准备发布蝴蝶种子!')
try:
# 发布响应内容,包含很多信息,其中就有种子id
des_post = requests.post( url=des_url, params=params, data=data, files=files, cookies=des_cookie)
except Exception as exc:
print('发布种子失败: %s' % exc)
sys.exit(0)
print('获取上传种子下载链接……')
seed_torrent_download_id = get_id(des_post.url)
short_name = hudbt['abbr']
if seed_torrent_download_id == 0:
sys.exit(0)
else:
# 重新下种子到指定目录,完成做种,后边还可以检测,但是这里没有做续种有没有完成的检测
print('准备下载蝴蝶种子! id = %s' % seed_torrent_download_id)
download_torrent(hudbt['domain'], seed_torrent_download_id, des_cookie,short_name)
# 检查指定目录下有没有标志下载完成的文件
def check(direction):
if os.path.isfile(direction):
return True
else:
return False
# 主函数。。一般不这么叫,代码主要逻辑都在这里了
def main(origin_url):
# 根据详情链接获取原始网站信息
origin_site = find_origin_site(origin_url)
if not origin_site:
sys.exit(0)
origin_cookie = origin_site['cookie']
host = origin_site['domain']
tid = get_id(origin_url)
short_name = origin_site['abbr']
print('下载原始网站种子……')
# 返回待上传种子的绝对路径
filename = download_torrent(host, tid, origin_cookie, short_name)
print('正在解析种子……')
try:
# 返回种子包含的name,即下载文件目录,因为ut后也可以获取种子的目录,
# 可以进行匹配观察
torrent_path = config.backup_path + '\\%s.torrent' % filename
file_dir, file_path = parser_torrent.get_info_from_torrent(
torrent_path)
except Exception as exc:
print('种子解析失败: %s' % exc)
sys.exit(0)
print('种子解析成功!')
# 构造指定目录下待观察的文件名,一个txt文件,检测到了就可以退出
# 没有检测到可能死循环,这里缺少一个退出机制,比如下载不了-->一直观察线程退不出去
direction = config.check_path + '\\' + file_dir + '.txt'
print('开始监听下载状态!')
while True:
if check(direction):
break
else:
sleep(10)
# 下载完成就根据原始网页进入解析
html = get_html(origin_url, origin_cookie)
raw_info = parser_choose(origin_site['abbr'], html, torrent_path)
print('网页解析成功!')
raw_info['filename'] = filename
upload_torrent(raw_info)
if __name__ == '__main__':
detail_link = input('请输入种子详情界面对应链接:')
main(detail_link)