diff --git a/pt.py b/pt.py index 798d115..73231b3 100644 --- a/pt.py +++ b/pt.py @@ -1,5 +1,6 @@ #!/usr/bin/python3 # -*- coding:utf-8 -*- +# change:添加至种子篮以自动下载 import random import smtplib import datetime @@ -10,6 +11,7 @@ import re import requests from email.mime.text import MIMEText +from urllib.parse import * # 全局变量 global mylog @@ -34,6 +36,15 @@ def ExtractDownloadHref( html ): # 提取种子的超链接 else: return( m.group(1) ) +def ExtractID(url): # 提取种子的超链接 + query = urlparse(url).query + params = dict([(k, v[0]) for k, v in parse_qs(query).items()]) + try: + return params["id"] + except: + return None + + def ExtractHTML( name, s1, s2, html ): # 配对s1+name|s2标签,提取该标签中所有内容,可处理嵌套结构 l = len( html[0] ) ls1 = len( s1 ) @@ -107,6 +118,7 @@ def main(): mylog.debug( 'initialize .. done.' ) torrents_found = '' # 每个站筛出的种子累加到这里 + # torrents_rss = [] for pt_site in PT_Sites: # 根据上面的数据结构循环遍历各pt站 url = pt_site['address'] + pt_site['torrents'] headers = pt_site['headers'] @@ -150,11 +162,13 @@ def main(): continue c1 = 0; c2 = 0; c3 = 0 content = '' # 找到的种子存在这里 + tids = [] for i in range(100): # 前100个种子 pstr2[0] = ExtractHTML( r'', r'