删种小助手。
import requests
from urllib.parse import urljoin
from lxml import etree
import time
import re
headers = {
'cookie': '_ga=GA1.2.286413587.1547475887; c_secure_ssl=eWVhaA%3D%3D; __cfduid=dddfa4fdd9060f1d5a337e3d5c87994231571281870; c_secure_uid=NTAxMDU%3D; c_secure_pass=97fc05ad9da6b047fd227bcd6bd68262; c_secure_tracker_ssl=eWVhaA%3D%3D; c_secure_login=bm9wZQ%3D%3D; _gid=GA1.2.37242126.1580051094',
'user-agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/80.0.3987.132 Safari/537.36'
}
s = requests.session()
# 构建列表
print("构建列表...")
cat_li, index = [], 7
while index <= 33:
cat_li.append("https://www.tjupt.org/torrents.php?inclbookmarked=0&incldead=0&picktype=0&spstate=0&cat=409&page=%d" % index)
index += 1
print("构建完成...")
# 获取请求
print("请求种子列表...")
to_li = []
for cat_item in cat_li:
print(cat_item)
content = s.get(cat_item, headers=headers).text
html = etree.HTML(content)
html_data = html.xpath("//table[@class='torrentname']//a/@href")
for im in html_data:
i = str(im)
if i.startswith("detail"):
to_li.append(urljoin("https://www.tjupt.org", i))
# time.sleep(2)
print("种子列表获取成功...")
# 获取种子详情
print("获取种子详情...")
i, length = 1, len(to_li)
for url in to_li:
print("Task %d/%d: " % (i, length)+ url)
id = re.findall(r'id=(\d*)&', url)[0]
content = s.get(url, headers=headers).text
html = etree.HTML(content)
html_data = html.xpath("//b[text()='最近活动种子:']/../text()")
# 删除种子
if str(html_data[0]).startswith("2020-01-"):
data = {
'id': id,
'reasontype': '1',
'reason[]': ''
}
s.post('https://www.tjupt.org/delete.php', headers=headers, data=data)
print("Torrent:%s delete done!" % id)
# time.sleep(2)
else:
print("Torrent:%s last active at %s" % (id, str(html_data[0])))
# time.sleep(2)
i += 1