From d81717feb7348bfd7085f8903c2fd2573c59d47a Mon Sep 17 00:00:00 2001 From: psjyva5l8 <1523334128@qq.com> Date: Thu, 10 Mar 2022 11:28:29 +0800 Subject: [PATCH] ADD file via upload --- spider2.py | 76 ++++++++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 76 insertions(+) create mode 100644 spider2.py diff --git a/spider2.py b/spider2.py new file mode 100644 index 0000000..0ecabc7 --- /dev/null +++ b/spider2.py @@ -0,0 +1,76 @@ +import os +import datetime +import time +from asyncio import futures + +import requests +import re + +Max_Workers = 24 # 最大线程数 + +# 打开目标网站 +def work(index): + url = 'https://pic.netbian.com/index_' + str(index) + '.html' + req = requests.get(url) + return req.text + + +# 使用正则表达式匹配图片访问链接 +def matchPicUrl(html): + # regexp = r'src="(/uploads.*?\.jpg)"' + regexp = r'