diff --git a/zy3.py b/zy3.py new file mode 100644 index 0000000..9ca5dd2 --- /dev/null +++ b/zy3.py @@ -0,0 +1,27 @@ +import requests + +import re +header = {"User-Agent": "Mozilla/5.0 (Linux; Android 6.0; Nexus 5 Build/MRA58N) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/122.0.0.0 Mobile Safari/537.36 Edg/122.0.0.0"} +urls=['https://www.jxxdxy.edu.cn/news-list-xiaoyuanyaowen-{}.html'.format(number) for number in range(1,21)] +all_url=[] +for url in urls: + #print(url) + all_url.append(url) + response = requests.get(url, headers=header,stream=True) + source=response.text + #print(source) + my_article1 = '