parent
7d70637177
commit
117aa4abbc
@ -0,0 +1,35 @@
|
|||||||
|
#!/usr/bin/env python
|
||||||
|
# coding: utf-8
|
||||||
|
|
||||||
|
# In[ ]:
|
||||||
|
|
||||||
|
|
||||||
|
import requests
|
||||||
|
import bs4
|
||||||
|
import pandas as pd
|
||||||
|
result = {"jobname": [], # 病例名称
|
||||||
|
"area": [], # 开始日期
|
||||||
|
"salary": [], # 结束日期
|
||||||
|
"url": [], # 时间
|
||||||
|
"edu":[] #事件
|
||||||
|
}
|
||||||
|
for i in range(11):
|
||||||
|
url = " https://mp.weixin.qq.com/s/K0u_qPFQtWuH4hk5K2xWfQ " + str(i)
|
||||||
|
print(url)
|
||||||
|
r = requests.get(url)
|
||||||
|
html = bs4.BeautifulSoup(r.text, "html.parser")
|
||||||
|
all_job = html.find("ul", class_="sojob-list").find_all("li")
|
||||||
|
for date in all_job:
|
||||||
|
name = date.find("a", target="_blank").text.strip()
|
||||||
|
area = date.find("a", class_="area").text
|
||||||
|
salary = date.find("span", class_="text-warning").text
|
||||||
|
url = date.find("a", class_="area")["href"]
|
||||||
|
edu = date.find("span", class_="edu").text
|
||||||
|
result["jobname"].append(name)
|
||||||
|
result["area"].append(area)
|
||||||
|
result["salary"].append(salary)
|
||||||
|
result["url"].append(url)
|
||||||
|
result["edu"].append(edu)
|
||||||
|
df = pd.DataFrame(result)
|
||||||
|
df.to_csv("shenzhen_Zhaopin.csv", encoding="utf_8_sig")
|
||||||
|
|
Loading…
Reference in new issue