You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

94 lines
2.9 KiB

3 years ago
# -*- coding: utf-8 -*-
import json
3 years ago
from selenium import webdriver
from selenium.webdriver.chrome.options import Options
from lxml import etree
import random
import settings
import time
3 years ago
headers = {
'User-Agent': random.choice(settings.USER_AGENT)
3 years ago
}
def getsource(url):
initChrome = Options()
3 years ago
initChrome.add_argument('--no-sandbox')
initChrome.add_argument('--headless')
initChrome.add_argument('--disable-gpu')
initChrome.add_argument("disable-cache")
initChrome.add_argument('disable-infobars')
initChrome.add_argument('log-level=3') # INFO = 0 WARNING = 1 LOG_ERROR = 2 LOG_FATAL = 3 default is 0
initChrome.add_experimental_option("excludeSwitches",['enable-automation','enable-logging'])
3 years ago
driver = webdriver.Chrome(chrome_options = initChrome, executable_path = './chromedriver.exe')
3 years ago
driver.implicitly_wait(10)
driver.get(url)
response = etree.HTML(driver.page_source)
response = etree.tostring(response, encoding = "utf-8", pretty_print = True, method = "html")
response = response.decode('utf-8')
driver.close()
3 years ago
return response
def manmanbuy(url):
initChrome = Options()
'''
3 years ago
initChrome.add_argument('--no-sandbox')
initChrome.add_argument('--headless')
initChrome.add_argument('--disable-gpu')
initChrome.add_argument("disable-cache")
initChrome.add_argument('disable-infobars')
initChrome.add_argument('log-level=3') # INFO = 0 WARNING = 1 LOG_ERROR = 2 LOG_FATAL = 3 default is 0
initChrome.add_experimental_option("excludeSwitches",['enable-automation','enable-logging'])
'''
3 years ago
# driver = webdriver.Chrome(chrome_options = initChrome, executable_path = './chromedriver.exe')
driver = webdriver.Chrome(executable_path = './chromedriver.exe')
# driver.get(url)
# time.sleep(10)
with open('cookies.json', 'r', encoding='utf-8') as fd:
listCookies = json.loads(fd.read())
for cookie in listCookies:
cookies = {
'domain': cookie['domain'],
'httpOnly': cookie['httpOnly'],
'name':cookie['name'],
'path':'/',
'secure': cookie['secure'],
'value':cookie['value'],
}
print(cookies)
driver.add_cookie(cookies)
driver.get(url)
time.sleep(10)
exit()
3 years ago
driver.implicitly_wait(10)
driver.get(url)
response = etree.HTML(driver.page_source)
response = etree.tostring(response, encoding = "utf-8", pretty_print = True, method = "html")
response = response.decode('utf-8')
driver.close()
return response
def saveCookies(driver):
jsonCookies = json.dumps(driver.get_cookies())
with open('cookies.json', 'w', encoding='utf-8') as fd:
fd.write(jsonCookies)
fd.close()
3 years ago
def buy():
jdurl = "https://item.jd.com/10047511027349.html"
url = "https://tool.manmanbuy.com/HistoryLowest.aspx?url=" + jdurl
# print(url)
response = manmanbuy(url)
3 years ago
print(response)
if __name__ == "__main__":
buy()