线索数据同步自动化代码主程序
#coding = utf-8
#author : JoJo
from get_data import getData
from login import logIn
from readExcel import getIDList
from selenium import webdriver
from writeData import writeData
def main():
chrome_options = webdriver.ChromeOptions()
chrome_options.add_argument('--headless')
chrome_options.add_argument('--disable-gpu')
#基础信息
baseurl = "https://vr.autohome.com.cn/om/#/*****************************/"
filePath = ".\\818************明细.xlsx"
dataMonth = input("输入截止月:\n")
dataDate = input("输入截止日:\n")
headers = { # 模拟浏览器头部信息
"user-agent": "Mozilla / 5.0(Windows NT 10.0; Win64; x64) AppleWebKit / 537.36(KHTML, like Gecko) Chrome / 83.0.4103.116 Safari / 537.36"
}
# 创建一个浏览器对象
bro = webdriver.Chrome(chrome_options = chrome_options)
# bro = webdriver.Chrome(executable_path = "chromedriver.exe")
#网站登录
logIn(bro) #finished
print("Login finished\n")
#获得IDList,用来构建完整网页
print("Getting ID list... ...")
IDListMain, IDListCompetitive = getIDList(filePath) #finished
totalNumMain = len(IDListMain)
totalNumCompetitive = len(IDListCompetitive) #finished
dataListMain = []
dataListCompetitive = []
print("ID list achieved\n")
i = 0
while i < totalNumMain:
ID = str(IDListMain[i])
print("ID is ", ID)
url = baseurl + ID
print("URL is ", url)
# 访问url,获取数据
data = getData(url, bro, dataMonth, dataDate) #finished
jud = 1
# writeData(ID, data, filePath, jud)
print(data + "\n")
data = int(data)
dataListMain.append(data)
i += 1
num = 1
writeData(IDListMain, dataListMain, filePath, num)
print("mission accomplished!")
if __name__ == "__main__":
main()
本文地址:https://blog.csdn.net/qq_43317541/article/details/107451064
推荐阅读
-
线索数据同步自动化代码主程序
-
AngularJs使用ng-model-options设置数据同步时机提高网站性能(代码教程)
-
vue axios 异步改同步请求(获得数据后再执行下面的代码)
-
线索数据同步自动化代码主程序
-
基于数据库的自动化生成工具,自动生成JavaBean、数据库文档、框架代码等(v5.8.8版)
-
自动生成mysql触发器代码,实现数据同步_MySQL
-
自动生成mysql触发器代码,实现数据同步_MySQL
-
使用react实现手机号的数据同步显示功能的示例代码
-
同步数据库自动化脚本_MySQL
-
AngularJs使用ng-model-options设置数据同步时机提高网站性能(代码教程)