欢迎您访问程序员文章站本站旨在为大家提供分享程序员计算机编程知识!
您现在的位置是: 首页  >  IT编程

线索数据同步自动化代码主程序

程序员文章站 2023-11-17 20:03:04
#coding = utf-8#author : JoJofrom get_data import getDatafrom login import logInfrom readExcel import getIDListfrom selenium import webdriverfrom writeData import writeDatadef main(): chrome_options = webdriver.ChromeOptions() chrome_optio......

#coding = utf-8
#author : JoJo

from get_data import getData
from login import logIn
from readExcel import getIDList
from selenium import webdriver
from writeData import writeData

def main():
    chrome_options = webdriver.ChromeOptions()
    chrome_options.add_argument('--headless')
    chrome_options.add_argument('--disable-gpu')

    #基础信息
    baseurl = "https://vr.autohome.com.cn/om/#/*****************************/"
    filePath = ".\\818************明细.xlsx"
    dataMonth = input("输入截止月:\n")
    dataDate = input("输入截止日:\n")

    headers = {  # 模拟浏览器头部信息
        "user-agent": "Mozilla / 5.0(Windows NT 10.0; Win64; x64) AppleWebKit / 537.36(KHTML, like Gecko) Chrome / 83.0.4103.116 Safari / 537.36"
    }

    # 创建一个浏览器对象
    bro = webdriver.Chrome(chrome_options = chrome_options)
    # bro = webdriver.Chrome(executable_path = "chromedriver.exe")

    #网站登录
    logIn(bro)     #finished
    print("Login finished\n")

    #获得IDList,用来构建完整网页
    print("Getting ID list... ...")
    IDListMain, IDListCompetitive = getIDList(filePath)    #finished
    totalNumMain = len(IDListMain)
    totalNumCompetitive = len(IDListCompetitive)            #finished

    dataListMain = []
    dataListCompetitive = []
    print("ID list achieved\n")

    i = 0
    while i < totalNumMain:
        ID = str(IDListMain[i])
        print("ID is ", ID)
        url = baseurl + ID
        print("URL is ", url)
        # 访问url,获取数据
        data = getData(url, bro, dataMonth, dataDate)   #finished
        jud = 1
        # writeData(ID, data, filePath, jud)
        print(data + "\n")
        data = int(data)
        dataListMain.append(data)
        i += 1
    num = 1
    writeData(IDListMain, dataListMain, filePath, num)

    print("mission accomplished!")

if __name__ == "__main__":
    main()

本文地址:https://blog.csdn.net/qq_43317541/article/details/107451064

相关标签: python 数据挖掘