方客户奶

-- coding: utf-8 --

import datetime
import os.path, configparser
import time
import random
from selenium import webdriver

s_dateTime_mark = 0
w_time = datetime.datetime.now()

w_time1 = datetime.datetime.strftime(w_time, ‘%Y%m%d_%H%M%S’)

w_time1 = “context0”
pathfilename = (os.getcwd() + ‘\’).replace(’\’, ‘/’)
filename_list = pathfilename + w_time1 + ‘.txt’
filename_log = pathfilename + w_time1 + ‘log.txt’
config_fileName = pathfilename + “load_db0.ini”
config = configparser.ConfigParser()
try:
f = open(pathfilename + “load_db0.ini”, ‘r’)
f.close()
except IOError:
f = open(pathfilename + “load_db0.ini”, ‘w’)
config.add_section(“Mark”)
config.set(“Mark”, “load_mark”, ‘0’)
s_dateTime_mark = int(config.get(“Mark”, “load_mark”), 10)
# s_dateTime_mark = config.get(“Mark”, “load_mark”)
config.write(open(pathfilename + “load_db0.ini”, “a”))
f.close()
config.read(config_fileName)
file_object = open(filename_list, ‘a’, encoding=‘utf-8’)
file_object_log = open(filename_log, ‘a’, encoding=‘utf-8’)

file_object.write(‘序號,原ID,地區,單位名稱,項目名稱,金額(萬元),時間’ + ‘\n’)

try:
s_dateTime_mark = int(config.get(“Mark”, “load_mark”), 10)
print(s_dateTime_mark)
if s_dateTime_mark == 0:
file_object.write(‘序号,原ID,地区,单位名称,项目名称,金额(元),时间’ + ‘\n’)
else:
pass
except:
print(“异常”)

file_object_log.write(‘開始時間:’ + str(datetime.datetime.now()) + ‘\n’)
log_link1 = r"D:\PythonScript\log_link.txt"
read_file = open(log_link1, ‘r’, encoding=‘utf-8’)
countx = len(read_file.readlines())
read_file.close
read_file = open(log_link1, ‘r’, encoding=‘utf-8’)
date_line = read_file.readlines()
for line in range(s_dateTime_mark - 1, 8000, -1):

for line in range(s_dateTime_mark + 1, countx):

for line in range(s_dateTime_mark - 1, 5):

date_line1 = read_file.readline()

date_line1 = date_line[line]
data_list = date_line1.split(",")
_sindex = data_list[0]
_id = data_list[1]
_districtName = data_list[2]
_url = data_list[3]
# path_driver = "C:\\Program Files (x86)\\Google\\Chrome\\Application\\chromedriver.exe"
# browser = webdriver.Chrome(path_driver)
try:
    option = webdriver.ChromeOptions()
    option.add_argument('headless')
    browser = webdriver.Chrome(chrome_options=option)

    # browser = webdriver.Chrome()
    browser.implicitly_wait(30)
    browser.get(_url)
    browser.switch_to_frame('iframe')
    biaoti = browser.find_element_by_tag_name("body").find_element_by_tag_name("header").find_element_by_tag_name(
        "h1").text
    laiyuan = \
    browser.find_element_by_tag_name("body").find_element_by_tag_name("header").find_element_by_class_name(
        "detail-info").find_elements_by_tag_name("span")[0].text
    fabushijian = \
        browser.find_element_by_tag_name("body").find_element_by_tag_name("header").find_element_by_class_name(
            "detail-info").find_elements_by_tag_name("span")[1].text
    liulancishu = \
        browser.find_element_by_tag_name("body").find_element_by_tag_name("header").find_element_by_class_name(
            "detail-info").find_elements_by_tag_name("span")[2].text
    laiyuan = laiyuan.replace('来源:', '')
    rowsList = browser.find_element_by_class_name(
        "form-panel-input-cls").find_element_by_tag_name("tbody").find_elements_by_tag_name("tr")
    allContext = []
    for eachRow in rowsList:
        ColsList = [eachCol.text for eachCol in eachRow.find_elements_by_tag_name("td")]
        allContext.append(ColsList)
        # print(ColsList)
    # print(allContext)
    for each in range(len(allContext)):
        if allContext[each][0] == "序号":
            continue
        value_input = str(_sindex) + ',' + str(_id) + ',' + _districtName + ',' + laiyuan + ',' + \
                      allContext[each][1] + ',' + allContext[each][3] + ',' + allContext[each][4] + '\n'
        file_object.write(value_input)
        print(value_input)
        config.set("Mark", "load_mark", str(_sindex))
        config.write(open(config_fileName, "w"))
    browser.close()
    file_object_log.write('序号:' + str(_sindex) + ' 開始時間:' + str(datetime.datetime.now()) + '\n')
    file_object.flush()
    file_object_log.flush()
    ret = random.uniform(2, 6)
    time.sleep(ret)
except Exception as e:
    errorFile = open(r"D:\PythonScript\errorContext0.txt", 'a', encoding='utf-8')
    errorFile.write(date_line1 + '\n')
    errorFile.flush()
    errorFile.close()
    print(e)

file_object.close()
file_object_log.close()
read_file.close()

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值