import os import time import psutil from selenium.webdriver.chrome.options import Options from selenium import webdriver from selenium.webdriver.common.by import By import openpyxl import urllib.request

检查是否已经存在浏览器实例,如果存在则不再创建

for proc in psutil.process_iter(): try: if 'chrome' in proc.name() and '--remote-debugging-port=9224' in proc.cmdline(): options = Options() options.add_experimental_option('debuggerAddress', '127.0.0.1:9224') break except: pass else: # 创建浏览器实例 os.system(r'start chrome --remote-debugging-port=9224 --user-data-dir="D:\评阅用"') options = Options() options.add_experimental_option('debuggerAddress', '127.0.0.1:9224')

在已有的浏览器实例中查找标签页

driver = webdriver.Chrome(options=options) tabs = driver.window_handles for tab in tabs: driver.switch_to.window(tab) if driver.title == '考后核验': print('登陆成功') break

打开Excel表格

wb = openpyxl.load_workbook(r'C:\Users\Administrator\Desktop\考后核验.xlsx') sheet = wb.active

创建照片文件夹

if not os.path.exists(r'C:\Users\Administrator\Desktop\照片'): os.mkdir(r'C:\Users\Administrator\Desktop\照片')

遍历时间单元K列

for row in sheet.iter_rows(min_row=2, max_row=sheet.max_row, min_col=11, max_col=11): for cell in row: # 获取时间单元内的数据 data = cell.value if data: # 创建子文件夹 folder_name = time.strftime('%Y-%m-%d %H-%M-%S', time.strptime(data, '%Y-%m-%d %H:%M:%S')) folder_path = os.path.join(r'C:\Users\Administrator\Desktop\照片', folder_name) if not os.path.exists(folder_path): os.mkdir(folder_path)

遍历表格内'A'列数据

for row in sheet.iter_rows(min_row=2, max_row=sheet.max_row, min_col=1, max_col=1): for cell in row: # 获取学号 student_id = cell.value if student_id: # 在网页内查找考生信息 search_input = driver.find_element(By.XPATH, '//input[@placeholder='姓名/考生号']') search_input.clear() search_input.send_keys(student_id) time.sleep(1) # 等待页面加载完成 search_button = driver.find_element(By.XPATH, '//button[@class='ant-btn ant-btn-primary']') driver.execute_script('arguments[0].click();', search_button) time.sleep(1) # 等待页面加载完成

        # 获取考生信息
        student_info = driver.find_element(By.XPATH, '//td[@class=\'ant-table-column-has-actions ant-table-column-has-sorters\' and text()=\'{}\']'.format(student_id))
        # 提取学号和姓名
        student_number = student_info.text
        student_name = student_info.find_element(By.XPATH, './following-sibling::td').text
        
        # 遍历时间单元K列和考场编号H列数据
        for k_row, h_row in zip(sheet.iter_rows(min_row=2, max_row=sheet.max_row, min_col=11, max_col=11), sheet.iter_rows(min_row=2, max_row=sheet.max_row, min_col=8, max_col=8)):
            k_cell = k_row[0]
            h_cell = h_row[0]
            k_data = k_cell.value
            h_data = h_cell.value
            if k_data and h_data:
                # 提取时间和考场编号
                k_time = time.strftime('%Y-%m-%d %H:%M:%S', time.strptime(k_data, '%Y-%m-%d %H:%M:%S'))
                h_number = str(h_data)
                
                # 在网页内查找所有时间单元和考场编号元素
                time_elements = driver.find_elements(By.XPATH, '//td[@class=\'ant-table-column-has-actions ant-table-column-has-sorters\' and text()=\'{}\']'.format(k_time))
                number_elements = driver.find_elements(By.XPATH, '//td[@class=\'ant-table-column-has-actions ant-table-column-has-sorters\' and text()=\'{}\']'.format(h_number))
                
                for time_element, number_element in zip(time_elements, number_elements):
                    # 获取时间和考场编号所在行的学号和姓名
                    row_student_number = time_element.find_element(By.XPATH, './preceding-sibling::td').text
                    row_student_name = time_element.find_element(By.XPATH, './preceding-sibling::td[2]').text
                    
                    # 如果学号和姓名匹配,则保存照片
                    if row_student_number == student_number and row_student_name == student_name:
                        # 创建考场编号文件夹
                        folder_path = os.path.join(r'C:\Users\Administrator\Desktop\照片', k_time, h_number)
                        if not os.path.exists(folder_path):
                            os.mkdir(folder_path)
                        
                        # 保存照片
                        photo_element = number_element.find_element(By.XPATH, './following-sibling::td/img')
                        photo_url = photo_element.get_attribute('src')
                        photo_name = '{}_{}.jpg'.format(student_number, student_name)
                        photo_path = os.path.join(folder_path, photo_name)
                        urllib.request.urlretrieve(photo_url, photo_path)
                        break

driver.quit()

Python Selenium 自动化下载考生照片

原文地址: https://www.cveoy.top/t/topic/fI38 著作权归作者所有。请勿转载和采集!

免费AI点我,无需注册和登录