You can not select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
40 lines
1.3 KiB
40 lines
1.3 KiB
import time
|
|
|
|
from selenium import webdriver # 用来驱动浏览器的
|
|
from selenium.webdriver.chrome.options import Options
|
|
from selenium.webdriver.support.wait import WebDriverWait # 等待页面加载某些元素
|
|
|
|
|
|
def getZhiYe(code):
|
|
url = 'https://pv4y-pc-tob.youzy.cn/careers/detail/index?code=' + code
|
|
driver.get(url)
|
|
# 模拟点击
|
|
a = driver.find_element_by_xpath("/html/body/div/div[1]/section/div/div[2]/div[2]/a[2]")
|
|
driver.execute_script("arguments[0].click();", a)
|
|
time.sleep(1)
|
|
|
|
a1 = driver.find_element_by_xpath("/html/body/div/div[1]/section/div/div[2]/div[3]/div/div[1]/a[1]")
|
|
a0 = a1.find_element_by_xpath("..")
|
|
aList = a0.find_elements_by_tag_name("a")
|
|
|
|
for one in aList:
|
|
print(one.text)
|
|
driver.execute_script("arguments[0].click();", one)
|
|
time.sleep(1)
|
|
|
|
|
|
if __name__ == '__main__':
|
|
# 打开webdriver
|
|
option = Options()
|
|
driver = webdriver.Chrome(options=option) # 调用带参数的谷歌浏览器
|
|
driver.implicitly_wait(2)
|
|
WebDriverWait(driver, 2)
|
|
driver.maximize_window()
|
|
authPage = 'https://www.youzy.cn/tzy/search/colleges/collegeList'
|
|
driver.get(authPage)
|
|
# 抓取
|
|
getZhiYe('02090400')
|
|
# 关闭selenium
|
|
# driver.close()
|
|
# driver.quit()
|