Commit d7796167 authored by liyang's avatar liyang

fix:ptt debug

parent ad694283
...@@ -39,8 +39,9 @@ def reptile(browser=None, search_word=""): ...@@ -39,8 +39,9 @@ def reptile(browser=None, search_word=""):
# 打开网页 # 打开网页
browser.get(url) browser.get(url)
# log.debug("已打开浏览器") # log.debug("已打开浏览器")
classify_item_list = browser.find_elements('xpath', "//div[@class='board-class']") item_list = browser.find_elements('xpath', "//div[@class='board-class']")
# log.debug(classify_item_list) # log.debug(classify_item_list)
classify_item_list = item_list.copy()
length = len(classify_item_list) length = len(classify_item_list)
for index in range(length): for index in range(length):
# 暂时先爬取 第2个 分类 # 暂时先爬取 第2个 分类
...@@ -209,7 +210,7 @@ def reptile(browser=None, search_word=""): ...@@ -209,7 +210,7 @@ def reptile(browser=None, search_word=""):
browser.back() browser.back()
time.sleep(0.1) time.sleep(0.1)
# 重新获取 # 重新获取
classify_item_list = browser.find_elements('xpath', "//div[@class='board-class']") # classify_item_list = browser.find_elements('xpath', "//div[@class='board-class']")
# 发送爬取数据到java服务 # 发送爬取数据到java服务
# print('----------------------') # print('----------------------')
......
# set options to be headless, .. classify_item_list = browser.find_elements('xpath', "//div[@class='board-class']")
from selenium import webdriver # log.debug(classify_item_list)
options = webdriver.ChromeOptions() length = len(classify_item_list)
options.add_argument('--headless') for index in range(length):
options.add_argument('--no-sandbox') # 暂时先爬取 第2个 分类
options.add_argument('--disable-dev-shm-usage') if 0 <= index < 4:
type_title = classify_item_list[index].text
# open it, go to a website, and get results classify_item_list[index].click()
wd = webdriver.Chrome(options=options) time.sleep(0.1)
wd.get("https://www.youtube.com/results?search_query=俄乌战争") for index_two in range(length_two):
print(element_list[index_two].text)
print(wd.page_source) # results # 浏览器返回上一页
\ No newline at end of file browser.back()
if index == 0:
browser.back()
time.sleep(0.1)
classify_item_list = browser.find_elements('xpath', "//div[@class='board-class']")
\ No newline at end of file
Markdown is supported
0% or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment