爬取携程泰山代码

from selenium import webdriver
from selenium.webdriver.common.by import By
import time
from selenium.webdriver.support.ui import WebDriverWait
from selenium.webdriver.support import expected_conditions as EC
driver = webdriver.Edge()
driver.get(“https://you.ctrip.com/sight/taian746/136014.html”) # 设置网址

检验xpath

h = ‘/html/body/div[2]/div[2]/div[1]/div[3]/div/div[4]/div[1]/div[4]/div/div[5]/div[’+str(j)+‘]/div[2]/div[2]’

element = WebDriverWait(driver, 10).until(

EC.presence_of_element_located((By.XPATH, h))

)

print(f"结果 : {element.text}")

driver.get(“加班1周,我被这个需求搞疯了_哔哩哔哩_bilibili”) # 设置网址

time.sleep(30)
driver.execute_script(“window.scrollTo(0, document.body.scrollHeight)”)
j = 1
max_comments = 10 # 设置最大评论数,可以根据需要调整
while j <= max_comments:
driver.execute_script(“window.scrollTo(0, document.body.scrollHeight)”)
time.sleep(2)
h = ’ /html/body/div[2]/div[2]/div[1]/div[3]/div/div[4]/div[1]/div[4]/div/div[5]/div[‘+str(j)+’]/div[2]/div[2]’
element = WebDriverWait(driver, 10).until(
EC.presence_of_element_located((By.XPATH, h))
)
print(f"结果 {j}: {element.text}")
j += 1