【spider】selenium模擬點擊斗魚示例

from selenium import webdriver
import  timeurl = 'https://www.douyu.com/directory/all'# 動態html網頁加載可能出現的問題：element is not attached to the page document
# 標簽沒有及時的加載顯示出來，如果加載時間不夠，可能報錯
# try exceptclass Douyu(object):def __init__(self):self.driver = webdriver.Chrome()def start(self):self.driver.get(url)time.sleep(2)self.driver.find_element_by_class_name('pop-zoom-close').click()fp = open('douyu.txt', 'w', encoding='utf-8')with open('douyu.html','w',encoding='utf-8') as file:file.write(self.driver.page_source)while False:titles = self.driver.find_elements_by_css_selector('h3.ellipsis')nums = self.driver.find_elements_by_xpath('//span[@class="dy-num fr"]')print(len(titles),len(nums))for title,num in zip(titles[10:],nums):print('標題是：%s，觀戰人數：%s'%(title.text.strip(),num.text.strip()))fp.write('標題是：%s，觀戰人數：%s'%(title.text.strip(),num.text.strip())+'\n')'''<a href="#" class="shark-pager-next shark-pager-disable shark-pager-disable-next">下一頁</a><a href="#" class="shark-pager-next">下一頁</a>'''# 如果沒有找到flag = -1# 找到了，返回索引值flag = self.driver.page_source.find('shark-pager-disable-next')if flag != -1:break# 選中的當前頁碼'''<a href="#" class="shark-pager-item current">1</a>'''current_page = self.driver.find_element_by_xpath('//a[@class="shark-pager-item current"]').textprint('當前頁碼是：',current_page)try:self.driver.find_element_by_class_name('shark-pager-next').click()time.sleep(2)except:time.sleep(2)# 點擊進入最后一頁# xpath多重條件查詢，直接后面添加[][]self.driver.find_element_by_xpath('//a[contains(@class,"shark-pager-item")][last()]').click()fp.close()time.sleep(10)self.driver.quit()if '__main__' == __name__:douyu = Douyu()douyu.start()

本文來自互聯網用戶投稿，該文觀點僅代表作者本人，不代表本站立場。本站僅提供信息存儲空間服務，不擁有所有權，不承擔相關法律責任。
如若轉載，請注明出處：http://www.pswp.cn/news/456231.shtml
繁體地址，請注明出處：http://hk.pswp.cn/news/456231.shtml
英文地址，請注明出處：http://en.pswp.cn/news/456231.shtml

如若內容造成侵權/違法違規/事實不符，請聯系多彩編程網進行投訴反饋email:809451989@qq.com，一經查實，立即刪除！