Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- #!/usr/bin/env python3
- import selenium.webdriver.common
- import bs4
- import time
- option = selenium.webdriver.ChromeOptions()
- option.add_argument('headless')
- driver = selenium.webdriver.Chrome('C:/Users/Asus/Downloads/Compressed/chromedriver.exe', chrome_options=option)
- #driver = selenium.webdriver.Chrome('/home/furas/bin/chromedriver', chrome_options=option)
- driver.get('https://www.pokedex.org/')
- # --- scroll down ---
- results = []
- for x in range(30): # TODO: different method to get "end of page"
- selenium.webdriver.ActionChains(driver).send_keys(selenium.webdriver.common.keys.Keys.PAGE_DOWN).perform()
- time.sleep(0.3) # it needs time to load new data
- src = driver.page_source
- soup = bs4.BeautifulSoup(src, 'lxml')
- ul = soup.find('ul', id='monsters-list').find_all('li')
- for li in ul:
- name = li.find('span')
- if name:
- print(name.text)
- if name not in results:
- results.append(name.text)
- print('len:', len(results))
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement