Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import time
- import bs4
- import re
- from selenium import webdriver
- from bs4 import BeautifulSoup as soup
- driver = webdriver.Firefox()
- url='https://doaj.org/search?source={"query"%3A{"query_string"%3A{"query"%3A"'
- b1=input("enter text \n")
- b2=b1.replace(" ","%20")
- b3='"%2C"default_operator"%3A"AND"}}%2C"from"%3A0%2C"size"%3A10}'
- #print(b2)
- print("\n\n")
- url=url+b2+b3
- driver.get(url)
- time.sleep(2)
- refs=driver.page_source
- pagesoup=soup(refs,"html.parser")
- #containers=pagesoup.findAll("div",{"class":'main-section'})
- containers=pagesoup.findAll("div",{"class":"abstract_text"})
- #print(containers[0].a['href'])
- #print("reached contA")
- i=0
- #u="https://www.scienceopen.com"
- for container in containers :
- # print("for loop")
- try :
- if(len(container.text)>20):
- i=i+1
- # print(i)
- #if(i%2!=0):
- # driver.get(u + container['href'])
- # refs=driver.page_source
- # s=soup(refs,"html.parser")
- # c=s.find("div",{"itemprop":"description"})
- print(container.text)
- print("\n")
- except :
- continue
- driver.close()
Add Comment
Please, Sign In to add comment