Source code for veryscrape.scrapers.google
from ..process import extract_urls
from ..scrape import SearchEngineScraper, ItemGenerator
from ..session import Session
[docs]class GoogleSession(Session):
error_on_failure = False
retries_to_error = 2
[docs]class ArticleGen(ItemGenerator):
[docs] def process_text(self, text):
return text[0]
[docs] def process_time(self, text):
return text[1]
[docs]class Google(SearchEngineScraper):
source = 'article'
item_gen = ArticleGen
session_class = GoogleSession
[docs] def query_string(self, query):
return 'https://news.google.com/news/search/section/q/' \
'{}/{}?hl=en&gl=US&ned=us'.format(query, query)