| 1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465 | ## Google (News)## @website     https://www.google.com# @provide-api yes (https://developers.google.com/web-search/docs/),#              deprecated!## @using-api   yes# @results     JSON# @stable      yes (but deprecated)# @parse       url, title, content, publishedDatefrom urllib import urlencodefrom json import loadsfrom dateutil import parser# search-urlcategories = ['news']paging = Truelanguage_support = True# engine dependent configurl = 'https://ajax.googleapis.com/'search_url = url + 'ajax/services/search/news?v=2.0&start={offset}&rsz=large&safe=off&filter=off&{query}&hl={lang}'# do search-requestdef request(query, params):    offset = (params['pageno'] - 1) * 8    language = 'en-US'    if params['language'] != 'all':        language = params['language'].replace('_', '-')    params['url'] = search_url.format(offset=offset,                                      query=urlencode({'q': query}),                                      lang=language)    return params# get response from search-requestdef response(resp):    results = []    search_res = loads(resp.text)    # return empty array if there are no results    if not search_res.get('responseData', {}).get('results'):        return []    # parse results    for result in search_res['responseData']['results']:        # parse publishedDate        publishedDate = parser.parse(result['publishedDate'])        if 'url' not in result:            continue        # append result        results.append({'url': result['unescapedUrl'],                        'title': result['titleNoFormatting'],                        'publishedDate': publishedDate,                        'content': result['content']})    # return results    return results
 |