137 search_results = resp.json()
140 if not search_results.get(
'query', {}).get(
'search'):
143 for result
in search_results[
'query'][
'search']:
145 if result.get(
'snippet',
'').startswith(
'#REDIRECT'):
148 title = result[
'title']
149 sectiontitle = result.get(
'sectiontitle')
150 content = html_to_text(result.get(
'snippet',
''))
151 metadata = html_to_text(result.get(
'categorysnippet',
''))
152 timestamp = result.get(
'timestamp')
155 base_url.format(language=resp.search_params[
'language']) +
'wiki/' + quote(title.replace(
' ',
'_').encode())
159 url +=
'#' + quote(sectiontitle.replace(
' ',
'_').encode())
160 title +=
' / ' + sectiontitle
162 item = {
'url': url,
'title': title,
'content': content,
'metadata': metadata}
165 item[
'publishedDate'] = datetime.strptime(timestamp, timestamp_format)