.oO SearXNG Developer Documentation Oo.
Loading...
Searching...
No Matches
ask.py
Go to the documentation of this file.
1# SPDX-License-Identifier: AGPL-3.0-or-later
2"""Ask.com"""
3
4from urllib.parse import urlencode
5import dateutil
6from lxml import html
7from searx import utils
8
9# Metadata
10about = {
11 "website": "https://www.ask.com/",
12 "wikidata_id": 'Q847564',
13 "official_api_documentation": None,
14 "use_official_api": False,
15 "require_api_key": False,
16 "results": "HTML",
17}
18
19# Engine Configuration
20categories = ['general']
21paging = True
22max_page = 5
23"""Ask.com has at max 5 pages."""
24
25# Base URL
26base_url = "https://www.ask.com/web"
27
28
29def request(query, params):
30
31 query_params = {
32 "q": query,
33 "page": params["pageno"],
34 }
35
36 params["url"] = f"{base_url}?{urlencode(query_params)}"
37 return params
38
39
40def response(resp):
41
42 start_tag = 'window.MESON.initialState = {'
43 end_tag = '}};'
44
45 dom = html.fromstring(resp.text)
46 script = utils.eval_xpath_getindex(dom, '//script', 0, default=None).text
47
48 pos = script.index(start_tag) + len(start_tag) - 1
49 script = script[pos:]
50 pos = script.index(end_tag) + len(end_tag) - 1
51 script = script[:pos]
52
53 json_resp = utils.js_variable_to_python(script)
54
55 results = []
56
57 for item in json_resp['search']['webResults']['results']:
58
59 pubdate_original = item.get('pubdate_original')
60 if pubdate_original:
61 pubdate_original = dateutil.parser.parse(pubdate_original)
62 metadata = [item.get(field) for field in ['category_l1', 'catsy'] if item.get(field)]
63
64 results.append(
65 {
66 "url": item['url'].split('&ueid')[0],
67 "title": item['title'],
68 "content": item['abstract'],
69 "publishedDate": pubdate_original,
70 # "thumbnail": item.get('image_url') or None, # these are not thumbs / to large
71 "metadata": ' | '.join(metadata),
72 }
73 )
74
75 return results
request(query, params)
Definition ask.py:29
response(resp)
Definition ask.py:40