205 params[
'headers'][
'Accept-Encoding'] =
'gzip, deflate'
212 args[
'spellcheck'] =
'1'
214 if brave_category
in (
'search',
'goggles'):
215 if params.get(
'pageno', 1) - 1:
216 args[
'offset'] = params.get(
'pageno', 1) - 1
217 if time_range_map.get(params[
'time_range']):
218 args[
'tf'] = time_range_map.get(params[
'time_range'])
220 if brave_category ==
'goggles':
221 args[
'goggles_id'] = Goggles
223 params[
"url"] = f
"{base_url}{brave_category}?{urlencode(args)}"
227 params[
'cookies'][
'safesearch'] = safesearch_map.get(params[
'safesearch'],
'off')
229 params[
'cookies'][
'useLocation'] =
'0'
230 params[
'cookies'][
'summarizer'] =
'0'
232 engine_region = traits.get_region(params[
'searxng_locale'],
'all')
233 params[
'cookies'][
'country'] = engine_region.split(
'-')[-1].lower()
235 ui_lang = locales.get_engine_locale(params[
'searxng_locale'], traits.custom[
"ui_lang"],
'en-us')
236 params[
'cookies'][
'ui_lang'] = ui_lang
238 logger.debug(
"cookies %s", params[
'cookies'])
240 params[
'headers'][
'Sec-Fetch-Dest'] =
"document"
241 params[
'headers'][
'Sec-Fetch-Mode'] =
"navigate"
242 params[
'headers'][
'Sec-Fetch-Site'] =
"same-origin"
243 params[
'headers'][
'Sec-Fetch-User'] =
"?1"
306 dom = html.fromstring(resp.text)
310 answer_tag = eval_xpath_getindex(dom,
'//div[@class="answer"]', 0, default=
None)
312 url = eval_xpath_getindex(dom,
'//div[@id="featured_snippet"]/a[@class="result-header"]/@href', 0, default=
None)
313 answer = extract_text(answer_tag)
314 if answer
is not None:
315 result_list.add(result_list.types.Answer(answer=answer, url=url))
318 xpath_results =
'//div[contains(@class, "snippet ")]'
320 for result
in eval_xpath_list(dom, xpath_results):
322 url = eval_xpath_getindex(result,
'.//a[contains(@class, "h")]/@href', 0, default=
None)
323 title_tag = eval_xpath_getindex(
324 result,
'.//a[contains(@class, "h")]//div[contains(@class, "title")]', 0, default=
None
326 if url
is None or title_tag
is None or not urlparse(url).netloc:
329 content: str = extract_text(
330 eval_xpath_getindex(result,
'.//div[contains(@class, "snippet-description")]', 0, default=
'')
332 pub_date_raw = eval_xpath(result,
'substring-before(.//div[contains(@class, "snippet-description")], "-")')
334 if pub_date
and content.startswith(pub_date_raw):
335 content = content.lstrip(pub_date_raw).strip(
"- \n\t")
337 thumbnail = eval_xpath_getindex(result,
'.//img[contains(@class, "thumb")]/@src', 0, default=
'')
341 'title': extract_text(title_tag),
343 'publishedDate': pub_date,
344 'thumbnail': thumbnail,
347 video_tag = eval_xpath_getindex(
348 result,
'.//div[contains(@class, "video-snippet") and @data-macro="video"]', 0, default=
None
350 if video_tag
is not None:
355 iframe_src = get_embeded_stream_url(url)
357 item[
'iframe_src'] = iframe_src
358 item[
'template'] =
'videos.html'
359 item[
'thumbnail'] = eval_xpath_getindex(video_tag,
'.//img/@src', 0, default=
'')
360 pub_date_raw = extract_text(
361 eval_xpath(video_tag,
'.//div[contains(@class, "snippet-attributes")]/div/text()')
365 item[
'thumbnail'] = eval_xpath_getindex(video_tag,
'.//img/@src', 0, default=
'')
367 result_list.append(item)
375 dom = html.fromstring(resp.text)
377 for result
in eval_xpath_list(dom,
'//div[contains(@class, "results")]//div[@data-type="news"]'):
382 url = eval_xpath_getindex(result,
'.//a[contains(@class, "result-header")]/@href', 0, default=
None)
386 title = extract_text(eval_xpath_list(result,
'.//span[contains(@class, "snippet-title")]'))
387 content = extract_text(eval_xpath_list(result,
'.//p[contains(@class, "desc")]'))
388 thumbnail = eval_xpath_getindex(result,
'.//div[contains(@class, "image-wrapper")]//img/@src', 0, default=
'')
394 "thumbnail": thumbnail,
397 result_list.append(item)
450 """Fetch :ref:`languages <brave languages>` and :ref:`regions <brave
451 regions>` from Brave."""
455 import babel.languages
459 engine_traits.custom[
"ui_lang"] = {}
462 'Accept-Encoding':
'gzip, deflate',
464 lang_map = {
'no':
'nb'}
468 resp = get(
'https://search.brave.com/settings', headers=headers)
471 print(
"ERROR: response from Brave is not OK.")
472 dom = html.fromstring(resp.text)
474 for option
in dom.xpath(
'//section//option[@value="en-us"]/../option'):
476 ui_lang = option.get(
'value')
478 l = babel.Locale.parse(ui_lang, sep=
'-')
480 sxng_tag = region_tag(babel.Locale.parse(ui_lang, sep=
'-'))
482 sxng_tag = language_tag(babel.Locale.parse(ui_lang, sep=
'-'))
484 except babel.UnknownLocaleError:
485 print(
"ERROR: can't determine babel locale of Brave's (UI) language %s" % ui_lang)
488 conflict = engine_traits.custom[
"ui_lang"].get(sxng_tag)
490 if conflict != ui_lang:
491 print(
"CONFLICT: babel %s --> %s, %s" % (sxng_tag, conflict, ui_lang))
493 engine_traits.custom[
"ui_lang"][sxng_tag] = ui_lang
497 resp = get(
'https://cdn.search.brave.com/serp/v2/_app/immutable/chunks/parameters.734c106a.js', headers=headers)
500 print(
"ERROR: response from Brave is not OK.")
502 country_js = resp.text[resp.text.index(
"options:{all") + len(
'options:') :]
503 country_js = country_js[: country_js.index(
"},k={default")]
504 country_tags = js_variable_to_python(country_js)
506 for k, v
in country_tags.items():
508 engine_traits.all_locale =
'all'
510 country_tag = v[
'value']
513 for lang_tag
in babel.languages.get_official_languages(country_tag, de_facto=
True):
514 lang_tag = lang_map.get(lang_tag, lang_tag)
515 sxng_tag = region_tag(babel.Locale.parse(
'%s_%s' % (lang_tag, country_tag.upper())))
518 conflict = engine_traits.regions.get(sxng_tag)
520 if conflict != country_tag:
521 print(
"CONFLICT: babel %s --> %s, %s" % (sxng_tag, conflict, country_tag))
523 engine_traits.regions[sxng_tag] = country_tag