.oO SearXNG Developer Documentation Oo.
Loading...
Searching...
No Matches
niconico.py
Go to the documentation of this file.
1# SPDX-License-Identifier: AGPL-3.0-or-later
2"""Niconico search engine for searxng"""
3
4from urllib.parse import urlencode
5from datetime import datetime, timedelta
6from lxml import html
7
8from searx.utils import eval_xpath_getindex, eval_xpath_list, eval_xpath, extract_text
9
10about = {
11 "website": "https://www.nicovideo.jp/",
12 "wikidata_id": "Q697233",
13 "use_official_api": False,
14 "require_api_key": False,
15 "results": "HTML",
16 "language": "ja",
17}
18
19categories = ["videos"]
20paging = True
21
22time_range_support = True
23time_range_dict = {"day": 1, "week": 7, "month": 30, "year": 365}
24
25base_url = "https://www.nicovideo.jp"
26embed_url = "https://embed.nicovideo.jp"
27
28results_xpath = '//li[@data-video-item]'
29url_xpath = './/a[@class="itemThumbWrap"]/@href'
30video_length_xpath = './/span[@class="videoLength"]'
31upload_time_xpath = './/p[@class="itemTime"]//span[@class="time"]/text()'
32title_xpath = './/p[@class="itemTitle"]/a'
33content_xpath = './/p[@class="itemDescription"]/@title'
34thumbnail_xpath = './/img[@class="thumb"]/@src'
35
36
37def request(query, params):
38 query_params = {"page": params['pageno']}
39
40 if time_range_dict.get(params['time_range']):
41 time_diff_days = time_range_dict[params['time_range']]
42 start_date = datetime.now() - timedelta(days=time_diff_days)
43 query_params['start'] = start_date.strftime('%Y-%m-%d')
44
45 params['url'] = f"{base_url}/search/{query}?{urlencode(query_params)}"
46 return params
47
48
49def response(resp):
50 results = []
51 dom = html.fromstring(resp.text)
52
53 for item in eval_xpath_list(dom, results_xpath):
54 relative_url = eval_xpath_getindex(item, url_xpath, 0)
55 video_id = relative_url.rsplit('?', maxsplit=1)[0].split('/')[-1]
56
57 url = f"{base_url}/watch/{video_id}"
58 iframe_src = f"{embed_url}/watch/{video_id}"
59
60 length = None
61 video_length = eval_xpath_getindex(item, video_length_xpath, 0)
62 if len(video_length) > 0:
63 try:
64 timediff = datetime.strptime(video_length, "%M:%S")
65 length = timedelta(minutes=timediff.minute, seconds=timediff.second)
66 except ValueError:
67 pass
68
69 published_date = None
70 upload_time = eval_xpath_getindex(item, upload_time_xpath, 0)
71 if len(upload_time) > 0:
72 try:
73 published_date = datetime.strptime(upload_time, "%Y/%m/%d %H:%M")
74 except ValueError:
75 pass
76
77 results.append(
78 {
79 'template': 'videos.html',
80 'title': extract_text(eval_xpath(item, title_xpath)),
81 'content': eval_xpath_getindex(item, content_xpath, 0),
82 'url': url,
83 "iframe_src": iframe_src,
84 'thumbnail': eval_xpath_getindex(item, thumbnail_xpath, 0),
85 'length': length,
86 "publishedDate": published_date,
87 }
88 )
89
90 return results
request(query, params)
Definition niconico.py:37