.oO SearXNG Developer Documentation Oo.
Loading...
Searching...
No Matches
torznab.py
Go to the documentation of this file.
1# SPDX-License-Identifier: AGPL-3.0-or-later
2"""Torznab_ is an API specification that provides a standardized way to query
3torrent site for content. It is used by a number of torrent applications,
4including Prowlarr_ and Jackett_.
5
6Using this engine together with Prowlarr_ or Jackett_ allows you to search
7a huge number of torrent sites which are not directly supported.
8
9Configuration
10=============
11
12The engine has the following settings:
13
14``base_url``:
15 Torznab endpoint URL.
16
17``api_key``:
18 The API key to use for authentication.
19
20``torznab_categories``:
21 The categories to use for searching. This is a list of category IDs. See
22 Prowlarr-categories_ or Jackett-categories_ for more information.
23
24``show_torrent_files``:
25 Whether to show the torrent file in the search results. Be careful as using
26 this with Prowlarr_ or Jackett_ leaks the API key. This should be used only
27 if you are querying a Torznab endpoint without authentication or if the
28 instance is private. Be aware that private trackers may ban you if you share
29 the torrent file. Defaults to ``false``.
30
31``show_magnet_links``:
32 Whether to show the magnet link in the search results. Be aware that private
33 trackers may ban you if you share the magnet link. Defaults to ``true``.
34
35.. _Torznab:
36 https://torznab.github.io/spec-1.3-draft/index.html
37.. _Prowlarr:
38 https://github.com/Prowlarr/Prowlarr
39.. _Jackett:
40 https://github.com/Jackett/Jackett
41.. _Prowlarr-categories:
42 https://wiki.servarr.com/en/prowlarr/cardigann-yml-definition#categories
43.. _Jackett-categories:
44 https://github.com/Jackett/Jackett/wiki/Jackett-Categories
45
46Implementations
47===============
48
49"""
50from __future__ import annotations
51from typing import TYPE_CHECKING
52
53from typing import List, Dict, Any
54from datetime import datetime
55from urllib.parse import quote
56from lxml import etree # type: ignore
57
58from searx.exceptions import SearxEngineAPIException
59from searx.utils import humanize_bytes
60
61if TYPE_CHECKING:
62 import httpx
63 import logging
64
65 logger: logging.Logger
66
67# engine settings
68about: Dict[str, Any] = {
69 "website": None,
70 "wikidata_id": None,
71 "official_api_documentation": "https://torznab.github.io/spec-1.3-draft",
72 "use_official_api": True,
73 "require_api_key": False,
74 "results": 'XML',
75}
76categories: List[str] = ['files']
77paging: bool = False
78time_range_support: bool = False
79
80# defined in settings.yml
81# example (Jackett): "http://localhost:9117/api/v2.0/indexers/all/results/torznab"
82base_url: str = ''
83api_key: str = ''
84# https://newznab.readthedocs.io/en/latest/misc/api/#predefined-categories
85torznab_categories: List[str] = []
86show_torrent_files: bool = False
87show_magnet_links: bool = True
88
89
90def init(engine_settings=None): # pylint: disable=unused-argument
91 """Initialize the engine."""
92 if len(base_url) < 1:
93 raise ValueError('missing torznab base_url')
94
95
96def request(query: str, params: Dict[str, Any]) -> Dict[str, Any]:
97 """Build the request params."""
98 search_url: str = base_url + '?t=search&q={search_query}'
99
100 if len(api_key) > 0:
101 search_url += '&apikey={api_key}'
102 if len(torznab_categories) > 0:
103 search_url += '&cat={torznab_categories}'
104
105 params['url'] = search_url.format(
106 search_query=quote(query), api_key=api_key, torznab_categories=",".join([str(x) for x in torznab_categories])
107 )
108
109 return params
110
111
112def response(resp: httpx.Response) -> List[Dict[str, Any]]:
113 """Parse the XML response and return a list of results."""
114 results = []
115 search_results = etree.XML(resp.content)
116
117 # handle errors: https://newznab.readthedocs.io/en/latest/misc/api/#newznab-error-codes
118 if search_results.tag == "error":
119 raise SearxEngineAPIException(search_results.get("description"))
120
121 channel: etree.Element = search_results[0]
122
123 item: etree.Element
124 for item in channel.iterfind('item'):
125 result: Dict[str, Any] = build_result(item)
126 results.append(result)
127
128 return results
129
130
131def build_result(item: etree.Element) -> Dict[str, Any]:
132 """Build a result from a XML item."""
133
134 # extract attributes from XML
135 # see https://torznab.github.io/spec-1.3-draft/torznab/Specification-v1.3.html#predefined-attributes
136 enclosure: etree.Element | None = item.find('enclosure')
137 enclosure_url: str | None = None
138 if enclosure is not None:
139 enclosure_url = enclosure.get('url')
140
141 filesize = get_attribute(item, 'size')
142 if not filesize and enclosure:
143 filesize = enclosure.get('length')
144
145 guid = get_attribute(item, 'guid')
146 comments = get_attribute(item, 'comments')
147 pubDate = get_attribute(item, 'pubDate')
148 seeders = get_torznab_attribute(item, 'seeders')
149 leechers = get_torznab_attribute(item, 'leechers')
150 peers = get_torznab_attribute(item, 'peers')
151
152 # map attributes to searx result
153 result: Dict[str, Any] = {
154 'template': 'torrent.html',
155 'title': get_attribute(item, 'title'),
156 'filesize': humanize_bytes(int(filesize)) if filesize else None,
157 'files': get_attribute(item, 'files'),
158 'seed': seeders,
159 'leech': _map_leechers(leechers, seeders, peers),
160 'url': _map_result_url(guid, comments),
161 'publishedDate': _map_published_date(pubDate),
162 'torrentfile': None,
163 'magnetlink': None,
164 }
165
166 link = get_attribute(item, 'link')
167 if show_torrent_files:
168 result['torrentfile'] = _map_torrent_file(link, enclosure_url)
169 if show_magnet_links:
170 magneturl = get_torznab_attribute(item, 'magneturl')
171 result['magnetlink'] = _map_magnet_link(magneturl, guid, enclosure_url, link)
172 return result
173
174
175def _map_result_url(guid: str | None, comments: str | None) -> str | None:
176 if guid and guid.startswith('http'):
177 return guid
178 if comments and comments.startswith('http'):
179 return comments
180 return None
181
182
183def _map_leechers(leechers: str | None, seeders: str | None, peers: str | None) -> str | None:
184 if leechers:
185 return leechers
186 if seeders and peers:
187 return str(int(peers) - int(seeders))
188 return None
189
190
191def _map_published_date(pubDate: str | None) -> datetime | None:
192 if pubDate is not None:
193 try:
194 return datetime.strptime(pubDate, '%a, %d %b %Y %H:%M:%S %z')
195 except (ValueError, TypeError) as e:
196 logger.debug("ignore exception (publishedDate): %s", e)
197 return None
198
199
200def _map_torrent_file(link: str | None, enclosure_url: str | None) -> str | None:
201 if link and link.startswith('http'):
202 return link
203 if enclosure_url and enclosure_url.startswith('http'):
204 return enclosure_url
205 return None
206
207
209 magneturl: str | None,
210 guid: str | None,
211 enclosure_url: str | None,
212 link: str | None,
213) -> str | None:
214 if magneturl and magneturl.startswith('magnet'):
215 return magneturl
216 if guid and guid.startswith('magnet'):
217 return guid
218 if enclosure_url and enclosure_url.startswith('magnet'):
219 return enclosure_url
220 if link and link.startswith('magnet'):
221 return link
222 return None
223
224
225def get_attribute(item: etree.Element, property_name: str) -> str | None:
226 """Get attribute from item."""
227 property_element: etree.Element | None = item.find(property_name)
228 if property_element is not None:
229 return property_element.text
230 return None
231
232
233def get_torznab_attribute(item: etree.Element, attribute_name: str) -> str | None:
234 """Get torznab special attribute from item."""
235 element: etree.Element | None = item.find(
236 './/torznab:attr[@name="{attribute_name}"]'.format(attribute_name=attribute_name),
237 {'torznab': 'http://torznab.com/schemas/2015/feed'},
238 )
239 if element is not None:
240 return element.get("value")
241 return None
datetime|None _map_published_date(str|None pubDate)
Definition torznab.py:191
str|None _map_result_url(str|None guid, str|None comments)
Definition torznab.py:175
List[Dict[str, Any]] response(httpx.Response resp)
Definition torznab.py:112
str|None _map_torrent_file(str|None link, str|None enclosure_url)
Definition torznab.py:200
str|None get_torznab_attribute(etree.Element item, str attribute_name)
Definition torznab.py:233
str|None _map_leechers(str|None leechers, str|None seeders, str|None peers)
Definition torznab.py:183
init(engine_settings=None)
Definition torznab.py:90
str|None _map_magnet_link(str|None magneturl, str|None guid, str|None enclosure_url, str|None link)
Definition torznab.py:213
Dict[str, Any] request(str query, Dict[str, Any] params)
Definition torznab.py:96
str|None get_attribute(etree.Element item, str property_name)
Definition torznab.py:225
Dict[str, Any] build_result(etree.Element item)
Definition torznab.py:131