1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798 |
- """
- Torrentz2.eu (BitTorrent meta-search engine)
-
- @website https://torrentz2.eu/
- @provide-api no
-
- @using-api no
- @results HTML
- @stable no (HTML can change, although unlikely,
- see https://torrentz.eu/torrentz.btsearch)
- @parse url, title, publishedDate, seed, leech, filesize, magnetlink
- """
-
- import re
- from lxml import html
- from datetime import datetime
- from searx.engines.xpath import extract_text
- from searx.url_utils import urlencode
- from searx.utils import get_torrent_size
-
- # engine dependent config
- categories = ['files', 'videos', 'music']
- paging = True
-
- # search-url
- # https://torrentz2.eu/search?f=EXAMPLE&p=6
- base_url = 'https://torrentz2.eu/'
- search_url = base_url + 'search?{query}'
-
-
- # do search-request
- def request(query, params):
- page = params['pageno'] - 1
- query = urlencode({'f': query, 'p': page})
- params['url'] = search_url.format(query=query)
- return params
-
-
- # get response from search-request
- def response(resp):
- results = []
-
- dom = html.fromstring(resp.text)
-
- for result in dom.xpath('//div[@class="results"]/dl'):
- name_cell = result.xpath('./dt')[0]
- title = extract_text(name_cell)
-
- # skip rows that do not contain a link to a torrent
- links = name_cell.xpath('./a')
- if len(links) != 1:
- continue
-
- # extract url and remove a slash in the beginning
- link = links[0].attrib.get('href').lstrip('/')
-
- seed = 0
- leech = 0
- try:
- seed = int(result.xpath('./dd/span[4]/text()')[0].replace(',', ''))
- leech = int(result.xpath('./dd/span[5]/text()')[0].replace(',', ''))
- except:
- pass
-
- params = {
- 'url': base_url + link,
- 'title': title,
- 'seed': seed,
- 'leech': leech,
- 'template': 'torrent.html'
- }
-
- # let's try to calculate the torrent size
- try:
- filesize_info = result.xpath('./dd/span[3]/text()')[0]
- filesize, filesize_multiplier = filesize_info.split()
- filesize = get_torrent_size(filesize, filesize_multiplier)
-
- params['filesize'] = filesize
- except:
- pass
-
- # does our link contain a valid SHA1 sum?
- if re.compile('[0-9a-fA-F]{40}').match(link):
- # add a magnet link to the result
- params['magnetlink'] = 'magnet:?xt=urn:btih:' + link
-
- # extract and convert creation date
- try:
- date_ts = result.xpath('./dd/span[2]')[0].attrib.get('title')
- date = datetime.fromtimestamp(float(date_ts))
- params['publishedDate'] = date
- except:
- pass
-
- results.append(params)
-
- return results
|