engines/linuxtracker.py

# -*- coding: utf-8 -*-
#VERSION: 1.1
#AUTHORS: Joost Bremmer (toost.b@gmail.com)
#
#  This program is free software: you can redistribute it and/or modify
#  it under the terms of the GNU General Public License as published by
#  the Free Software Foundation, either version 3 of the License, or
#  (at your option) any later version.
#
#  This program is distributed in the hope that it will be useful,
#  but WITHOUT ANY WARRANTY; without even the implied warranty of
#  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
#  GNU General Public License for more details.
#
#  You should have received a copy of the GNU General Public License
#  along with this program.  If not, see <https://www.gnu.org/licenses/>.


try:
    from HTMLParser import HTMLParser
except ImportError:
    from html.parser import HTMLParser
import re

# import qBT modules
try:
    from novaprinter import prettyPrinter
    from helpers import retrieve_url
except:
    pass


class linuxtracker(object):
    """Class used by qBittorrent to search for torrents"""

    url = 'http://linuxtracker.org'
    name = 'Linux Tracker'
    # defines which search categories are supported by this search engine
    # and their corresponding id. Possible categories are:
    # 'all', 'movies', 'tv', 'music', 'games', 'anime', 'software', 'pictures',
    # 'books'
    supported_categories = { 'all' : 0, 'software': 0}

    class LinuxSearchParser(HTMLParser):
        """ Parses BakaBT browse page for search results and prints them"""
        def __init__(self, res, url):
            try:
                super().__init__()
            except:
                # See: http://stackoverflow.com/questions/9698614/
                HTMLParser.__init__(self)
            self.results = res
            self.engine_url = url
            self.curr = None
            self.strong_count = 0
            self.wait_for_data = True

        def handle_starttag(self, tag, attr):
            if tag == 'a':
                self.start_a(attr)

        def handle_endtag(self, tag):
            if tag == 'strong':
                self.end_strong()

        def start_a(self, attr):
            params = dict(attr)
            if 'href' in params and 'title' in params and \
                    "torrent-details" in params['href']:
                hit = {'desc_link': self.engine_url + '/' + params['href']}
                self.curr = hit
                self.wait_for_data = True
            elif 'href' in params and \
                    "magnet:?" in params['href']:
                self.curr['link'] = params['href']
                self.curr['engine_url'] = self.engine_url
                self.results.append(self.curr)
                self.curr = None
            elif 'href' in params and \
                    "peers" in params['href']:
                self.wait_for_data = True

        def end_strong(self):
            self.strong_count += 1
            self.wait_for_data = True

        def handle_data(self, data):
            if self.wait_for_data is True:
                # We process the data in order of name, size, seeds, leechers
                if self.strong_count is 0 and self.curr:
                    # Get title
                    self.curr['name'] = data.strip()
                elif self.strong_count is 3 and self.curr:
                    # Get size
                        # Strip all comma's since it screws with
                        # prettyPrinter
                        if "," in data:
                            data = re.sub(",", '', data)
                        self.curr["size"] = data.strip()
                elif self.strong_count is 4 and self.curr:
                    # Get seeds
                    try:
                        self.curr["seeds"] = int(data.strip())
                    except:
                        pass
                elif self.strong_count is 5 and self.curr:
                    # Get leechers
                    try:
                        self.curr["leech"] = int(data.strip())
                    except:
                        pass
                elif self.strong_count is 6:
                    # Reset strong counter
                    self.strong_count = 0
                self.wait_for_data = False

    def __init__(self):
        """class initialization"""

    def download_torrent(self, info):
        """Retrieve and save url as a temporary file."""

    # DO NOT CHANGE the name and parameters of this function
    # This function will be the one called by nova2.py
    def search(self, what, cat='all'):
        """
        Retreive and parse engine search results by category and query.

        Parameters:
        :param what: a string with the search tokens, already escaped
                     (e.g. "Ubuntu+Linux")
        :param cat:  the name of a search category, see supported_categories.
        """

        url = str("{0}/index.php?page=torrents"
                  "&active=1&order=5&by=2&search={1}").format(self.url, what)

        hits = []
        page = 1
        parser = self.LinuxSearchParser(hits, self.url)
        while True:
            res = retrieve_url(url + "&pages={}".format(page))
            parser.feed(res)
            for each in hits:
                prettyPrinter(each)

            if len(hits) < 15:
                break
            del hits[:]
            page += 1

        parser.close()