Merge pull request #51 from ngosang/feature/limetorrents

Add limetorrents search plugin
2018-09-24 18:01:31 +02:00 · 2018-09-24 18:01:31 +02:00 · 4a21503f78
parent 47ee0b91de f8896bdbc5
commit 4a21503f78
4 changed files with 248 additions and 0 deletions
--- a/nova/engines/limetorrents.py
+++ b/nova/engines/limetorrents.py
@ -0,0 +1,123 @@
+#VERSION: 4.00
+# AUTHORS: Lima66
+# CONTRIBUTORS: Diego de las Heras (ngosang@hotmail.es)
+
+import re
+try:
+    # python3
+    from html.parser import HTMLParser
+except ImportError:
+    # python2
+    from HTMLParser import HTMLParser
+
+# qBt
+from novaprinter import prettyPrinter
+from helpers import retrieve_url
+
+
+class limetorrents(object):
+    url = "https://www.limetorrents.info"
+    name = "LimeTorrents"
+    supported_categories = {'all': 'all',
+                            'anime': 'anime',
+                            'software': 'applications',
+                            'games': 'games',
+                            'movies': 'movies',
+                            'music': 'music',
+                            'tv': 'tv'}
+
+    class MyHtmlParser(HTMLParser):
+        """ Sub-class for parsing results """
+
+        def error(self, message):
+            pass
+
+        A, TD, TR, HREF = ('a', 'td', 'tr', 'href')
+
+        def __init__(self, url):
+            HTMLParser.__init__(self)
+            self.url = url
+            self.current_item = {}  # dict for found item
+            self.item_name = None  # key's name in current_item dict
+            self.page_empty = 22000
+            self.inside_tr = False
+            self.findTable = False
+            self.parser_class = {"tdnormal": "size",  # class
+                                 "tdseed": "seeds",
+                                 "tdleech": "leech"}
+
+        def handle_starttag(self, tag, attrs):
+
+            params = dict(attrs)
+            if params.get('class') == 'table2':
+                self.findTable = True
+
+            if tag == self.TR and self.findTable and (params.get('bgcolor') == '#F4F4F4' or params.get('bgcolor') == '#FFFFFF'):  # noqa
+                self.inside_tr = True
+                self.current_item = {}
+            if not self.inside_tr:
+                return
+
+            if self.inside_tr and tag == self.TD:
+                if "class" in params:
+                    self.item_name = self.parser_class.get(params["class"], None)
+                    if self.item_name:
+                        self.current_item[self.item_name] = -1
+
+            if self.inside_tr and tag == self.A and self.HREF in params:
+                link = params["href"]
+                if link.startswith("http://itorrents.org/torrent/"):
+                    self.current_item["engine_url"] = self.url
+                    self.item_name = "name"
+                elif link.endswith(".html"):
+                    self.current_item["link"] = self.url + link
+                    self.current_item["desc_link"] = self.url + link
+
+        def handle_data(self, data):
+            if self.inside_tr and self.item_name:
+                if self.item_name == 'size' and (data.endswith('MB') or data.endswith('GB')):
+                    self.current_item[self.item_name] = data.strip().replace(',', '')
+                elif not self.item_name == 'size':
+                    self.current_item[self.item_name] = data.strip().replace(',', '')
+
+                self.item_name = None
+
+        def handle_endtag(self, tag):
+            if tag == 'table':
+                self.findTable = False
+
+            if self.inside_tr and tag == self.TR:
+                self.inside_tr = False
+                self.item_name = None
+                array_length = len(self.current_item)
+                if array_length < 1:
+                    return
+                prettyPrinter(self.current_item)
+                self.current_item = {}
+
+    def download_torrent(self, info):
+        # since limetorrents provides torrent links in itorrent (cloudflare protected),
+        # we have to fetch the info page and extract the magnet link
+        info_page = retrieve_url(info)
+        magnet_match = re.search(r"href\s*\=\s*\"(magnet[^\"]+)\"", info_page)
+        if magnet_match and magnet_match.groups():
+            print(magnet_match.groups()[0] + " " + info)
+        else:
+            raise Exception('Error, please fill a bug report!')
+
+    def search(self, query, cat='all'):
+        """ Performs search """
+        query = query.replace("%20", "-")
+        category = self.supported_categories[cat]
+
+        parser = self.MyHtmlParser(self.url)
+        page = 1
+        while True:
+            page_url = "{0}/search/{1}/{2}/seeds/{3}".format(self.url, category, query, page)
+            html = retrieve_url(page_url)
+            lunghezza_html = len(html)
+            if page > 6 or lunghezza_html <= parser.page_empty:
+                return
+            parser.feed(html)
+            page += 1
+        parser.close()
--- a/nova/engines/versions.txt
+++ b/nova/engines/versions.txt
@ -2,6 +2,7 @@ btdb: 1.04
 eztv: 1.01
 leetx: 2.00
 legittorrents: 2.03
+limetorrents: 4.00
 piratebay: 2.16
 rarbg: 2.00
 torlock: 2.1
--- a/nova3/engines/limetorrents.py
+++ b/nova3/engines/limetorrents.py
@ -0,0 +1,123 @@
+#VERSION: 4.00
+# AUTHORS: Lima66
+# CONTRIBUTORS: Diego de las Heras (ngosang@hotmail.es)
+
+import re
+try:
+    # python3
+    from html.parser import HTMLParser
+except ImportError:
+    # python2
+    from HTMLParser import HTMLParser
+
+# qBt
+from novaprinter import prettyPrinter
+from helpers import retrieve_url
+
+
+class limetorrents(object):
+    url = "https://www.limetorrents.info"
+    name = "LimeTorrents"
+    supported_categories = {'all': 'all',
+                            'anime': 'anime',
+                            'software': 'applications',
+                            'games': 'games',
+                            'movies': 'movies',
+                            'music': 'music',
+                            'tv': 'tv'}
+
+    class MyHtmlParser(HTMLParser):
+        """ Sub-class for parsing results """
+
+        def error(self, message):
+            pass
+
+        A, TD, TR, HREF = ('a', 'td', 'tr', 'href')
+
+        def __init__(self, url):
+            HTMLParser.__init__(self)
+            self.url = url
+            self.current_item = {}  # dict for found item
+            self.item_name = None  # key's name in current_item dict
+            self.page_empty = 22000
+            self.inside_tr = False
+            self.findTable = False
+            self.parser_class = {"tdnormal": "size",  # class
+                                 "tdseed": "seeds",
+                                 "tdleech": "leech"}
+
+        def handle_starttag(self, tag, attrs):
+
+            params = dict(attrs)
+            if params.get('class') == 'table2':
+                self.findTable = True
+
+            if tag == self.TR and self.findTable and (params.get('bgcolor') == '#F4F4F4' or params.get('bgcolor') == '#FFFFFF'):  # noqa
+                self.inside_tr = True
+                self.current_item = {}
+            if not self.inside_tr:
+                return
+
+            if self.inside_tr and tag == self.TD:
+                if "class" in params:
+                    self.item_name = self.parser_class.get(params["class"], None)
+                    if self.item_name:
+                        self.current_item[self.item_name] = -1
+
+            if self.inside_tr and tag == self.A and self.HREF in params:
+                link = params["href"]
+                if link.startswith("http://itorrents.org/torrent/"):
+                    self.current_item["engine_url"] = self.url
+                    self.item_name = "name"
+                elif link.endswith(".html"):
+                    self.current_item["link"] = self.url + link
+                    self.current_item["desc_link"] = self.url + link
+
+        def handle_data(self, data):
+            if self.inside_tr and self.item_name:
+                if self.item_name == 'size' and (data.endswith('MB') or data.endswith('GB')):
+                    self.current_item[self.item_name] = data.strip().replace(',', '')
+                elif not self.item_name == 'size':
+                    self.current_item[self.item_name] = data.strip().replace(',', '')
+
+                self.item_name = None
+
+        def handle_endtag(self, tag):
+            if tag == 'table':
+                self.findTable = False
+
+            if self.inside_tr and tag == self.TR:
+                self.inside_tr = False
+                self.item_name = None
+                array_length = len(self.current_item)
+                if array_length < 1:
+                    return
+                prettyPrinter(self.current_item)
+                self.current_item = {}
+
+    def download_torrent(self, info):
+        # since limetorrents provides torrent links in itorrent (cloudflare protected),
+        # we have to fetch the info page and extract the magnet link
+        info_page = retrieve_url(info)
+        magnet_match = re.search(r"href\s*\=\s*\"(magnet[^\"]+)\"", info_page)
+        if magnet_match and magnet_match.groups():
+            print(magnet_match.groups()[0] + " " + info)
+        else:
+            raise Exception('Error, please fill a bug report!')
+
+    def search(self, query, cat='all'):
+        """ Performs search """
+        query = query.replace("%20", "-")
+        category = self.supported_categories[cat]
+
+        parser = self.MyHtmlParser(self.url)
+        page = 1
+        while True:
+            page_url = "{0}/search/{1}/{2}/seeds/{3}".format(self.url, category, query, page)
+            html = retrieve_url(page_url)
+            lunghezza_html = len(html)
+            if page > 6 or lunghezza_html <= parser.page_empty:
+                return
+            parser.feed(html)
+            page += 1
+        parser.close()
--- a/nova3/engines/versions.txt
+++ b/nova3/engines/versions.txt
@ -2,6 +2,7 @@ btdb: 1.04
 eztv: 1.01
 leetx: 2.00
 legittorrents: 2.03
+limetorrents: 4.00
 piratebay: 2.16
 rarbg: 2.00
 torlock: 2.1