Merge pull request #51 from ngosang/feature/limetorrents
Add limetorrents search plugin
This commit is contained in:
commit
4a21503f78
|
|
@ -0,0 +1,123 @@
|
|||
#VERSION: 4.00
|
||||
# AUTHORS: Lima66
|
||||
# CONTRIBUTORS: Diego de las Heras (ngosang@hotmail.es)
|
||||
|
||||
import re
|
||||
try:
|
||||
# python3
|
||||
from html.parser import HTMLParser
|
||||
except ImportError:
|
||||
# python2
|
||||
from HTMLParser import HTMLParser
|
||||
|
||||
# qBt
|
||||
from novaprinter import prettyPrinter
|
||||
from helpers import retrieve_url
|
||||
|
||||
|
||||
class limetorrents(object):
|
||||
url = "https://www.limetorrents.info"
|
||||
name = "LimeTorrents"
|
||||
supported_categories = {'all': 'all',
|
||||
'anime': 'anime',
|
||||
'software': 'applications',
|
||||
'games': 'games',
|
||||
'movies': 'movies',
|
||||
'music': 'music',
|
||||
'tv': 'tv'}
|
||||
|
||||
class MyHtmlParser(HTMLParser):
|
||||
""" Sub-class for parsing results """
|
||||
|
||||
def error(self, message):
|
||||
pass
|
||||
|
||||
A, TD, TR, HREF = ('a', 'td', 'tr', 'href')
|
||||
|
||||
def __init__(self, url):
|
||||
HTMLParser.__init__(self)
|
||||
self.url = url
|
||||
self.current_item = {} # dict for found item
|
||||
self.item_name = None # key's name in current_item dict
|
||||
self.page_empty = 22000
|
||||
self.inside_tr = False
|
||||
self.findTable = False
|
||||
self.parser_class = {"tdnormal": "size", # class
|
||||
"tdseed": "seeds",
|
||||
"tdleech": "leech"}
|
||||
|
||||
def handle_starttag(self, tag, attrs):
|
||||
|
||||
params = dict(attrs)
|
||||
if params.get('class') == 'table2':
|
||||
self.findTable = True
|
||||
|
||||
if tag == self.TR and self.findTable and (params.get('bgcolor') == '#F4F4F4' or params.get('bgcolor') == '#FFFFFF'): # noqa
|
||||
self.inside_tr = True
|
||||
self.current_item = {}
|
||||
if not self.inside_tr:
|
||||
return
|
||||
|
||||
if self.inside_tr and tag == self.TD:
|
||||
if "class" in params:
|
||||
self.item_name = self.parser_class.get(params["class"], None)
|
||||
if self.item_name:
|
||||
self.current_item[self.item_name] = -1
|
||||
|
||||
if self.inside_tr and tag == self.A and self.HREF in params:
|
||||
link = params["href"]
|
||||
if link.startswith("http://itorrents.org/torrent/"):
|
||||
self.current_item["engine_url"] = self.url
|
||||
self.item_name = "name"
|
||||
elif link.endswith(".html"):
|
||||
self.current_item["link"] = self.url + link
|
||||
self.current_item["desc_link"] = self.url + link
|
||||
|
||||
def handle_data(self, data):
|
||||
if self.inside_tr and self.item_name:
|
||||
if self.item_name == 'size' and (data.endswith('MB') or data.endswith('GB')):
|
||||
self.current_item[self.item_name] = data.strip().replace(',', '')
|
||||
elif not self.item_name == 'size':
|
||||
self.current_item[self.item_name] = data.strip().replace(',', '')
|
||||
|
||||
self.item_name = None
|
||||
|
||||
def handle_endtag(self, tag):
|
||||
if tag == 'table':
|
||||
self.findTable = False
|
||||
|
||||
if self.inside_tr and tag == self.TR:
|
||||
self.inside_tr = False
|
||||
self.item_name = None
|
||||
array_length = len(self.current_item)
|
||||
if array_length < 1:
|
||||
return
|
||||
prettyPrinter(self.current_item)
|
||||
self.current_item = {}
|
||||
|
||||
def download_torrent(self, info):
|
||||
# since limetorrents provides torrent links in itorrent (cloudflare protected),
|
||||
# we have to fetch the info page and extract the magnet link
|
||||
info_page = retrieve_url(info)
|
||||
magnet_match = re.search(r"href\s*\=\s*\"(magnet[^\"]+)\"", info_page)
|
||||
if magnet_match and magnet_match.groups():
|
||||
print(magnet_match.groups()[0] + " " + info)
|
||||
else:
|
||||
raise Exception('Error, please fill a bug report!')
|
||||
|
||||
def search(self, query, cat='all'):
|
||||
""" Performs search """
|
||||
query = query.replace("%20", "-")
|
||||
category = self.supported_categories[cat]
|
||||
|
||||
parser = self.MyHtmlParser(self.url)
|
||||
page = 1
|
||||
while True:
|
||||
page_url = "{0}/search/{1}/{2}/seeds/{3}".format(self.url, category, query, page)
|
||||
html = retrieve_url(page_url)
|
||||
lunghezza_html = len(html)
|
||||
if page > 6 or lunghezza_html <= parser.page_empty:
|
||||
return
|
||||
parser.feed(html)
|
||||
page += 1
|
||||
parser.close()
|
||||
|
|
@ -2,6 +2,7 @@ btdb: 1.04
|
|||
eztv: 1.01
|
||||
leetx: 2.00
|
||||
legittorrents: 2.03
|
||||
limetorrents: 4.00
|
||||
piratebay: 2.16
|
||||
rarbg: 2.00
|
||||
torlock: 2.1
|
||||
|
|
|
|||
|
|
@ -0,0 +1,123 @@
|
|||
#VERSION: 4.00
|
||||
# AUTHORS: Lima66
|
||||
# CONTRIBUTORS: Diego de las Heras (ngosang@hotmail.es)
|
||||
|
||||
import re
|
||||
try:
|
||||
# python3
|
||||
from html.parser import HTMLParser
|
||||
except ImportError:
|
||||
# python2
|
||||
from HTMLParser import HTMLParser
|
||||
|
||||
# qBt
|
||||
from novaprinter import prettyPrinter
|
||||
from helpers import retrieve_url
|
||||
|
||||
|
||||
class limetorrents(object):
|
||||
url = "https://www.limetorrents.info"
|
||||
name = "LimeTorrents"
|
||||
supported_categories = {'all': 'all',
|
||||
'anime': 'anime',
|
||||
'software': 'applications',
|
||||
'games': 'games',
|
||||
'movies': 'movies',
|
||||
'music': 'music',
|
||||
'tv': 'tv'}
|
||||
|
||||
class MyHtmlParser(HTMLParser):
|
||||
""" Sub-class for parsing results """
|
||||
|
||||
def error(self, message):
|
||||
pass
|
||||
|
||||
A, TD, TR, HREF = ('a', 'td', 'tr', 'href')
|
||||
|
||||
def __init__(self, url):
|
||||
HTMLParser.__init__(self)
|
||||
self.url = url
|
||||
self.current_item = {} # dict for found item
|
||||
self.item_name = None # key's name in current_item dict
|
||||
self.page_empty = 22000
|
||||
self.inside_tr = False
|
||||
self.findTable = False
|
||||
self.parser_class = {"tdnormal": "size", # class
|
||||
"tdseed": "seeds",
|
||||
"tdleech": "leech"}
|
||||
|
||||
def handle_starttag(self, tag, attrs):
|
||||
|
||||
params = dict(attrs)
|
||||
if params.get('class') == 'table2':
|
||||
self.findTable = True
|
||||
|
||||
if tag == self.TR and self.findTable and (params.get('bgcolor') == '#F4F4F4' or params.get('bgcolor') == '#FFFFFF'): # noqa
|
||||
self.inside_tr = True
|
||||
self.current_item = {}
|
||||
if not self.inside_tr:
|
||||
return
|
||||
|
||||
if self.inside_tr and tag == self.TD:
|
||||
if "class" in params:
|
||||
self.item_name = self.parser_class.get(params["class"], None)
|
||||
if self.item_name:
|
||||
self.current_item[self.item_name] = -1
|
||||
|
||||
if self.inside_tr and tag == self.A and self.HREF in params:
|
||||
link = params["href"]
|
||||
if link.startswith("http://itorrents.org/torrent/"):
|
||||
self.current_item["engine_url"] = self.url
|
||||
self.item_name = "name"
|
||||
elif link.endswith(".html"):
|
||||
self.current_item["link"] = self.url + link
|
||||
self.current_item["desc_link"] = self.url + link
|
||||
|
||||
def handle_data(self, data):
|
||||
if self.inside_tr and self.item_name:
|
||||
if self.item_name == 'size' and (data.endswith('MB') or data.endswith('GB')):
|
||||
self.current_item[self.item_name] = data.strip().replace(',', '')
|
||||
elif not self.item_name == 'size':
|
||||
self.current_item[self.item_name] = data.strip().replace(',', '')
|
||||
|
||||
self.item_name = None
|
||||
|
||||
def handle_endtag(self, tag):
|
||||
if tag == 'table':
|
||||
self.findTable = False
|
||||
|
||||
if self.inside_tr and tag == self.TR:
|
||||
self.inside_tr = False
|
||||
self.item_name = None
|
||||
array_length = len(self.current_item)
|
||||
if array_length < 1:
|
||||
return
|
||||
prettyPrinter(self.current_item)
|
||||
self.current_item = {}
|
||||
|
||||
def download_torrent(self, info):
|
||||
# since limetorrents provides torrent links in itorrent (cloudflare protected),
|
||||
# we have to fetch the info page and extract the magnet link
|
||||
info_page = retrieve_url(info)
|
||||
magnet_match = re.search(r"href\s*\=\s*\"(magnet[^\"]+)\"", info_page)
|
||||
if magnet_match and magnet_match.groups():
|
||||
print(magnet_match.groups()[0] + " " + info)
|
||||
else:
|
||||
raise Exception('Error, please fill a bug report!')
|
||||
|
||||
def search(self, query, cat='all'):
|
||||
""" Performs search """
|
||||
query = query.replace("%20", "-")
|
||||
category = self.supported_categories[cat]
|
||||
|
||||
parser = self.MyHtmlParser(self.url)
|
||||
page = 1
|
||||
while True:
|
||||
page_url = "{0}/search/{1}/{2}/seeds/{3}".format(self.url, category, query, page)
|
||||
html = retrieve_url(page_url)
|
||||
lunghezza_html = len(html)
|
||||
if page > 6 or lunghezza_html <= parser.page_empty:
|
||||
return
|
||||
parser.feed(html)
|
||||
page += 1
|
||||
parser.close()
|
||||
|
|
@ -2,6 +2,7 @@ btdb: 1.04
|
|||
eztv: 1.01
|
||||
leetx: 2.00
|
||||
legittorrents: 2.03
|
||||
limetorrents: 4.00
|
||||
piratebay: 2.16
|
||||
rarbg: 2.00
|
||||
torlock: 2.1
|
||||
|
|
|
|||
Loading…
Reference in New Issue