summaryrefslogtreecommitdiffstats
path: root/module
diff options
context:
space:
mode:
Diffstat (limited to 'module')
-rw-r--r--module/network/Browser.py22
-rw-r--r--module/network/HTTPChunk.py2
-rw-r--r--module/network/HTTPRequest.py10
-rw-r--r--module/network/RequestFactory.py6
-rw-r--r--module/plugins/hooks/ExtractArchive.py20
-rw-r--r--module/plugins/hoster/BasePlugin.py78
-rw-r--r--module/plugins/hoster/DepositfilesCom.py46
-rw-r--r--module/plugins/hoster/HellshareCz.py4
-rw-r--r--module/plugins/hoster/HotfileCom.py9
-rw-r--r--module/plugins/internal/UnRar.py6
-rwxr-xr-xmodule/remote/thriftbackend/thriftgen/pyload/Pyload-remote2
-rw-r--r--module/remote/thriftbackend/thriftgen/pyload/Pyload.py17
12 files changed, 153 insertions, 69 deletions
diff --git a/module/network/Browser.py b/module/network/Browser.py
index 822e2ed6d..23cf7666b 100644
--- a/module/network/Browser.py
+++ b/module/network/Browser.py
@@ -8,7 +8,6 @@ from HTTPDownload import HTTPDownload
class Browser(object):
-
__slots__ = ("log", "options", "bucket", "cj", "_size", "http", "dl")
def __init__(self, bucket=None, options={}):
@@ -20,9 +19,14 @@ class Browser(object):
self.cj = None # needs to be setted later
self._size = 0
- self.http = HTTPRequest(self.cj, options)
+ self.renewHTTPRequest()
self.dl = None
+
+ def renewHTTPRequest(self):
+ if hasattr(self, "http"): self.http.close()
+ self.http = HTTPRequest(self.cj, self.options)
+
def setLastURL(self, val):
self.http.lastURL = val
@@ -80,7 +84,7 @@ class Browser(object):
""" this can also download ftp """
self._size = 0
self.dl = HTTPDownload(url, filename, get, post, self.lastEffectiveURL if ref else None,
- self.cj if cookies else None, self.bucket, self.options, progressNotify, disposition)
+ self.cj if cookies else None, self.bucket, self.options, progressNotify, disposition)
name = self.dl.download(chunks, resume)
self._size = self.dl.size
@@ -96,6 +100,18 @@ class Browser(object):
""" add a header to the request """
self.http.putHeader(name, value)
+ def addAuth(self, pwd):
+ """Adds user and pw for http auth
+
+ :param pwd: string, user:password
+ """
+ self.options["auth"] = pwd
+ self.renewHTTPRequest() #we need a new request
+
+ def removeAuth(self):
+ if "auth" in self.options: del self.options["auth"]
+ self.renewHTTPRequest()
+
def clearHeaders(self):
self.http.clearHeaders()
diff --git a/module/network/HTTPChunk.py b/module/network/HTTPChunk.py
index 680b982d3..69eedb19c 100644
--- a/module/network/HTTPChunk.py
+++ b/module/network/HTTPChunk.py
@@ -137,7 +137,7 @@ class HTTPChunk(HTTPRequest):
self.fp = None #file handle
self.initHandle()
- self.setInterface(self.p.options["interface"], self.p.options["proxies"], self.p.options["ipv6"])
+ self.setInterface(self.p.options)
self.BOMChecked = False # check and remove byte order mark
diff --git a/module/network/HTTPRequest.py b/module/network/HTTPRequest.py
index ffe5d1873..6672a58e6 100644
--- a/module/network/HTTPRequest.py
+++ b/module/network/HTTPRequest.py
@@ -55,7 +55,7 @@ class HTTPRequest():
self.headers = [] #temporary request header
self.initHandle()
- self.setInterface(options["interface"], options["proxies"], options["ipv6"])
+ self.setInterface(options)
self.c.setopt(pycurl.WRITEFUNCTION, self.write)
self.c.setopt(pycurl.HEADERFUNCTION, self.writeHeader)
@@ -89,7 +89,10 @@ class HTTPRequest():
"Keep-Alive: 300",
"Expect:"])
- def setInterface(self, interface, proxy, ipv6=False):
+ def setInterface(self, options):
+
+ interface, proxy, ipv6 = options["interface"], options["proxies"], options["ipv6"]
+
if interface and interface.lower() != "none":
self.c.setopt(pycurl.INTERFACE, str(interface))
@@ -112,6 +115,9 @@ class HTTPRequest():
else:
self.c.setopt(pycurl.IPRESOLVE, pycurl.IPRESOLVE_V4)
+ if "auth" in options:
+ self.c.setopt(pycurl.USERPWD, str(options["auth"]))
+
def addCookies(self):
""" put cookies from curl handle to cj """
if self.cj:
diff --git a/module/network/RequestFactory.py b/module/network/RequestFactory.py
index 774249a70..5b1528281 100644
--- a/module/network/RequestFactory.py
+++ b/module/network/RequestFactory.py
@@ -54,9 +54,11 @@ class RequestFactory():
self.lock.release()
return req
- def getHTTPRequest(self):
+ def getHTTPRequest(self, **kwargs):
""" returns a http request, dont forget to close it ! """
- return HTTPRequest(CookieJar(None), self.getOptions())
+ options = self.getOptions()
+ options.update(kwargs) # submit kwargs as additional options
+ return HTTPRequest(CookieJar(None), options)
def getURL(self, *args, **kwargs):
""" see HTTPRequest for argument list """
diff --git a/module/plugins/hooks/ExtractArchive.py b/module/plugins/hooks/ExtractArchive.py
index 54dd6ff2d..0a70da417 100644
--- a/module/plugins/hooks/ExtractArchive.py
+++ b/module/plugins/hooks/ExtractArchive.py
@@ -3,8 +3,8 @@
import sys
import os
-from os import remove, chmod
-from os.path import exists, basename, isfile, isdir
+from os import remove, chmod, makedirs
+from os.path import exists, basename, isfile, isdir, join
from traceback import print_exc
from copy import copy
@@ -50,7 +50,7 @@ if os.name != "nt":
from grp import getgrnam
from module.plugins.Hook import Hook, threaded, Expose
-from module.utils import save_join
+from module.utils import save_join, fs_encode
class ArchiveError(Exception):
@@ -77,6 +77,7 @@ class ExtractArchive(Hook):
("overwrite", "bool", "Overwrite files", True),
("passwordfile", "file", "password file", "unrar_passwords.txt"),
("deletearchive", "bool", "Delete archives when done", False),
+ ("subfolder", "bool", "Create subfolder for each package", False),
("destination", "folder", "Extract files to", ""),
("queue", "bool", "Wait for all downloads to be fninished", True),
("renice", "int", "CPU Priority", 0), ]
@@ -151,7 +152,7 @@ class ExtractArchive(Hook):
#iterate packages -> plugins -> targets
for pid in ids:
p = self.core.files.getPackage(pid)
- self.logInfo(_("Extract package %s") % p.name)
+ self.logInfo(_("Check package %s") % p.name)
if not p: continue
# determine output folder
@@ -159,8 +160,15 @@ class ExtractArchive(Hook):
# force trailing slash
if self.getConfig("destination") and self.getConfig("destination").lower() != "none":
- if exists(self.getConfig("destination")):
- out = save_join(self.getConfig("destination"), "")
+
+ out = save_join(dl, p.folder, self.getConfig("destination"), "")
+ #relative to package folder if destination is relative, otherwise absolute path overwrites them
+
+ if self.getConf("subfolder"):
+ out = join(out, fs_encode(p.folder))
+
+ if not exists(out):
+ makedirs(out)
files_ids = [(save_join(dl, p.folder, x["name"]), x["id"]) for x in p.getChildren().itervalues()]
diff --git a/module/plugins/hoster/BasePlugin.py b/module/plugins/hoster/BasePlugin.py
index ed11c378b..15e35ce24 100644
--- a/module/plugins/hoster/BasePlugin.py
+++ b/module/plugins/hoster/BasePlugin.py
@@ -1,13 +1,13 @@
#!/usr/bin/env python
# -*- coding: utf-8 -*-
-
-from module.plugins.Hoster import Hoster
-from module.utils import html_unescape
-
from urlparse import urlparse
from re import search
from urllib import unquote
+from module.network.HTTPRequest import BadHeader
+from module.plugins.Hoster import Hoster
+from module.utils import html_unescape, removeChars
+
class BasePlugin(Hoster):
__name__ = "BasePlugin"
__type__ = "hoster"
@@ -41,31 +41,49 @@ class BasePlugin(Hoster):
#
# return
if pyfile.url.startswith("http"):
- header = self.load(pyfile.url, just_header = True)
- #self.logDebug(header)
-
- if 'location' in header:
- self.logDebug("Location: " + header['location'])
- url = unquote(header['location'])
- else:
- url = pyfile.url
-
- name = html_unescape(urlparse(url).path.split("/")[-1])
-
- if 'content-disposition' in header:
- self.logDebug("Content-Disposition: " + header['content-disposition'])
- m = search("filename(?P<type>=|\*=(?P<enc>.+)'')(?P<name>.*)", header['content-disposition'])
- if m:
- disp = m.groupdict()
- self.logDebug(disp)
- if not disp['enc']: disp['enc'] = 'utf-8'
- name = disp['name'].replace('"', "").replace("'", "").replace(";", "").strip()
- name = unicode(unquote(name), disp['enc'])
-
- if not name: self.offline()
- pyfile.name = name
- self.logDebug("Filename: %s" % pyfile.name)
- self.download(url, disposition=True)
+
+ try:
+ self.downloadFile(pyfile)
+ except BadHeader, e:
+ if e.code in (401, 403):
+ self.logDebug("Auth required")
+
+ pwd = pyfile.package().password.strip()
+ if ":" not in pwd:
+ self.fail(_("Authorization required (username:password)"))
+
+ self.req.addAuth(pwd)
+ self.downloadFile(pyfile)
+ else:
+ raise
else:
- self.fail("No Plugin matched and not a downloadable url.") \ No newline at end of file
+ self.fail("No Plugin matched and not a downloadable url.")
+
+
+ def downloadFile(self, pyfile):
+ header = self.load(pyfile.url, just_header = True)
+ #self.logDebug(header)
+
+ if 'location' in header:
+ self.logDebug("Location: " + header['location'])
+ url = unquote(header['location'])
+ else:
+ url = pyfile.url
+
+ name = html_unescape(urlparse(url).path.split("/")[-1])
+
+ if 'content-disposition' in header:
+ self.logDebug("Content-Disposition: " + header['content-disposition'])
+ m = search("filename(?P<type>=|\*=(?P<enc>.+)'')(?P<name>.*)", header['content-disposition'])
+ if m:
+ disp = m.groupdict()
+ self.logDebug(disp)
+ if not disp['enc']: disp['enc'] = 'utf-8'
+ name = removeChars(disp['name'], "\"';").strip()
+ name = unicode(unquote(name), disp['enc'])
+
+ if not name: name = url
+ pyfile.name = name
+ self.logDebug("Filename: %s" % pyfile.name)
+ self.download(url, disposition=True) \ No newline at end of file
diff --git a/module/plugins/hoster/DepositfilesCom.py b/module/plugins/hoster/DepositfilesCom.py
index 1fba3bad5..81e6aa4d6 100644
--- a/module/plugins/hoster/DepositfilesCom.py
+++ b/module/plugins/hoster/DepositfilesCom.py
@@ -5,6 +5,7 @@ import re
import urllib
from module.plugins.Hoster import Hoster
from module.network.RequestFactory import getURL
+from module.plugins.ReCaptcha import ReCaptcha
def getInfo(urls):
result = []
@@ -29,13 +30,15 @@ class DepositfilesCom(Hoster):
__name__ = "DepositfilesCom"
__type__ = "hoster"
__pattern__ = r"http://[\w\.]*?depositfiles\.com(/\w{1,3})?/files/[\w]+"
- __version__ = "0.33"
+ __version__ = "0.34"
__description__ = """Depositfiles.com Download Hoster"""
__author_name__ = ("spoob", "zoidberg")
__author_mail__ = ("spoob@pyload.org", "zoidberg@mujmail.cz")
FILE_INFO_PATTERN = r'File name: <b title="([^"]+)">.*\s*<span class="nowrap">File size: <b>([0-9.]+)&nbsp;(KB|MB|GB)</b>'
FILE_OFFLINE_PATTERN = r'<span class="html_download_api-not_exists"></span>'
+ RECAPTCHA_PATTERN = r"Recaptcha.create\('([^']+)', this\);"
+ DOWNLOAD_LINK_PATTERN = r'<form action="(http://.+?\.depositfiles.com/.+?)" method="get"'
def setup(self):
self.resumeDownload = self.multiDL = True if self.account else False
@@ -96,27 +99,42 @@ class DepositfilesCom(Hoster):
found = re.search(r"var fid = '(\w+)';", self.html)
if not found: self.retry(wait_time=5)
- fid = found.group(1)
- self.logDebug ("FID: %s" % fid)
+ params = {'fid' : found.group(1)}
+ self.logDebug ("FID: %s" % params['fid'])
- self.wait()
-
- #form = re.search(r"\$\('#download_container'\)\.load\('([^']+)", self.html)
+ captcha_key = None
+ found = re.search(self.RECAPTCHA_PATTERN, self.html)
+ if found: captcha_key = found.group(1)
+ self.logDebug ("CAPTCHA_KEY: %s" % captcha_key)
- #self.html = self.load("http://depositfiles.com/"+ form.group(1))
+ self.wait()
+ recaptcha = ReCaptcha(self)
+
+ for i in range(5):
+ self.html = self.load("http://depositfiles.com/get_file.php", get = params)
+ if '<input type=button value="Continue" onclick="check_recaptcha' in self.html:
+ if not captcha_key: self.fail('Parse error (Captcha key)')
+ if 'response' in params: self.invalidCaptcha()
+ params['challenge'], params['response'] = recaptcha.challenge(captcha_key)
+ self.logDebug(params)
+ continue
+
+ found = re.search(self.DOWNLOAD_LINK_PATTERN, self.html)
+ if found:
+ if 'response' in params: self.correctCaptcha()
+ link = urllib.unquote(found.group(1))
+ self.logDebug ("LINK: %s" % link)
+ break
+ else:
+ self.fail('Parse error (Download link)')
+ else:
+ self.fail('No valid captcha response received')
- self.html = self.load("http://depositfiles.com/get_file.php?fid=" + fid)
- link = urllib.unquote(re.search('<form action="(http://.+?\.depositfiles.com/.+?)" method="get"', self.html).group(1))
- self.logDebug ("LINK: %s" % link)
try:
self.download(link)
except:
self.retry(wait_time = 60)
- #wait_time = int(re.search(r'<span id="download_waiter_remain">(.*?)</span>', self.html).group(1))
- #self.setWait(wait_time)
- #self.log.debug("DepositFiles.com: Waiting %d seconds." % wait_time)
-
def handlePremium(self):
link = urllib.unquote(re.search('<div id="download_url">\s*<a href="(http://.+?\.depositfiles.com/.+?)"', self.html).group(1))
self.download(link) \ No newline at end of file
diff --git a/module/plugins/hoster/HellshareCz.py b/module/plugins/hoster/HellshareCz.py
index 7986ecf11..8c90e8099 100644
--- a/module/plugins/hoster/HellshareCz.py
+++ b/module/plugins/hoster/HellshareCz.py
@@ -48,7 +48,7 @@ class HellshareCz(Hoster):
__name__ = "HellshareCz"
__type__ = "hoster"
__pattern__ = r"http://(.*\.)*hellshare\.(cz|com|sk|hu)/.*"
- __version__ = "0.70"
+ __version__ = "0.71"
__description__ = """Hellshare.cz"""
__author_name__ = ("zoidberg")
@@ -97,7 +97,7 @@ class HellshareCz(Hoster):
def handleFree(self):
# hellshare is very generous
- if 'You exceeded your today's limit for free download. You can download only 1 files per 24 hours.' in self.html:
+ if "You exceeded your today's limit for free download. You can download only 1 files per 24 hours." in self.html:
t = datetime.datetime.today().replace(hour=1, minute=0, second=0) + datetime.timedelta(
days=1) - datetime.datetime.today()
self.setWait(t.seconds, True)
diff --git a/module/plugins/hoster/HotfileCom.py b/module/plugins/hoster/HotfileCom.py
index 96927a9fc..9c056d899 100644
--- a/module/plugins/hoster/HotfileCom.py
+++ b/module/plugins/hoster/HotfileCom.py
@@ -37,6 +37,8 @@ class HotfileCom(Hoster):
__author_name__ = ("sitacuisses","spoob","mkaay")
__author_mail__ = ("sitacuisses@yhoo.de","spoob@pyload.org","mkaay@mkaay.de")
+ FILE_OFFLINE_PATTERN = r'File is removed'
+
def setup(self):
self.html = [None, None]
self.wantReconnect = False
@@ -73,7 +75,10 @@ class HotfileCom(Hoster):
if not self.account:
self.downloadHTML()
-
+
+ if self.FILE_OFFLINE_PATTERN in self.html[0]:
+ self.offline()
+
self.setWait(self.getWaitTime())
self.wait()
@@ -131,3 +136,5 @@ class HotfileCom(Hoster):
self.wantReconnect = True
return waittime
return 65
+ else:
+ self.fail("Don't know how long to wait. Cannot proceed.")
diff --git a/module/plugins/internal/UnRar.py b/module/plugins/internal/UnRar.py
index 7ba1d01ba..1943f69e0 100644
--- a/module/plugins/internal/UnRar.py
+++ b/module/plugins/internal/UnRar.py
@@ -18,16 +18,14 @@
"""
import os
+import re
from os.path import join
from glob import glob
from subprocess import Popen, PIPE
-
from module.plugins.hooks.ExtractArchive import AbtractExtractor
from module.utils import save_join, decode
-import re
-
class UnRar(AbtractExtractor):
__name__ = "UnRar"
__version__ = "0.1"
@@ -138,7 +136,7 @@ class UnRar(AbtractExtractor):
def getDeleteFiles(self):
if ".part" in self.file:
- return glob(self.file.replace("0", "*").replace("1", "*"))
+ return glob(re.sub("(?<=\.part)([01]+)", "*", self.file, re.IGNORECASE))
return [self.file]
def listContent(self):
diff --git a/module/remote/thriftbackend/thriftgen/pyload/Pyload-remote b/module/remote/thriftbackend/thriftgen/pyload/Pyload-remote
index e2e56d5ca..854b1589e 100755
--- a/module/remote/thriftbackend/thriftgen/pyload/Pyload-remote
+++ b/module/remote/thriftbackend/thriftgen/pyload/Pyload-remote
@@ -74,7 +74,7 @@ if len(sys.argv) <= 1 or sys.argv[1] == '--help':
print ' void orderPackage(PackageID pid, i16 position)'
print ' void orderFile(FileID fid, i16 position)'
print ' void setPackageData(PackageID pid, data)'
- print ' void deleteFinished()'
+ print ' deleteFinished()'
print ' void restartFailed()'
print ' bool isCaptchaWaiting()'
print ' CaptchaTask getCaptchaTask(bool exclusive)'
diff --git a/module/remote/thriftbackend/thriftgen/pyload/Pyload.py b/module/remote/thriftbackend/thriftgen/pyload/Pyload.py
index 677e4afe2..a1bc63f75 100644
--- a/module/remote/thriftbackend/thriftgen/pyload/Pyload.py
+++ b/module/remote/thriftbackend/thriftgen/pyload/Pyload.py
@@ -1873,7 +1873,7 @@ class Client(Iface):
def deleteFinished(self, ):
self.send_deleteFinished()
- self.recv_deleteFinished()
+ return self.recv_deleteFinished()
def send_deleteFinished(self, ):
self._oprot.writeMessageBegin('deleteFinished', TMessageType.CALL, self._seqid)
@@ -1892,7 +1892,9 @@ class Client(Iface):
result = deleteFinished_result()
result.read(self._iprot)
self._iprot.readMessageEnd()
- return
+ if result.success is not None:
+ return result.success
+ raise TApplicationException(TApplicationException.MISSING_RESULT, "deleteFinished failed: unknown result");
def restartFailed(self, ):
self.send_restartFailed()
@@ -3085,7 +3087,7 @@ class Processor(Iface, TProcessor):
args.read(iprot)
iprot.readMessageEnd()
result = deleteFinished_result()
- self._handler.deleteFinished()
+ result.success = self._handler.deleteFinished()
oprot.writeMessageBegin("deleteFinished", TMessageType.REPLY, seqid)
result.write(oprot)
oprot.writeMessageEnd()
@@ -4904,13 +4906,22 @@ class deleteFinished_args(TBase):
class deleteFinished_result(TBase):
+ """
+ Attributes:
+ - success
+ """
__slots__ = [
+ 'success',
]
thrift_spec = (
+ (0, TType.LIST, 'success', (TType.I32,None), None, ), # 0
)
+ def __init__(self, success=None,):
+ self.success = success
+
class restartFailed_args(TBase):