summaryrefslogtreecommitdiffstats
path: root/module/plugins/hoster/CzshareCom.py
diff options
context:
space:
mode:
Diffstat (limited to 'module/plugins/hoster/CzshareCom.py')
-rw-r--r--module/plugins/hoster/CzshareCom.py144
1 files changed, 111 insertions, 33 deletions
diff --git a/module/plugins/hoster/CzshareCom.py b/module/plugins/hoster/CzshareCom.py
index 74c582dae..f6cbb200a 100644
--- a/module/plugins/hoster/CzshareCom.py
+++ b/module/plugins/hoster/CzshareCom.py
@@ -20,84 +20,160 @@ import re
from module.plugins.Hoster import Hoster
from module.network.RequestFactory import getURL
+def toInfoPage(url):
+ if r"/download.php?" in url:
+ try:
+ id = re.search(r"id=(\d+)", url).group(1)
+ code = re.search(r"code=(\w+)", url).group(1)
+ except Exception, e:
+ return None
+ return "http://czshare.com/%s/%s/" % (id, code)
+ return url
+
def getInfo(urls):
result = []
for url in urls:
+ info_url = toInfoPage(url)
+ if info_url:
+ html = getURL(info_url, decode=True)
+ if re.search(CzshareCom.FILE_OFFLINE_PATTERN, html):
+ # File offline
+ result.append((url, 0, 1, url))
+ else:
+ # Get file info
+ name, size = url, 0
- html = getURL(url, decode=True)
- if re.search(CzshareCom.FILE_OFFLINE_PATTERN, html):
- # File offline
- result.append((url, 0, 1, url))
- else:
- # Get file info
- found = re.search(CzshareCom.FILE_NAME_PATTERN, html)
- if found is not None:
- name = found.group(1)
-
found = re.search(CzshareCom.FILE_SIZE_PATTERN, html)
if found is not None:
- size = float(found.group(1).replace(',','.'))
+ size = float(found.group(1).replace(',','.').replace(' ',''))
units = found.group(2)
pow = {'KiB': 1, 'MiB': 2, 'GiB': 3}[units]
size = int(size * 1024 ** pow)
+
+ found = re.search(CzshareCom.FILE_NAME_PATTERN, html)
+ if found is not None:
+ name = found.group(1)
+
+ if found or size > 0:
result.append((name, size, 2, url))
- else:
- result.append((name, 0, 2, url))
yield result
class CzshareCom(Hoster):
__name__ = "CzshareCom"
__type__ = "hoster"
- __pattern__ = r"http://(\w*\.)*czshare\.(com|cz)/.*"
- __version__ = "0.7"
+ __pattern__ = r"http://(\w*\.)*czshare\.(com|cz)/(\d+/|download.php\?).*"
+ __version__ = "0.8"
__description__ = """CZshare.com"""
__author_name__ = ("zoidberg")
- __author_mail__ = ("zoidberg@mujmail.cz")
- FILE_URL_PATTERN = r'<a href="([^"]+)" class="page-download">[^>]*alt="([^"]+)" /></a>'
- FORM_PATTERN = r'<form action="download.php" method="post">\s*<img src="captcha.php" id="captcha" />(.*?)</form>'
+ FREE_URL_PATTERN = r'<a href="([^"]+)" class="page-download">[^>]*alt="([^"]+)" /></a>'
+ FREE_FORM_PATTERN = r'<form action="download.php" method="post">\s*<img src="captcha.php" id="captcha" />(.*?)</form>'
+ PREMIUM_FORM_PATTERN = r'<form action="/profi_down.php" method="post">(.*?)</form>'
FORM_INPUT_PATTERN = r'<input[^>]* name="([^"]+)" value="([^"]+)"[^>]*/>'
- FILE_OFFLINE_PATTERN = r'<h2 class="red">[^<]*[Ss]oubor (nenalezen|expiroval|je po.kozen)[^<]*<span>&nbsp;</span></h2>'
+ FILE_OFFLINE_PATTERN = r'<h2 class="red">[^<]*[Ss]oubor (nenalezen|expiroval|je po.kozen|byl smaz.n)[^<]*<span>&nbsp;</span></h2>'
MULTIDL_PATTERN = r"<p><font color='red'>Z[^<]*PROFI.</font></p>"
- FILE_NAME_PATTERN = r'<h1>([^<]+)<span>&nbsp;</span></h1>'
- FILE_SIZE_PATTERN = r'<div class="tab" id="category">\s*Velikost:\s*([0-9.,]+)(KiB|MiB|GiB)\s*</div>'
+ #FILE_NAME_PATTERN = r'<h1>([^<]+)<span>&nbsp;</span></h1>'
+ FILE_NAME_PATTERN = r'<div class="tab" id="parameters">\s*<p>\s*Cel. n.zev: <a href=[^>]*>([^<]+)</a>'
+ FILE_SIZE_PATTERN = r'<div class="tab" id="category">(?:\s*<p>[^\n]*</p>)*\s*Velikost:\s*([0-9., ]+)(KiB|MiB|GiB)\s*</div>'
+ USER_CREDIT_PATTERN = r'<div class="credit">\s*kredit: <strong>([0-9., ]+)(KB|MB|GB)</strong>\s*</div><!-- .credit -->'
def setup(self):
- self.multiDL = False
+ self.resumeDownload = self.multiDL = True if self.premium else False
+ self.chunkLimit = 1
def process(self, pyfile):
- self.html = self.load(pyfile.url, cookies=True, decode=True)
+ self.getFileInfo(pyfile)
+
+ if self.premium and self.account is not None:
+ for i in range(2):
+ if self.handlePremium(pyfile): break
+ else:
+ self.resetAccount()
+ else:
+ self.handleFree(pyfile)
+ self.checkDownloadedFile()
+
+ def getFileInfo(self, pyfile):
+ url = toInfoPage(pyfile.url)
+ if not url:
+ self.logError(e)
+ self.fail("Invalid URL")
+
+ self.html = self.load(url, cookies=True, decode=True)
#marks the file as "offline" when the pattern was found on the html-page
if re.search(self.FILE_OFFLINE_PATTERN, self.html) is not None:
self.offline()
# parse the name from the site and set attribute in pyfile
- found = re.search(self.FILE_URL_PATTERN, self.html)
+ found = re.search(self.FILE_NAME_PATTERN, self.html)
if found is None:
- self.fail("Parse error (URL)")
+ self.fail("Parse error (NAME)")
+ pyfile.name = found.group(1)
+ self.logDebug("NAME:" + pyfile.name)
- pyfile.name = found.group(2)
+ found = re.search(self.FILE_SIZE_PATTERN, self.html)
+ if found is None:
+ self.logError("Parse error (SIZE)")
+ else:
+ size = float(found.group(1).replace(',','.').replace(' ',''))
+ pyfile.size = size * 1024 ** {'KiB': 1, 'MiB': 2, 'GiB': 3}[found.group(2)]
+
+ def handlePremium(self, pyfile):
+ # check user credit
+ found = re.search(self.USER_CREDIT_PATTERN, self.html)
+ if found is None:
+ self.account.relogin(self.user)
+ return False
+
+ try:
+ credit = float(found.group(1).replace(',','.').replace(' ',''))
+ credit = credit * 1024 ** {'KB': 0, 'MB': 1, 'GB': 2}[found.group(2)]
+ self.logInfo("Premium download for %i KiB of Credit" % (pyfile.size / 1024))
+ self.logInfo("User %s has %i KiB left" % (self.user, credit))
+ if credit * 1024 < pyfile.size:
+ self.logInfo("Not enough credit to download file %s" % pyfile.name)
+ self.resetAccount()
+ except Exception, e:
+ # let's continue and see what happens...
+ self.logError('Parse error (CREDIT): %s' % e)
+
+ # parse download link
+ try:
+ form = re.search(self.PREMIUM_FORM_PATTERN, self.html, re.DOTALL).group(1)
+ inputs = dict(re.findall(self.FORM_INPUT_PATTERN, form))
+ except Exception, e:
+ self.logError("Parse error (FORM): %s" % e)
+ self.resetAccount()
+
+ # download the file, destination is determined by pyLoad
+ self.download("http://czshare.com/profi_down.php", cookies=True, post=inputs)
+ return True
+
+ def handleFree(self, pyfile):
+ # get free url
+ found = re.search(self.FREE_URL_PATTERN, self.html)
+ if found is None:
+ self.fail("Parse error (URL)")
parsed_url = "http://czshare.com" + found.group(1)
+ self.logDebug("PARSED_URL:" + parsed_url)
# get download ticket and parse html
- self.logDebug("PARSED_URL:" + parsed_url)
- self.logDebug("NAME:" + pyfile.name)
self.html = self.load(parsed_url, cookies=True)
- #if not re.search(self.FORM_PATTERN, self.html):
+ #if not re.search(self.FREE_FORM_PATTERN, self.html):
if re.search(self.MULTIDL_PATTERN, self.html):
self.waitForFreeSlot()
try:
- form = re.search(self.FORM_PATTERN, self.html, re.DOTALL).group(1)
+ form = re.search(self.FREE_FORM_PATTERN, self.html, re.DOTALL).group(1)
inputs = dict(re.findall(self.FORM_INPUT_PATTERN, form))
- pyfile.size = float(inputs['size'])/1024
+ pyfile.size = int(inputs['size'])
except Exception, e:
self.logError(e)
self.fail("Parse error (FORM)")
-
+
# get and decrypt captcha
captcha_url = 'http://czshare.com/captcha.php'
inputs['captchastring2'] = self.decryptCaptcha(captcha_url)
@@ -106,11 +182,13 @@ class CzshareCom(Hoster):
# download the file, destination is determined by pyLoad
self.download(parsed_url, cookies=True, post=inputs)
+
+ def checkDownloadedFile(self):
# check download
check = self.checkDownload({
"tempoffline": re.compile(r"^Soubor je do.asn. nedostupn.$"),
"multi_dl": re.compile(self.MULTIDL_PATTERN),
- "captcha_err": re.compile(self.FORM_PATTERN)
+ "captcha_err": re.compile(self.FREE_FORM_PATTERN)
})
if check == "tempoffline":