diff options
| author | 2014-09-08 01:08:03 +0200 | |
|---|---|---|
| committer | 2014-09-14 11:03:20 +0200 | |
| commit | 91115fd577f20704ef7f2e74c4527ffbb0730a09 (patch) | |
| tree | 198fc68f1eb6f42e220d0f1c68499f48ae70543c /pyload/common/packagetools.py | |
| parent | Project __init__ with info (diff) | |
| download | pyload-91115fd577f20704ef7f2e74c4527ffbb0730a09.tar.xz | |
Restructure pyload file tree (1)
Diffstat (limited to 'pyload/common/packagetools.py')
| -rw-r--r-- | pyload/common/packagetools.py | 136 | 
1 files changed, 0 insertions, 136 deletions
| diff --git a/pyload/common/packagetools.py b/pyload/common/packagetools.py deleted file mode 100644 index d5ab4d182..000000000 --- a/pyload/common/packagetools.py +++ /dev/null @@ -1,136 +0,0 @@ -# JDownloader/src/jd/controlling/LinkGrabberPackager.java - -import re -from urlparse import urlparse - -def matchFirst(string, *args): -    """ matches against list of regexp and returns first match""" -    for patternlist in args: -        for pattern in patternlist: -            r = pattern.search(string) -            if r is not None: -                name = r.group(1) -                return name - -    return string - - -def parseNames(files): -    """ Generates packages names from name, data lists - -    :param files: list of (name, data) -    :return: packagenames mapt to data lists (eg. urls) -    """ -    packs = {} - -    endings = "\\.(3gp|7zip|7z|abr|ac3|aiff|aifc|aif|ai|au|avi|bin|bz2|cbr|cbz|ccf|cue|cvd|chm|dta|deb|divx|djvu|dlc|dmg|doc|docx|dot|eps|exe|ff|flv|f4v|gsd|gif|gz|iwd|iso|ipsw|java|jar|jpg|jpeg|jdeatme|load|mws|mw|m4v|m4a|mkv|mp2|mp3|mp4|mov|movie|mpeg|mpe|mpg|msi|msu|msp|nfo|npk|oga|ogg|ogv|otrkey|pkg|png|pdf|pptx|ppt|pps|ppz|pot|psd|qt|rmvb|rm|rar|ram|ra|rev|rnd|r\\d+|rpm|run|rsdf|rtf|sh(!?tml)|srt|snd|sfv|swf|tar|tif|tiff|ts|txt|viv|vivo|vob|wav|wmv|xla|xls|xpi|zeno|zip|z\\d+|_[_a-z]{2}|\\d+$)" - -    rarPats = [re.compile("(.*)(\\.|_|-)pa?r?t?\\.?[0-9]+.(rar|exe)$", re.I), -               re.compile("(.*)(\\.|_|-)part\\.?[0]*[1].(rar|exe)$", re.I), -               re.compile("(.*)\\.rar$", re.I), -               re.compile("(.*)\\.r\\d+$", re.I), -               re.compile("(.*)(\\.|_|-)\\d+$", re.I)] - -    zipPats = [re.compile("(.*)\\.zip$", re.I), -               re.compile("(.*)\\.z\\d+$", re.I), -               re.compile("(?is).*\\.7z\\.[\\d]+$", re.I), -               re.compile("(.*)\\.a.$", re.I)] - -    ffsjPats = [re.compile("(.*)\\._((_[a-z])|([a-z]{2}))(\\.|$)"), -                re.compile("(.*)(\\.|_|-)[\\d]+(" + endings + "$)", re.I)] - -    iszPats = [re.compile("(.*)\\.isz$", re.I), -               re.compile("(.*)\\.i\\d{2}$", re.I)] - -    pat1 = re.compile("(\\.?CD\\d+)", re.I) -    pat2 = re.compile("(\\.?part\\d+)", re.I) - -    pat3 = re.compile("(.+)[\\.\\-_]+$") -    pat4 = re.compile("(.+)\\.\\d+\\.xtm$") - -    for file, url in files: -        patternMatch = False - -        if file is None: -            continue - -        # remove trailing / -        name = file.rstrip('/') - -        # extract last path part .. if there is a path -        split = name.rsplit("/", 1) -        if len(split) > 1: -            name = split.pop(1) - -            #check if a already existing package may be ok for this file -        #        found = False -        #        for pack in packs: -        #            if pack in file: -        #                packs[pack].append(url) -        #                found = True -        #                break -        # -        #        if found: continue - -        # unrar pattern, 7zip/zip and hjmerge pattern, isz pattern, FFSJ pattern -        before = name -        name = matchFirst(name, rarPats, zipPats, iszPats, ffsjPats) -        if before != name: -            patternMatch = True - -        # xtremsplit pattern -        r = pat4.search(name) -        if r is not None: -            name = r.group(1) - -        # remove part and cd pattern -        r = pat1.search(name) -        if r is not None: -            name = name.replace(r.group(0), "") -            patternMatch = True - -        r = pat2.search(name) -        if r is not None: -            name = name.replace(r.group(0), "") -            patternMatch = True - -        # additional checks if extension pattern matched -        if patternMatch: -            # remove extension -            index = name.rfind(".") -            if index <= 0: -                index = name.rfind("_") -            if index > 0: -                length = len(name) - index -                if length <= 4: -                    name = name[:-length] - -            # remove endings like . _ - -            r = pat3.search(name) -            if r is not None: -                name = r.group(1) - -            # replace . and _ with space -            name = name.replace(".", " ") -            name = name.replace("_", " ") - -            name = name.strip() -        else: -            name = "" - -        # fallback: package by hoster -        if not name: -            name = urlparse(file).hostname -            if name: name = name.replace("www.", "") - -        # fallback : default name -        if not name: -            name = "unknown" - -        # build mapping -        if name in packs: -            packs[name].append(url) -        else: -            packs[name] = [url] - -    return packs | 
