new experimental backend, new gui status (unfinished)

author: mkaay <mkaay@mkaay.de> 2010-12-19 14:12:03 +0100
committer: mkaay <mkaay@mkaay.de> 2010-12-19 14:12:03 +0100
commit: 5120d1a26cac79ab283f38db8d7f18c9c010e786 (patch)
tree: 219f8874869ac6f9c1656fea9df8db17b55ce034 /module/network/HTTPDownload.py
parent: acc manager fix (diff)
download: pyload-5120d1a26cac79ab283f38db8d7f18c9c010e786.tar.xz
1 files changed, 305 insertions, 0 deletions
diff --git a/module/network/HTTPDownload.py b/module/network/HTTPDownload.py
new file mode 100644
index 000000000..78dc00d72
--- /dev/null
+++ b/module/network/HTTPDownload.py
@@ -0,0 +1,305 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+"""
+    This program is free software; you can redistribute it and/or modify
+    it under the terms of the GNU General Public License as published by
+    the Free Software Foundation; either version 3 of the License,
+    or (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.
+    See the GNU General Public License for more details.
+
+    You should have received a copy of the GNU General Public License
+    along with this program; if not, see <http://www.gnu.org/licenses/>.
+    
+    @author: mkaay
+"""
+
+from HTTPChunk import HTTPChunk
+from helper import *
+from os.path import exists, getsize
+from os import remove
+from shutil import move, copyfileobj
+
+from cookielib import CookieJar
+
+class WrongFormat(Exception):
+    pass
+
+class ChunkInfo():
+    def __init__(self, name):
+        self.name = name
+        self.size = None
+        self.loaded = False
+        self.chunks = []
+    
+    def setSize(self, size):
+        self.size = int(size)
+    
+    def addChunk(self, name, range, encoding):
+        self.chunks.append((name, range, encoding))
+    
+    def clear(self):
+        self.chunks = []
+        self.loaded = False
+    
+    def save(self):
+        fh = open("%s.chunks" % self.name, "w")
+        fh.write("name:%s\n" % self.name)
+        fh.write("size:%s\n" % self.size)
+        for i, c in enumerate(self.chunks):
+            fh.write("#%d:\n" % i)
+            fh.write("\tname:%s\n" % c[0])
+            fh.write("\tencoding:%s\n" % c[2])
+            fh.write("\trange:%i-%i\n" % c[1])
+    
+    @staticmethod
+    def load(name):
+        if not exists("%s.chunks" % name):
+            raise IOError()
+        fh = open("%s.chunks" % name, "r")
+        name = fh.readline()[:-1]
+        size = fh.readline()[:-1]
+        if name.startswith("name:") and size.startswith("size:"):
+            name = name[5:]
+            size = size[5:]
+        else:
+            raise WrongFormat()
+        ci = ChunkInfo(name)
+        ci.loaded = True
+        ci.setSize(size)
+        while True:
+            if not fh.readline(): #skip line
+                break
+            name = fh.readline()[1:-1]
+            encoding = fh.readline()[1:-1]
+            range = fh.readline()[1:-1]
+            if name.startswith("name:") and encoding.startswith("encoding:") and range.startswith("range:"):
+                name = name[5:]
+                encoding = encoding[9:]
+                range = range[6:].split("-")
+            else:
+                raise WrongFormat()
+            
+            ci.addChunk(name, (long(range[0]), long(range[1])), encoding)
+        return ci
+    
+    def removeInfo(self):
+        remove("%s.chunks" % self.name)
+    
+    def getCount(self):
+        return len(self.chunks)
+    
+    def getChunkName(self, index):
+        return self.chunks[index][0]
+    
+    def getChunkRange(self, index):
+        return self.chunks[index][1]
+        
+    def getChunkEncoding(self, index):
+        return self.chunks[index][2]
+
+class HTTPDownload():
+    def __init__(self, url, filename, get={}, post={}, referer=None, cookies=True, customHeaders={}, bucket=None, interface=None, proxies={}):
+        self.url = url
+        self.filename = filename
+        self.interface = interface
+        self.proxies = proxies
+        
+        self.get = get
+        self.post = post
+        
+        self.referer = referer
+        self.cookies = cookies
+        
+        self.customHeaders = customHeaders
+        
+        self.bucket = bucket
+        
+        self.deferred = Deferred()
+        
+        self.finished = False
+        self.size = None
+        
+        self.cookieJar = CookieJar()
+        
+        self.chunks = []
+        try:
+            self.info = ChunkInfo.load(filename)
+        except IOError:
+            self.info = ChunkInfo(filename)
+        self.noChunkSupport = False
+    
+    @property
+    def arrived(self):
+        arrived = 0
+        for i in range(self.info.getCount()):
+            arrived += getsize(self.info.getChunkName(i)) #ugly, but difficult to calc otherwise due chunk resume
+        return arrived
+    
+    def abort(self):
+        for chunk in self.chunks:
+            chunk.abort = True
+    
+    def getSpeed(self):
+        speed = 0
+        for chunk in self.chunks:
+            speed += chunk.getSpeed()
+        return speed
+    
+    @property
+    def speed(self):
+        return self.getSpeed()
+    
+    def _copyChunks(self):
+        fo = open(self.filename, "wb")
+        for i in range(self.info.getCount()):
+            encoding = self.info.getChunkEncoding(i)
+            
+            decompress = lambda data: data
+            if encoding == "gzip":
+                gz = zlib.decompressobj(16+zlib.MAX_WBITS)
+                decompress = lambda data: gz.decompress(data)
+            if encoding == "deflate":
+                df = zlib.decompressobj(-zlib.MAX_WBITS)
+                decompress = lambda data: df.decompress(data)
+            
+            fname = "%s.chunk%d" % (self.filename, i)
+            fi = open(fname, "rb")
+            while True:
+                data = fi.read(512*1024)
+                if not data:
+                    break
+                fo.write(decompress(data))
+            fi.close()
+            remove(fname)
+        fo.close()
+        self.info.removeInfo()
+        self.deferred.callback()
+    
+    def _createChunk(self, fh, range=None):
+        chunk = HTTPChunk(self.url, fh, get=self.get, post=self.post,
+                          referer=self.referer, cookies=self.cookies,
+                          customHeaders=self.customHeaders,
+                          bucket=self.bucket, range=range,
+                          interface=self.interface, proxies=self.proxies)
+        chunk.cookieJar = self.cookieJar
+        return chunk
+    
+    def download(self, chunks=1, resume=False):
+        if chunks > 0:
+            dg = DeferredGroup()
+            if self.info.loaded and not self.info.getCount() == chunks:
+                self.info.clear()
+            crange = None
+            if resume:
+                if self.info.getCount() == chunks and exists("%s.chunk0" % (self.filename, )):
+                    crange = self.info.getChunkRange(0)
+                    crange = (crange[0]+getsize("%s.chunk0" % (self.filename, )), crange[1])
+            
+            if crange is None or crange[1]-crange[0] > 0:
+                fh = open("%s.chunk0" % (self.filename, ), "ab" if crange else "wb")
+                chunk = self._createChunk(fh, range=crange)
+                self.chunks.append(chunk)
+                d = chunk.download()
+                dg.addDeferred(d)
+                
+                if not self.info.loaded:
+                    size = chunk.size
+                    chunksize = size/chunks
+                    lastchunk = chunksize
+                    
+                    chunk.range = (0, chunksize-1)
+                    chunk.noRangeHeader = True
+                    self.size = chunk.size
+                    self.info.setSize(self.size)
+                    chunk.size = chunksize
+                    self.info.addChunk("%s.chunk0" % (self.filename, ), chunk.range, chunk.getEncoding())
+                    
+                    lastchunk = size - chunksize*(chunks-1)
+                else:
+                    self.size = self.info.size
+                self.firstchunk = chunk
+            
+            for i in range(1, chunks):
+                cont = False
+                if not self.info.loaded: #first time load
+                    if i+1 == chunks:
+                        rng = (i*chunksize, i*chunksize+lastchunk)
+                    else:
+                        rng = (i*chunksize, (i+1)*chunksize-1)
+                else: #not finished
+                    rng = self.info.getChunkRange(i)
+                    if resume and exists("%s.chunk%d" % (self.filename, i)): #continue chunk
+                        rng = (rng[0]+getsize("%s.chunk%d" % (self.filename, i)), rng[1])
+                        cont = True
+                
+                if rng[1]-rng[0] <= 0: #chunk done
+                    continue
+                
+                fh = open("%s.chunk%d" % (self.filename, i), "ab" if cont else "wb")
+                chunk = self._createChunk(fh, range=rng)
+                self.chunks.append(chunk)
+                d = chunk.download()
+                if not chunk.resp.getcode() == 206 and i == 1: #no range supported, tell chunk0 to download everything
+                    chunk.abort = True
+                    self.noChunkSupport = True
+                    self.firstchunk.size = self.size
+                    self.firstchunk.range = None
+                    self.info.clear()
+                    self.info.addChunk("%s.chunk0" % (self.filename, ), (0, self.firstchunk.size), chunk.getEncoding())
+                    break
+                dg.addDeferred(d)
+                
+                if not self.info.loaded:
+                    self.info.addChunk("%s.chunk%d" % (self.filename, i), chunk.range, chunk.getEncoding())
+            
+            self.info.save()
+            dg.addCallback(self._copyChunks)
+            if len(self.chunks) == 0:
+                dg.callback()
+            return self.deferred
+        else:
+            raise Exception("no chunks")
+
+if __name__ == "__main__":
+    import sys
+    from Bucket import Bucket
+    bucket = Bucket()
+    #bucket.setRate(200*1000)
+    bucket = None
+    
+    url = "http://mirror.sov.uk.goscomb.net/ubuntu-releases/maverick/ubuntu-10.10-desktop-i386.iso"
+    
+    finished = False
+    def err(*a, **b):
+        print a, b
+    def callb(*a, **b):
+        global finished
+        finished = True
+        print a, b
+    
+    print "starting"
+    
+    dwnld = HTTPDownload(url, "ubuntu.iso")
+    d = dwnld.download(chunks=1, resume=True)
+    d.addCallback(callb)
+    d.addErrback(err)
+    
+    try:
+        while True:
+            for a, chunk in enumerate(dwnld.chunks):
+                if not chunk.finished:
+                    print "#%d" % a, chunk.getSpeed()/1024, "kb/s", "size", int(float(chunk.arrived)/chunk.size*100), "%"
+                else:
+                    print "#%d" % a, "finished"
+            print "sum", dwnld.speed/1024, dwnld.arrived, "/", dwnld.size, int(float(dwnld.arrived)/dwnld.size*100), "%"
+            if finished:
+                print "- finished"
+                break
+            sleep(1)
+    except KeyboardInterrupt:
+        dwnld.abort()
+        sys.exit()
author	mkaay <mkaay@mkaay.de>	2010-12-19 14:12:03 +0100
committer	mkaay <mkaay@mkaay.de>	2010-12-19 14:12:03 +0100
commit	5120d1a26cac79ab283f38db8d7f18c9c010e786 (patch)
tree	219f8874869ac6f9c1656fea9df8db17b55ce034 /module/network/HTTPDownload.py
parent	acc manager fix (diff)
download	pyload-5120d1a26cac79ab283f38db8d7f18c9c010e786.tar.xz