diff options
| author | 2009-09-04 22:54:33 +0200 | |
|---|---|---|
| committer | 2009-09-04 22:54:33 +0200 | |
| commit | 5a7d201ab8a07184cb38e0b5022441da899b4ad4 (patch) | |
| tree | 0a6862e584a775ce64a67846623404d3f17bf320 /module/captcha/ShareonlineBiz.py | |
| parent | Removed tag v0.2 (diff) | |
| download | pyload-5a7d201ab8a07184cb38e0b5022441da899b4ad4.tar.xz | |
pyLoad 0.2.1v0.2.1
Diffstat (limited to 'module/captcha/ShareonlineBiz.py')
| -rw-r--r-- | module/captcha/ShareonlineBiz.py | 61 | 
1 files changed, 61 insertions, 0 deletions
| diff --git a/module/captcha/ShareonlineBiz.py b/module/captcha/ShareonlineBiz.py new file mode 100644 index 000000000..91124f181 --- /dev/null +++ b/module/captcha/ShareonlineBiz.py @@ -0,0 +1,61 @@ +#!/usr/bin/env python +# -*- coding: utf-8 -*- +# +#Copyright (C) 2009 kingzero, RaNaN +# +#This program is free software; you can redistribute it and/or modify +#it under the terms of the GNU General Public License as published by +#the Free Software Foundation; either version 3 of the License, +#or (at your option) any later version. +# +#This program is distributed in the hope that it will be useful, +#but WITHOUT ANY WARRANTY; without even the implied warranty of +#MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. +#See the GNU General Public License for more details. +# +#You should have received a copy of the GNU General Public License +# along with this program; if not, see <http://www.gnu.org/licenses/>. +# +### +from captcha import OCR + +class ShareonlineBiz(OCR): +    def __init__(self): +        OCR.__init__(self) +         +    def get_captcha(self, image):  +        self.load_image(image) +        self.to_greyscale() +        self.image = self.image.resize((160, 50)) +        self.pixels = self.image.load() +        self.threshold(1.85) +        #self.eval_black_white(240) +        #self.derotate_by_average() + +        letters = self.split_captcha_letters() +         +        final = "" +        for letter in letters: +            self.image = letter +            self.run_tesser() +            final += self.result_captcha + +        #replace common errors +        final = self.correct({ +        "A": "4", +        "‘5": "3", +        ("‘1", "T"): "7", +        ("‘L", "B", "'L"): "2", +        "b": "6", +        ("I", "X"): "1" +        }, final) + +        return final + +        #tesseract at 60% + +if __name__ == '__main__': +    import urllib +    ocr = ShareonlineBiz() +    urllib.urlretrieve("http://www.share-online.biz/captcha.php", "captcha.jpeg") +    print  ocr.get_captcha('captcha.jpeg') | 
