summaryrefslogtreecommitdiffstats
path: root/module/plugins/ocr/NetloadIn.py
diff options
context:
space:
mode:
authorGravatar Walter Purcaro <vuolter@gmail.com> 2014-07-10 03:26:45 +0200
committerGravatar Walter Purcaro <vuolter@gmail.com> 2014-07-10 03:26:45 +0200
commitc1abc13d4dccb20f3845594c28952667573b7d0b (patch)
treeda8a8678bd804bec77ef16e864bfe2bf2e561eaf /module/plugins/ocr/NetloadIn.py
parentImproved filename sanitation removing non-ascii chars. (diff)
downloadpyload-c1abc13d4dccb20f3845594c28952667573b7d0b.tar.xz
Move captcha to ocr
Diffstat (limited to 'module/plugins/ocr/NetloadIn.py')
-rw-r--r--module/plugins/ocr/NetloadIn.py26
1 files changed, 26 insertions, 0 deletions
diff --git a/module/plugins/ocr/NetloadIn.py b/module/plugins/ocr/NetloadIn.py
new file mode 100644
index 000000000..9fc2f0725
--- /dev/null
+++ b/module/plugins/ocr/NetloadIn.py
@@ -0,0 +1,26 @@
+# -*- coding: utf-8 -*-
+
+from module.plugins.OCR import OCR
+
+class NetloadIn(OCR):
+ __name__ = "NetloadIn"
+ def __init__(self):
+ OCR.__init__(self)
+
+ def get_captcha(self, image):
+ self.load_image(image)
+ self.to_greyscale()
+ self.clean(3)
+ self.clean(3)
+ self.run_tesser(True, True, False, False)
+
+ self.result_captcha = self.result_captcha.replace(" ", "")[:4] # cut to 4 numbers
+
+ return self.result_captcha
+
+if __name__ == '__main__':
+ import urllib
+ ocr = NetloadIn()
+ urllib.urlretrieve("http://netload.in/share/includes/captcha.php", "captcha.png")
+
+ print ocr.get_captcha('captcha.png')