summaryrefslogtreecommitdiffhomepage
path: root/libs/deathbycaptcha.py
diff options
context:
space:
mode:
authorLouis Vézina <[email protected]>2019-09-16 22:04:27 -0400
committerLouis Vézina <[email protected]>2019-09-16 22:04:27 -0400
commit3ca2c98cd42f24299ac08daa26ed8a21a44c60de (patch)
tree225f3a4bdf7a8276299f71b49e3c37ba1e420a8d /libs/deathbycaptcha.py
parentc5fa0f56e41ee03fd7b02f6474cbb4fd1bdf08e6 (diff)
downloadbazarr-3ca2c98cd42f24299ac08daa26ed8a21a44c60de.tar.gz
bazarr-3ca2c98cd42f24299ac08daa26ed8a21a44c60de.zip
WIP
Diffstat (limited to 'libs/deathbycaptcha.py')
-rw-r--r--libs/deathbycaptcha.py436
1 files changed, 274 insertions, 162 deletions
diff --git a/libs/deathbycaptcha.py b/libs/deathbycaptcha.py
index 8bc04ab93..05aa8f68d 100644
--- a/libs/deathbycaptcha.py
+++ b/libs/deathbycaptcha.py
@@ -1,6 +1,73 @@
#!/usr/bin/env python
# -*- coding: UTF-8 -*-
+"""Death by Captcha HTTP and socket API clients.
+
+There are two types of Death by Captcha (DBC hereinafter) API: HTTP and
+socket ones. Both offer the same functionalily, with the socket API
+sporting faster responses and using way less connections.
+
+To access the socket API, use SocketClient class; for the HTTP API, use
+HttpClient class. Both are thread-safe. SocketClient keeps a persistent
+connection opened and serializes all API requests sent through it, thus
+it is advised to keep a pool of them if you're script is heavily
+multithreaded.
+
+Both SocketClient and HttpClient give you the following methods:
+
+get_user()
+ Returns your DBC account details as a dict with the following keys:
+
+ "user": your account numeric ID; if login fails, it will be the only
+ item with the value of 0;
+ "rate": your CAPTCHA rate, i.e. how much you will be charged for one
+ solved CAPTCHA in US cents;
+ "balance": your DBC account balance in US cents;
+ "is_banned": flag indicating whether your account is suspended or not.
+
+get_balance()
+ Returns your DBC account balance in US cents.
+
+get_captcha(cid)
+ Returns an uploaded CAPTCHA details as a dict with the following keys:
+
+ "captcha": the CAPTCHA numeric ID; if no such CAPTCHAs found, it will
+ be the only item with the value of 0;
+ "text": the CAPTCHA text, if solved, otherwise None;
+ "is_correct": flag indicating whether the CAPTCHA was solved correctly
+ (DBC can detect that in rare cases).
+
+ The only argument `cid` is the CAPTCHA numeric ID.
+
+get_text(cid)
+ Returns an uploaded CAPTCHA text (None if not solved). The only argument
+ `cid` is the CAPTCHA numeric ID.
+
+report(cid)
+ Reports an incorrectly solved CAPTCHA. The only argument `cid` is the
+ CAPTCHA numeric ID. Returns True on success, False otherwise.
+
+upload(captcha)
+ Uploads a CAPTCHA. The only argument `captcha` can be either file-like
+ object (any object with `read` method defined, actually, so StringIO
+ will do), or CAPTCHA image file name. On successul upload you'll get
+ the CAPTCHA details dict (see get_captcha() method).
+
+ NOTE: AT THIS POINT THE UPLOADED CAPTCHA IS NOT SOLVED YET! You have
+ to poll for its status periodically using get_captcha() or get_text()
+ method until the CAPTCHA is solved and you get the text.
+
+decode(captcha, timeout=DEFAULT_TIMEOUT)
+ A convenient method that uploads a CAPTCHA and polls for its status
+ periodically, but no longer than `timeout` (defaults to 60 seconds).
+ If solved, you'll get the CAPTCHA details dict (see get_captcha()
+ method for details). See upload() method for details on `captcha`
+ argument.
+
+Visit http://www.deathbycaptcha.com/user/api for updates.
+
+"""
+
import base64
import binascii
import errno
@@ -12,7 +79,7 @@ import socket
import sys
import threading
import time
-
+import urllib
try:
from json import read as json_decode, write as json_encode
except ImportError:
@@ -21,67 +88,60 @@ except ImportError:
except ImportError:
from simplejson import loads as json_decode, dumps as json_encode
-try:
- from urllib2 import build_opener, HTTPRedirectHandler, Request, HTTPError
- from urllib import urlencode, urlopen
-except ImportError:
- from urllib.request import build_opener, HTTPRedirectHandler, Request, urlopen
- from urllib.error import HTTPError
- from urllib.parse import urlencode
# API version and unique software ID
-API_VERSION = 'DBC/Python v4.0.11'
-SOFTWARE_VENDOR_ID = 0
+API_VERSION = 'DBC/Python v4.6'
# Default CAPTCHA timeout and decode() polling interval
DEFAULT_TIMEOUT = 60
-POLLS_INTERVAL = 5
+DEFAULT_TOKEN_TIMEOUT = 120
+POLLS_INTERVAL = [1, 1, 2, 3, 2, 2, 3, 2, 2]
+DFLT_POLL_INTERVAL = 3
# Base HTTP API url
-HTTP_BASE_URL = 'http://api.deathbycaptcha.com/api'
+HTTP_BASE_URL = 'http://api.dbcapi.me/api'
# Preferred HTTP API server's response content type, do not change
HTTP_RESPONSE_TYPE = 'application/json'
# Socket API server's host & ports range
-SOCKET_HOST = 'api.deathbycaptcha.com'
+SOCKET_HOST = 'api.dbcapi.me'
SOCKET_PORTS = range(8123, 8131)
+
+def _load_image(captcha):
+ if hasattr(captcha, 'read'):
+ img = captcha.read()
+ elif type(captcha) == bytearray:
+ img = captcha
+ else:
+ img = ''
+ try:
+ captcha_file = open(captcha, 'rb')
+ except Exception:
+ raise
+ else:
+ img = captcha_file.read()
+ captcha_file.close()
+ if not len(img):
+ raise ValueError('CAPTCHA image is empty')
+ elif imghdr.what(None, img) is None:
+ raise TypeError('Unknown CAPTCHA image type')
+ else:
+ return img
+
+
class AccessDeniedException(Exception):
pass
+
class Client(object):
- """Death by Captcha API Client"""
+
+ """Death by Captcha API Client."""
def __init__(self, username, password):
self.is_verbose = False
- self.userpwd = {'username': username,
- 'password': password}
-
- def _load_file(self, captcha):
- if hasattr(captcha, 'read'):
- raw_captcha = captcha.read()
- elif isinstance(captcha, bytearray):
- raw_captcha = captcha
- elif os.path.isfile(captcha):
- raw_captcha = ''
- try:
- f = open(captcha, 'rb')
- except Exception as e:
- raise e
- else:
- raw_captcha = f.read()
- f.close()
- else:
- f_stream = urlopen(captcha)
- raw_captcha = f_stream.read()
-
- if not len(raw_captcha):
- raise ValueError('CAPTCHA image is empty')
- elif imghdr.what(None, raw_captcha) is None:
- raise TypeError('Unknown CAPTCHA image type')
- else:
- return raw_captcha
+ self.userpwd = {'username': username, 'password': password}
def _log(self, cmd, msg=''):
if self.is_verbose:
@@ -95,16 +155,16 @@ class Client(object):
pass
def get_user(self):
- """Fetch the user's details dict -- balance, rate and banned status."""
- raise NotImplemented()
+ """Fetch user details -- ID, balance, rate and banned status."""
+ raise NotImplementedError()
def get_balance(self):
- """Fetch the user's balance (in US cents)."""
+ """Fetch user balance (in US cents)."""
return self.get_user().get('balance')
def get_captcha(self, cid):
- """Fetch a CAPTCHA details dict -- its ID, text and correctness."""
- raise NotImplemented()
+ """Fetch a CAPTCHA details -- ID, text and correctness flag."""
+ raise NotImplementedError()
def get_text(self, cid):
"""Fetch a CAPTCHA text."""
@@ -112,11 +172,7 @@ class Client(object):
def report(self, cid):
"""Report a CAPTCHA as incorrectly solved."""
- raise NotImplemented()
-
- def remove(self, cid):
- """Remove an unsolved CAPTCHA."""
- raise NotImplemented()
+ raise NotImplementedError()
def upload(self, captcha):
"""Upload a CAPTCHA.
@@ -125,32 +181,56 @@ class Client(object):
dict on success.
"""
- raise NotImplemented()
+ raise NotImplementedError()
- def decode(self, captcha, timeout=DEFAULT_TIMEOUT):
- """Try to solve a CAPTCHA.
+ def decode(self, captcha=None, timeout=None, **kwargs):
+ """
+ Try to solve a CAPTCHA.
See Client.upload() for arguments details.
Uploads a CAPTCHA, polls for its status periodically with arbitrary
timeout (in seconds), returns CAPTCHA details if (correctly) solved.
-
"""
+ if not timeout:
+ if not captcha:
+ timeout = DEFAULT_TOKEN_TIMEOUT
+ else:
+ timeout = DEFAULT_TIMEOUT
+
deadline = time.time() + (max(0, timeout) or DEFAULT_TIMEOUT)
- c = self.upload(captcha)
- if c:
- while deadline > time.time() and not c.get('text'):
- time.sleep(POLLS_INTERVAL)
- c = self.get_captcha(c['captcha'])
- if c.get('text') and c.get('is_correct'):
- return c
+ uploaded_captcha = self.upload(captcha, **kwargs)
+ if uploaded_captcha:
+ intvl_idx = 0 # POLL_INTERVAL index
+ while deadline > time.time() and not uploaded_captcha.get('text'):
+ intvl, intvl_idx = self._get_poll_interval(intvl_idx)
+ time.sleep(intvl)
+ pulled = self.get_captcha(uploaded_captcha['captcha'])
+ if pulled['captcha'] == uploaded_captcha['captcha']:
+ uploaded_captcha = pulled
+ if uploaded_captcha.get('text') and \
+ uploaded_captcha.get('is_correct'):
+ return uploaded_captcha
+
+ def _get_poll_interval(self, idx):
+ """Returns poll interval and next index depending on index provided"""
+
+ if len(POLLS_INTERVAL) > idx:
+ intvl = POLLS_INTERVAL[idx]
+ else:
+ intvl = DFLT_POLL_INTERVAL
+ idx += 1
+
+ return intvl, idx
+
class HttpClient(Client):
+
"""Death by Captcha HTTP API client."""
def __init__(self, *args):
Client.__init__(self, *args)
- self.opener = build_opener(HTTPRedirectHandler())
+ self.opener = urllib2.build_opener(urllib2.HTTPRedirectHandler())
def _call(self, cmd, payload=None, headers=None):
if headers is None:
@@ -158,22 +238,30 @@ class HttpClient(Client):
headers['Accept'] = HTTP_RESPONSE_TYPE
headers['User-Agent'] = API_VERSION
if hasattr(payload, 'items'):
- payload = urlencode(payload)
+ payload = urllib.urlencode(payload)
self._log('SEND', '%s %d %s' % (cmd, len(payload), payload))
+ else:
+ self._log('SEND', '%s' % cmd)
if payload is not None:
headers['Content-Length'] = len(payload)
try:
- response = self.opener.open(Request(
+ response = self.opener.open(urllib2.Request(
HTTP_BASE_URL + '/' + cmd.strip('/'),
data=payload,
headers=headers
)).read()
- except HTTPError as e:
- if 403 == e.code:
- raise AccessDeniedException(
- 'Access denied, please check your credentials and/or balance')
- elif 400 == e.code or 413 == e.code:
- raise ValueError("CAPTCHA was rejected by the service, check if it's a valid image")
+ except urllib2.HTTPError as err:
+ if 403 == err.code:
+ raise AccessDeniedException('Access denied, please check'
+ ' your credentials and/or balance')
+ elif 400 == err.code or 413 == err.code:
+ raise ValueError("CAPTCHA was rejected by the service, check"
+ " if it's a valid image")
+ elif 503 == err.code:
+ raise OverflowError("CAPTCHA was rejected due to service"
+ " overload, try again later")
+ else:
+ raise err
else:
self._log('RECV', '%d %s' % (len(response), response))
try:
@@ -192,38 +280,53 @@ class HttpClient(Client):
return not self._call('captcha/%d/report' % cid,
self.userpwd.copy()).get('is_correct')
- def remove(self, cid):
- return not self._call('captcha/%d/remove' % cid,
- self.userpwd.copy()).get('captcha')
-
- def upload(self, captcha):
+ def upload(self, captcha=None, **kwargs):
boundary = binascii.hexlify(os.urandom(16))
- data = self.userpwd.copy()
- data['swid'] = SOFTWARE_VENDOR_ID
- body = '\r\n'.join(('\r\n'.join(('--%s' % boundary,
- 'Content-Disposition: form-data; name="%s"' % k,
- 'Content-Type: text/plain',
- 'Content-Length: %d' % len(str(v)),
- '',
- str(v))))
- for k, v in data.items())
- captcha = self._load_file(captcha)
- body += '\r\n'.join(('',
- '--%s' % boundary,
- 'Content-Disposition: form-data; name="captchafile"; filename="captcha"',
- 'Content-Type: application/octet-stream',
- 'Content-Length: %d' % len(captcha),
- '',
- captcha,
- '--%s--' % boundary,
- ''))
+ banner = kwargs.get('banner', '')
+ if banner:
+ kwargs['banner'] = 'base64:' + base64.b64encode(_load_image(banner))
+ body = '\r\n'.join(('\r\n'.join((
+ '--%s' % boundary,
+ 'Content-Disposition: form-data; name="%s"' % k,
+ 'Content-Type: text/plain',
+ 'Content-Length: %d' % len(str(v)),
+ '',
+ str(v)
+ ))) for k, v in self.userpwd.items())
+
+ body += '\r\n'.join(('\r\n'.join((
+ '--%s' % boundary,
+ 'Content-Disposition: form-data; name="%s"' % k,
+ 'Content-Type: text/plain',
+ 'Content-Length: %d' % len(str(v)),
+ '',
+ str(v)
+ ))) for k, v in kwargs.items())
+
+ if captcha:
+ img = _load_image(captcha)
+ body += '\r\n'.join((
+ '',
+ '--%s' % boundary,
+ 'Content-Disposition: form-data; name="captchafile"; '
+ 'filename="captcha"',
+ 'Content-Type: application/octet-stream',
+ 'Content-Length: %d' % len(img),
+ '',
+ img,
+ '--%s--' % boundary,
+ ''
+ ))
+
response = self._call('captcha', body, {
'Content-Type': 'multipart/form-data; boundary="%s"' % boundary
}) or {}
if response.get('captcha'):
return response
+
class SocketClient(Client):
+
"""Death by Captcha socket API client."""
TERMINATOR = '\r\n'
@@ -253,12 +356,11 @@ class SocketClient(Client):
self.socket.settimeout(0)
try:
self.socket.connect(host)
- except socket.error as e:
- if errno.EINPROGRESS == e[0]:
- pass
- else:
+ except socket.error as err:
+ if (err.args[0] not in
+ (errno.EAGAIN, errno.EWOULDBLOCK, errno.EINPROGRESS)):
self.close()
- raise e
+ raise err
return self.socket
def __del__(self):
@@ -269,27 +371,30 @@ class SocketClient(Client):
fds = [sock]
buf += self.TERMINATOR
response = ''
+ intvl_idx = 0
while True:
- rd, wr, ex = select.select((not buf and fds) or [],
- (buf and fds) or [],
- fds,
- POLLS_INTERVAL)
- if ex:
+ intvl, intvl_idx = self._get_poll_interval(intvl_idx)
+ rds, wrs, exs = select.select((not buf and fds) or [],
+ (buf and fds) or [],
+ fds,
+ intvl)
+ if exs:
raise IOError('select() failed')
try:
- if wr:
+ if wrs:
while buf:
- buf = buf[wr[0].send(buf):]
- elif rd:
+ buf = buf[wrs[0].send(buf):]
+ elif rds:
while True:
- s = rd[0].recv(256)
+ s = rds[0].recv(256)
if not s:
raise IOError('recv(): connection lost')
else:
response += s
- except socket.error as e:
- if e[0] not in (errno.EAGAIN, errno.EINPROGRESS):
- raise e
+ except socket.error as err:
+ if (err.args[0] not in
+ (errno.EAGAIN, errno.EWOULDBLOCK, errno.EINPROGRESS)):
+ raise err
if response.endswith(self.TERMINATOR):
self._log('RECV', response)
return response.rstrip(self.TERMINATOR)
@@ -303,16 +408,18 @@ class SocketClient(Client):
request = json_encode(data)
response = None
- for i in range(2):
+ for _ in range(2):
+ if not self.socket and cmd != 'login':
+ self._call('login', self.userpwd.copy())
self.socket_lock.acquire()
try:
sock = self.connect()
response = self._sendrecv(sock, request)
- except IOError as e:
- sys.stderr.write(str(e) + "\n")
+ except IOError as err:
+ sys.stderr.write(str(err) + "\n")
self.close()
- except socket.error as e:
- sys.stderr.write(str(e) + "\n")
+ except socket.error as err:
+ sys.stderr.write(str(err) + "\n")
self.close()
raise IOError('Connection refused')
else:
@@ -320,64 +427,68 @@ class SocketClient(Client):
finally:
self.socket_lock.release()
+ if response is None:
+ raise IOError('Connection lost or timed out during API request')
+
try:
- if response is None:
- raise IOError('Connection lost timed out during API request')
- try:
- response = json_decode(response)
- except Exception:
- raise RuntimeError('Invalid API response')
- if 'error' in response:
- error = response['error']
- if 'not-logged-in' == error:
- raise AccessDeniedException('Access denied, check your credentials')
- elif 'banned' == error:
- raise AccessDeniedException('Access denied, account is suspended')
- elif 'insufficient-funds' == error:
- raise AccessDeniedException('CAPTCHA was rejected due to low balance')
- elif 'invalid-captcha' == error:
- raise ValueError('CAPTCHA is not a valid image')
- elif 'service-overload' == error:
- raise ValueError(
- 'CAPTCHA was rejected due to service overload, try again later')
- else:
- raise RuntimeError('API server error occured: %s' % error)
- except Exception as e:
+ response = json_decode(response)
+ except Exception:
+ raise RuntimeError('Invalid API response')
+
+ if not response.get('error'):
+ return response
+
+ error = response['error']
+ if error in ('not-logged-in', 'invalid-credentials'):
+ raise AccessDeniedException('Access denied, check your credentials')
+ elif 'banned' == error:
+ raise AccessDeniedException('Access denied, account is suspended')
+ elif 'insufficient-funds' == error:
+ raise AccessDeniedException(
+ 'CAPTCHA was rejected due to low balance')
+ elif 'invalid-captcha' == error:
+ raise ValueError('CAPTCHA is not a valid image')
+ elif 'service-overload' == error:
+ raise OverflowError(
+ 'CAPTCHA was rejected due to service overload, try again later')
+ else:
self.socket_lock.acquire()
self.close()
self.socket_lock.release()
- raise e
- else:
- return response
+ raise RuntimeError('API server error occured: %s' % error)
def get_user(self):
- return self._call('user', self.userpwd.copy()) or {'user': 0}
+ return self._call('user') or {'user': 0}
def get_captcha(self, cid):
return self._call('captcha', {'captcha': cid}) or {'captcha': 0}
- def upload(self, captcha):
- data = self.userpwd.copy()
- data['captcha'] = base64.b64encode(self._load_file(captcha))
+ def upload(self, captcha=None, **kwargs):
+ data = {}
+ if captcha:
+ data['captcha'] = base64.b64encode(_load_image(captcha))
+ if kwargs:
+ banner = kwargs.get('banner', '')
+ if banner:
+ kwargs['banner'] = base64.b64encode(_load_image(banner))
+ data.update(kwargs)
response = self._call('upload', data)
if response.get('captcha'):
- return dict((k, response.get(k)) for k in ('captcha', 'text', 'is_correct'))
+ uploaded_captcha = dict(
+ (k, response.get(k))
+ for k in ('captcha', 'text', 'is_correct')
+ )
+ if not uploaded_captcha['text']:
+ uploaded_captcha['text'] = None
+ return uploaded_captcha
def report(self, cid):
- data = self.userpwd.copy()
- data['captcha'] = cid
- return not self._call('report', data).get('is_correct')
+ return not self._call('report', {'captcha': cid}).get('is_correct')
- def remove(self, cid):
- data = self.userpwd.copy()
- data['captcha'] = cid
- return not self._call('remove', data).get('captcha')
if '__main__' == __name__:
- import sys
-
# Put your DBC username & password here:
- #client = HttpClient(sys.argv[1], sys.argv[2])
+ # client = HttpClient(sys.argv[1], sys.argv[2])
client = SocketClient(sys.argv[1], sys.argv[2])
client.is_verbose = True
@@ -393,11 +504,12 @@ if '__main__' == __name__:
captcha = None
if captcha:
- print('CAPTCHA %d solved: %s' % (captcha['captcha'], captcha['text']))
+ print('CAPTCHA %d solved: %s' % \
+ (captcha['captcha'], captcha['text']))
# Report as incorrectly solved if needed. Make sure the CAPTCHA was
# in fact incorrectly solved!
- try:
- client.report(captcha['captcha'])
- except Exception as e:
- sys.stderr.write('Failed reporting CAPTCHA: %s\n' % (e, ))
+ # try:
+ # client.report(captcha['captcha'])
+ # except Exception, e:
+ # sys.stderr.write('Failed reporting CAPTCHA: %s\n' % (e, ))