forked from guitarmind/tesseract-web-service
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathtesseractclient.py
43 lines (36 loc) · 1.34 KB
/
tesseractclient.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
#!/usr/bin/env python
import sys
import optparse
import tornado.httpclient
import simplejson, json
import urllib
"""
Get result string from tesseract API
"""
def ocrAPI(apiUrl, imageUrl):
request = { 'url': imageUrl }
post_data = json.dumps(request)
headers = { 'Content-Type': 'application/json; charset=UTF-8' }
http_client = tornado.httpclient.AsyncHTTPClient()
http_client.fetch(apiUrl, handle_request, method = 'POST', headers = headers, body = post_data)
print "Sending request: " + post_data
tornado.ioloop.IOLoop.instance().start()
def handle_request(response):
if response.error:
print "Error: ", response.error
else:
print "Got response: " + response.body
tornado.ioloop.IOLoop.instance().stop()
def main():
parser = optparse.OptionParser()
parser.add_option('-a', '--api-url', dest='apiUrl', help='the URL of RESTful tesseract web service.')
parser.add_option('-i', '--image-url', dest='imageUrl', help='the URL of image to do OCR.')
(options, args) = parser.parse_args()
if not options.apiUrl: # if apiUrl is not given
parser.error('api-url not given')
if not options.imageUrl: # if imageUrl is not given
parser.error('image-url not given')
# call tesseract API
ocrAPI(options.apiUrl, options.imageUrl)
if __name__ == '__main__':
main()