20 Simple python demo script of tesseract-ocr 3.02 c-api
29 filename =
"../phototest.tif"
30 libpath =
"/usr/local/lib64/"
31 libpath_w =
"../vs2008/DLL_Release/"
33 if sys.platform ==
"win32":
34 libname = libpath_w +
"libtesseract302.dll"
35 libname_alt =
"libtesseract302.dll"
36 os.environ[
"PATH"] += os.pathsep + libpath_w
38 libname = libpath +
"libtesseract.so.3.0.2"
39 libname_alt =
"libtesseract.so.3"
42 tesseract = ctypes.cdll.LoadLibrary(libname)
45 tesseract = ctypes.cdll.LoadLibrary(libname_alt)
46 except WindowsError, err:
47 print(
"Trying to load '%s'..." % libname)
48 print(
"Trying to load '%s'..." % libname_alt)
52 tesseract.TessVersion.restype = ctypes.c_char_p
53 tesseract_version = tesseract.TessVersion()
57 if float(tesseract_version) < 3.02:
58 print(
"Found tesseract-ocr library version %s." % tesseract_version)
59 print(
"C-API is present only in version 3.02!")
62 api = tesseract.TessBaseAPICreate()
63 rc = tesseract.TessBaseAPIInit3(api,
"", lang);
65 tesseract.TessBaseAPIDelete(api)
66 print(
"Could not initialize tesseract.\n")
69 text_out = tesseract.TessBaseAPIProcessPages(api, filename,
None , 0);
70 result_text = ctypes.string_at(text_out)