summaryrefslogtreecommitdiff
blob: a59128537ce9b88d748fe11d4b4ee6e86dbd4d58 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE pkgmetadata SYSTEM "https://www.gentoo.org/dtd/metadata.dtd">
<pkgmetadata>
	<maintainer type="person">
		<email>tupone@gentoo.org</email>
		<name>Tupone Alfredo</name>
	</maintainer>
	<longdescription lang="en">
		Python-tesseract is an optical character recognition (OCR) tool for
		python.
		That is, it will recognize and "read" the text embedded in images.

		Python-tesseract is a wrapper for Google's Tesseract-OCR Engine.
		It is also useful as a stand-alone invocation script to tesseract, as
		it can read all image types supported by the Pillow and Leptonica
		imaging libraries, including jpeg, png, gif, bmp, tiff, and others.
		Additionally, if used as a script, Python-tesseract will print the
		recognized text instead of writing it to a file.
	</longdescription>
	<upstream>
		<remote-id type="github">madmaze/pytesseract</remote-id>
		<remote-id type="pypi">pytesseract</remote-id>
	</upstream>
</pkgmetadata>