mirror of
https://codeberg.org/guix/guix.git
synced 2025-10-02 02:15:12 +00:00
gnu: Add tesseract-ocr.
* gnu/packages/ocr.scm (tesseract-ocr): New variable.
This commit is contained in:
parent
9e617a5419
commit
d814be32d5
1 changed files with 51 additions and 4 deletions
|
@ -17,12 +17,14 @@
|
||||||
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
||||||
|
|
||||||
(define-module (gnu packages ocr)
|
(define-module (gnu packages ocr)
|
||||||
#:use-module (guix licenses)
|
#:use-module ((guix licenses) #:prefix license:)
|
||||||
#:use-module (guix packages)
|
#:use-module (guix packages)
|
||||||
#:use-module (guix download)
|
#:use-module (guix download)
|
||||||
#:use-module (guix build-system gnu)
|
#:use-module (guix build-system gnu)
|
||||||
#:use-module ((gnu packages compression)
|
#:use-module (gnu packages autotools)
|
||||||
#:select (lzip)))
|
#:use-module (gnu packages compression)
|
||||||
|
#:use-module (gnu packages image)
|
||||||
|
#:use-module (gnu packages pkg-config))
|
||||||
|
|
||||||
(define-public ocrad
|
(define-public ocrad
|
||||||
(package
|
(package
|
||||||
|
@ -43,4 +45,49 @@
|
||||||
"GNU Ocrad is an optical character recognition program based on a
|
"GNU Ocrad is an optical character recognition program based on a
|
||||||
feature extraction method. It can read images in PBM, PGM or PPM formats and
|
feature extraction method. It can read images in PBM, PGM or PPM formats and
|
||||||
it produces text in 8-bit or UTF-8 formats.")
|
it produces text in 8-bit or UTF-8 formats.")
|
||||||
(license gpl3+)))
|
(license license:gpl3+)))
|
||||||
|
|
||||||
|
(define-public tesseract-ocr
|
||||||
|
(package
|
||||||
|
(name "tesseract-ocr")
|
||||||
|
(version "3.02.02")
|
||||||
|
(source
|
||||||
|
(origin
|
||||||
|
(method url-fetch)
|
||||||
|
(uri (string-append
|
||||||
|
"https://tesseract-ocr.googlecode.com/files/tesseract-ocr-"
|
||||||
|
version ".tar.gz"))
|
||||||
|
(sha256
|
||||||
|
(base32 "0g81m9y4iydp7kgr56mlkvjdwpp3mb01q385yhdnyvra7z5kkk96"))
|
||||||
|
(modules '((guix build utils)))
|
||||||
|
;; Leptonica added a pkg-config file in the meanwhile.
|
||||||
|
(snippet
|
||||||
|
'(substitute* "tesseract.pc.in"
|
||||||
|
(("^# Requires: lept ## .*")
|
||||||
|
"Requires: lept\n")))))
|
||||||
|
(build-system gnu-build-system)
|
||||||
|
(native-inputs
|
||||||
|
`(("autoconf" ,autoconf)
|
||||||
|
("automake" ,automake)
|
||||||
|
("libtool" ,libtool)))
|
||||||
|
(propagated-inputs
|
||||||
|
`(("leptonica" ,leptonica)))
|
||||||
|
(arguments
|
||||||
|
'(#:phases
|
||||||
|
(modify-phases %standard-phases
|
||||||
|
(add-after
|
||||||
|
unpack autogen
|
||||||
|
(lambda _
|
||||||
|
(zero? (system* "sh" "autogen.sh")))))
|
||||||
|
#:configure-flags
|
||||||
|
(let ((leptonica (assoc-ref %build-inputs "leptonica")))
|
||||||
|
(list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))))
|
||||||
|
(home-page "https://code.google.com/p/tesseract-ocr/")
|
||||||
|
(synopsis "Optical character recognition engine")
|
||||||
|
(description
|
||||||
|
"Tesseract is an optical character recognition (OCR) engine with very
|
||||||
|
high accuracy. It supports many languages, output text formatting, hOCR
|
||||||
|
positional information and page layout analysis. Several image formats are
|
||||||
|
supported through the Leptonica library. It can also detect whether text is
|
||||||
|
monospaced or proportional.")
|
||||||
|
(license license:asl2.0)))
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue