guix/gnu/packages/ocr.scm

;;; GNU Guix --- Functional package management for GNU
;;; Copyright © 2013 Ludovic Courtès <ludo@gnu.org>
;;;
;;; This file is part of GNU Guix.
;;;
;;; GNU Guix is free software; you can redistribute it and/or modify it
;;; under the terms of the GNU General Public License as published by
;;; the Free Software Foundation; either version 3 of the License, or (at
;;; your option) any later version.
;;;
;;; GNU Guix is distributed in the hope that it will be useful, but
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
;;; GNU General Public License for more details.
;;;
;;; You should have received a copy of the GNU General Public License
;;; along with GNU Guix.  If not, see <http://www.gnu.org/licenses/>.

(define-module (gnu packages ocr)
  #:use-module ((guix licenses) #:prefix license:)
  #:use-module (guix packages)
  #:use-module (guix download)
  #:use-module (guix build-system gnu)
  #:use-module (gnu packages autotools)
  #:use-module (gnu packages compression)
  #:use-module (gnu packages image)
  #:use-module (gnu packages pkg-config))

(define-public ocrad
  (package
    (name "ocrad")
    (version "0.25")
    (source (origin
             (method url-fetch)
             (uri (string-append "mirror://gnu/ocrad/ocrad-"
                                 version ".tar.lz"))
             (sha256
              (base32
               "1m2dblgvvjs48rsglfdwq0ib9zk8h9n34xsh67ibrg0g0ffbw477"))))
    (build-system gnu-build-system)
    (native-inputs `(("lzip" ,lzip)))
    (home-page "http://www.gnu.org/software/ocrad/")
    (synopsis "Optical character recognition based on feature extraction")
    (description
     "GNU Ocrad is an optical character recognition program based on a
feature extraction method.  It can read images in PBM, PGM or PPM formats and
it produces text in 8-bit or UTF-8 formats.")
    (license license:gpl3+)))

(define-public tesseract-ocr
  (package
    (name "tesseract-ocr")
    (version "3.02.02")
    (source
     (origin
       (method url-fetch)
       (uri (string-append
             "https://tesseract-ocr.googlecode.com/files/tesseract-ocr-"
             version ".tar.gz"))
       (sha256
        (base32 "0g81m9y4iydp7kgr56mlkvjdwpp3mb01q385yhdnyvra7z5kkk96"))
       (modules '((guix build utils)))
       ;; Leptonica added a pkg-config file in the meanwhile.
       (snippet
        '(substitute* "tesseract.pc.in"
           (("^# Requires: lept  ## .*")
            "Requires: lept\n")))))
    (build-system gnu-build-system)
    (native-inputs
     `(("autoconf" ,autoconf)
       ("automake" ,automake)
       ("libtool" ,libtool)))
    (propagated-inputs
     `(("leptonica" ,leptonica)))
    (arguments
     '(#:phases
       (modify-phases %standard-phases
         (add-after
          'unpack 'autogen
          (lambda _
            (zero? (system* "sh" "autogen.sh")))))
       #:configure-flags
       (let ((leptonica (assoc-ref %build-inputs "leptonica")))
         (list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))))
    (home-page "https://code.google.com/p/tesseract-ocr/")
    (synopsis "Optical character recognition engine")
    (description
     "Tesseract is an optical character recognition (OCR) engine with very
high accuracy.  It supports many languages, output text formatting, hOCR
positional information and page layout analysis.  Several image formats are
supported through the Leptonica library.  It can also detect whether text is
monospaced or proportional.")
    (license license:asl2.0)))
gnu: Add GNU Ocrad. * gnu/packages/ocrad.scm: New file. * gnu-system.am (GNU_SYSTEM_MODULES): Add it. 2013-08-18 22:52:49 +00:00			`;;; GNU Guix --- Functional package management for GNU`
			`;;; Copyright © 2013 Ludovic Courtès <ludo@gnu.org>`
			`;;;`
			`;;; This file is part of GNU Guix.`
			`;;;`
			`;;; GNU Guix is free software; you can redistribute it and/or modify it`
			`;;; under the terms of the GNU General Public License as published by`
			`;;; the Free Software Foundation; either version 3 of the License, or (at`
			`;;; your option) any later version.`
			`;;;`
			`;;; GNU Guix is distributed in the hope that it will be useful, but`
			`;;; WITHOUT ANY WARRANTY; without even the implied warranty of`
			`;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the`
			`;;; GNU General Public License for more details.`
			`;;;`
			`;;; You should have received a copy of the GNU General Public License`
			`;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.`

gnu: Rename (gnu packages ocrad) to (gnu packages ocr). * gnu/packages/ocrad.scm: Deleted. * gnu/packages/ocr.scm: New file. * gnu-system.am (GNU_SYSTEM_MODULES): Change ocrad.scm to ocr.scm. 2015-03-20 15:22:34 +00:00			`(define-module (gnu packages ocr)`
gnu: Add tesseract-ocr. * gnu/packages/ocr.scm (tesseract-ocr): New variable. 2015-03-21 19:11:56 +00:00			`#:use-module ((guix licenses) #:prefix license:)`
gnu: Add GNU Ocrad. * gnu/packages/ocrad.scm: New file. * gnu-system.am (GNU_SYSTEM_MODULES): Add it. 2013-08-18 22:52:49 +00:00			`#:use-module (guix packages)`
			`#:use-module (guix download)`
			`#:use-module (guix build-system gnu)`
gnu: Add tesseract-ocr. * gnu/packages/ocr.scm (tesseract-ocr): New variable. 2015-03-21 19:11:56 +00:00			`#:use-module (gnu packages autotools)`
			`#:use-module (gnu packages compression)`
			`#:use-module (gnu packages image)`
			`#:use-module (gnu packages pkg-config))`
gnu: Add GNU Ocrad. * gnu/packages/ocrad.scm: New file. * gnu-system.am (GNU_SYSTEM_MODULES): Add it. 2013-08-18 22:52:49 +00:00
			`(define-public ocrad`
			`(package`
			`(name "ocrad")`
gnu: ocrad: Update to 0.25. * gnu/packages/ocr.scm (ocrad): Update to 0.25. 2015-04-21 20:57:29 +00:00			`(version "0.25")`
gnu: Add GNU Ocrad. * gnu/packages/ocrad.scm: New file. * gnu-system.am (GNU_SYSTEM_MODULES): Add it. 2013-08-18 22:52:49 +00:00			`(source (origin`
			`(method url-fetch)`
			`(uri (string-append "mirror://gnu/ocrad/ocrad-"`
			`version ".tar.lz"))`
			`(sha256`
			`(base32`
gnu: ocrad: Update to 0.25. * gnu/packages/ocr.scm (ocrad): Update to 0.25. 2015-04-21 20:57:29 +00:00			`"1m2dblgvvjs48rsglfdwq0ib9zk8h9n34xsh67ibrg0g0ffbw477"))))`
gnu: Add GNU Ocrad. * gnu/packages/ocrad.scm: New file. * gnu-system.am (GNU_SYSTEM_MODULES): Add it. 2013-08-18 22:52:49 +00:00			`(build-system gnu-build-system)`
			(native-inputs `(("lzip" ,lzip)))
			`(home-page "http://www.gnu.org/software/ocrad/")`
			`(synopsis "Optical character recognition based on feature extraction")`
			`(description`
gnu: Synchronize descriptions with 'gnumaint'. 2013-12-01 21:33:23 +00:00			`"GNU Ocrad is an optical character recognition program based on a`
			`feature extraction method. It can read images in PBM, PGM or PPM formats and`
			`it produces text in 8-bit or UTF-8 formats.")`
gnu: Add tesseract-ocr. * gnu/packages/ocr.scm (tesseract-ocr): New variable. 2015-03-21 19:11:56 +00:00			`(license license:gpl3+)))`

			`(define-public tesseract-ocr`
			`(package`
			`(name "tesseract-ocr")`
			`(version "3.02.02")`
			`(source`
			`(origin`
			`(method url-fetch)`
			`(uri (string-append`
			`"https://tesseract-ocr.googlecode.com/files/tesseract-ocr-"`
			`version ".tar.gz"))`
			`(sha256`
			`(base32 "0g81m9y4iydp7kgr56mlkvjdwpp3mb01q385yhdnyvra7z5kkk96"))`
			`(modules '((guix build utils)))`
			`;; Leptonica added a pkg-config file in the meanwhile.`
			`(snippet`
			`'(substitute* "tesseract.pc.in"`
			`(("^# Requires: lept ## .*")`
			`"Requires: lept\n")))))`
			`(build-system gnu-build-system)`
			`(native-inputs`
			`(("autoconf" ,autoconf)
			`("automake" ,automake)`
			`("libtool" ,libtool)))`
			`(propagated-inputs`
			`(("leptonica" ,leptonica)))
			`(arguments`
			`'(#:phases`
			`(modify-phases %standard-phases`
			`(add-after`
utils: 'modify-phases' no longer introduces quotes. Suggested by Taylan Ulrich Bayırlı/Kammer <taylanbayirli@gmail.com>. * guix/build/utils.scm (%modify-phases): Remove quotes. * guix/build/cmake-build-system.scm (%standard-phases): Adjust accordingly. * guix/build/glib-or-gtk-build-system.scm (%standard-phases): Likewise. * guix/build/gnu-dist.scm (%dist-phases): Likewise. * guix/build/perl-build-system.scm (%standard-phases): Likewise. * guix/build/python-build-system.scm (%standard-phases): Likewise. * guix/build/ruby-build-system.scm (%standard-phases): Likewise. * guix/build/waf-build-system.scm (%standard-phases): Likewise. * gnu/packages/bash.scm, gnu/packages/code.scm, gnu/packages/gl.scm, gnu/packages/gnome.scm, gnu/packages/graphics.scm, gnu/packages/image.scm, gnu/packages/key-mon.scm, gnu/packages/ocr.scm, gnu/packages/plotutils.scm, gnu/packages/search.scm, gnu/packages/video.scm: Likewise. 2015-03-31 20:43:01 +00:00			`'unpack 'autogen`
gnu: Add tesseract-ocr. * gnu/packages/ocr.scm (tesseract-ocr): New variable. 2015-03-21 19:11:56 +00:00			`(lambda _`
			`(zero? (system* "sh" "autogen.sh")))))`
			`#:configure-flags`
			`(let ((leptonica (assoc-ref %build-inputs "leptonica")))`
			`(list (string-append "LIBLEPT_HEADERSDIR=" leptonica "/include")))))`
			`(home-page "https://code.google.com/p/tesseract-ocr/")`
			`(synopsis "Optical character recognition engine")`
			`(description`
			`"Tesseract is an optical character recognition (OCR) engine with very`
			`high accuracy. It supports many languages, output text formatting, hOCR`
			`positional information and page layout analysis. Several image formats are`
			`supported through the Leptonica library. It can also detect whether text is`
			`monospaced or proportional.")`
			`(license license:asl2.0)))`