summaryrefslogtreecommitdiff
path: root/app-text/pdfsandwich
diff options
context:
space:
mode:
authorV3n3RiX <venerix@redcorelinux.org>2017-10-09 18:53:29 +0100
committerV3n3RiX <venerix@redcorelinux.org>2017-10-09 18:53:29 +0100
commit4f2d7949f03e1c198bc888f2d05f421d35c57e21 (patch)
treeba5f07bf3f9d22d82e54a462313f5d244036c768 /app-text/pdfsandwich
reinit the tree, so we can have metadata
Diffstat (limited to 'app-text/pdfsandwich')
-rw-r--r--app-text/pdfsandwich/Manifest5
-rw-r--r--app-text/pdfsandwich/metadata.xml23
-rw-r--r--app-text/pdfsandwich/pdfsandwich-0.1.4-r1.ebuild37
3 files changed, 65 insertions, 0 deletions
diff --git a/app-text/pdfsandwich/Manifest b/app-text/pdfsandwich/Manifest
new file mode 100644
index 000000000000..24a21d1f2596
--- /dev/null
+++ b/app-text/pdfsandwich/Manifest
@@ -0,0 +1,5 @@
+DIST pdfsandwich-0.1.4.tar.bz2 16401 SHA256 8b82f3ae08000c5cae1ff5a0f6537b0b563befef928e5198255b743a46714af3 SHA512 ee03aea13c72cc5a02136b5d16d2425f685f0b7a9d6fa6cff6c792bd24e6316720dff321b5e8237b949c98c713f39cb8b08b855b76e2a77350927b1ee7943171 WHIRLPOOL d8eb5fd281b1eb3f9e371ee71c486b8e839048f3ab569f8b62644e21ad921692283b2d35dfeb07111f86cf52eeb926da4152fcf58124cca2f96aa05116e8e115
+EBUILD pdfsandwich-0.1.4-r1.ebuild 970 SHA256 31e52d93880ab0f86aec47a27b2abd5362b6c7a85ae9a575103b6ec7743ae5ef SHA512 3505739fec5f3d76a7d51c0c9f4f4cf992faa59e23779dfd0ebf677246da0a794ca18af304a5631e7fc0984bd698bfe69f6c3a012389cdc943a543ac0fe4b263 WHIRLPOOL 293f1bbd0ef56e30dc2dc30809dcee8cbbd106a20ac3562dfb77c865f302386ff180d4d9b19156c1fdafd5433904c7e71ff5657e1ce69a86779ee6009407394b
+MISC ChangeLog 2188 SHA256 465634736809ae641d29b66eb22cf8399c51e75d89fe413b05588b34e8d5b3df SHA512 7b3c12835c3517cb6a4f3f8639e06142f5761bf59665ddea8a9159f7b2eb23b49bd845dcae2cbe3394d515aba47c295a600eef28dc1a459b6dc546fd902b9997 WHIRLPOOL 71bcd50831b6902f27910c9a71c74a54d8c7bc56d650b607598aabc29b27320b8c2be9063ae69e6019e718ac4e093cb6ac32676decdf753f5f8bfb8cad9ff44b
+MISC ChangeLog-2015 1879 SHA256 8dc86c03230b063d2eb0d87006c6b0d263fe12e7583b4b810a61abb9d855dc04 SHA512 2badcf204953484ae85ba0ede7dd65008c95d8e1279ccf75260aa0550819213beeb00787709604e38fae4ccba4188f46009670fe3340c16e74aeca881b187ff8 WHIRLPOOL 0e4519e1c97c056c118bc05b683641da069cd8bf32b53e60ef5118a1383fb06b271e3dccc0fef11abd555abe404e74113b2ec0e3db69e7bb93953bfa0f1a3bff
+MISC metadata.xml 937 SHA256 a001b3d2fe61a29e09b9d64972ddd43758ea78195c154993e132a79ca0aeae25 SHA512 595e3fdd841667046ae3064ee12aa288586cb1db3f8cd902aaf5c7c1bfb1c1776c641c400593b273dad83bf4f3a4c98f1f031125b8d65af3e836d6c2abdbc531 WHIRLPOOL bdffa2c49b734e8b72b4070ebceafdc336df67b0e9cf1a21bf82bc5f2d4720a574340044182faf00e8aecf894ce17e8810ebd72bf8d621d43f5daf758f46464a
diff --git a/app-text/pdfsandwich/metadata.xml b/app-text/pdfsandwich/metadata.xml
new file mode 100644
index 000000000000..0fb15c19e847
--- /dev/null
+++ b/app-text/pdfsandwich/metadata.xml
@@ -0,0 +1,23 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE pkgmetadata SYSTEM "http://www.gentoo.org/dtd/metadata.dtd">
+<pkgmetadata>
+ <!-- maintainer-needed -->
+ <longdescription>
+pdfsandwich generates "sandwich" OCR pdf files, i.e. pdf files which
+contain only images (no text) will be processed by optical character
+recognition (OCR) and the text will be added to each page invisibly
+"behind" the images.
+
+pdfsandwich is a command line tool which is supposed to be useful to
+OCR scanned books or journals. It is able to recognize the page layout
+even for multicolumn text.
+
+Essentially, pdfsandwich is a wrapper script which calls the following
+binaries: convert, cuneiform, gs, and hocr2pdf. It is known to run on
+Unix systems and has been tested on Linux and MacOS X. It supports
+parallel processing on multiprocessor systems.
+</longdescription>
+ <upstream>
+ <remote-id type="sourceforge">pdfsandwich</remote-id>
+ </upstream>
+</pkgmetadata>
diff --git a/app-text/pdfsandwich/pdfsandwich-0.1.4-r1.ebuild b/app-text/pdfsandwich/pdfsandwich-0.1.4-r1.ebuild
new file mode 100644
index 000000000000..21bf32dcc96f
--- /dev/null
+++ b/app-text/pdfsandwich/pdfsandwich-0.1.4-r1.ebuild
@@ -0,0 +1,37 @@
+# Copyright 1999-2017 Gentoo Foundation
+# Distributed under the terms of the GNU General Public License v2
+
+EAPI=5
+
+DESCRIPTION="generator of sandwich OCR pdf files"
+HOMEPAGE="http://www.tobias-elze.de/pdfsandwich"
+SRC_URI="mirror://sourceforge/pdfsandwich/${P}.tar.bz2"
+
+LICENSE="GPL-2"
+KEYWORDS="~amd64 ~x86"
+SLOT="0"
+IUSE="png"
+
+RDEPEND=">=app-text/tesseract-3.00
+ media-gfx/exact-image
+ app-text/unpaper
+ app-text/ghostscript-gpl
+ virtual/imagemagick-tools[png?]"
+DEPEND="sys-apps/gawk
+ >=dev-lang/ocaml-3.10[ocamlopt]"
+
+src_prepare() {
+ sed -i "/^OCAMLOPTFLAGS/s/$/ -ccopt \"\$(CFLAGS) \$(LDFLAGS)\"/" Makefile || die
+ sed -i "s/install -s/install/" Makefile || die
+}
+
+src_install() {
+ emake DESTDIR="${D}" install
+}
+
+pkg_postinst() {
+ elog "pdfsandwich relies on the tesseract library for OCR."
+ elog "Consequently language support is determined by tesseract's"
+ elog "language support which in turn is controlled via the LINGUAS"
+ elog "variable in make.conf."
+}