From cd5bd94991327a12715431e75e0c19f68ad48183 Mon Sep 17 00:00:00 2001 From: Zheng Junjie <873216071@qq.com> Date: Fri, 25 Dec 2020 13:56:16 +0800 Subject: [PATCH] gnu: Add python-pdftotext. --- gnu/packages/python-xyz.scm | 21 +++++++++++++++++++++ 1 file changed, 21 insertions(+) diff --git a/gnu/packages/python-xyz.scm b/gnu/packages/python-xyz.scm index acde5a5e5e..9d9c298076 100644 --- a/gnu/packages/python-xyz.scm +++ b/gnu/packages/python-xyz.scm @@ -93,6 +93,7 @@ ;;; Copyright © 2020 Diego N. Barbato ;;; Copyright © 2020 Leo Prikler ;;; Copyright © 2019 Kristian Trandem +;;; Copyright © 2020 Zheng Junjie <873216071@qq.com> ;;; ;;; This file is part of GNU Guix. ;;; @@ -158,6 +159,7 @@ #:use-module (gnu packages ncurses) #:use-module (gnu packages openstack) #:use-module (gnu packages pcre) + #:use-module (gnu packages pdf) #:use-module (gnu packages perl) #:use-module (gnu packages photo) #:use-module (gnu packages pkg-config) @@ -4861,6 +4863,25 @@ algorithm. Patiencediff provides a good balance of performance, nice output for humans, and implementation simplicity.") (license license:gpl2))) +(define-public python-pdftotext + (package + (name "python-pdftotext") + (version "2.1.5") + (source + (origin + (method url-fetch) + (uri (pypi-uri "pdftotext" version)) + (sha256 + (base32 + "19la1cw1hmkcr8big04gm2dd5fw0y0z97g930aiy29s1gaqbiblq")))) + (build-system python-build-system) + (inputs + `(("poppler" ,poppler))) + (home-page "https://github.com/jalan/pdftotext") + (synopsis "Simple PDF text extraction") + (description "Pdftotext is a Python library of PDF text extraction.") + (license license:expat))) + (define-public python-pyparsing (package (name "python-pyparsing") -- 2.29.2