2015-03-04 22:34:13 +01:00
|
|
|
|
;;; GNU Guix --- Functional package management for GNU
|
|
|
|
|
;;; Copyright © 2015 Taylan Ulrich Bayırlı/Kammer <taylanbayirli@gmail.com>
|
2016-01-03 06:41:49 +01:00
|
|
|
|
;;; Copyright © 2015, 2016 Ricardo Wurmus <rekado@elephly.net>
|
2015-09-29 14:10:33 +02:00
|
|
|
|
;;; Copyright © 2015 Ben Woodcroft <donttrustben@gmail.com>
|
2015-12-10 16:15:04 +01:00
|
|
|
|
;;; Copyright © 2015 Roel Janssen <roel@gnu.org>
|
2015-03-04 22:34:13 +01:00
|
|
|
|
;;;
|
|
|
|
|
;;; This file is part of GNU Guix.
|
|
|
|
|
;;;
|
|
|
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
|
|
|
;;; under the terms of the GNU General Public License as published by
|
|
|
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
|
|
|
;;; your option) any later version.
|
|
|
|
|
;;;
|
|
|
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
|
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
|
;;; GNU General Public License for more details.
|
|
|
|
|
;;;
|
|
|
|
|
;;; You should have received a copy of the GNU General Public License
|
|
|
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
|
|
(define-module (gnu packages textutils)
|
|
|
|
|
#:use-module ((guix licenses) #:prefix license:)
|
|
|
|
|
#:use-module (guix packages)
|
|
|
|
|
#:use-module (guix download)
|
|
|
|
|
#:use-module (guix git-download)
|
|
|
|
|
#:use-module (guix build-system gnu)
|
2016-01-03 06:41:49 +01:00
|
|
|
|
#:use-module (guix build-system cmake)
|
2015-04-14 16:35:30 +02:00
|
|
|
|
#:use-module (gnu packages autotools)
|
2015-07-27 20:19:55 +02:00
|
|
|
|
#:use-module (gnu packages python))
|
2015-03-04 22:34:13 +01:00
|
|
|
|
|
|
|
|
|
(define-public recode
|
|
|
|
|
(package
|
|
|
|
|
(name "recode")
|
|
|
|
|
;; Last beta release (3.7-beta2) is from 2008; last commit from Feb 2014.
|
|
|
|
|
;; So we use that commit instead.
|
|
|
|
|
(version "3.7.0.201402")
|
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method git-fetch)
|
|
|
|
|
(uri (git-reference
|
|
|
|
|
(url "https://github.com/pinard/Recode.git")
|
|
|
|
|
(commit "2d7092a9999194fc0e9449717a8048c8d8e26c18")))
|
|
|
|
|
(sha256
|
2015-11-23 12:03:17 +01:00
|
|
|
|
(base32 "1wssv8z6g3ryrw33sksz4rjhlnhgvvdqszw1ggl4rcwks34n86zm"))
|
|
|
|
|
(file-name (string-append name "-" version "-checkout"))))
|
2015-03-04 22:34:13 +01:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(native-inputs `(("python" ,python-2)))
|
|
|
|
|
(arguments
|
|
|
|
|
'(#:phases
|
|
|
|
|
(alist-cons-before
|
2015-04-15 06:04:51 +02:00
|
|
|
|
'check 'pre-check
|
2015-03-04 22:34:13 +01:00
|
|
|
|
(lambda _
|
|
|
|
|
(substitute* "tests/setup.py"
|
|
|
|
|
(("([[:space:]]*)include_dirs=.*" all space)
|
2015-04-15 06:04:51 +02:00
|
|
|
|
(string-append all space "library_dirs=['../src/.libs'],\n")))
|
|
|
|
|
;; The test extension 'Recode.so' lacks RUNPATH for 'librecode.so'.
|
|
|
|
|
(setenv "LD_LIBRARY_PATH" (string-append (getcwd) "/src/.libs")))
|
2015-03-04 22:34:13 +01:00
|
|
|
|
%standard-phases)))
|
|
|
|
|
(home-page "https://github.com/pinard/Recode")
|
|
|
|
|
(synopsis "Text encoding converter")
|
|
|
|
|
(description "The Recode library converts files between character sets and
|
|
|
|
|
usages. It recognises or produces over 200 different character sets (or about
|
|
|
|
|
300 if combined with an iconv library) and transliterates files between almost
|
|
|
|
|
any pair. When exact transliteration are not possible, it gets rid of
|
|
|
|
|
offending characters or falls back on approximations. The recode program is a
|
|
|
|
|
handy front-end to the library.")
|
|
|
|
|
(license license:gpl2+)))
|
2015-03-04 22:35:15 +01:00
|
|
|
|
|
|
|
|
|
(define-public enca
|
|
|
|
|
(package
|
|
|
|
|
(name "enca")
|
|
|
|
|
(version "1.16")
|
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append
|
|
|
|
|
"https://github.com/nijel/enca/archive/" version ".tar.gz"))
|
|
|
|
|
(sha256
|
2015-11-23 13:46:31 +01:00
|
|
|
|
(base32 "1xik00x0yvhswsw2isnclabhv536xk1s42cf5z54gfbpbhc7ni8l"))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))))
|
2015-03-04 22:35:15 +01:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(inputs `(("recode" ,recode)))
|
2015-03-10 14:18:19 +01:00
|
|
|
|
|
|
|
|
|
;; Both 'test-convert-64.sh' and 'test-convert-filter.sh' manipulate a
|
|
|
|
|
;; 'test.tmp' file, so they have to run in sequence.
|
|
|
|
|
(arguments '(#:parallel-tests? #f))
|
|
|
|
|
|
2015-03-04 22:35:15 +01:00
|
|
|
|
(home-page "https://github.com/nijel/enca")
|
|
|
|
|
(synopsis "Text encoding detection tool")
|
|
|
|
|
(description "Enca (Extremely Naive Charset Analyser) consists of libenca,
|
|
|
|
|
an encoding detection library, and enca, a command line frontend, integrating
|
|
|
|
|
libenca and several charset conversion libraries and tools.")
|
|
|
|
|
(license license:gpl2)))
|
2015-03-19 17:06:06 +01:00
|
|
|
|
|
|
|
|
|
(define-public utf8proc
|
|
|
|
|
(package
|
|
|
|
|
(name "utf8proc")
|
2015-11-30 14:31:02 +01:00
|
|
|
|
(version "1.3.1")
|
2015-03-19 17:06:06 +01:00
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append
|
|
|
|
|
"https://github.com/JuliaLang/utf8proc/archive/v"
|
|
|
|
|
version ".tar.gz"))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
2015-11-30 14:31:02 +01:00
|
|
|
|
(base32 "1k48as5kjkar4yj3dwxyll8ykj4k723ib5a6mnw1g86q3zi0zdl3"))))
|
2015-03-19 17:06:06 +01:00
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
'(#:tests? #f ;no "check" target
|
2015-11-30 14:31:02 +01:00
|
|
|
|
#:make-flags (list "CC=gcc"
|
|
|
|
|
(string-append "prefix=" (assoc-ref %outputs "out")))
|
2015-03-19 17:06:06 +01:00
|
|
|
|
#:phases
|
2015-11-30 14:31:02 +01:00
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
|
(delete 'configure))))
|
2015-03-19 17:06:06 +01:00
|
|
|
|
(home-page "http://julialang.org/utf8proc/")
|
|
|
|
|
(synopsis "C library for processing UTF-8 Unicode data")
|
|
|
|
|
(description "utf8proc is a small C library that provides Unicode
|
|
|
|
|
normalization, case-folding, and other operations for data in the UTF-8
|
|
|
|
|
encoding, supporting Unicode version 7.0.")
|
|
|
|
|
(license license:expat)))
|
2015-04-14 16:35:30 +02:00
|
|
|
|
|
|
|
|
|
(define-public libgtextutils
|
|
|
|
|
(package
|
|
|
|
|
(name "libgtextutils")
|
|
|
|
|
(version "0.7")
|
|
|
|
|
(source
|
|
|
|
|
(origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append
|
|
|
|
|
"https://github.com/agordon/libgtextutils/releases/download/"
|
|
|
|
|
version "/libgtextutils-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32 "0jiybkb2z58wa2msvllnphr4js2hvjvh988pavb3mzkgr6ihwbkr"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(arguments
|
|
|
|
|
'(#:phases
|
|
|
|
|
(alist-cons-after
|
|
|
|
|
'unpack 'autoreconf
|
|
|
|
|
(lambda _ (zero? (system* "autoreconf" "-vif")))
|
|
|
|
|
%standard-phases)))
|
|
|
|
|
(native-inputs
|
|
|
|
|
`(("autoconf" ,autoconf)
|
|
|
|
|
("automake" ,automake)
|
|
|
|
|
("libtool" ,libtool)))
|
|
|
|
|
(home-page "https://github.com/agordon/libgtextutils")
|
|
|
|
|
(synopsis "Gordon's text utils library")
|
|
|
|
|
(description
|
|
|
|
|
"libgtextutils is a text utilities library used by the fastx toolkit from
|
|
|
|
|
the Hannon Lab.")
|
|
|
|
|
(license license:agpl3+)))
|
2015-09-29 14:10:33 +02:00
|
|
|
|
|
|
|
|
|
(define-public cityhash
|
|
|
|
|
(let ((commit "8af9b8c")
|
|
|
|
|
(revision "1"))
|
|
|
|
|
(package
|
|
|
|
|
(name "cityhash")
|
|
|
|
|
(version (string-append "1.1." revision "." commit))
|
|
|
|
|
(source (origin
|
|
|
|
|
(method git-fetch)
|
|
|
|
|
(uri (git-reference
|
|
|
|
|
(url "https://github.com/google/cityhash.git")
|
|
|
|
|
(commit commit)))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"0n6skf5dv8yfl1ckax8dqhvsbslkwc9158zf2ims0xqdvzsahbi6"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(home-page "https://github.com/google/cityhash")
|
|
|
|
|
(synopsis "C++ hash functions for strings")
|
|
|
|
|
(description
|
|
|
|
|
"CityHash provides hash functions for strings. The functions mix the
|
|
|
|
|
input bits thoroughly but are not suitable for cryptography.")
|
|
|
|
|
(license license:expat))))
|
2015-12-10 16:15:04 +01:00
|
|
|
|
|
|
|
|
|
(define-public libconfig
|
|
|
|
|
(package
|
|
|
|
|
(name "libconfig")
|
|
|
|
|
(version "1.5")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "http://www.hyperrealm.com/libconfig/"
|
|
|
|
|
"libconfig-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"1xh3hzk63v4y8815lc5209m3s6ms2cpgw4h5hg462i4f1lwsl7g3"))))
|
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
|
(home-page "http://www.hyperrealm.com/libconfig/")
|
|
|
|
|
(synopsis "C/C++ configuration file library")
|
|
|
|
|
(description
|
|
|
|
|
"Libconfig is a simple library for manipulating structured configuration
|
|
|
|
|
files. This file format is more compact and more readable than XML. And
|
|
|
|
|
unlike XML, it is type-aware, so it is not necessary to do string parsing in
|
|
|
|
|
application code.")
|
|
|
|
|
(license license:lgpl2.1+)))
|
2016-01-03 06:41:49 +01:00
|
|
|
|
|
|
|
|
|
(define-public pfff
|
|
|
|
|
(package
|
|
|
|
|
(name "pfff")
|
|
|
|
|
(version "1.0")
|
|
|
|
|
(source (origin
|
|
|
|
|
(method url-fetch)
|
|
|
|
|
(uri (string-append "https://github.com/pfff/pfff/archive/v"
|
|
|
|
|
version ".tar.gz"))
|
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
|
(sha256
|
|
|
|
|
(base32
|
|
|
|
|
"00m553aa277iarxj6dalmklyb64r7ias49bfwzbacsfg8h3kar8m"))))
|
|
|
|
|
(build-system cmake-build-system)
|
|
|
|
|
(home-page "http://biit.cs.ut.ee/pfff/")
|
|
|
|
|
(synopsis "Probabilistic fast file fingerprinting tool")
|
|
|
|
|
(description
|
|
|
|
|
"pfff is a tool for calculating a compact digital fingerprint of a file
|
|
|
|
|
by sampling randomly from the file instead of reading it in full.
|
|
|
|
|
Consequently, the computation has a flat performance characteristic,
|
|
|
|
|
correlated with data variation rather than file size. pfff can be as reliable
|
|
|
|
|
as existing hashing techniques, with provably negligible risk of collisions.")
|
|
|
|
|
(license license:bsd-3)))
|