460 lines
20 KiB
Scheme
460 lines
20 KiB
Scheme
;;; GNU Guix --- Functional package management for GNU
|
|
;;; Copyright © 2016 David Thompson <davet@gnu.org>
|
|
;;; Copyright © 2016, 2019 Marius Bakke <mbakke@fastmail.com>
|
|
;;; Copyright © 2017 Leo Famulari <leo@famulari.name>
|
|
;;; Copyright © 2018 Tobias Geerinckx-Rice <me@tobias.gr>
|
|
;;; Copyright © 2016 Kei Kebreau <kkebreau@posteo.net>
|
|
;;; Copyright © 2019 Ricardo Wurmus <rekado@elephly.net>
|
|
;;;
|
|
;;; This file is part of GNU Guix.
|
|
;;;
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
;;; under the terms of the GNU General Public License as published by
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
;;; your option) any later version.
|
|
;;;
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
;;; GNU General Public License for more details.
|
|
;;;
|
|
;;; You should have received a copy of the GNU General Public License
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
(define-module (gnu packages speech)
|
|
#:use-module ((guix licenses) #:prefix license:)
|
|
#:use-module (guix packages)
|
|
#:use-module (guix download)
|
|
#:use-module (guix utils)
|
|
#:use-module (guix build-system gnu)
|
|
#:use-module (gnu packages)
|
|
#:use-module (gnu packages audio)
|
|
#:use-module (gnu packages autotools)
|
|
#:use-module (gnu packages compression)
|
|
#:use-module (gnu packages emacs)
|
|
#:use-module (gnu packages gcc)
|
|
#:use-module (gnu packages glib)
|
|
#:use-module (gnu packages linux)
|
|
#:use-module (gnu packages ncurses)
|
|
#:use-module (gnu packages pkg-config)
|
|
#:use-module (gnu packages pulseaudio)
|
|
#:use-module (gnu packages python)
|
|
#:use-module (gnu packages texinfo)
|
|
#:use-module (gnu packages textutils))
|
|
|
|
(define-public espeak
|
|
(package
|
|
(name "espeak")
|
|
(version "1.48.04")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "mirror://sourceforge/espeak/espeak/"
|
|
"espeak-" (version-major+minor version)
|
|
"/espeak-" version "-source.zip"))
|
|
(sha256
|
|
(base32
|
|
"0n86gwh9pw0jqqpdz7mxggllfr8k0r7pc67ayy7w5z6z79kig6mz"))
|
|
(modules '((guix build utils)))
|
|
(snippet
|
|
;; remove prebuilt binaries
|
|
'(begin
|
|
(delete-file-recursively "linux_32bit")
|
|
#t))))
|
|
(build-system gnu-build-system)
|
|
(arguments
|
|
`(#:make-flags (list (string-append "PREFIX=" (assoc-ref %outputs "out"))
|
|
(string-append "DATADIR="
|
|
(assoc-ref %outputs "out")
|
|
"/share/espeak-data")
|
|
(string-append "LDFLAGS=-Wl,-rpath="
|
|
(assoc-ref %outputs "out")
|
|
"/lib")
|
|
"AUDIO=pulseaudio")
|
|
#:tests? #f ; no check target
|
|
#:phases
|
|
(modify-phases %standard-phases
|
|
(replace 'configure
|
|
(lambda _
|
|
(chdir "src")
|
|
;; We use version 19 of the PortAudio library, so we must copy the
|
|
;; corresponding file to be sure that espeak compiles correctly.
|
|
(copy-file "portaudio19.h" "portaudio.h")
|
|
(substitute* "Makefile"
|
|
(("/bin/ln") "ln"))
|
|
#t)))))
|
|
(inputs
|
|
`(("portaudio" ,portaudio)
|
|
("pulseaudio" ,pulseaudio)))
|
|
(native-inputs `(("unzip" ,unzip)))
|
|
(home-page "http://espeak.sourceforge.net/")
|
|
(synopsis "Software speech synthesizer")
|
|
(description "eSpeak is a software speech synthesizer for English and
|
|
other languages. eSpeak uses a \"formant synthesis\" method. This allows many
|
|
languages to be provided in a small size. The speech is clear, and can be used
|
|
at high speeds, but is not as natural or smooth as larger synthesizers which are
|
|
based on human speech recordings.")
|
|
(license license:gpl3+)))
|
|
|
|
(define-public espeak-ng
|
|
(package
|
|
(name "espeak-ng")
|
|
(version "1.49.2")
|
|
(home-page "https://github.com/espeak-ng/espeak-ng")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append home-page "/releases/download/" version
|
|
"/espeak-ng-" version ".tar.gz"))
|
|
(sha256
|
|
(base32 "1d10x9rbvqi2zwcz65fxh04k0x0scnk7732l37laz6xra1ldhzng"))))
|
|
(build-system gnu-build-system)
|
|
(arguments
|
|
`(#:configure-flags '("--disable-static")
|
|
;; Building in parallel triggers a race condition in 1.49.2.
|
|
#:parallel-build? #f
|
|
;; XXX: Some tests require an audio device.
|
|
#:tests? #f))
|
|
(inputs
|
|
`(("libcap" ,libcap)
|
|
("pcaudiolib" ,pcaudiolib)))
|
|
(synopsis "Software speech synthesizer")
|
|
(description
|
|
"eSpeak NG is a software speech synthesizer for more than 100 languages.
|
|
It is based on the eSpeak engine and supports spectral and Klatt formant
|
|
synthesis, and the ability to use MBROLA voices.")
|
|
(license license:gpl3+)))
|
|
|
|
(define-public mitlm
|
|
(package
|
|
(name "mitlm")
|
|
(version "0.4.2")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "https://github.com/mitlm/mitlm/releases/"
|
|
"download/v" version "/"
|
|
name "-" version ".tar.xz"))
|
|
(sha256
|
|
(base32
|
|
"09fv4fcpmw9g1j0zml0k5kk1lgjw2spr8gn51llbkaaph6v8d62a"))))
|
|
(build-system gnu-build-system)
|
|
(native-inputs
|
|
`(("gfortran" ,gfortran)))
|
|
(synopsis "The MIT Language Modeling toolkit")
|
|
(description "The MIT Language Modeling (MITLM) toolkit is a set of
|
|
tools designed for the efficient estimation of statistical n-gram language
|
|
models involving iterative parameter estimation. It achieves much of its
|
|
efficiency through the use of a compact vector representation of n-grams.")
|
|
(home-page "https://github.com/mitlm/mitlm")
|
|
(license license:expat)))
|
|
|
|
(define-public speech-dispatcher
|
|
(package
|
|
(name "speech-dispatcher")
|
|
(version "0.9.1")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "https://github.com/brailcom/speechd/releases"
|
|
"/download/" version "/speech-dispatcher-"
|
|
version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"16bg52hnkrsrs7kgbzanb34b9zb6fqxwj0a9bmsxmj1skkil1h1p"))))
|
|
(build-system gnu-build-system)
|
|
(arguments
|
|
`(#:configure-flags '("--disable-static"
|
|
|
|
;; Disable support for proprietary TTS engines.
|
|
"--with-ibmtts=no"
|
|
"--with-kali=no" "--with-baratinoo=no")))
|
|
(native-inputs
|
|
`(("intltool" ,intltool)
|
|
("pkg-config" ,pkg-config)))
|
|
(inputs
|
|
`(("dotconf" ,dotconf)
|
|
("espeak" ,espeak-ng)
|
|
("glib" ,glib)
|
|
("libltdl" ,libltdl)
|
|
("libsndfile" ,libsndfile)
|
|
("pulseaudio" ,pulseaudio)
|
|
("python" ,python)))
|
|
(synopsis "Common interface to speech synthesizers")
|
|
(description "The Speech Dispatcher project provides a high-level
|
|
device independent layer for access to speech synthesis through a simple,
|
|
stable and well documented interface.")
|
|
(home-page "https://devel.freebsoft.org/speechd")
|
|
;; The software is distributed under GPL2+, but includes a number
|
|
;; of files covered by other licenses. Note: in practice, this
|
|
;; is linked against dotconf, which is LGPL 2.1 only.
|
|
(license (list license:gpl2+
|
|
license:fdl1.2+ ; Most files in doc/ are dual gpl2+/fdl1.2+.
|
|
license:lgpl2.1+
|
|
(license:non-copyleft
|
|
;; festival_client.{c,h} carries an expat-style license.
|
|
"See src/modules/festival_client.c in the distribution.")
|
|
license:gpl3+)))) ; doc/texinfo.tex -- with TeX exception.
|
|
|
|
(define-public sonic
|
|
(package
|
|
(name "sonic")
|
|
(version "0.2.0")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "https://github.com/waywardgeek/sonic/archive/"
|
|
"release-" version ".tar.gz"))
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"11a0q9wkgbb9ymf52v7dvybfhj8hprgr67zs1xcng143fvjpr0n7"))))
|
|
(build-system gnu-build-system)
|
|
(arguments
|
|
`(#:tests? #f ; No test suite.
|
|
#:make-flags
|
|
(list (string-append "DESTDIR=" (assoc-ref %outputs "out")))
|
|
#:phases
|
|
(modify-phases %standard-phases
|
|
(delete 'configure)))) ; No ./configure script.
|
|
(synopsis "Speed up or slow down speech")
|
|
(description "Sonic implements a simple algorithm for speeding up or slowing
|
|
down speech. However, it's optimized for speed ups of over 2X, unlike previous
|
|
algorithms for changing speech rate. Sonic is a C library designed to be easily
|
|
integrated into streaming voice applications such as text-to-speech (TTS) back
|
|
ends.
|
|
|
|
The primary motivation behind Sonic is to enable the blind and visually impaired
|
|
to improve their productivity with speech engines, like eSpeak. Sonic can also
|
|
be used by the sighted.")
|
|
(home-page "https://github.com/waywardgeek/sonic")
|
|
(license license:asl2.0)))
|
|
|
|
(define-public festival
|
|
(package
|
|
(name "festival")
|
|
(version "2.5.0")
|
|
(source (origin
|
|
(method url-fetch)
|
|
(uri (string-append "http://festvox.org/packed/festival/"
|
|
(version-major+minor version)
|
|
"/festival-" version "-release.tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1d5415nckiv19adxisxfm1l1xxfyw88g87ckkmcr0lhjdd10g42c"))))
|
|
(build-system gnu-build-system)
|
|
(arguments
|
|
`(#:tests? #f ; there is no test target
|
|
#:make-flags
|
|
(list (string-append "RM="
|
|
(assoc-ref %build-inputs "coreutils")
|
|
"/bin/rm")
|
|
(string-append "ECHO_N="
|
|
(assoc-ref %build-inputs "coreutils")
|
|
"/bin/printf \"%s\""))
|
|
#:parallel-build? #f ; not supported
|
|
#:modules ((guix build gnu-build-system)
|
|
(guix build utils)
|
|
(guix build emacs-utils))
|
|
#:imported-modules (,@%gnu-build-system-modules
|
|
(guix build emacs-utils))
|
|
#:phases
|
|
(modify-phases %standard-phases
|
|
(add-after 'unpack 'unpack-and-patch-speech-tools
|
|
(lambda* (#:key inputs #:allow-other-keys)
|
|
(invoke "tar" "-C" ".."
|
|
"-xf" (assoc-ref inputs "speech-tools"))
|
|
(with-directory-excursion "../speech_tools"
|
|
(substitute* '("config/rules/modules.mak"
|
|
"config/rules/test_make_rules.mak"
|
|
"config/make_system.mak")
|
|
(("/bin/sh") (which "sh"))))
|
|
#t))
|
|
(add-after 'unpack 'patch-/bin/sh
|
|
(lambda _
|
|
(substitute* '("config/test_make_rules"
|
|
"config/make_system.mak")
|
|
(("/bin/sh") (which "sh")))
|
|
#t))
|
|
(add-before 'build 'build-speech-tools
|
|
(lambda* (#:key configure-flags make-flags #:allow-other-keys)
|
|
(with-directory-excursion "../speech_tools"
|
|
(apply invoke "sh" "configure"
|
|
(string-append "CONFIG_SHELL=" (which "sh"))
|
|
(string-append "SHELL=" (which "sh"))
|
|
configure-flags)
|
|
(apply invoke "make" make-flags))))
|
|
(add-after 'build 'build-documentation
|
|
(lambda _
|
|
(with-directory-excursion "doc"
|
|
(invoke "make" "festival.info"))))
|
|
(add-after 'unpack 'set-installation-directories
|
|
(lambda* (#:key outputs #:allow-other-keys)
|
|
(let ((out (assoc-ref outputs "out")))
|
|
(substitute* "config/project.mak"
|
|
(("^FTLIBDIR.*")
|
|
(string-append "FTLIBDIR=" out "/share/festival/lib")))
|
|
(substitute* "config/systems/default.mak"
|
|
(("^INSTALL_PREFIX.*")
|
|
(string-append "INSTALL_PREFIX=" out)))
|
|
#t)))
|
|
(add-after 'install 'actually-install
|
|
(lambda* (#:key inputs outputs #:allow-other-keys)
|
|
(let ((out (assoc-ref outputs "out")))
|
|
;; Install Speech Tools first
|
|
(with-directory-excursion "../speech_tools"
|
|
;; Target directories
|
|
(for-each (lambda (dir)
|
|
(mkdir-p (string-append out dir)))
|
|
'("/bin"
|
|
"/lib"
|
|
"/include/speech_tools/"
|
|
"/include/speech_tools/instantiate"
|
|
"/include/speech_tools/ling_class"
|
|
"/include/speech_tools/rxp"
|
|
"/include/speech_tools/sigpr"
|
|
"/include/speech_tools/unix"))
|
|
;; Install binaries
|
|
(for-each (lambda (file)
|
|
(install-file file (string-append out "/bin")))
|
|
(find-files "bin" ".*"))
|
|
(for-each (lambda (file)
|
|
(delete-file (string-append out "/bin/" file)))
|
|
'("est_gdb" "est_examples" "est_program"))
|
|
;; Install libraries
|
|
(for-each (lambda (file)
|
|
(install-file file (string-append out "/lib")))
|
|
(find-files "lib" "lib.*\\.so.*"))
|
|
|
|
;; Install headers
|
|
(for-each
|
|
(lambda (dir)
|
|
(for-each
|
|
(lambda (header)
|
|
(install-file header
|
|
(string-append out "/include/speech_tools/" dir)))
|
|
(find-files (string-append "include/" dir)
|
|
"\\.h$")))
|
|
'("." "instantiate" "ling_class" "rxp" "sigpr" "unix")))
|
|
|
|
;; Unpack files that will be installed together with the
|
|
;; Festival libraries.
|
|
(invoke "tar" "--strip-components=1"
|
|
"-xvf" (assoc-ref inputs "festvox-cmu"))
|
|
(invoke "tar" "--strip-components=1"
|
|
"-xvf" (assoc-ref inputs "festvox-poslex"))
|
|
(invoke "tar" "--strip-components=1"
|
|
"-xvf" (assoc-ref inputs "default-voice"))
|
|
|
|
;; Install Festival
|
|
(let ((bin (string-append out "/bin"))
|
|
(incdir (string-append out "/include/festival"))
|
|
(share (string-append out "/share/festival"))
|
|
(info (string-append out "/share/info")))
|
|
(for-each (lambda (executable)
|
|
(install-file executable bin))
|
|
'("src/main/festival"
|
|
"src/main/festival_client"
|
|
"examples/benchmark"))
|
|
(let ((scripts '("examples/dumpfeats"
|
|
"examples/durmeanstd"
|
|
"examples/latest"
|
|
"examples/make_utts"
|
|
"examples/powmeanstd"
|
|
"examples/run-festival-script"
|
|
"examples/saytime"
|
|
"examples/scfg_parse_text"
|
|
"examples/text2pos"
|
|
"examples/text2wave")))
|
|
(substitute* scripts
|
|
(("exec /tmp/guix-build.*/bin/festival")
|
|
(string-append "exec " bin "/festival")))
|
|
(for-each (lambda (script)
|
|
(install-file script bin))
|
|
scripts))
|
|
|
|
;; Documentation
|
|
(for-each (lambda (file)
|
|
(install-file file info))
|
|
(find-files "doc/info/" "festival.info.*"))
|
|
|
|
;; Headers
|
|
(mkdir-p incdir)
|
|
(for-each (lambda (header)
|
|
(install-file header
|
|
(string-append incdir "/"
|
|
(dirname header))))
|
|
(find-files "src/include" "\\.h$"))
|
|
|
|
;; Data
|
|
(mkdir-p share)
|
|
(for-each (lambda (file)
|
|
(install-file file
|
|
(string-append share "/"
|
|
(dirname file))))
|
|
(find-files "lib" ".*"))
|
|
(for-each delete-file
|
|
(append (find-files share "Makefile")
|
|
(find-files bin "Makefile")))))
|
|
#t))
|
|
(add-after 'actually-install 'install-emacs-mode
|
|
(lambda* (#:key outputs #:allow-other-keys)
|
|
(let ((emacs-dir (string-append (assoc-ref outputs "out")
|
|
"/share/emacs/site-lisp")))
|
|
(install-file "lib/festival.el" emacs-dir)
|
|
(emacs-generate-autoloads ,name emacs-dir)
|
|
#t)))
|
|
;; Rebuild the very old configure script that is confused by extra
|
|
;; arguments.
|
|
(add-before 'configure 'bootstrap
|
|
(lambda _ (invoke "autoreconf" "-vif"))))))
|
|
(inputs
|
|
`(("ncurses" ,ncurses)))
|
|
(native-inputs
|
|
`(("autoconf" ,autoconf)
|
|
("automake" ,automake)
|
|
("texinfo" ,texinfo)
|
|
("emacs" ,emacs-minimal)
|
|
("festvox-cmu"
|
|
,(origin
|
|
(method url-fetch)
|
|
(uri (string-append "http://festvox.org/packed/festival/"
|
|
(version-major+minor version)
|
|
"/festlex_CMU.tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"01vwidqhhg2zifvk1gby91mckg1z2pv2mj6lihvdaifakf8k1561"))))
|
|
("festvox-poslex"
|
|
,(origin
|
|
(method url-fetch)
|
|
(uri (string-append "http://festvox.org/packed/festival/"
|
|
(version-major+minor version)
|
|
"/festlex_POSLEX.tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"18wywilxaqwy63lc47p5g5529mpxhslibh1bjij0snxx5mjf7ip7"))))
|
|
("default-voice"
|
|
,(origin
|
|
(method url-fetch)
|
|
(uri (string-append "http://festvox.org/packed/festival/"
|
|
(version-major+minor version)
|
|
"/voices/festvox_kallpc16k.tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"136hmsyiwnlg2qwa508dy0imf19mzrb5r3dmb2kg8kcyxnslm740"))))
|
|
("speech-tools"
|
|
,(origin
|
|
(method url-fetch)
|
|
(uri (string-append "http://festvox.org/packed/festival/"
|
|
(version-major+minor version)
|
|
"/speech_tools-" version "-release.tar.gz"))
|
|
(sha256
|
|
(base32
|
|
"1k2xh13miyv48gh06rgsq2vj25xwj7z6vwq9ilsn8i7ig3nrgzg4"))))))
|
|
(home-page "http://www.cstr.ed.ac.uk/projects/festival/")
|
|
(synopsis "Speech synthesis system")
|
|
(description "Festival offers a general framework for building speech
|
|
synthesis systems as well as including examples of various modules. As a
|
|
whole it offers full text to speech through a number APIs: from shell level,
|
|
though a Scheme command interpreter, as a C++ library, from Java, and an Emacs
|
|
interface. Festival is multi-lingual though English is the most advanced.
|
|
The system is written in C++ and uses the Edinburgh Speech Tools Library for
|
|
low level architecture and has a Scheme (SIOD) based command interpreter for
|
|
control.")
|
|
(license (license:non-copyleft "file://COPYING"))))
|