2016-05-24 18:53:18 +02:00
|
|
|
;;; GNU Guix --- Functional package management for GNU
|
|
|
|
;;; Copyright © 2016 David Thompson <davet@gnu.org>
|
2019-02-25 13:58:53 +01:00
|
|
|
;;; Copyright © 2016, 2019 Marius Bakke <mbakke@fastmail.com>
|
2017-01-02 03:20:08 +01:00
|
|
|
;;; Copyright © 2017 Leo Famulari <leo@famulari.name>
|
2018-01-18 00:56:39 +01:00
|
|
|
;;; Copyright © 2018 Tobias Geerinckx-Rice <me@tobias.gr>
|
2019-02-25 14:35:14 +01:00
|
|
|
;;; Copyright © 2016 Kei Kebreau <kkebreau@posteo.net>
|
2016-05-24 18:53:18 +02:00
|
|
|
;;;
|
|
|
|
;;; This file is part of GNU Guix.
|
|
|
|
;;;
|
|
|
|
;;; GNU Guix is free software; you can redistribute it and/or modify it
|
|
|
|
;;; under the terms of the GNU General Public License as published by
|
|
|
|
;;; the Free Software Foundation; either version 3 of the License, or (at
|
|
|
|
;;; your option) any later version.
|
|
|
|
;;;
|
|
|
|
;;; GNU Guix is distributed in the hope that it will be useful, but
|
|
|
|
;;; WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
;;; GNU General Public License for more details.
|
|
|
|
;;;
|
|
|
|
;;; You should have received a copy of the GNU General Public License
|
|
|
|
;;; along with GNU Guix. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
|
|
|
|
(define-module (gnu packages speech)
|
|
|
|
#:use-module ((guix licenses) #:prefix license:)
|
|
|
|
#:use-module (guix packages)
|
|
|
|
#:use-module (guix download)
|
2019-02-25 14:35:14 +01:00
|
|
|
#:use-module (guix utils)
|
2016-05-24 18:53:18 +02:00
|
|
|
#:use-module (guix build-system gnu)
|
|
|
|
#:use-module (gnu packages)
|
2017-04-09 11:42:47 +02:00
|
|
|
#:use-module (gnu packages audio)
|
2016-10-13 00:26:25 +02:00
|
|
|
#:use-module (gnu packages autotools)
|
2019-02-25 14:35:14 +01:00
|
|
|
#:use-module (gnu packages compression)
|
2016-10-13 00:26:25 +02:00
|
|
|
#:use-module (gnu packages gcc)
|
|
|
|
#:use-module (gnu packages glib)
|
2019-02-25 13:58:53 +01:00
|
|
|
#:use-module (gnu packages linux)
|
2016-10-13 00:26:25 +02:00
|
|
|
#:use-module (gnu packages pkg-config)
|
|
|
|
#:use-module (gnu packages pulseaudio)
|
2017-04-09 11:42:47 +02:00
|
|
|
#:use-module (gnu packages python)
|
2016-10-13 00:26:25 +02:00
|
|
|
#:use-module (gnu packages textutils))
|
2016-05-24 18:53:18 +02:00
|
|
|
|
2019-02-25 14:35:14 +01:00
|
|
|
(define-public espeak
|
|
|
|
(package
|
|
|
|
(name "espeak")
|
|
|
|
(version "1.48.04")
|
|
|
|
(source (origin
|
|
|
|
(method url-fetch)
|
|
|
|
(uri (string-append "mirror://sourceforge/espeak/espeak/"
|
|
|
|
"espeak-" (version-major+minor version)
|
|
|
|
"/espeak-" version "-source.zip"))
|
|
|
|
(sha256
|
|
|
|
(base32
|
|
|
|
"0n86gwh9pw0jqqpdz7mxggllfr8k0r7pc67ayy7w5z6z79kig6mz"))
|
|
|
|
(modules '((guix build utils)))
|
|
|
|
(snippet
|
|
|
|
;; remove prebuilt binaries
|
|
|
|
'(begin
|
|
|
|
(delete-file-recursively "linux_32bit")
|
|
|
|
#t))))
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
(arguments
|
|
|
|
`(#:make-flags (list (string-append "PREFIX=" (assoc-ref %outputs "out"))
|
|
|
|
(string-append "DATADIR="
|
|
|
|
(assoc-ref %outputs "out")
|
|
|
|
"/share/espeak-data")
|
|
|
|
(string-append "LDFLAGS=-Wl,-rpath="
|
|
|
|
(assoc-ref %outputs "out")
|
|
|
|
"/lib")
|
|
|
|
"AUDIO=pulseaudio")
|
|
|
|
#:tests? #f ; no check target
|
|
|
|
#:phases
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
(replace 'configure
|
|
|
|
(lambda _
|
|
|
|
(chdir "src")
|
|
|
|
;; We use version 19 of the PortAudio library, so we must copy the
|
|
|
|
;; corresponding file to be sure that espeak compiles correctly.
|
|
|
|
(copy-file "portaudio19.h" "portaudio.h")
|
|
|
|
(substitute* "Makefile"
|
|
|
|
(("/bin/ln") "ln"))
|
|
|
|
#t)))))
|
|
|
|
(inputs
|
|
|
|
`(("portaudio" ,portaudio)
|
|
|
|
("pulseaudio" ,pulseaudio)))
|
|
|
|
(native-inputs `(("unzip" ,unzip)))
|
|
|
|
(home-page "http://espeak.sourceforge.net/")
|
|
|
|
(synopsis "Software speech synthesizer")
|
|
|
|
(description "eSpeak is a software speech synthesizer for English and
|
|
|
|
other languages. eSpeak uses a \"formant synthesis\" method. This allows many
|
|
|
|
languages to be provided in a small size. The speech is clear, and can be used
|
|
|
|
at high speeds, but is not as natural or smooth as larger synthesizers which are
|
|
|
|
based on human speech recordings.")
|
|
|
|
(license license:gpl3+)))
|
|
|
|
|
2019-02-25 13:58:53 +01:00
|
|
|
(define-public espeak-ng
|
|
|
|
(package
|
|
|
|
(name "espeak-ng")
|
|
|
|
(version "1.49.2")
|
|
|
|
(home-page "https://github.com/espeak-ng/espeak-ng")
|
|
|
|
(source (origin
|
|
|
|
(method url-fetch)
|
|
|
|
(uri (string-append home-page "/releases/download/" version
|
|
|
|
"/espeak-ng-" version ".tar.gz"))
|
|
|
|
(sha256
|
|
|
|
(base32 "1d10x9rbvqi2zwcz65fxh04k0x0scnk7732l37laz6xra1ldhzng"))))
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
(arguments
|
|
|
|
`(#:configure-flags '("--disable-static")
|
|
|
|
;; Building in parallel triggers a race condition in 1.49.2.
|
|
|
|
#:parallel-build? #f
|
|
|
|
;; XXX: Some tests require an audio device.
|
|
|
|
#:tests? #f))
|
|
|
|
(inputs
|
|
|
|
`(("libcap" ,libcap)
|
|
|
|
("pcaudiolib" ,pcaudiolib)))
|
|
|
|
(synopsis "Software speech synthesizer")
|
|
|
|
(description
|
|
|
|
"eSpeak NG is a software speech synthesizer for more than 100 languages.
|
|
|
|
It is based on the eSpeak engine and supports spectral and Klatt formant
|
|
|
|
synthesis, and the ability to use MBROLA voices.")
|
|
|
|
(license license:gpl3+)))
|
|
|
|
|
2016-05-24 18:53:18 +02:00
|
|
|
(define-public mitlm
|
|
|
|
(package
|
|
|
|
(name "mitlm")
|
2018-01-18 00:56:39 +01:00
|
|
|
(version "0.4.2")
|
2016-05-24 18:53:18 +02:00
|
|
|
(source (origin
|
|
|
|
(method url-fetch)
|
2018-01-18 00:56:39 +01:00
|
|
|
(uri (string-append "https://github.com/mitlm/mitlm/releases/"
|
|
|
|
"download/v" version "/"
|
|
|
|
name "-" version ".tar.xz"))
|
2016-05-24 18:53:18 +02:00
|
|
|
(sha256
|
|
|
|
(base32
|
2018-01-18 00:56:39 +01:00
|
|
|
"09fv4fcpmw9g1j0zml0k5kk1lgjw2spr8gn51llbkaaph6v8d62a"))))
|
2016-05-24 18:53:18 +02:00
|
|
|
(build-system gnu-build-system)
|
|
|
|
(native-inputs
|
|
|
|
`(("gfortran" ,gfortran)))
|
|
|
|
(synopsis "The MIT Language Modeling toolkit")
|
|
|
|
(description "The MIT Language Modeling (MITLM) toolkit is a set of
|
|
|
|
tools designed for the efficient estimation of statistical n-gram language
|
|
|
|
models involving iterative parameter estimation. It achieves much of its
|
|
|
|
efficiency through the use of a compact vector representation of n-grams.")
|
|
|
|
(home-page "https://github.com/mitlm/mitlm")
|
|
|
|
(license license:expat)))
|
2016-10-13 00:26:25 +02:00
|
|
|
|
|
|
|
(define-public speech-dispatcher
|
|
|
|
(package
|
|
|
|
(name "speech-dispatcher")
|
2019-05-11 17:58:22 +02:00
|
|
|
(version "0.9.1")
|
2016-10-13 00:26:25 +02:00
|
|
|
(source (origin
|
|
|
|
(method url-fetch)
|
2019-02-25 13:28:35 +01:00
|
|
|
(uri (string-append "https://github.com/brailcom/speechd/releases"
|
|
|
|
"/download/" version "/speech-dispatcher-"
|
2016-10-13 00:26:25 +02:00
|
|
|
version ".tar.gz"))
|
|
|
|
(sha256
|
|
|
|
(base32
|
2019-05-11 17:58:22 +02:00
|
|
|
"16bg52hnkrsrs7kgbzanb34b9zb6fqxwj0a9bmsxmj1skkil1h1p"))))
|
2016-10-13 00:26:25 +02:00
|
|
|
(build-system gnu-build-system)
|
2019-02-25 13:27:58 +01:00
|
|
|
(arguments
|
2019-02-25 13:28:35 +01:00
|
|
|
`(#:configure-flags '("--disable-static"
|
2019-05-11 17:58:22 +02:00
|
|
|
|
2019-02-25 13:28:35 +01:00
|
|
|
;; Disable support for proprietary TTS engines.
|
2019-05-11 17:58:22 +02:00
|
|
|
"--with-ibmtts=no"
|
2019-02-25 13:28:35 +01:00
|
|
|
"--with-kali=no" "--with-baratinoo=no")))
|
2016-10-13 00:26:25 +02:00
|
|
|
(native-inputs
|
|
|
|
`(("intltool" ,intltool)
|
|
|
|
("pkg-config" ,pkg-config)))
|
|
|
|
(inputs
|
|
|
|
`(("dotconf" ,dotconf)
|
2019-02-25 14:03:06 +01:00
|
|
|
("espeak" ,espeak-ng)
|
2016-10-13 00:26:25 +02:00
|
|
|
("glib" ,glib)
|
|
|
|
("libltdl" ,libltdl)
|
2017-04-09 11:42:47 +02:00
|
|
|
("libsndfile" ,libsndfile)
|
|
|
|
("pulseaudio" ,pulseaudio)
|
|
|
|
("python" ,python)))
|
2016-10-13 00:26:25 +02:00
|
|
|
(synopsis "Common interface to speech synthesizers")
|
|
|
|
(description "The Speech Dispatcher project provides a high-level
|
|
|
|
device independent layer for access to speech synthesis through a simple,
|
|
|
|
stable and well documented interface.")
|
|
|
|
(home-page "https://devel.freebsoft.org/speechd")
|
|
|
|
;; The software is distributed under GPL2+, but includes a number
|
2019-05-11 17:58:22 +02:00
|
|
|
;; of files covered by other licenses. Note: in practice, this
|
|
|
|
;; is linked against dotconf, which is LGPL 2.1 only.
|
2016-10-13 00:26:25 +02:00
|
|
|
(license (list license:gpl2+
|
|
|
|
license:fdl1.2+ ; Most files in doc/ are dual gpl2+/fdl1.2+.
|
|
|
|
license:lgpl2.1+
|
|
|
|
(license:non-copyleft
|
|
|
|
;; festival_client.{c,h} carries an expat-style license.
|
|
|
|
"See src/modules/festival_client.c in the distribution.")
|
|
|
|
license:gpl3+)))) ; doc/texinfo.tex -- with TeX exception.
|
2017-01-02 03:20:08 +01:00
|
|
|
|
|
|
|
(define-public sonic
|
|
|
|
(package
|
|
|
|
(name "sonic")
|
|
|
|
(version "0.2.0")
|
|
|
|
(source (origin
|
|
|
|
(method url-fetch)
|
|
|
|
(uri (string-append "https://github.com/waywardgeek/sonic/archive/"
|
|
|
|
"release-" version ".tar.gz"))
|
|
|
|
(file-name (string-append name "-" version ".tar.gz"))
|
|
|
|
(sha256
|
|
|
|
(base32
|
|
|
|
"11a0q9wkgbb9ymf52v7dvybfhj8hprgr67zs1xcng143fvjpr0n7"))))
|
|
|
|
(build-system gnu-build-system)
|
|
|
|
(arguments
|
|
|
|
`(#:tests? #f ; No test suite.
|
|
|
|
#:make-flags
|
|
|
|
(list (string-append "DESTDIR=" (assoc-ref %outputs "out")))
|
|
|
|
#:phases
|
|
|
|
(modify-phases %standard-phases
|
|
|
|
(delete 'configure)))) ; No ./configure script.
|
|
|
|
(synopsis "Speed up or slow down speech")
|
|
|
|
(description "Sonic implements a simple algorithm for speeding up or slowing
|
|
|
|
down speech. However, it's optimized for speed ups of over 2X, unlike previous
|
|
|
|
algorithms for changing speech rate. Sonic is a C library designed to be easily
|
|
|
|
integrated into streaming voice applications such as text-to-speech (TTS) back
|
|
|
|
ends.
|
|
|
|
|
|
|
|
The primary motivation behind Sonic is to enable the blind and visually impaired
|
|
|
|
to improve their productivity with speech engines, like eSpeak. Sonic can also
|
|
|
|
be used by the sighted.")
|
|
|
|
(home-page "https://github.com/waywardgeek/sonic")
|
|
|
|
(license license:asl2.0)))
|