flightgear/3rdparty/flite_hts_engine/bin/flite_hts_engine.c
2022-10-20 20:29:11 +08:00

221 lines
9.2 KiB
C

/* ----------------------------------------------------------------- */
/* The English TTS System "Flite+hts_engine" */
/* developed by HTS Working Group */
/* http://hts-engine.sourceforge.net/ */
/* ----------------------------------------------------------------- */
/* */
/* Copyright (c) 2005-2013 Nagoya Institute of Technology */
/* Department of Computer Science */
/* */
/* 2005-2008 Tokyo Institute of Technology */
/* Interdisciplinary Graduate School of */
/* Science and Engineering */
/* */
/* All rights reserved. */
/* */
/* Redistribution and use in source and binary forms, with or */
/* without modification, are permitted provided that the following */
/* conditions are met: */
/* */
/* - Redistributions of source code must retain the above copyright */
/* notice, this list of conditions and the following disclaimer. */
/* - Redistributions in binary form must reproduce the above */
/* copyright notice, this list of conditions and the following */
/* disclaimer in the documentation and/or other materials provided */
/* with the distribution. */
/* - Neither the name of the HTS working group nor the names of its */
/* contributors may be used to endorse or promote products derived */
/* from this software without specific prior written permission. */
/* */
/* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND */
/* CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, */
/* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF */
/* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE */
/* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS */
/* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, */
/* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED */
/* TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, */
/* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON */
/* ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, */
/* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY */
/* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE */
/* POSSIBILITY OF SUCH DAMAGE. */
/* ----------------------------------------------------------------- */
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include <stdarg.h>
#include "flite_hts_engine.h"
#define INPUT_BUFF_SIZE 1024
/* usage: output usage */
static void usage(void)
{
fprintf(stderr, "The English TTS System \"Flite+hts_engine\"\n");
fprintf(stderr, "Version 1.05 (http://hts-engine.sourceforge.net/)\n");
fprintf(stderr, "Copyright (C) 2005-2013 Nagoya Institute of Technology\n");
fprintf(stderr, " 2005-2008 Tokyo Institute of Technology\n");
fprintf(stderr, "All rights reserved.\n");
fprintf(stderr, "\n%s\n", HTS_COPYRIGHT);
fprintf(stderr, "CMU Flite\n");
fprintf(stderr, "Version 1.4 (http://www.speech.cs.cmu.edu/flite/)\n");
fprintf(stderr, "Copyright (C) 1999-2009 Carnegie Mellon University\n");
fprintf(stderr, "All rights reserved.\n");
fprintf(stderr, "\n");
fprintf(stderr, "flite_hts_engine - The English TTS system \"Flite+hts_engine\"\n");
fprintf(stderr, "\n");
fprintf(stderr, " usage:\n");
fprintf(stderr, " flite_hts_engine [ options ] [ infile ] \n");
fprintf(stderr, " options: [ def][ min-- max]\n");
fprintf(stderr, " -m htsvoice : HTS voice [ N/A]\n");
fprintf(stderr, " -o wav : filename of output wav audio (generated speech) [ N/A]\n");
fprintf(stderr, " -s i : sampling frequency [ auto][ 1-- ]\n");
fprintf(stderr, " -p i : frame period (point) [ auto][ 1-- ]\n");
fprintf(stderr, " -a f : all-pass constant [ auto][ 0.0-- 1.0]\n");
fprintf(stderr, " -b f : postfiltering coefficient [ 0.0][ 0.0-- 1.0]\n");
fprintf(stderr, " -r f : speech speed rate [ 1.0][ 0.0-- ]\n");
fprintf(stderr, " -fm : additional half-tone [ 0.0][ -- ]\n");
fprintf(stderr, " -u f : voiced/unvoiced threshold [ 0.5][ 0.0-- 1.0]\n");
fprintf(stderr, " -jm f : weight of GV for spectrum [ 1.0][ 0.0-- ]\n");
fprintf(stderr, " -jf f : weight of GV for Log F0 [ 1.0][ 0.0-- ]\n");
fprintf(stderr, " -z i : audio buffer size (if i==0, turn off) [ 0][ 0-- ]\n");
fprintf(stderr, " infile:\n");
fprintf(stderr, " text file [stdin]\n");
fprintf(stderr, "\n");
exit(0);
}
int main(int argc, char **argv)
{
size_t i;
char buff[INPUT_BUFF_SIZE];
FILE *fp_txt = stdin;
char *fn_txt = NULL;
char *fn_wav = NULL;
char *fn_voice = NULL;
/* Flite+hts_engine */
Flite_HTS_Engine engine;
/* parse command line */
if (argc == 1)
usage();
/* initialize engine */
Flite_HTS_Engine_initialize(&engine);
/* get HTS voice file name */
for (i = 0; i < argc; i++) {
if (argv[i][0] == '-' && argv[i][1] == 'm')
fn_voice = argv[++i];
if (argv[i][0] == '-' && argv[i][1] == 'h')
usage();
}
if (fn_voice == NULL) {
fprintf(stderr, "flite_hts_engine: HTS voice must be specified.\n");
exit(1);
}
/* load HTS voice */
if (Flite_HTS_Engine_load(&engine, fn_voice) != TRUE) {
fprintf(stderr, "flite_hts_engine: HTS voice cannot be loaded.\n");
Flite_HTS_Engine_clear(&engine);
exit(1);
}
/* read command */
while (--argc) {
if (**++argv == '-') {
switch (*(*argv + 1)) {
case 'm': /* HTS voice was already loaded */
++argv;
--argc;
break;
case 'o':
fn_wav = *++argv;
--argc;
break;
case 'h':
usage();
break;
case 's':
Flite_HTS_Engine_set_sampling_frequency(&engine, (size_t) atoi(*++argv));
--argc;
break;
case 'p':
Flite_HTS_Engine_set_fperiod(&engine, (size_t) atoi(*++argv));
--argc;
break;
case 'a':
Flite_HTS_Engine_set_alpha(&engine, atof(*++argv));
--argc;
break;
case 'b':
Flite_HTS_Engine_set_beta(&engine, atof(*++argv));
--argc;
break;
case 'r':
Flite_HTS_Engine_set_speed(&engine, atof(*++argv));
--argc;
break;
case 'f':
switch (*(*argv + 2)) {
case 'm':
Flite_HTS_Engine_add_half_tone(&engine, atof(*++argv));
break;
default:
fprintf(stderr, "flite_hts_engine: Invalid option '-f%c'.\n", *(*argv + 2));
exit(1);
}
--argc;
break;
case 'u':
Flite_HTS_Engine_set_msd_threshold(&engine, 1, atof(*++argv));
--argc;
break;
case 'j':
switch (*(*argv + 2)) {
case 'm':
Flite_HTS_Engine_set_gv_weight(&engine, 0, atof(*++argv));
break;
case 'f':
case 'p':
Flite_HTS_Engine_set_gv_weight(&engine, 1, atof(*++argv));
break;
default:
fprintf(stderr, "flite_hts_engine: Invalid option '-j%c'.\n", *(*argv + 2));
exit(1);
}
--argc;
break;
case 'z':
Flite_HTS_Engine_set_audio_buff_size(&engine, atoi(*++argv));
--argc;
break;
default:
fprintf(stderr, "flite_hts_engine: Invalid option '-%c'.\n", *(*argv + 1));
exit(1);
}
} else {
fn_txt = *argv;
}
}
/* synthesis */
if (fn_txt != NULL)
fp_txt = fopen(fn_txt, "r");
if (fgets(buff, INPUT_BUFF_SIZE, fp_txt) != NULL && strlen(buff) > 0)
Flite_HTS_Engine_synthesize(&engine, buff, fn_wav);
if (fn_txt != NULL)
fclose(fp_txt);
/* free */
Flite_HTS_Engine_clear(&engine);
return 0;
}