3 # Open \______ \ ____ ____ | | _\_ |__ _______ ___
4 # Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
5 # Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
6 # Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
10 # Copyright (C) 2007 Jonas Häggqvist
12 # All files in this archive are subject to the GNU General Public License.
13 # See the file COPYING in the source tree root for full license agreement.
15 # This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
16 # KIND, either express or implied.
23 use vars
qw($V $C $t $l $e $E $s $S $i $v);
26 use Digest::MD5 qw(md5_hex);
28 use open ':encoding(utf8)';
34 Usage: voice.pl [options] [path to dir]
36 Create voice file. You must also specify -t and -l.
42 Specify which target you want to build voicefile for. Must include
43 any features that target supports.
46 Numeric target id. Needed for voice building.
49 Specify which language you want to build. Without .lang extension.
52 Which encoder to use for voice strings
55 Which encoder options to use when compressing voice strings. Enclose
56 in double quotes if the options include spaces.
59 Which TTS engine to use.
61 -S=<TTS engine options>
62 Options to pass to the TTS engine. Enclose in double quotes if the
63 options include spaces.
71 # Initialize TTS engine. May return an object or value which will be passed
72 # to voicestring and shutdown_tts
75 my ($tts_engine, $tts_engine_opts, $language) = @_;
76 my %ret = ("name" => $tts_engine);
79 print("> festival $tts_engine_opts --server\n") if $verbose;
80 my $pid = open(FESTIVAL_SERVER
, "| festival $tts_engine_opts --server > /dev/null 2>&1");
81 my $dummy = *FESTIVAL_SERVER
; #suppress warning
82 $SIG{INT
} = sub { kill TERM
=> $pid; print("foo"); panic_cleanup
(); };
83 $SIG{KILL
} = sub { kill TERM
=> $pid; print("boo"); panic_cleanup
(); };
87 my $toolsdir = dirname
($0);
88 my $path = `cygpath $toolsdir -a -w`;
91 my $cmd = $path . "sapi_voice.vbs /language:$language $tts_engine_opts";
93 print("> cscript //nologo $cmd\n") if $verbose;
94 my $pid = open2
(*CMD_OUT
, *CMD_IN
, "cscript //nologo $cmd");
95 binmode(*CMD_IN
, ':encoding(utf16le)');
96 binmode(*CMD_OUT
, ':encoding(utf16le)');
97 $SIG{INT
} = sub { print(CMD_IN
"QUIT\r\n"); panic_cleanup
(); };
98 $SIG{KILL
} = sub { print(CMD_IN
"QUIT\r\n"); panic_cleanup
(); };
99 print(CMD_IN
"QUERY\tVENDOR\r\n");
100 my $vendor = readline(*CMD_OUT
);
104 "stdout" => *CMD_OUT
,
105 "vendor" => $vendor);
111 # Shutdown TTS engine if necessary.
113 my ($tts_object) = @_;
114 switch
($$tts_object{"name"}) {
116 # Send SIGTERM to festival server
117 kill TERM
=> $$tts_object{"pid"};
120 print({$$tts_object{"stdin"}} "QUIT\r\n");
121 close($$tts_object{"stdin"});
126 # Apply corrections to a voice-string to make it sound better
129 my ($string, $language, $tts_object) = @_;
131 my $corrections = $tts_object->{"corrections"};
133 foreach (@
$corrections) {
134 my $r = "s" . $_->{separator
} . $_->{search
} . $_->{separator
}
135 . $_->{replace
} . $_->{separator
} . $_->{modifier
};
136 eval ('$string =~' . "$r;");
138 if ($orig ne $string) {
139 printf("%s -> %s\n", $orig, $string) if $verbose;
144 # Produce a wav file of the text given
147 my ($string, $output, $tts_engine_opts, $tts_object) = @_;
149 printf("Generate \"%s\" with %s in file %s\n", $string, $$tts_object{"name"}, $output) if $verbose;
150 switch
($$tts_object{"name"}) {
152 # festival_client lies to us, so we have to do awful soul-eating
153 # work with IPC::open3()
154 $cmd = "festival_client --server localhost --otype riff --ttw --output \"$output\"";
155 # Use festival-prolog.scm if it's there (created by user of tools/configure)
156 if (-f
"festival-prolog.scm") {
157 $cmd .= " --prolog festival-prolog.scm";
159 print("> $cmd\n") if $verbose;
160 # Open command, and filehandles for STDIN, STDOUT, STDERR
161 my $pid = open3
(*CMD_IN
, *CMD_OUT
, *CMD_ERR
, $cmd);
162 # Put the string to speak into STDIN and close it
163 print(CMD_IN
$string);
165 # Read all output from festival_client (because it LIES TO US)
172 $cmd = "flite $tts_engine_opts -t \"$string\" \"$output\"";
173 print("> $cmd\n") if $verbose;
177 $cmd = "espeak $tts_engine_opts -w \"$output\"";
178 print("> $cmd\n") if $verbose;
179 open(ESPEAK
, "| $cmd");
180 print ESPEAK
$string . "\n";
184 print({$$tts_object{"stdin"}} "SPEAK\t$output\t$string\r\n");
187 $cmd = "swift $tts_engine_opts -o \"$output\" \"$string\"";
188 print("> $cmd\n") if $verbose;
194 # trim leading / trailing silence from the clip
197 my ($file, $threshold, $tts_object) = @_;
198 printf("Trim \"%s\"\n", $file) if $verbose;
199 my $cmd = "wavtrim \"$file\" $threshold";
200 if ($$tts_object{"name"} eq "sapi") {
201 print({$$tts_object{"stdin"}} "EXEC\t$cmd\r\n");
204 print("> $cmd\n") if $verbose;
209 # Encode a wav file into the given destination file
212 my ($input, $output, $encoder, $encoder_opts, $tts_object) = @_;
213 printf("Encode \"%s\" with %s in file %s\n", $input, $encoder, $output) if $verbose;
214 my $cmd = "$encoder $encoder_opts \"$input\" \"$output\"";
215 if ($$tts_object{"name"} eq "sapi") {
216 print({$$tts_object{"stdin"}} "EXEC\t$cmd\r\n");
219 print("> $cmd\n") if $verbose;
224 # synchronize the clip generation / processing if it's running in another process
226 my ($tts_object) = @_;
227 if ($$tts_object{"name"} eq "sapi") {
228 print({$$tts_object{"stdin"}} "SYNC\t42\r\n");
229 my $wait = readline($$tts_object{"stdout"});
230 #ignore what's actually returned
234 # Run genlang and create voice clips for each string
237 my ($language, $target, $encoder, $encoder_opts, $tts_engine, $tts_engine_opts) = @_;
238 my $english = dirname
($0) . '/../apps/lang/english.lang';
239 my $langfile = dirname
($0) . '/../apps/lang/' . $language . '.lang';
240 my $correctionsfile = dirname
($0) . '/voice-corrections.txt';
243 my $cmd = "genlang -o -t=$target -e=$english $langfile 2>/dev/null";
245 open(VOICEFONTIDS
, "> voicefontids");
247 local $| = 1; # make progress indicator work reliably
249 my $tts_object = init_tts
($tts_engine, $tts_engine_opts, $language);
250 # add string corrections to tts_object.
252 open(VOICEREGEXP
, "<$correctionsfile") or die "Can't open corrections file!\n";
253 while(<VOICEREGEXP
>) {
254 # get first character of line
256 my $separator = substr($_, 0, 1);
257 if($separator =~ m/\s+/) {
261 $line =~ s/^.//g; # remove separator at beginning
262 my ($lang, $engine, $vendor, $search, $replace, $modifier) = split(/$separator/, $line);
264 # does language match?
265 if($language !~ m/$lang/) {
268 if($$tts_object{"name"} !~ m/$engine/) {
271 my $v = $$tts_object{"vendor"} || ""; # vendor might be empty in $tts_object
272 if($v !~ m/$vendor/) {
275 push @corrects, {separator
=> $separator, search
=> $search, replace
=> $replace, modifier
=> $modifier};
279 $tts_object->{corrections
} = [@corrects];
281 print("Generating voice clips");
282 print("\n") if $verbose;
285 print(VOICEFONTIDS
$line);
286 if ($line =~ /^id: (.*)$/) {
289 elsif ($line =~ /^voice: "(.*)"$/) {
291 if ($id !~ /^NOT_USED_.*$/ && $voice ne "") {
292 my $wav = $id . '.wav';
293 my $mp3 = $id . '.mp3';
295 # Print some progress information
296 if (++$i % 10 == 0 and !$verbose) {
300 # Apply corrections to the string
301 $voice = correct_string
($voice, $language, $tts_object);
303 # If we have a pool of snippets, see if the string exists there first
304 if (defined($ENV{'POOL'})) {
305 $pool_file = sprintf("%s/%s-%s.mp3", $ENV{'POOL'},
306 md5_hex
("$voice $tts_engine $tts_engine_opts $encoder_opts"),
309 printf("Re-using %s (%s) from pool\n", $id, $voice) if $verbose;
310 copy
($pool_file, $mp3);
314 # Don't generate MP3 if it already exists (probably from the POOL)
316 if ($id eq "VOICE_PAUSE") {
317 print("Use distributed $wav\n") if $verbose;
318 copy
(dirname
($0)."/VOICE_PAUSE.wav", $wav);
321 voicestring
($voice, $wav, $tts_engine_opts, $tts_object);
322 wavtrim
($wav, 500, $tts_object);
323 # 500 seems to be a reasonable default for now
326 encodewav
($wav, $mp3, $encoder, $encoder_opts, $tts_object);
327 synchronize
($tts_object);
328 if (defined($ENV{'POOL'})) {
329 copy
($mp3, $pool_file);
340 shutdown_tts
($tts_object);
343 # Assemble the voicefile
346 my ($language, $target_id) = @_;
348 $outfile = sprintf("%s.voice", $language);
349 printf("Saving voice file to %s\n", $outfile) if $verbose;
350 my $cmd = "voicefont 'voicefontids' $target_id ./ $outfile";
351 print("> $cmd\n") if $verbose;
353 print($output) if $verbose;
357 for (glob('*.mp3')) {
360 for (glob('*.wav')) {
370 # Generate .talk clips
373 my ($dir, $tts_object, $encoder, $encoder_opts, $tts_engine_opts, $i) = @_;
374 my $d = new DirHandle
$dir;
375 while (my $file = $d->read) {
376 my ($voice, $wav, $mp3);
377 # Print some progress information
378 if (++$i % 10 == 0 and !$verbose) {
382 # Convert to a complete path
383 my $path = sprintf("%s/%s", $dir, $file);
386 $wav = sprintf("%s.talk.wav", $path);
388 # Ignore dot-dirs and talk files
389 if ($file eq '.' || $file eq '..' || $file =~ /\.talk$/) {
394 gentalkclips
($path, $tts_object, $encoder, $encoder_opts, $tts_engine_opts, $i);
395 $mp3 = sprintf("%s/_dirname.talk", $path);
399 $mp3 = sprintf("%s.talk", $path);
400 $voice =~ s/\.[^\.]*$//; # Trim extension
403 printf("Talkclip %s: %s", $mp3, $voice) if $verbose;
405 voicestring
($voice, $wav, $tts_engine_opts, $tts_object);
406 wavtrim
($wav, 500, $tts_object);
407 # 500 seems to be a reasonable default for now
408 encodewav
($wav, $mp3, $encoder, $encoder_opts, $tts_object);
409 synchronize
($tts_object);
417 unless (defined($V) or defined($C)) { print("Missing either -V or -C\n"); $printusage = 1; }
419 unless (defined($t)) { print("Missing -t argument\n"); $printusage = 1; }
420 unless (defined($l)) { print("Missing -l argument\n"); $printusage = 1; }
421 unless (defined($i)) { print("Missing -i argument\n"); $printusage = 1; }
423 elsif (defined($C)) {
424 unless (defined($ARGV[0])) { print "Missing path argument\n"; $printusage = 1; }
426 unless (defined($e)) { print("Missing -e argument\n"); $printusage = 1; }
427 unless (defined($E)) { print("Missing -E argument\n"); $printusage = 1; }
428 unless (defined($s)) { print("Missing -s argument\n"); $printusage = 1; }
429 unless (defined($S)) { print("Missing -S argument\n"); $printusage = 1; }
430 if ($printusage == 1) { printusage
(); exit 1; }
432 if (defined($v) or defined($ENV{'V'})) {
436 # add the tools dir to the path temporarily, for calling various tools
437 $ENV{'PATH'} = dirname
($0) . ':' . $ENV{'PATH'};
442 # Only do the panic cleanup for voicefiles
443 $SIG{INT
} = \
&panic_cleanup
;
444 $SIG{KILL
} = \
&panic_cleanup
;
446 printf("Generating voice\n Target: %s\n Language: %s\n Encoder (options): %s (%s)\n TTS Engine (options): %s (%s)\n",
447 $t, $l, $e, $E, $s, $S);
448 generateclips
($l, $t, $e, $E, $s, $S);
453 printf("Generating .talk clips\n Path: %s\n Language: %s\n Encoder (options): %s (%s)\n TTS Engine (options): %s (%s)\n", $ARGV[0], $l, $e, $E, $s, $S);
454 my $tts_object = init_tts
($s, $S, $l);
455 gentalkclips
($ARGV[0], $tts_object, $e, $E, $S, 0);
456 shutdown_tts
($tts_object);