1 /* ----------------------------------------------------------------- */
2 /*           The HMM-Based Speech Synthesis Engine "hts_engine API"  */
3 /*           developed by HTS Working Group                          */
4 /*           http://hts-engine.sourceforge.net/                      */
5 /* ----------------------------------------------------------------- */
6 /*                                                                   */
7 /*  Copyright (c) 2001-2015  Nagoya Institute of Technology          */
8 /*                           Department of Computer Science          */
9 /*                                                                   */
10 /*                2001-2008  Tokyo Institute of Technology           */
11 /*                           Interdisciplinary Graduate School of    */
12 /*                           Science and Engineering                 */
13 /*                                                                   */
14 /* All rights reserved.                                              */
15 /*                                                                   */
16 /* Redistribution and use in source and binary forms, with or        */
17 /* without modification, are permitted provided that the following   */
18 /* conditions are met:                                               */
19 /*                                                                   */
20 /* - Redistributions of source code must retain the above copyright  */
21 /*   notice, this list of conditions and the following disclaimer.   */
22 /* - Redistributions in binary form must reproduce the above         */
23 /*   copyright notice, this list of conditions and the following     */
24 /*   disclaimer in the documentation and/or other materials provided */
25 /*   with the distribution.                                          */
26 /* - Neither the name of the HTS working group nor the names of its  */
27 /*   contributors may be used to endorse or promote products derived */
28 /*   from this software without specific prior written permission.   */
29 /*                                                                   */
30 /* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND            */
31 /* CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES,       */
32 /* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF          */
33 /* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE          */
34 /* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS */
35 /* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,          */
36 /* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED   */
37 /* TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,     */
38 /* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON */
39 /* ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,   */
40 /* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY    */
41 /* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE           */
42 /* POSSIBILITY OF SUCH DAMAGE.                                       */
43 /* ----------------------------------------------------------------- */
44 
45 #ifndef HTS_HIDDEN_H
46 #define HTS_HIDDEN_H
47 
48 #ifdef __cplusplus
49 #define HTS_HIDDEN_H_START extern "C" {
50 #define HTS_HIDDEN_H_END   }
51 #else
52 #define HTS_HIDDEN_H_START
53 #define HTS_HIDDEN_H_END
54 #endif                          /* __CPLUSPLUS */
55 
56 HTS_HIDDEN_H_START;
57 
58 /* hts_engine libraries */
59 #include "HTS_engine.h"
60 
61 /* common ---------------------------------------------------------- */
62 
63 #define HTS_MAXBUFLEN 1024
64 
65 #if !defined(WORDS_BIGENDIAN) && !defined(WORDS_LITTLEENDIAN)
66 #define WORDS_LITTLEENDIAN
67 #endif                          /* !WORDS_BIGENDIAN && !WORDS_LITTLEENDIAN */
68 #if defined(WORDS_BIGENDIAN) && defined(WORDS_LITTLEENDIAN)
69 #undef WORDS_BIGENDIAN
70 #endif                          /* WORDS_BIGENDIAN && WORDS_LITTLEENDIAN */
71 
72 #define MAX_F0    20000.0
73 #define MIN_F0    20.0
74 #define MAX_LF0   9.9034875525361280454891979401956     /* log(20000.0) */
75 #define MIN_LF0   2.9957322735539909934352235761425     /* log(20.0) */
76 #define HALF_TONE 0.05776226504666210911810267678818    /* log(2.0) / 12.0 */
77 #define DB        0.11512925464970228420089957273422    /* log(10.0) / 20.0 */
78 
79 /* misc ------------------------------------------------------------ */
80 
81 typedef struct _HTS_File {
82    unsigned char type;
83    void *pointer;
84 } HTS_File;
85 
86 /* HTS_fopen: wrapper for fopen */
87 HTS_File *HTS_fopen_from_fn(const char *name, const char *opt);
88 
89 /* HTS_fopen_from_fp: wrapper for fopen */
90 HTS_File *HTS_fopen_from_fp(HTS_File * fp, size_t size);
91 
92 /* HTS_fopen_from_data: wrapper for fopen */
93 HTS_File *HTS_fopen_from_data(void *data, size_t size);
94 
95 /* HTS_fclose: wrapper for fclose */
96 void HTS_fclose(HTS_File * fp);
97 
98 /* HTS_fgetc: wrapper for fgetc */
99 int HTS_fgetc(HTS_File * fp);
100 
101 /* HTS_feof: wrapper for feof */
102 int HTS_feof(HTS_File * fp);
103 
104 /* HTS_fseek: wrapper for fseek */
105 int HTS_fseek(HTS_File * fp, long offset, int origin);
106 
107 /* HTS_ftell: wrapper for ftell */
108 size_t HTS_ftell(HTS_File * fp);
109 
110 /* HTS_fread_big_endian: fread with byteswap */
111 size_t HTS_fread_big_endian(void *buf, size_t size, size_t n, HTS_File * fp);
112 
113 /* HTS_fread_little_endian: fread with byteswap */
114 size_t HTS_fread_little_endian(void *buf, size_t size, size_t n, HTS_File * fp);
115 
116 /* HTS_fwrite_little_endian: fwrite with byteswap */
117 size_t HTS_fwrite_little_endian(const void *buf, size_t size, size_t n, FILE * fp);
118 
119 /* HTS_get_pattern_token: get pattern token (single/double quote can be used) */
120 HTS_Boolean HTS_get_pattern_token(HTS_File * fp, char *buff);
121 
122 /* HTS_get_token: get token from file pointer (separators are space,tab,line break) */
123 HTS_Boolean HTS_get_token_from_fp(HTS_File * fp, char *buff);
124 
125 /* HTS_get_token: get token from file pointer with specified separator */
126 HTS_Boolean HTS_get_token_from_fp_with_separator(HTS_File * fp, char *buff, char separator);
127 
128 /* HTS_get_token_from_string: get token from string (separator are space,tab,line break) */
129 HTS_Boolean HTS_get_token_from_string(const char *string, size_t * index, char *buff);
130 
131 /* HTS_get_token_from_string_with_separator: get token from string with specified separator */
132 HTS_Boolean HTS_get_token_from_string_with_separator(const char *str, size_t * index, char *buff, char separator);
133 
134 /* HTS_calloc: wrapper for calloc */
135 void *HTS_calloc(const size_t num, const size_t size);
136 
137 /* HTS_strdup: wrapper for strdup */
138 char *HTS_strdup(const char *string);
139 
140 /* HTS_calloc_matrix: allocate double matrix */
141 double **HTS_alloc_matrix(size_t x, size_t y);
142 
143 /* HTS_free_matrix: free double matrix */
144 void HTS_free_matrix(double **p, size_t x);
145 
146 /* HTS_Free: wrapper for free */
147 void HTS_free(void *p);
148 
149 /* HTS_error: output error message */
150 void HTS_error(int error, const char *message, ...);
151 
152 /* audio ----------------------------------------------------------- */
153 
154 /* HTS_Audio_initialize: initialize audio */
155 void HTS_Audio_initialize(HTS_Audio * audio);
156 
157 /* HTS_Audio_set_parameter: set parameters for audio */
158 void HTS_Audio_set_parameter(HTS_Audio * audio, size_t sampling_frequency, size_t max_buff_size);
159 
160 /* HTS_Audio_write: send data to audio */
161 void HTS_Audio_write(HTS_Audio * audio, short data);
162 
163 /* HTS_Audio_flush: flush remain data */
164 void HTS_Audio_flush(HTS_Audio * audio);
165 
166 /* HTS_Audio_clear: free audio */
167 void HTS_Audio_clear(HTS_Audio * audio);
168 
169 /* model ----------------------------------------------------------- */
170 
171 /* HTS_ModelSet_initialize: initialize model set */
172 void HTS_ModelSet_initialize(HTS_ModelSet * ms);
173 
174 /* HTS_ModelSet_load: load HTS voices */
175 HTS_Boolean HTS_ModelSet_load(HTS_ModelSet * ms, char **voices, size_t num_voices);
176 
177 /* HTS_ModelSet_get_sampling_frequency: get sampling frequency of HTS voices */
178 size_t HTS_ModelSet_get_sampling_frequency(HTS_ModelSet * ms);
179 
180 /* HTS_ModelSet_get_fperiod: get frame period of HTS voices */
181 size_t HTS_ModelSet_get_fperiod(HTS_ModelSet * ms);
182 
183 /* HTS_ModelSet_get_fperiod: get stream option */
184 const char *HTS_ModelSet_get_option(HTS_ModelSet * ms, size_t stream_index);
185 
186 /* HTS_ModelSet_get_gv_flag: get GV flag */
187 HTS_Boolean HTS_ModelSet_get_gv_flag(HTS_ModelSet * ms, const char *string);
188 
189 /* HTS_ModelSet_get_nstate: get number of state */
190 size_t HTS_ModelSet_get_nstate(HTS_ModelSet * ms);
191 
192 /* HTS_Engine_get_fullcontext_label_format: get full-context label format */
193 const char *HTS_ModelSet_get_fullcontext_label_format(HTS_ModelSet * ms);
194 
195 /* HTS_Engine_get_fullcontext_label_version: get full-context label version */
196 const char *HTS_ModelSet_get_fullcontext_label_version(HTS_ModelSet * ms);
197 
198 /* HTS_ModelSet_get_nstream: get number of stream */
199 size_t HTS_ModelSet_get_nstream(HTS_ModelSet * ms);
200 
201 /* HTS_ModelSet_get_nvoices: get number of HTS voices */
202 size_t HTS_ModelSet_get_nvoices(HTS_ModelSet * ms);
203 
204 /* HTS_ModelSet_get_vector_length: get vector length */
205 size_t HTS_ModelSet_get_vector_length(HTS_ModelSet * ms, size_t stream_index);
206 
207 /* HTS_ModelSet_is_msd: get MSD flag */
208 HTS_Boolean HTS_ModelSet_is_msd(HTS_ModelSet * ms, size_t stream_index);
209 
210 /* HTS_ModelSet_get_window_size: get dynamic window size */
211 size_t HTS_ModelSet_get_window_size(HTS_ModelSet * ms, size_t stream_index);
212 
213 /* HTS_ModelSet_get_window_left_width: get left width of dynamic window */
214 int HTS_ModelSet_get_window_left_width(HTS_ModelSet * ms, size_t stream_index, size_t window_index);
215 
216 /* HTS_ModelSet_get_window_right_width: get right width of dynamic window */
217 int HTS_ModelSet_get_window_right_width(HTS_ModelSet * ms, size_t stream_index, size_t window_index);
218 
219 /* HTS_ModelSet_get_window_coefficient: get coefficient of dynamic window */
220 double HTS_ModelSet_get_window_coefficient(HTS_ModelSet * ms, size_t stream_index, size_t window_index, size_t coefficient_index);
221 
222 /* HTS_ModelSet_get_window_max_width: get max width of dynamic window */
223 size_t HTS_ModelSet_get_window_max_width(HTS_ModelSet * ms, size_t stream_index);
224 
225 /* HTS_ModelSet_use_gv: get GV flag */
226 HTS_Boolean HTS_ModelSet_use_gv(HTS_ModelSet * ms, size_t stream_index);
227 
228 /* HTS_ModelSet_get_duration_index: get index of duration tree and PDF */
229 void HTS_ModelSet_get_duration_index(HTS_ModelSet * ms, size_t voice_index, const char *string, size_t * tree_index, size_t * pdf_index);
230 
231 /* HTS_ModelSet_get_duration: get duration using interpolation weight */
232 void HTS_ModelSet_get_duration(HTS_ModelSet * ms, const char *string, const double *iw, double *mean, double *vari);
233 
234 /* HTS_ModelSet_get_parameter_index: get index of parameter tree and PDF */
235 void HTS_ModelSet_get_parameter_index(HTS_ModelSet * ms, size_t voice_index, size_t stream_index, size_t state_index, const char *string, size_t * tree_index, size_t * pdf_index);
236 
237 /* HTS_ModelSet_get_parameter: get parameter using interpolation weight */
238 void HTS_ModelSet_get_parameter(HTS_ModelSet * ms, size_t stream_index, size_t state_index, const char *string, const double *const *iw, double *mean, double *vari, double *msd);
239 
240 void HTS_ModelSet_get_gv_index(HTS_ModelSet * ms, size_t voice_index, size_t stream_index, const char *string, size_t * tree_index, size_t * pdf_index);
241 
242 /* HTS_ModelSet_get_gv: get GV using interpolation weight */
243 void HTS_ModelSet_get_gv(HTS_ModelSet * ms, size_t stream_index, const char *string, const double *const *iw, double *mean, double *vari);
244 
245 /* HTS_ModelSet_clear: free model set */
246 void HTS_ModelSet_clear(HTS_ModelSet * ms);
247 
248 /* label ----------------------------------------------------------- */
249 
250 /* HTS_Label_initialize: initialize label */
251 void HTS_Label_initialize(HTS_Label * label);
252 
253 /* HTS_Label_load_from_fn: load label from file name */
254 void HTS_Label_load_from_fn(HTS_Label * label, size_t sampling_rate, size_t fperiod, const char *fn);
255 
256 /* HTS_Label_load_from_strings: load label list from string list */
257 void HTS_Label_load_from_strings(HTS_Label * label, size_t sampling_rate, size_t fperiod, char **lines, size_t num_lines);
258 
259 /* HTS_Label_get_size: get number of label string */
260 size_t HTS_Label_get_size(HTS_Label * label);
261 
262 /* HTS_Label_get_string: get label string */
263 const char *HTS_Label_get_string(HTS_Label * label, size_t index);
264 
265 /* HTS_Label_get_start_frame: get start frame */
266 double HTS_Label_get_start_frame(HTS_Label * label, size_t index);
267 
268 /* HTS_Label_get_end_frame: get end frame */
269 double HTS_Label_get_end_frame(HTS_Label * label, size_t index);
270 
271 /* HTS_Label_clear: free label */
272 void HTS_Label_clear(HTS_Label * label);
273 
274 /* sstream --------------------------------------------------------- */
275 
276 /* HTS_SStreamSet_initialize: initialize state stream set */
277 void HTS_SStreamSet_initialize(HTS_SStreamSet * sss);
278 
279 /* HTS_SStreamSet_create: parse label and determine state duration */
280 HTS_Boolean HTS_SStreamSet_create(HTS_SStreamSet * sss, HTS_ModelSet * ms, HTS_Label * label, HTS_Boolean phoneme_alignment_flag, double speed, double *duration_iw, double **parameter_iw, double **gv_iw);
281 
282 /* HTS_SStreamSet_get_nstream: get number of stream */
283 size_t HTS_SStreamSet_get_nstream(HTS_SStreamSet * sss);
284 
285 /* HTS_SStreamSet_get_vector_length: get vector length */
286 size_t HTS_SStreamSet_get_vector_length(HTS_SStreamSet * sss, size_t stream_index);
287 
288 /* HTS_SStreamSet_is_msd: get MSD flag */
289 HTS_Boolean HTS_SStreamSet_is_msd(HTS_SStreamSet * sss, size_t stream_index);
290 
291 /* HTS_SStreamSet_get_total_state: get total number of state */
292 size_t HTS_SStreamSet_get_total_state(HTS_SStreamSet * sss);
293 
294 /* HTS_SStreamSet_get_total_frame: get total number of frame */
295 size_t HTS_SStreamSet_get_total_frame(HTS_SStreamSet * sss);
296 
297 /* HTS_SStreamSet_get_msd: get msd parameter */
298 double HTS_SStreamSet_get_msd(HTS_SStreamSet * sss, size_t stream_index, size_t state_index);
299 
300 /* HTS_SStreamSet_window_size: get dynamic window size */
301 size_t HTS_SStreamSet_get_window_size(HTS_SStreamSet * sss, size_t stream_index);
302 
303 /* HTS_SStreamSet_get_window_left_width: get left width of dynamic window */
304 int HTS_SStreamSet_get_window_left_width(HTS_SStreamSet * sss, size_t stream_index, size_t window_index);
305 
306 /* HTS_SStreamSet_get_window_right_width: get right width of dynamic window */
307 int HTS_SStreamSet_get_window_right_width(HTS_SStreamSet * sss, size_t stream_index, size_t window_index);
308 
309 /* HTS_SStreamSet_get_window_coefficient: get coefficient of dynamic window */
310 double HTS_SStreamSet_get_window_coefficient(HTS_SStreamSet * sss, size_t stream_index, size_t window_index, int coefficient_index);
311 
312 /* HTS_SStreamSet_get_window_max_width: get max width of dynamic window */
313 size_t HTS_SStreamSet_get_window_max_width(HTS_SStreamSet * sss, size_t stream_index);
314 
315 /* HTS_SStreamSet_use_gv: get GV flag */
316 HTS_Boolean HTS_SStreamSet_use_gv(HTS_SStreamSet * sss, size_t stream_index);
317 
318 /* HTS_SStreamSet_get_duration: get state duration */
319 size_t HTS_SStreamSet_get_duration(HTS_SStreamSet * sss, size_t state_index);
320 
321 /* HTS_SStreamSet_get_mean: get mean parameter */
322 double HTS_SStreamSet_get_mean(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index);
323 
324 /* HTS_SStreamSet_set_mean: set mean parameter */
325 void HTS_SStreamSet_set_mean(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index, double f);
326 
327 /* HTS_SStreamSet_get_vari: get variance parameter */
328 double HTS_SStreamSet_get_vari(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index);
329 
330 /* HTS_SStreamSet_set_vari: set variance parameter */
331 void HTS_SStreamSet_set_vari(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index, double f);
332 
333 /* HTS_SStreamSet_get_gv_mean: get GV mean parameter */
334 double HTS_SStreamSet_get_gv_mean(HTS_SStreamSet * sss, size_t stream_index, size_t vector_index);
335 
336 /* HTS_SStreamSet_get_gv_mean: get GV variance parameter */
337 double HTS_SStreamSet_get_gv_vari(HTS_SStreamSet * sss, size_t stream_index, size_t vector_index);
338 
339 /* HTS_SStreamSet_set_gv_switch: set GV switch */
340 void HTS_SStreamSet_set_gv_switch(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, HTS_Boolean i);
341 
342 /* HTS_SStreamSet_get_gv_switch: get GV switch */
343 HTS_Boolean HTS_SStreamSet_get_gv_switch(HTS_SStreamSet * sss, size_t stream_index, size_t state_index);
344 
345 /* HTS_SStreamSet_clear: free state stream set */
346 void HTS_SStreamSet_clear(HTS_SStreamSet * sss);
347 
348 /* pstream --------------------------------------------------------- */
349 
350 /* check variance in finv() */
351 #define INFTY   ((double) 1.0e+38)
352 #define INFTY2  ((double) 1.0e+19)
353 #define INVINF  ((double) 1.0e-38)
354 #define INVINF2 ((double) 1.0e-19)
355 
356 /* GV */
357 #define STEPINIT 0.1
358 #define STEPDEC  0.5
359 #define STEPINC  1.2
360 #define W1       1.0
361 #define W2       1.0
362 #define GV_MAX_ITERATION 5
363 
364 /* HTS_PStreamSet_initialize: initialize parameter stream set */
365 void HTS_PStreamSet_initialize(HTS_PStreamSet * pss);
366 
367 /* HTS_PStreamSet_create: parameter generation using GV weight */
368 HTS_Boolean HTS_PStreamSet_create(HTS_PStreamSet * pss, HTS_SStreamSet * sss, double *msd_threshold, double *gv_weight);
369 
370 /* HTS_PStreamSet_get_nstream: get number of stream */
371 size_t HTS_PStreamSet_get_nstream(HTS_PStreamSet * pss);
372 
373 /* HTS_PStreamSet_get_static_length: get features length */
374 size_t HTS_PStreamSet_get_vector_length(HTS_PStreamSet * pss, size_t stream_index);
375 
376 /* HTS_PStreamSet_get_total_frame: get total number of frame */
377 size_t HTS_PStreamSet_get_total_frame(HTS_PStreamSet * pss);
378 
379 /* HTS_PStreamSet_get_parameter: get parameter */
380 double HTS_PStreamSet_get_parameter(HTS_PStreamSet * pss, size_t stream_index, size_t frame_index, size_t vector_index);
381 
382 /* HTS_PStreamSet_get_parameter_vector: get parameter vector */
383 double *HTS_PStreamSet_get_parameter_vector(HTS_PStreamSet * pss, size_t stream_index, size_t frame_index);
384 
385 /* HTS_PStreamSet_get_msd_flag: get generated MSD flag per frame */
386 HTS_Boolean HTS_PStreamSet_get_msd_flag(HTS_PStreamSet * pss, size_t stream_index, size_t frame_index);
387 
388 /* HTS_PStreamSet_is_msd: get MSD flag */
389 HTS_Boolean HTS_PStreamSet_is_msd(HTS_PStreamSet * pss, size_t stream_index);
390 
391 /* HTS_PStreamSet_clear: free parameter stream set */
392 void HTS_PStreamSet_clear(HTS_PStreamSet * pss);
393 
394 /* gstream --------------------------------------------------------- */
395 
396 /* HTS_GStreamSet_initialize: initialize generated parameter stream set */
397 void HTS_GStreamSet_initialize(HTS_GStreamSet * gss);
398 
399 /* HTS_GStreamSet_create: generate speech */
400 HTS_Boolean HTS_GStreamSet_create(HTS_GStreamSet * gss, HTS_PStreamSet * pss, size_t stage, HTS_Boolean use_log_gain, size_t sampling_rate, size_t fperiod, double alpha, double beta, HTS_Boolean * stop, double volume, HTS_Audio * audio);
401 
402 /* HTS_GStreamSet_get_total_nsamples: get total number of sample */
403 size_t HTS_GStreamSet_get_total_nsamples(HTS_GStreamSet * gss);
404 
405 /* HTS_GStreamSet_get_total_frame: get total number of frame */
406 size_t HTS_GStreamSet_get_total_frame(HTS_GStreamSet * gss);
407 
408 /* HTS_GStreamSet_get_static_length: get features length */
409 size_t HTS_GStreamSet_get_vector_length(HTS_GStreamSet * gss, size_t stream_index);
410 
411 /* HTS_GStreamSet_get_speech: get synthesized speech parameter */
412 double HTS_GStreamSet_get_speech(HTS_GStreamSet * gss, size_t sample_index);
413 
414 /* HTS_GStreamSet_get_parameter: get generated parameter */
415 double HTS_GStreamSet_get_parameter(HTS_GStreamSet * gss, size_t stream_index, size_t frame_index, size_t vector_index);
416 
417 /* HTS_GStreamSet_clear: free generated parameter stream set */
418 void HTS_GStreamSet_clear(HTS_GStreamSet * gss);
419 
420 /* vocoder --------------------------------------------------------- */
421 
422 #ifndef LZERO
423 #define LZERO (-1.0e+10)        /* ~log(0) */
424 #endif                          /* !LZERO */
425 
426 #ifndef ZERO
427 #define ZERO  (1.0e-10)         /* ~(0) */
428 #endif                          /* !ZERO */
429 
430 #ifndef PI
431 #define PI  3.14159265358979323846
432 #endif                          /* !PI */
433 
434 #ifndef PI2
435 #define PI2 6.28318530717958647692
436 #endif                          /* !PI2 */
437 
438 #define RANDMAX 32767
439 
440 #define SEED    1
441 #define B0      0x00000001
442 #define B28     0x10000000
443 #define B31     0x80000000
444 #define B31_    0x7fffffff
445 #define Z       0x00000000
446 
447 #ifdef HTS_EMBEDDED
448 #define GAUSS     FALSE
449 #define PADEORDER 4             /* pade order (for MLSA filter) */
450 #define IRLENG    384           /* length of impulse response */
451 #else
452 #define GAUSS     TRUE
453 #define PADEORDER 5
454 #define IRLENG    576
455 #endif                          /* HTS_EMBEDDED */
456 
457 #define CHECK_LSP_STABILITY_MIN 0.25
458 #define CHECK_LSP_STABILITY_NUM 4
459 
460 /* for MGLSA filter */
461 #define NORMFLG1 TRUE
462 #define NORMFLG2 FALSE
463 #define MULGFLG1 TRUE
464 #define MULGFLG2 FALSE
465 #define NGAIN    FALSE
466 
467 /* HTS_Vocoder: structure for setting of vocoder */
468 typedef struct _HTS_Vocoder {
469    HTS_Boolean is_first;
470    size_t stage;                /* Gamma=-1/stage: if stage=0 then Gamma=0 */
471    double gamma;                /* Gamma */
472    HTS_Boolean use_log_gain;    /* log gain flag (for LSP) */
473    size_t fprd;                 /* frame shift */
474    unsigned long next;          /* temporary variable for random generator */
475    HTS_Boolean gauss;           /* flag to use Gaussian noise */
476    double rate;                 /* sampling rate */
477    double pitch_of_curr_point;  /* used in excitation generation */
478    double pitch_counter;        /* used in excitation generation */
479    double pitch_inc_per_point;  /* used in excitation generation */
480    double *excite_ring_buff;    /* used in excitation generation */
481    size_t excite_buff_size;     /* used in excitation generation */
482    size_t excite_buff_index;    /* used in excitation generation */
483    unsigned char sw;            /* switch used in random generator */
484    int x;                       /* excitation signal */
485    double *freqt_buff;          /* used in freqt */
486    size_t freqt_size;           /* buffer size for freqt */
487    double *spectrum2en_buff;    /* used in spectrum2en */
488    size_t spectrum2en_size;     /* buffer size for spectrum2en */
489    double r1, r2, s;            /* used in random generator */
490    double *postfilter_buff;     /* used in postfiltering */
491    size_t postfilter_size;      /* buffer size for postfiltering */
492    double *c, *cc, *cinc, *d1;  /* used in the MLSA/MGLSA filter */
493    double *lsp2lpc_buff;        /* used in lsp2lpc */
494    size_t lsp2lpc_size;         /* buffer size of lsp2lpc */
495    double *gc2gc_buff;          /* used in gc2gc */
496    size_t gc2gc_size;           /* buffer size for gc2gc */
497 } HTS_Vocoder;
498 
499 /* HTS_Vocoder_initialize: initialize vocoder */
500 void HTS_Vocoder_initialize(HTS_Vocoder * v, size_t m, size_t stage, HTS_Boolean use_log_gain, size_t rate, size_t fperiod);
501 
502 /* HTS_Vocoder_synthesize: pulse/noise excitation and MLSA/MGLSA filster based waveform synthesis */
503 void HTS_Vocoder_synthesize(HTS_Vocoder * v, size_t m, double lf0, double *spectrum, size_t nlpf, double *lpf, double alpha, double beta, double volume, double *rawdata, HTS_Audio * audio);
504 
505 /* HTS_Vocoder_clear: clear vocoder */
506 void HTS_Vocoder_clear(HTS_Vocoder * v);
507 
508 HTS_HIDDEN_H_END;
509 
510 #endif                          /* !HTS_HIDDEN_H */
511