1 /* ----------------------------------------------------------------- */ 2 /* The HMM-Based Speech Synthesis Engine "hts_engine API" */ 3 /* developed by HTS Working Group */ 4 /* http://hts-engine.sourceforge.net/ */ 5 /* ----------------------------------------------------------------- */ 6 /* */ 7 /* Copyright (c) 2001-2015 Nagoya Institute of Technology */ 8 /* Department of Computer Science */ 9 /* */ 10 /* 2001-2008 Tokyo Institute of Technology */ 11 /* Interdisciplinary Graduate School of */ 12 /* Science and Engineering */ 13 /* */ 14 /* All rights reserved. */ 15 /* */ 16 /* Redistribution and use in source and binary forms, with or */ 17 /* without modification, are permitted provided that the following */ 18 /* conditions are met: */ 19 /* */ 20 /* - Redistributions of source code must retain the above copyright */ 21 /* notice, this list of conditions and the following disclaimer. */ 22 /* - Redistributions in binary form must reproduce the above */ 23 /* copyright notice, this list of conditions and the following */ 24 /* disclaimer in the documentation and/or other materials provided */ 25 /* with the distribution. */ 26 /* - Neither the name of the HTS working group nor the names of its */ 27 /* contributors may be used to endorse or promote products derived */ 28 /* from this software without specific prior written permission. */ 29 /* */ 30 /* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND */ 31 /* CONTRIBUTORS "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, */ 32 /* INCLUDING, BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF */ 33 /* MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE */ 34 /* DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS */ 35 /* BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, */ 36 /* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED */ 37 /* TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, */ 38 /* DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON */ 39 /* ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, */ 40 /* OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY */ 41 /* OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE */ 42 /* POSSIBILITY OF SUCH DAMAGE. */ 43 /* ----------------------------------------------------------------- */ 44 45 #ifndef HTS_HIDDEN_H 46 #define HTS_HIDDEN_H 47 48 #ifdef __cplusplus 49 #define HTS_HIDDEN_H_START extern "C" { 50 #define HTS_HIDDEN_H_END } 51 #else 52 #define HTS_HIDDEN_H_START 53 #define HTS_HIDDEN_H_END 54 #endif /* __CPLUSPLUS */ 55 56 HTS_HIDDEN_H_START; 57 58 /* hts_engine libraries */ 59 #include "HTS_engine.h" 60 61 /* common ---------------------------------------------------------- */ 62 63 #define HTS_MAXBUFLEN 1024 64 65 #if !defined(WORDS_BIGENDIAN) && !defined(WORDS_LITTLEENDIAN) 66 #define WORDS_LITTLEENDIAN 67 #endif /* !WORDS_BIGENDIAN && !WORDS_LITTLEENDIAN */ 68 #if defined(WORDS_BIGENDIAN) && defined(WORDS_LITTLEENDIAN) 69 #undef WORDS_BIGENDIAN 70 #endif /* WORDS_BIGENDIAN && WORDS_LITTLEENDIAN */ 71 72 #define MAX_F0 20000.0 73 #define MIN_F0 20.0 74 #define MAX_LF0 9.9034875525361280454891979401956 /* log(20000.0) */ 75 #define MIN_LF0 2.9957322735539909934352235761425 /* log(20.0) */ 76 #define HALF_TONE 0.05776226504666210911810267678818 /* log(2.0) / 12.0 */ 77 #define DB 0.11512925464970228420089957273422 /* log(10.0) / 20.0 */ 78 79 /* misc ------------------------------------------------------------ */ 80 81 typedef struct _HTS_File { 82 unsigned char type; 83 void *pointer; 84 } HTS_File; 85 86 /* HTS_fopen: wrapper for fopen */ 87 HTS_File *HTS_fopen_from_fn(const char *name, const char *opt); 88 89 /* HTS_fopen_from_fp: wrapper for fopen */ 90 HTS_File *HTS_fopen_from_fp(HTS_File * fp, size_t size); 91 92 /* HTS_fopen_from_data: wrapper for fopen */ 93 HTS_File *HTS_fopen_from_data(void *data, size_t size); 94 95 /* HTS_fclose: wrapper for fclose */ 96 void HTS_fclose(HTS_File * fp); 97 98 /* HTS_fgetc: wrapper for fgetc */ 99 int HTS_fgetc(HTS_File * fp); 100 101 /* HTS_feof: wrapper for feof */ 102 int HTS_feof(HTS_File * fp); 103 104 /* HTS_fseek: wrapper for fseek */ 105 int HTS_fseek(HTS_File * fp, long offset, int origin); 106 107 /* HTS_ftell: wrapper for ftell */ 108 size_t HTS_ftell(HTS_File * fp); 109 110 /* HTS_fread_big_endian: fread with byteswap */ 111 size_t HTS_fread_big_endian(void *buf, size_t size, size_t n, HTS_File * fp); 112 113 /* HTS_fread_little_endian: fread with byteswap */ 114 size_t HTS_fread_little_endian(void *buf, size_t size, size_t n, HTS_File * fp); 115 116 /* HTS_fwrite_little_endian: fwrite with byteswap */ 117 size_t HTS_fwrite_little_endian(const void *buf, size_t size, size_t n, FILE * fp); 118 119 /* HTS_get_pattern_token: get pattern token (single/double quote can be used) */ 120 HTS_Boolean HTS_get_pattern_token(HTS_File * fp, char *buff); 121 122 /* HTS_get_token: get token from file pointer (separators are space,tab,line break) */ 123 HTS_Boolean HTS_get_token_from_fp(HTS_File * fp, char *buff); 124 125 /* HTS_get_token: get token from file pointer with specified separator */ 126 HTS_Boolean HTS_get_token_from_fp_with_separator(HTS_File * fp, char *buff, char separator); 127 128 /* HTS_get_token_from_string: get token from string (separator are space,tab,line break) */ 129 HTS_Boolean HTS_get_token_from_string(const char *string, size_t * index, char *buff); 130 131 /* HTS_get_token_from_string_with_separator: get token from string with specified separator */ 132 HTS_Boolean HTS_get_token_from_string_with_separator(const char *str, size_t * index, char *buff, char separator); 133 134 /* HTS_calloc: wrapper for calloc */ 135 void *HTS_calloc(const size_t num, const size_t size); 136 137 /* HTS_strdup: wrapper for strdup */ 138 char *HTS_strdup(const char *string); 139 140 /* HTS_calloc_matrix: allocate double matrix */ 141 double **HTS_alloc_matrix(size_t x, size_t y); 142 143 /* HTS_free_matrix: free double matrix */ 144 void HTS_free_matrix(double **p, size_t x); 145 146 /* HTS_Free: wrapper for free */ 147 void HTS_free(void *p); 148 149 /* HTS_error: output error message */ 150 void HTS_error(int error, const char *message, ...); 151 152 /* audio ----------------------------------------------------------- */ 153 154 /* HTS_Audio_initialize: initialize audio */ 155 void HTS_Audio_initialize(HTS_Audio * audio); 156 157 /* HTS_Audio_set_parameter: set parameters for audio */ 158 void HTS_Audio_set_parameter(HTS_Audio * audio, size_t sampling_frequency, size_t max_buff_size); 159 160 /* HTS_Audio_write: send data to audio */ 161 void HTS_Audio_write(HTS_Audio * audio, short data); 162 163 /* HTS_Audio_flush: flush remain data */ 164 void HTS_Audio_flush(HTS_Audio * audio); 165 166 /* HTS_Audio_clear: free audio */ 167 void HTS_Audio_clear(HTS_Audio * audio); 168 169 /* model ----------------------------------------------------------- */ 170 171 /* HTS_ModelSet_initialize: initialize model set */ 172 void HTS_ModelSet_initialize(HTS_ModelSet * ms); 173 174 /* HTS_ModelSet_load: load HTS voices */ 175 HTS_Boolean HTS_ModelSet_load(HTS_ModelSet * ms, char **voices, size_t num_voices); 176 177 /* HTS_ModelSet_get_sampling_frequency: get sampling frequency of HTS voices */ 178 size_t HTS_ModelSet_get_sampling_frequency(HTS_ModelSet * ms); 179 180 /* HTS_ModelSet_get_fperiod: get frame period of HTS voices */ 181 size_t HTS_ModelSet_get_fperiod(HTS_ModelSet * ms); 182 183 /* HTS_ModelSet_get_fperiod: get stream option */ 184 const char *HTS_ModelSet_get_option(HTS_ModelSet * ms, size_t stream_index); 185 186 /* HTS_ModelSet_get_gv_flag: get GV flag */ 187 HTS_Boolean HTS_ModelSet_get_gv_flag(HTS_ModelSet * ms, const char *string); 188 189 /* HTS_ModelSet_get_nstate: get number of state */ 190 size_t HTS_ModelSet_get_nstate(HTS_ModelSet * ms); 191 192 /* HTS_Engine_get_fullcontext_label_format: get full-context label format */ 193 const char *HTS_ModelSet_get_fullcontext_label_format(HTS_ModelSet * ms); 194 195 /* HTS_Engine_get_fullcontext_label_version: get full-context label version */ 196 const char *HTS_ModelSet_get_fullcontext_label_version(HTS_ModelSet * ms); 197 198 /* HTS_ModelSet_get_nstream: get number of stream */ 199 size_t HTS_ModelSet_get_nstream(HTS_ModelSet * ms); 200 201 /* HTS_ModelSet_get_nvoices: get number of HTS voices */ 202 size_t HTS_ModelSet_get_nvoices(HTS_ModelSet * ms); 203 204 /* HTS_ModelSet_get_vector_length: get vector length */ 205 size_t HTS_ModelSet_get_vector_length(HTS_ModelSet * ms, size_t stream_index); 206 207 /* HTS_ModelSet_is_msd: get MSD flag */ 208 HTS_Boolean HTS_ModelSet_is_msd(HTS_ModelSet * ms, size_t stream_index); 209 210 /* HTS_ModelSet_get_window_size: get dynamic window size */ 211 size_t HTS_ModelSet_get_window_size(HTS_ModelSet * ms, size_t stream_index); 212 213 /* HTS_ModelSet_get_window_left_width: get left width of dynamic window */ 214 int HTS_ModelSet_get_window_left_width(HTS_ModelSet * ms, size_t stream_index, size_t window_index); 215 216 /* HTS_ModelSet_get_window_right_width: get right width of dynamic window */ 217 int HTS_ModelSet_get_window_right_width(HTS_ModelSet * ms, size_t stream_index, size_t window_index); 218 219 /* HTS_ModelSet_get_window_coefficient: get coefficient of dynamic window */ 220 double HTS_ModelSet_get_window_coefficient(HTS_ModelSet * ms, size_t stream_index, size_t window_index, size_t coefficient_index); 221 222 /* HTS_ModelSet_get_window_max_width: get max width of dynamic window */ 223 size_t HTS_ModelSet_get_window_max_width(HTS_ModelSet * ms, size_t stream_index); 224 225 /* HTS_ModelSet_use_gv: get GV flag */ 226 HTS_Boolean HTS_ModelSet_use_gv(HTS_ModelSet * ms, size_t stream_index); 227 228 /* HTS_ModelSet_get_duration_index: get index of duration tree and PDF */ 229 void HTS_ModelSet_get_duration_index(HTS_ModelSet * ms, size_t voice_index, const char *string, size_t * tree_index, size_t * pdf_index); 230 231 /* HTS_ModelSet_get_duration: get duration using interpolation weight */ 232 void HTS_ModelSet_get_duration(HTS_ModelSet * ms, const char *string, const double *iw, double *mean, double *vari); 233 234 /* HTS_ModelSet_get_parameter_index: get index of parameter tree and PDF */ 235 void HTS_ModelSet_get_parameter_index(HTS_ModelSet * ms, size_t voice_index, size_t stream_index, size_t state_index, const char *string, size_t * tree_index, size_t * pdf_index); 236 237 /* HTS_ModelSet_get_parameter: get parameter using interpolation weight */ 238 void HTS_ModelSet_get_parameter(HTS_ModelSet * ms, size_t stream_index, size_t state_index, const char *string, const double *const *iw, double *mean, double *vari, double *msd); 239 240 void HTS_ModelSet_get_gv_index(HTS_ModelSet * ms, size_t voice_index, size_t stream_index, const char *string, size_t * tree_index, size_t * pdf_index); 241 242 /* HTS_ModelSet_get_gv: get GV using interpolation weight */ 243 void HTS_ModelSet_get_gv(HTS_ModelSet * ms, size_t stream_index, const char *string, const double *const *iw, double *mean, double *vari); 244 245 /* HTS_ModelSet_clear: free model set */ 246 void HTS_ModelSet_clear(HTS_ModelSet * ms); 247 248 /* label ----------------------------------------------------------- */ 249 250 /* HTS_Label_initialize: initialize label */ 251 void HTS_Label_initialize(HTS_Label * label); 252 253 /* HTS_Label_load_from_fn: load label from file name */ 254 void HTS_Label_load_from_fn(HTS_Label * label, size_t sampling_rate, size_t fperiod, const char *fn); 255 256 /* HTS_Label_load_from_strings: load label list from string list */ 257 void HTS_Label_load_from_strings(HTS_Label * label, size_t sampling_rate, size_t fperiod, char **lines, size_t num_lines); 258 259 /* HTS_Label_get_size: get number of label string */ 260 size_t HTS_Label_get_size(HTS_Label * label); 261 262 /* HTS_Label_get_string: get label string */ 263 const char *HTS_Label_get_string(HTS_Label * label, size_t index); 264 265 /* HTS_Label_get_start_frame: get start frame */ 266 double HTS_Label_get_start_frame(HTS_Label * label, size_t index); 267 268 /* HTS_Label_get_end_frame: get end frame */ 269 double HTS_Label_get_end_frame(HTS_Label * label, size_t index); 270 271 /* HTS_Label_clear: free label */ 272 void HTS_Label_clear(HTS_Label * label); 273 274 /* sstream --------------------------------------------------------- */ 275 276 /* HTS_SStreamSet_initialize: initialize state stream set */ 277 void HTS_SStreamSet_initialize(HTS_SStreamSet * sss); 278 279 /* HTS_SStreamSet_create: parse label and determine state duration */ 280 HTS_Boolean HTS_SStreamSet_create(HTS_SStreamSet * sss, HTS_ModelSet * ms, HTS_Label * label, HTS_Boolean phoneme_alignment_flag, double speed, double *duration_iw, double **parameter_iw, double **gv_iw); 281 282 /* HTS_SStreamSet_get_nstream: get number of stream */ 283 size_t HTS_SStreamSet_get_nstream(HTS_SStreamSet * sss); 284 285 /* HTS_SStreamSet_get_vector_length: get vector length */ 286 size_t HTS_SStreamSet_get_vector_length(HTS_SStreamSet * sss, size_t stream_index); 287 288 /* HTS_SStreamSet_is_msd: get MSD flag */ 289 HTS_Boolean HTS_SStreamSet_is_msd(HTS_SStreamSet * sss, size_t stream_index); 290 291 /* HTS_SStreamSet_get_total_state: get total number of state */ 292 size_t HTS_SStreamSet_get_total_state(HTS_SStreamSet * sss); 293 294 /* HTS_SStreamSet_get_total_frame: get total number of frame */ 295 size_t HTS_SStreamSet_get_total_frame(HTS_SStreamSet * sss); 296 297 /* HTS_SStreamSet_get_msd: get msd parameter */ 298 double HTS_SStreamSet_get_msd(HTS_SStreamSet * sss, size_t stream_index, size_t state_index); 299 300 /* HTS_SStreamSet_window_size: get dynamic window size */ 301 size_t HTS_SStreamSet_get_window_size(HTS_SStreamSet * sss, size_t stream_index); 302 303 /* HTS_SStreamSet_get_window_left_width: get left width of dynamic window */ 304 int HTS_SStreamSet_get_window_left_width(HTS_SStreamSet * sss, size_t stream_index, size_t window_index); 305 306 /* HTS_SStreamSet_get_window_right_width: get right width of dynamic window */ 307 int HTS_SStreamSet_get_window_right_width(HTS_SStreamSet * sss, size_t stream_index, size_t window_index); 308 309 /* HTS_SStreamSet_get_window_coefficient: get coefficient of dynamic window */ 310 double HTS_SStreamSet_get_window_coefficient(HTS_SStreamSet * sss, size_t stream_index, size_t window_index, int coefficient_index); 311 312 /* HTS_SStreamSet_get_window_max_width: get max width of dynamic window */ 313 size_t HTS_SStreamSet_get_window_max_width(HTS_SStreamSet * sss, size_t stream_index); 314 315 /* HTS_SStreamSet_use_gv: get GV flag */ 316 HTS_Boolean HTS_SStreamSet_use_gv(HTS_SStreamSet * sss, size_t stream_index); 317 318 /* HTS_SStreamSet_get_duration: get state duration */ 319 size_t HTS_SStreamSet_get_duration(HTS_SStreamSet * sss, size_t state_index); 320 321 /* HTS_SStreamSet_get_mean: get mean parameter */ 322 double HTS_SStreamSet_get_mean(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index); 323 324 /* HTS_SStreamSet_set_mean: set mean parameter */ 325 void HTS_SStreamSet_set_mean(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index, double f); 326 327 /* HTS_SStreamSet_get_vari: get variance parameter */ 328 double HTS_SStreamSet_get_vari(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index); 329 330 /* HTS_SStreamSet_set_vari: set variance parameter */ 331 void HTS_SStreamSet_set_vari(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, size_t vector_index, double f); 332 333 /* HTS_SStreamSet_get_gv_mean: get GV mean parameter */ 334 double HTS_SStreamSet_get_gv_mean(HTS_SStreamSet * sss, size_t stream_index, size_t vector_index); 335 336 /* HTS_SStreamSet_get_gv_mean: get GV variance parameter */ 337 double HTS_SStreamSet_get_gv_vari(HTS_SStreamSet * sss, size_t stream_index, size_t vector_index); 338 339 /* HTS_SStreamSet_set_gv_switch: set GV switch */ 340 void HTS_SStreamSet_set_gv_switch(HTS_SStreamSet * sss, size_t stream_index, size_t state_index, HTS_Boolean i); 341 342 /* HTS_SStreamSet_get_gv_switch: get GV switch */ 343 HTS_Boolean HTS_SStreamSet_get_gv_switch(HTS_SStreamSet * sss, size_t stream_index, size_t state_index); 344 345 /* HTS_SStreamSet_clear: free state stream set */ 346 void HTS_SStreamSet_clear(HTS_SStreamSet * sss); 347 348 /* pstream --------------------------------------------------------- */ 349 350 /* check variance in finv() */ 351 #define INFTY ((double) 1.0e+38) 352 #define INFTY2 ((double) 1.0e+19) 353 #define INVINF ((double) 1.0e-38) 354 #define INVINF2 ((double) 1.0e-19) 355 356 /* GV */ 357 #define STEPINIT 0.1 358 #define STEPDEC 0.5 359 #define STEPINC 1.2 360 #define W1 1.0 361 #define W2 1.0 362 #define GV_MAX_ITERATION 5 363 364 /* HTS_PStreamSet_initialize: initialize parameter stream set */ 365 void HTS_PStreamSet_initialize(HTS_PStreamSet * pss); 366 367 /* HTS_PStreamSet_create: parameter generation using GV weight */ 368 HTS_Boolean HTS_PStreamSet_create(HTS_PStreamSet * pss, HTS_SStreamSet * sss, double *msd_threshold, double *gv_weight); 369 370 /* HTS_PStreamSet_get_nstream: get number of stream */ 371 size_t HTS_PStreamSet_get_nstream(HTS_PStreamSet * pss); 372 373 /* HTS_PStreamSet_get_static_length: get features length */ 374 size_t HTS_PStreamSet_get_vector_length(HTS_PStreamSet * pss, size_t stream_index); 375 376 /* HTS_PStreamSet_get_total_frame: get total number of frame */ 377 size_t HTS_PStreamSet_get_total_frame(HTS_PStreamSet * pss); 378 379 /* HTS_PStreamSet_get_parameter: get parameter */ 380 double HTS_PStreamSet_get_parameter(HTS_PStreamSet * pss, size_t stream_index, size_t frame_index, size_t vector_index); 381 382 /* HTS_PStreamSet_get_parameter_vector: get parameter vector */ 383 double *HTS_PStreamSet_get_parameter_vector(HTS_PStreamSet * pss, size_t stream_index, size_t frame_index); 384 385 /* HTS_PStreamSet_get_msd_flag: get generated MSD flag per frame */ 386 HTS_Boolean HTS_PStreamSet_get_msd_flag(HTS_PStreamSet * pss, size_t stream_index, size_t frame_index); 387 388 /* HTS_PStreamSet_is_msd: get MSD flag */ 389 HTS_Boolean HTS_PStreamSet_is_msd(HTS_PStreamSet * pss, size_t stream_index); 390 391 /* HTS_PStreamSet_clear: free parameter stream set */ 392 void HTS_PStreamSet_clear(HTS_PStreamSet * pss); 393 394 /* gstream --------------------------------------------------------- */ 395 396 /* HTS_GStreamSet_initialize: initialize generated parameter stream set */ 397 void HTS_GStreamSet_initialize(HTS_GStreamSet * gss); 398 399 /* HTS_GStreamSet_create: generate speech */ 400 HTS_Boolean HTS_GStreamSet_create(HTS_GStreamSet * gss, HTS_PStreamSet * pss, size_t stage, HTS_Boolean use_log_gain, size_t sampling_rate, size_t fperiod, double alpha, double beta, HTS_Boolean * stop, double volume, HTS_Audio * audio); 401 402 /* HTS_GStreamSet_get_total_nsamples: get total number of sample */ 403 size_t HTS_GStreamSet_get_total_nsamples(HTS_GStreamSet * gss); 404 405 /* HTS_GStreamSet_get_total_frame: get total number of frame */ 406 size_t HTS_GStreamSet_get_total_frame(HTS_GStreamSet * gss); 407 408 /* HTS_GStreamSet_get_static_length: get features length */ 409 size_t HTS_GStreamSet_get_vector_length(HTS_GStreamSet * gss, size_t stream_index); 410 411 /* HTS_GStreamSet_get_speech: get synthesized speech parameter */ 412 double HTS_GStreamSet_get_speech(HTS_GStreamSet * gss, size_t sample_index); 413 414 /* HTS_GStreamSet_get_parameter: get generated parameter */ 415 double HTS_GStreamSet_get_parameter(HTS_GStreamSet * gss, size_t stream_index, size_t frame_index, size_t vector_index); 416 417 /* HTS_GStreamSet_clear: free generated parameter stream set */ 418 void HTS_GStreamSet_clear(HTS_GStreamSet * gss); 419 420 /* vocoder --------------------------------------------------------- */ 421 422 #ifndef LZERO 423 #define LZERO (-1.0e+10) /* ~log(0) */ 424 #endif /* !LZERO */ 425 426 #ifndef ZERO 427 #define ZERO (1.0e-10) /* ~(0) */ 428 #endif /* !ZERO */ 429 430 #ifndef PI 431 #define PI 3.14159265358979323846 432 #endif /* !PI */ 433 434 #ifndef PI2 435 #define PI2 6.28318530717958647692 436 #endif /* !PI2 */ 437 438 #define RANDMAX 32767 439 440 #define SEED 1 441 #define B0 0x00000001 442 #define B28 0x10000000 443 #define B31 0x80000000 444 #define B31_ 0x7fffffff 445 #define Z 0x00000000 446 447 #ifdef HTS_EMBEDDED 448 #define GAUSS FALSE 449 #define PADEORDER 4 /* pade order (for MLSA filter) */ 450 #define IRLENG 384 /* length of impulse response */ 451 #else 452 #define GAUSS TRUE 453 #define PADEORDER 5 454 #define IRLENG 576 455 #endif /* HTS_EMBEDDED */ 456 457 #define CHECK_LSP_STABILITY_MIN 0.25 458 #define CHECK_LSP_STABILITY_NUM 4 459 460 /* for MGLSA filter */ 461 #define NORMFLG1 TRUE 462 #define NORMFLG2 FALSE 463 #define MULGFLG1 TRUE 464 #define MULGFLG2 FALSE 465 #define NGAIN FALSE 466 467 /* HTS_Vocoder: structure for setting of vocoder */ 468 typedef struct _HTS_Vocoder { 469 HTS_Boolean is_first; 470 size_t stage; /* Gamma=-1/stage: if stage=0 then Gamma=0 */ 471 double gamma; /* Gamma */ 472 HTS_Boolean use_log_gain; /* log gain flag (for LSP) */ 473 size_t fprd; /* frame shift */ 474 unsigned long next; /* temporary variable for random generator */ 475 HTS_Boolean gauss; /* flag to use Gaussian noise */ 476 double rate; /* sampling rate */ 477 double pitch_of_curr_point; /* used in excitation generation */ 478 double pitch_counter; /* used in excitation generation */ 479 double pitch_inc_per_point; /* used in excitation generation */ 480 double *excite_ring_buff; /* used in excitation generation */ 481 size_t excite_buff_size; /* used in excitation generation */ 482 size_t excite_buff_index; /* used in excitation generation */ 483 unsigned char sw; /* switch used in random generator */ 484 int x; /* excitation signal */ 485 double *freqt_buff; /* used in freqt */ 486 size_t freqt_size; /* buffer size for freqt */ 487 double *spectrum2en_buff; /* used in spectrum2en */ 488 size_t spectrum2en_size; /* buffer size for spectrum2en */ 489 double r1, r2, s; /* used in random generator */ 490 double *postfilter_buff; /* used in postfiltering */ 491 size_t postfilter_size; /* buffer size for postfiltering */ 492 double *c, *cc, *cinc, *d1; /* used in the MLSA/MGLSA filter */ 493 double *lsp2lpc_buff; /* used in lsp2lpc */ 494 size_t lsp2lpc_size; /* buffer size of lsp2lpc */ 495 double *gc2gc_buff; /* used in gc2gc */ 496 size_t gc2gc_size; /* buffer size for gc2gc */ 497 } HTS_Vocoder; 498 499 /* HTS_Vocoder_initialize: initialize vocoder */ 500 void HTS_Vocoder_initialize(HTS_Vocoder * v, size_t m, size_t stage, HTS_Boolean use_log_gain, size_t rate, size_t fperiod); 501 502 /* HTS_Vocoder_synthesize: pulse/noise excitation and MLSA/MGLSA filster based waveform synthesis */ 503 void HTS_Vocoder_synthesize(HTS_Vocoder * v, size_t m, double lf0, double *spectrum, size_t nlpf, double *lpf, double alpha, double beta, double volume, double *rawdata, HTS_Audio * audio); 504 505 /* HTS_Vocoder_clear: clear vocoder */ 506 void HTS_Vocoder_clear(HTS_Vocoder * v); 507 508 HTS_HIDDEN_H_END; 509 510 #endif /* !HTS_HIDDEN_H */ 511