/*************************************************************************/ /* */ /* Language Technologies Institute */ /* Carnegie Mellon University */ /* Copyright (c) 2007 */ /* All Rights Reserved. */ /* */ /* Permission is hereby granted, free of charge, to use and distribute */ /* this software and its documentation without restriction, including */ /* without limitation the rights to use, copy, modify, merge, publish, */ /* distribute, sublicense, and/or sell copies of this work, and to */ /* permit persons to whom this work is furnished to do so, subject to */ /* the following conditions: */ /* 1. The code must retain the above copyright notice, this list of */ /* conditions and the following disclaimer. */ /* 2. Any modifications must be clearly marked as such. */ /* 3. Original authors' names are not deleted. */ /* 4. The authors' names are not used to endorse or promote products */ /* derived from this software without specific prior written */ /* permission. */ /* */ /* CARNEGIE MELLON UNIVERSITY AND THE CONTRIBUTORS TO THIS WORK */ /* DISCLAIM ALL WARRANTIES WITH REGARD TO THIS SOFTWARE, INCLUDING */ /* ALL IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS, IN NO EVENT */ /* SHALL CARNEGIE MELLON UNIVERSITY NOR THE CONTRIBUTORS BE LIABLE */ /* FOR ANY SPECIAL, INDIRECT OR CONSEQUENTIAL DAMAGES OR ANY DAMAGES */ /* WHATSOEVER RESULTING FROM LOSS OF USE, DATA OR PROFITS, WHETHER IN */ /* AN ACTION OF CONTRACT, NEGLIGENCE OR OTHER TORTIOUS ACTION, */ /* ARISING OUT OF OR IN CONNECTION WITH THE USE OR PERFORMANCE OF */ /* THIS SOFTWARE. */ /* */ /*************************************************************************/ /* Author: Alan W Black (awb@cs.cmu.edu) */ /* Date: November 2007 */ /*************************************************************************/ /* */ /* clustergen db */ /* */ /* A statistical corpus based synthesizer. */ /* See Black, A. (2006), CLUSTERGEN: A Statistical Parametric */ /* Synthesizer using Trajectory Modeling", Interspeech 2006 - ICSLP, */ /* Pittsburgh, PA. */ /* http://www.cs.cmu.edu/~awb/papers/is2006/IS061394.PDF */ /* */ /*************************************************************************/ #ifndef _CST_CG_H__ #define _CST_CG_H__ #include "cst_cart.h" #include "cst_track.h" #include "cst_wave.h" #include "cst_audio.h" #include "cst_synth.h" /* for dur_stat */ typedef struct cst_cg_db_struct { const char *name; const char * const *types; int num_types; const int sample_rate; float f0_mean, f0_stddev; /* Cluster trees */ const cst_cart * const *f0_trees; const cst_cart * const *param_trees0; /* single or static */ const cst_cart * const *param_trees1; /* deltas */ const cst_cart * const *param_trees2; /* me str */ /* Model params e.g. mceps, deltas intersliced with stddevs */ const int num_channels0; const int num_frames0; const unsigned short * const * model_vectors0; const int num_channels1; const int num_frames1; const unsigned short * const * model_vectors1; const int num_channels2; const int num_frames2; const unsigned short * const * model_vectors2; /* Currently shared between different models */ const float *model_min; /* for vector coeffs encoding */ const float *model_range; /* for vector coeffs encoding */ const float frame_advance; /* duration model (cart + phonedurs) */ const dur_stat * const *dur_stats; const cst_cart *dur_cart; /* phone to states map */ const char * const * const *phone_states; /* Other parameters */ const int do_mlpg; /* implies deltas are in the model_vectors */ const float *dynwin; const int dynwinsize; const float mlsa_alpha; const float mlsa_beta; const int multimodel; const int mixed_excitation; /* filters for Mixed Excitation */ const int ME_num; const int ME_order; const double * const *me_h; const float gain; } cst_cg_db; /* Access model parameters, unpacking them as required */ #define CG_MODEL_VECTOR(M,N,X,Y) \ (M->model_min[Y]+((float)(M->N[X][Y])/65535.0*M->model_range[Y])) CST_VAL_USER_TYPE_DCLS(cg_db,cst_cg_db) cst_utterance *cg_synth(cst_utterance *utt); cst_wave *mlsa_resynthesis(const cst_track *t, const cst_track *str, cst_cg_db *cg_db, cst_audio_streaming_info *asc); cst_track *mlpg(const cst_track *param_track, cst_cg_db *cg_db); #endif