00001
00036
00037
00038
00039
00040
00041
00042
00043 #ifndef __SENT_VOCA_H__
00044 #define __SENT_VOCA_H__
00045
00046 #include <sent/stddefs.h>
00047 #include <sent/htk_hmm.h>
00048
00050 #define MAXWSTEP 4000
00051
00053 typedef struct {
00054 WORD_ID maxnum;
00055 WORD_ID num;
00056 WORD_ID errnum;
00057 WORD_ID linenum;
00058 boolean do_conv;
00059 boolean ok_flag;
00060
00061 unsigned char *wlen;
00062
00063 char **wname;
00064 char **woutput;
00065 HMM_Logical ***wseq;
00066 WORD_ID *wton;
00067 #ifdef CLASS_NGRAM
00068 LOGPROB *cprob;
00069 WORD_ID cwnum;
00070 #endif
00071 WORD_ID head_silwid;
00072 WORD_ID tail_silwid;
00073 short maxwn;
00074 short maxwlen;
00075 int totalstatenum;
00076 int totalmodelnum;
00077 int totaltransnum;
00078 boolean *is_transparent;
00079 APATNODE *errph_root;
00080 BMALLOC_BASE *mroot;
00081 } WORD_INFO;
00082
00083 WORD_INFO *word_info_new();
00084 void word_info_free(WORD_INFO *winfo);
00085 void winfo_init(WORD_INFO *winfo);
00086 boolean winfo_expand(WORD_INFO *winfo);
00087 boolean init_voca(WORD_INFO *winfo, char *filename, HTK_HMM_INFO *hmminfo, boolean, boolean);
00088 boolean init_wordlist(WORD_INFO *winfo, char *filename, HTK_HMM_INFO *hmminfo, char *headphone, char *tailphone, char *contextphone, boolean force_dict);
00089 void voca_set_stats(WORD_INFO *winfo);
00090 void voca_load_start(WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, boolean ignore_tri_conv);
00091 boolean voca_load_line(char *buf, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo);
00092 boolean voca_load_end(WORD_INFO *winfo);
00093 boolean voca_load_htkdict(FILE *, WORD_INFO *, HTK_HMM_INFO *, boolean);
00094 boolean voca_load_htkdict_fp(FILE *, WORD_INFO *, HTK_HMM_INFO *, boolean);
00095 boolean voca_append_htkdict(char *entry, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, boolean ignore_tri_conv);
00096 boolean voca_append(WORD_INFO *dstinfo, WORD_INFO *srcinfo, int coffset, int woffset);
00097 boolean voca_load_htkdict_line(char *buf, WORD_ID *vnum, int linenum, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, boolean do_conv, boolean *ok_flag);
00098
00099 boolean voca_load_word_line(char *buf, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, char *headphone, char *tailpohone, char *contextphone);
00100 boolean voca_load_wordlist(FILE *fp, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, char *headphone, char *tailphone, char *contextphone);
00101 boolean voca_load_wordlist_fp(FILE *fp, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, char *headphone, char *tailphone, char *contextphone);
00102 boolean voca_load_wordlist_line(char *buf, WORD_ID *vnum, int linenum, WORD_INFO *winfo, HTK_HMM_INFO *hmminfo, boolean do_conv, boolean *ok_flag, char *headphone, char *tailphone, char *contextphone);
00103 boolean voca_mono2tri(WORD_INFO *winfo, HTK_HMM_INFO *hmminfo);
00104 WORD_ID voca_lookup_wid(char *, WORD_INFO *);
00105 WORD_ID *new_str2wordseq(WORD_INFO *, char *, int *);
00106 char *cycle_triphone(char *p);
00107 char *cycle_triphone_flush();
00108 void print_voca_info(FILE *fp, WORD_INFO *);
00109 void put_voca(FILE *fp, WORD_INFO *winfo, WORD_ID wid);
00110
00111
00112 boolean make_base_phone(HTK_HMM_INFO *hmminfo, WORD_INFO *winfo);
00113 void print_phone_info(FILE *fp, HTK_HMM_INFO *hmminfo);
00114 void print_all_basephone_detail(HMM_basephone *base);
00115 void print_all_basephone_name(HMM_basephone *base);
00116 void test_interword_triphone(HTK_HMM_INFO *hmminfo, WORD_INFO *winfo);
00117
00118 #endif