/*---------------------------------------------------------------------------* * run_seq_lts.c * * * * Copyright 2007, 2008 Nuance Communciations, Inc. * * * * Licensed under the Apache License, Version 2.0 (the 'License'); * * you may not use this file except in compliance with the License. * * * * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * * * Unless required by applicable law or agreed to in writing, software * * distributed under the License is distributed on an 'AS IS' BASIS, * * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * * See the License for the specific language governing permissions and * * limitations under the License. * * * *---------------------------------------------------------------------------*/ #include #include #include #include #ifndef NO_STDERR #include #else extern void PrintError(char *msg, unsigned long p1, unsigned long p2, unsigned long p3); #endif #include "passert.h" #include "pmemory.h" #include "plog.h" #include "phashtable.h" #include "lts_error.h" #include "lts.h" #include "lts_seq_internal.h" #include "port_fileio.h" #include "platform_utils.h" /* strdup, safe_strtok, etc */ #define ASSERT(x) passert(x) #ifdef TI_DSP #include "tidsp_defines.h" #endif #ifdef _DEBUG #define PRINT_LOAD_TREE_SUMMARY 0 #define PRINT_LOAD_TREE 0 #define PRINT_CONS_COMB 0 #define PRINT_DP_LETTER 0 #define PRINT_LTS_WORD 0 #define PRINT_DICT_LOOKUP 0 #endif #define LTS_MARKER_WORD_START "WS" #define LTS_MARKER_PRON_START "PS" #define LTS_MARKER_SYLL_START "SS" #define LTS_MARKER_SYLL_START_DD "SS%d" #define LTS_MARKER_PIPESEP "|" #define LTS_MARKER_PIPESEP_CHAR '|' static int load_int(PORT_FILE *fp); static SWIsltsResult load_lquestions(LQUESTION ***pquestions, int *pnum_questions, PORT_FILE *fp); static SWIsltsResult free_lquestions(LQUESTION ** questions, int num_questions); static SWIsltsResult load_letter_mapping(PORT_FILE *fp, LM **ppLetterMap); static SWIsltsResult free_letter_mapping(LM *lm); static SWIsltsResult load_phone_mapping(PORT_FILE *fp, PM **ppPhoneMap); static SWIsltsResult free_phone_mapping(PM *pm); static SWIsltsResult load_outputs(char ***poutputs, char ***pinputs, int *pnum, PORT_FILE *fp); static SWIsltsResult free_outputs(char **outputs, char **inputs, int num); static SWIsltsResult load_trees(RT_LTREE ***ptrees, int *num_letters, LQUESTION ***pquestions, int *num_questions, LM **plm, PORT_FILE *fp); static SWIsltsResult free_trees(RT_LTREE **trees, int num_letters, LQUESTION **questions, int num_questions, LM *lm); static SWIsltsResult load_allowable_cons_comb(LTS *lts, PORT_FILE *fp); static SWIsltsResult free_allowable_cons_comb(LTS *lts); static SWIsltsResult load_question_strings(LTS* lts, PORT_FILE* fp); static SWIsltsResult free_question_strings(LTS* lts); #define find_letter_index( myLet, myLM) (myLM->letter_index_for_letter[ toupper(myLet)]) int find_phone(const char *ph, PM *pm); int find_best_string(const char *str, LTS* lts); int find_best_prefix_string(const char *str, LTS* lts); int fill_up_dp_for_letter(LTS *lts, const char *input_word, int word_len, int index, int root_start, int root_end, int left_phone); #define in_list(myV, myQ) (bitarray_read_bit( myQ->membership, myV)) #define qmatches(myQ, myU) (in_list( myU->properties[ myQ->type], myQ)) int matches(LQUESTION *q1, LQUESTION *q2, int type, LDP *dp) ; int find_output_for_dp(LTS *lts, int *pbackoff_output); int add_output(char *output, char **output_phone_string, int out_len, int max_phone_length); int is_allowable_cons_comb(LTS *lts, const char *cons_string); void adjust_syllable_boundaries(LTS *lts, char **output_phone_string, int num_out, int max_phone_length); SWIsltsResult lts_for_word(LTS *lts, char *word, int word_len, char **output_phone_string, int max_phone_length, int *num_out); /*------------ * * bitarray * *-----------*/ #define bitarray_read_bit( biTs, iBiT) ( biTs[iBiT/16] & (1<<((iBiT)%16)) ) /* int bitarray_read_bit( unsigned short* bits, int iBit) { // ASSERT( iBit<256); return bits[iBit/16] & (1<<((iBit)%16)); } */ void bitarray_write_bit( unsigned short* bits, int iBit, int iVal) { unsigned short sect; ASSERT( iBit<256); sect = bits[iBit/16]; if(iVal) { sect |= (1<<(iBit%16)); } else { sect &= ~(1<<(iBit%16)); } bits[ iBit/16] = sect; } void bitarray_populate_from_list(unsigned short* bits, char* list, int listlen) { unsigned int i; for(i=0; itype), sizeof(char), 1, fp); PORT_FREAD_CHAR(&(questions[i]->num_list), sizeof(char), 1, fp); questions[i]->list = (unsigned char*) lts_alloc(questions[i]->num_list, sizeof(unsigned char)); if (questions[i]->list == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } PORT_FREAD_CHAR(questions[i]->list, sizeof(char), (questions[i]->num_list), fp); bitarray_populate_from_list( questions[i]->membership, (char*) questions[i]->list, questions[i]->num_list); } *pnum_questions = num_questions; return SWIsltsSuccess; CLEAN_UP: free_lquestions(questions, num_questions); *pnum_questions = 0; *pquestions = NULL; return nRes; } /* deallocate questions */ static SWIsltsResult free_lquestions(LQUESTION ** questions, int num_questions) { SWIsltsResult nRes = SWIsltsSuccess; int i; if (questions) { for (i=0; ilist) { FREE(questions[i]->list); questions[i]->list = NULL; } FREE(questions[i]); questions[i] = NULL; } FREE(questions); } return nRes; } static SWIsltsResult load_letter_mapping(PORT_FILE *fp, LM **ppLetterMap) { SWIsltsResult nRes = SWIsltsSuccess; unsigned char len; LM * lm; int i; /* pfprintf(PSTDOUT,"got len %d\n", len);*/ lm = (LM*) lts_alloc(1, sizeof(LM)); if (lm == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } PORT_FREAD_CHAR(&len, sizeof(char), 1, fp); lm->num_letters = len; lm->letters = (char*) lts_alloc(len, sizeof(char)); if (lm->letters == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } lm->type = (char*) lts_alloc(len, sizeof(char)); if (lm->type == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } PORT_FREAD_CHAR(lm->letters, sizeof(char), len, fp); PORT_FREAD_CHAR(lm->type, sizeof(char), len, fp); { unsigned int letter; for (letter=0; letter <= UCHAR_MAX; letter++) lm->letter_index_for_letter[letter] = LTS_MAXCHAR; } for (i=0;iletters[i]); lm->letters[i] = letter; lm->letter_index_for_letter[(unsigned char)letter] = i; } *ppLetterMap = lm; return SWIsltsSuccess; CLEAN_UP: free_letter_mapping(lm); *ppLetterMap = NULL; return nRes; } /* deallocate letter mapping */ static SWIsltsResult free_letter_mapping(LM *lm) { SWIsltsResult nRes = SWIsltsSuccess; if (lm) { if (lm->letters) { FREE(lm->letters); lm->letters = NULL; } if (lm->type) { FREE(lm->type); lm->type = NULL; } lm->num_letters = 0; FREE(lm); } return nRes; } static SWIsltsResult load_phone_mapping(PORT_FILE *fp, PM **ppPhoneMap) { SWIsltsResult nRes = SWIsltsSuccess; PM * pm; int i; unsigned char len; char * ph; pm = (PM*) lts_alloc(1, sizeof(PM)); if (pm == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } pm->num_phones = load_int(fp); pm->phones = (char**) lts_alloc(pm->num_phones, sizeof(char*)); if (pm->phones == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } for (i=0;inum_phones;i++) { PORT_FREAD_CHAR(&len, sizeof(unsigned char), 1, fp); pm->phoneH = NULL; pm->phones[i] = ph = (char*) lts_alloc(len+1, sizeof(char)); if (ph == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } PORT_FREAD_CHAR(ph, sizeof(char), len, fp); ph[len] = '\0'; } pm->phoneH = my_PHashTableCreate_FromStrings( (const char**)pm->phones, pm->num_phones, L("lts.phoneH")); if(pm->phoneH == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } *ppPhoneMap = pm; return SWIsltsSuccess; CLEAN_UP: free_phone_mapping(pm); *ppPhoneMap = NULL; return nRes; } /* deallocate phone mapping */ static SWIsltsResult free_phone_mapping(PM *pm) { SWIsltsResult nRes = SWIsltsSuccess; int i; if (pm) { if (pm->phones) { for (i=0; inum_phones; i++) { if (pm->phones[i]) { FREE(pm->phones[i]); pm->phones[i] = NULL; } } FREE(pm->phones); pm->phones = NULL; } if(pm->phoneH) PHashTableDestroy( (PHashTable*)pm->phoneH); pm->phoneH = NULL; FREE(pm); } return nRes; } static SWIsltsResult load_outputs(char ***poutputs, char ***pinputs, int *pnum, PORT_FILE *fp) { SWIsltsResult nRes = SWIsltsSuccess; int i; char ** outputs = NULL; char ** inputs = NULL; int num; unsigned char olen; char * out; unsigned char ilen; char * in; num = load_int(fp); *poutputs = outputs = (char **) lts_alloc(num, sizeof(char*)); if (outputs == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } *pinputs = inputs = (char **) lts_alloc(num, sizeof(char*)); if (inputs == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } for (i=0;i 0) { PORT_FREAD_CHAR(out, sizeof(char), olen, fp); } out[olen] = '\0'; PORT_FREAD_CHAR(&ilen, sizeof(char), 1, fp); in = inputs[i] = lts_alloc(ilen + 1, sizeof(char)); if (in == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } if (ilen > 0) { PORT_FREAD_CHAR(in, sizeof(char), ilen, fp); } in[ilen] = '\0'; #if PRINT_LOAD_TREE if (ilen > 0) pfprintf(PSTDOUT,"LOAD_TREE: got input %s out %s\n", in, outputs[i]); pfprintf(PSTDOUT,"LOAD_TREE: outputs[%d] len %d out %x out %s\n", i, olen, outputs[i], outputs[i]); #endif } *pnum = num; return SWIsltsSuccess; CLEAN_UP: free_outputs(outputs, inputs, num); *poutputs = NULL; *pinputs = NULL; *pnum = 0; return nRes; } static SWIsltsResult free_outputs(char **outputs, char **inputs, int num) { SWIsltsResult nRes = SWIsltsSuccess; int i; if (outputs) { for (i=0; inum_letters) { #ifndef NO_STDERR PLogError(L("Error loading data, num_letters %d doesn't match num from mapping %d\n"), *num_letters, (*plm)->num_letters); #endif nRes = SWIsltsInternalErr; goto CLEAN_UP; } *ptrees = trees = (RT_LTREE**) lts_alloc(*num_letters, sizeof(RT_LTREE*)); if (trees == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } for (let=0;let<*num_letters;let++) { /* pfprintf(PSTDOUT,"loading for t %d\n", t);*/ trees[let] = tree = (RT_LTREE*) lts_alloc(1, sizeof(RT_LTREE)); if (tree == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } tree->num_nodes = load_int(fp); tree->values_or_question1 = (short*) lts_alloc(tree->num_nodes, sizeof(short)); if (tree->values_or_question1 == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } tree->question2 = (short*) lts_alloc(tree->num_nodes, sizeof(short)); if (tree->question2 == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } tree->left_nodes = (short *) lts_alloc(tree->num_nodes, sizeof(short)); if (tree->left_nodes == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } #if PRINT_LOAD_TREE pfprintf(PSTDOUT,"LOAD_TREE: Tree for let %d num_nodes %d\n", let, tree->num_nodes); #endif for (i=0;inum_nodes;i++) { PORT_FREAD_INT16(&(tree->left_nodes[i]), sizeof(short), 1, fp); PORT_FREAD_INT16(&(tree->values_or_question1[i]), sizeof(short), 1, fp); #if PRINT_LOAD_TREE pfprintf(PSTDOUT,"LOAD_TREE: node[%d] %d %d", i, tree->left_nodes[i], tree->values_or_question1[i]); #endif PORT_FREAD_INT16(&(tree->question2[i]), sizeof(short), 1, fp); if (tree->left_nodes[i] != NO_NODE) { if (tree->question2[i] == -1) tree->question2[i] = 0; #if PRINT_LOAD_TREE pfprintf(PSTDOUT," %x", (unsigned short) tree->question2[i]); #endif } #if PRINT_LOAD_TREE pfprintf(PSTDOUT,"\n"); #endif } } return SWIsltsSuccess; CLEAN_UP: free_trees(trees, *num_letters, *pquestions, *num_questions, *plm); *ptrees = NULL; *pquestions = NULL; *plm = NULL; *num_letters = 0; *num_questions = 0; return nRes; } /* deallocate trees */ static SWIsltsResult free_trees(RT_LTREE **trees, int num_letters, LQUESTION **questions, int num_questions, LM *lm) { SWIsltsResult nRes = SWIsltsSuccess; int i; RT_LTREE * tree; if (lm) { free_letter_mapping(lm); } if (questions) { free_lquestions(questions, num_questions); } if (trees) { for (i=0; ivalues_or_question1) { FREE(tree->values_or_question1); tree->values_or_question1 = NULL; } if (tree->question2) { FREE(tree->question2); tree->question2 = NULL; } if (tree->left_nodes) { FREE(tree->left_nodes); tree->left_nodes = NULL; } FREE(trees[i]); trees[i] = NULL; } } FREE(trees); } return nRes; } static SWIsltsResult load_allowable_cons_comb(LTS *lts, PORT_FILE *fp) { SWIsltsResult nRes = SWIsltsSuccess; char line[50]; char tempstr[50]; char * tok; int i, toklen; int count; char seps[] = " \n"; lts->num_cons_comb = 0; lts->allowable_cons_combH = NULL; while (PORT_FGETS(line, 50, fp)) { #ifndef TI_DSP /*need to get rid of sme crud at the end of the line because it is being read in binary mode*/ for (i=strlen(line)-1;i>=0;i--) { if (!isalpha(line[i])) line[i] = ' '; } #endif count = 0; tok = safe_strtok(line, seps, &toklen); tempstr[0] = '\0'; /* get all available sequence of tokens */ while(tok && toklen > 0){ count += toklen; strncat(tempstr, tok, toklen); tempstr[count+1] = '\0'; strcat(tempstr, " "); count++; tok = safe_strtok(tok+toklen, seps, &toklen); } if (count > 0) { /* delete the final space */ tempstr[count-1] = '\0'; lts->allowable_cons_comb[lts->num_cons_comb] = (char*) lts_alloc(strlen(tempstr)+1, sizeof(char)); if (lts->allowable_cons_comb[lts->num_cons_comb] == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } strcpy(lts->allowable_cons_comb[lts->num_cons_comb], tempstr); #if PRINT_CONS_COMB pfprintf(PSTDOUT,"LOAD_TREE: allowable_cons_comb[%d]: %s\n", lts->num_cons_comb, tempstr); #endif lts->num_cons_comb++; if (lts->num_cons_comb >= MAX_CONS_COMB) { #ifndef NO_STDERR PLogError(L("MAX_CONS_COMB %d exceeded\n"), MAX_CONS_COMB); #endif nRes = SWIsltsInternalErr; goto CLEAN_UP; } } } if (lts->num_cons_comb == 0) { #ifndef NO_STDERR PLogError(L("Warning: the data file is missing consonant combinations - syllable boundaries will be incorrect\n")); #endif } lts->allowable_cons_combH = my_PHashTableCreate_FromStrings( (const char**)lts->allowable_cons_comb, lts->num_cons_comb, L("lts.allowable_cons_combH")); if(lts->allowable_cons_combH == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } #if PRINT_LOAD_TREE_SUMMARY pfprintf(PSTDOUT,"loaded %d cons combinations\n", lts->num_cons_comb); #endif return SWIsltsSuccess; CLEAN_UP: free_allowable_cons_comb(lts); return nRes; } static SWIsltsResult free_allowable_cons_comb(LTS *lts) { SWIsltsResult nRes = SWIsltsSuccess; int i; for (i=0; inum_cons_comb; i++) { if (lts->allowable_cons_comb[i]) { FREE(lts->allowable_cons_comb[i]); lts->allowable_cons_comb[i] = NULL; } } if(lts->allowable_cons_combH) PHashTableDestroy( (PHashTable*)lts->allowable_cons_combH); lts->allowable_cons_combH = NULL; return nRes; } static SWIsltsResult load_question_strings(LTS* lts, PORT_FILE* fp) { SWIsltsResult nRes = SWIsltsSuccess; int i; int num; unsigned char len; char ** strings; char * str; num = load_int(fp); lts->strings = strings = (char **) lts_alloc(num, sizeof(char*)); lts->string_lens = (char*)lts_alloc(num, sizeof(char)); if (strings == NULL || lts->string_lens == NULL ) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } for (i=0;i 0) { PORT_FREAD_CHAR(str, sizeof(char), len, fp); } str[len] = '\0'; bitarray_populate_from_list( lts->membership, lts->strings[i], len); lts->string_lens[i] = strlen(lts->strings[i]); } // *pnum = num; lts->num_strings = num; return SWIsltsSuccess; CLEAN_UP: free_question_strings(lts); return nRes; } /* deallocate question strings */ static SWIsltsResult free_question_strings(LTS* lts) { SWIsltsResult nRes = SWIsltsSuccess; int i; if (lts->strings) { for (i=0;inum_strings;i++) { if (lts->strings[i]) { FREE(lts->strings[i]); lts->strings[i] = NULL; } } FREE(lts->strings); if(lts->string_lens) FREE(lts->string_lens); lts->strings = NULL; lts->string_lens = NULL; } return nRes; } SWIsltsResult create_lts(char *data_filename, LTS_HANDLE *phLts) { SWIsltsResult nRes = SWIsltsSuccess; LTS * lts; #ifdef USE_STATIC_SLTS /* TODO: language-specific ID here? */ lts = &g_lts; #else /* !USE_STATIC_SLTS */ PORT_FILE *fp; lts = (LTS*) lts_alloc(1, sizeof(LTS)); if (lts == NULL) { nRes = SWIsltsErrAllocResource; goto CLEAN_UP; } fp = PORT_FOPEN(data_filename, "rb"); if (fp == NULL) { #ifndef NO_STDERR PLogError(L("Cannot open %s\n"), data_filename); #endif nRes = SWIsltsFileOpenErr; goto CLEAN_UP; } nRes = load_phone_mapping(fp, <s->phone_mapping); if (nRes != SWIsltsSuccess) { PLogError(L("SWIsltsErr: load_phone_mapping() failed: Err_code = %d\n"), nRes); goto CLEAN_UP; } nRes = load_question_strings(lts, fp); if (nRes != SWIsltsSuccess) { PLogError(L("SWIsltsErr: load_question_strings() failed: Err_code = %d\n"), nRes); goto CLEAN_UP; } nRes = load_outputs(&(lts->outputs), &(lts->input_for_output), <s->num_outputs, fp); if (nRes != SWIsltsSuccess) { PLogError(L("SWIsltsErr: load_outputs() failed: Err_code = %d\n"), nRes); goto CLEAN_UP; } #if PRINT_LOAD_TREE pfprintf(PSTDOUT,"LOAD_TREE: got %d outputs, loading trees\n", lts->num_outputs); #endif nRes = load_trees(&(lts->trees), &(lts->num_letters), &(lts->questions), &(lts->num_questions), &(lts->letter_mapping), fp); if (nRes != SWIsltsSuccess) { PLogError(L("SWIsltsErr: load_trees() failed: Err_code = %d\n"), nRes); goto CLEAN_UP; } nRes = load_allowable_cons_comb(lts, fp); if (nRes != SWIsltsSuccess) { PLogError(L("SWIsltsErr: load_allowable_cons_comb() failed: Err_code = %d\n"), nRes); goto CLEAN_UP; } PORT_FCLOSE(fp); #endif /* !USE_STATIC_SLTS */ *phLts = lts; return SWIsltsSuccess; CLEAN_UP: free_lts(lts); *phLts = NULL; return nRes; } /* deallocates LTS */ SWIsltsResult free_lts(LTS_HANDLE hlts) { SWIsltsResult nRes = SWIsltsSuccess; LTS * lts = (LTS *)hlts; if (lts) { #ifndef USE_STATIC_SLTS free_phone_mapping(lts->phone_mapping); free_question_strings(lts); lts->strings = NULL; lts->phone_mapping = NULL; free_outputs(lts->outputs, lts->input_for_output, lts->num_outputs); lts->input_for_output = lts->outputs = NULL; free_trees(lts->trees, lts->num_letters, lts->questions, lts->num_questions, lts->letter_mapping); lts->trees = NULL; lts->questions = NULL; lts->letter_mapping = NULL; free_allowable_cons_comb(lts); FREE(lts); #endif /* !USE_STATIC_LTS */ } return nRes; } int find_phone(const char *ph, PM *pm) { ESR_ReturnCode rc; int iRet = -1; rc = PHashTableGetValue((PHashTable*)pm->phoneH, ph, (void**)(void*)&iRet); if (rc != ESR_SUCCESS) PLogError("error while in find_phone(%s,%x)\n", ph, pm); return iRet; } int find_best_string(const char *str, LTS* lts) { int i, maxlen, maxi, len; int len_str; if(str[0] == '\0') return -1; len_str = strlen(str); maxi = -1; maxlen = 0; for (i=0;inum_strings;i++) { len = lts->string_lens[i]; if( len > len_str) continue; /* no point in comparison */ if (strncmp(str, lts->strings[i], len) == 0) { if (len > maxlen) { maxlen = len; maxi = i; } } } return maxi; } int find_best_prefix_string(const char *str, LTS* lts) { int i; int maxlen; int maxi; int len; int prelen; maxi = -1; maxlen = 0; prelen = strlen(str); for (i=0;inum_strings;i++) { len = lts->string_lens[i]; if (len <= prelen) { if (strncmp(str + (prelen - len), lts->strings[i], len) == 0) { if (len > maxlen) { maxlen = len; maxi = i; } } } } return maxi; } int fill_up_dp_for_letter(LTS *lts, const char *input_word, int word_len, int index, int root_start, int root_end, int left_phone) { int i,j; LDP *dp; unsigned char letter; int hit_wb; LM *lm; unsigned char word[MAX_WORD_LEN]; char tempstr[MAX_WORD_LEN]; int first_syl_end; int last_syl_start; dp = &(lts->dp); lm = lts->letter_mapping; /* the LTS decision tree does not seem to be well trained at all for the letter ' when followed by "s" ... It seems to result in the phoneme 'm', which is wrong. "'t" seems to be OK though. BAD: Kevin's : k6v6nmz ... pal's : palmz ... paul's : p{lz BAD: janice's : jan6s6mz ... tom's house : t)mmz&h?s ... tonya's : t)ny6mz BAD: jake's house : jAk6mz&h?s Ignoring ' as below we get ... BETTER: Kevin's : kev6nz ... pal's : palz ... paul's : p{lz BETTER: janice's : jan6s6s ... tom's house : t)mz&h?s ... tonya's : t)ny6s BETTER: jake's house : jAk6s&h?s The proper solution requires a legitimate text normalizer with special handling of cases like 's which would always put a "z" there, except if preceded by an unvoiced stop (ptk) which requires a "s" there. For now let's just skip the ' letter, which testing shows to be generally safe (janice's, jake's etc are better but still not quite right). */ if(input_word[index] == '\'') return 1; // same as unknown character letter = find_letter_index(input_word[index], lm); if (letter == LTS_MAXCHAR) { /* lisa - we need to decide how to handle this case. Do we just silently skip unknown characters or warn the app or user somehow*/ #ifdef NO_STDERR PrintError("unknown character on input %c - skipping\n", input_word[index], NULL, NULL); #else PLogError(L("unknown character on input %c - skipping\n"), input_word[index]); #endif return 1; } hit_wb = 0; /*pfprintf(PSTDOUT,"left context\n");*/ for (j=0;j<5;j++) { if (hit_wb) { dp->properties[ Left1+j] = find_letter_index(LTS_MARKER_PIPESEP_CHAR, lm); } else { i = index - (j+1); if (i < 0) dp->properties[ Left1+j] = find_letter_index(LTS_MARKER_PIPESEP_CHAR, lm); else { dp->properties[ Left1+j] = find_letter_index(input_word[i], lm); if (dp->properties[ Left1+j] == LTS_MAXCHAR) { /*assume an unknown character is a word boundary*/ dp->properties[ Left1+j] = find_letter_index(LTS_MARKER_PIPESEP_CHAR, lm); hit_wb = 1; } } } } /*pfprintf(PSTDOUT,"right context\n");*/ hit_wb = 0; for (j=0;j<5;j++) { if (hit_wb) { dp->properties[ Right1+j] = find_letter_index(LTS_MARKER_PIPESEP_CHAR, lm); } else { i = index + (j+1); if (i >= word_len) dp->properties[Right1+j] = find_letter_index(LTS_MARKER_PIPESEP_CHAR, lm); else { dp->properties[ Right1+j] = find_letter_index(input_word[i], lm); if (dp->properties[ Right1+j] == LTS_MAXCHAR) { /*assume an unknown character is a word boundary*/ dp->properties[ Right1+j] = find_letter_index(LTS_MARKER_PIPESEP_CHAR, lm); hit_wb = 1; } } } } dp->letter = letter; // properties[ Letter] = letter; dp->properties[ LeftPhone1] = left_phone; /*pfprintf(PSTDOUT,"word stuff\n"); */ /*find word start and end - use unknown character as word boundaries*/ dp->properties[ WordLen] = word_len; if (index == 0) dp->properties[ LetInWord] = 0; else if (index == word_len-1) dp->properties[ LetInWord] = 2; else dp->properties[ LetInWord] = 1; for (i=0;itype[word[i]] == 1) { for (j=i+1;jtype[word[j]] != 1) break; } first_syl_end = j; break; } } last_syl_start = 0; for (i=word_len-1;i>=0;i--) { if (lm->type[word[i]] == 1) { for (j=i-1;j>=0;j--) { if (lm->type[word[j]] != 1) break; } last_syl_start = j; break; } } #if PRINT_DP_LETTER pfprintf(PSTDOUT,"first_syl_end %d last_syl_start %d\n", first_syl_end, last_syl_start); #endif if (index > last_syl_start) dp->properties[ SylInWord] = 2; else if (index < first_syl_end) dp->properties[ SylInWord] = 0; else dp->properties[ SylInWord] = 1; first_syl_end = word_len; for (i=0;itype[word[i]] == 1) { for (j=i+1;jtype[word[j]] != 1) break; } for (;jtype[word[j]] == 1) break; } first_syl_end = j; break; } } last_syl_start = 0; for (i=word_len-1;i>=0;i--) { if (lm->type[word[i]] == 1) { for (j=i-1;j>=0;j--) { if (lm->type[word[j]] != 1) break; } for (;j>=0;j--) { if (lm->type[word[j]] == 1) break; } last_syl_start = j; break; } } #if PRINT_DP_LETTER pfprintf(PSTDOUT,"first_syl_end %d last_syl_start %d\n", first_syl_end, last_syl_start); #endif if (index > last_syl_start) dp->properties[ Syl2InWord] = 2; else if (index < first_syl_end) dp->properties[ Syl2InWord] = 0; else dp->properties[Syl2InWord] = 1; first_syl_end = word_len; for (i=root_start;itype[word[i]] == 1) { for (j=i+1;jtype[word[j]] != 1) break; } first_syl_end = j; break; } } last_syl_start = 0; for (i=root_end-1;i>=root_start;i--) { if (lm->type[word[i]] == 1) { for (j=i-1;j>=0;j--) { if (lm->type[word[j]] != 1) break; } last_syl_start = j; break; } } #if PRINT_DP_LETTER pfprintf(PSTDOUT,"first_syl_end %d last_syl_start %d\n", first_syl_end, last_syl_start); #endif if (index > last_syl_start) dp->properties[SylInRoot] = 2; else if (index < first_syl_end) dp->properties[ SylInRoot] = 0; else dp->properties[ SylInRoot] = 1; first_syl_end = word_len; for (i=root_start;itype[word[i]] == 1) { for (j=i+1;jtype[word[j]] != 1) break; } for (;jtype[word[j]] == 1) break; } first_syl_end = j; break; } } last_syl_start = 0; for (i=root_end-1;i>=root_start;i--) { if (lm->type[word[i]] == 1) { for (j=i-1;j>=0;j--) { if (lm->type[word[j]] != 1) break; } for (;j>=0;j--) { if (lm->type[word[j]] == 1) break; } last_syl_start = j; break; } } #if PRINT_DP_LETTER pfprintf(PSTDOUT,"first_syl_end %d last_syl_start %d\n", first_syl_end, last_syl_start); #endif if (index > last_syl_start) dp->properties[Syl2InRoot] = 2; else if (index < first_syl_end) dp->properties[Syl2InRoot] = 0; else dp->properties[Syl2InRoot] = 1; dp->properties[Left_DFRE] = index - root_start; dp->properties[Right_DFRE] = (root_end - index) - 1; /* pfprintf(PSTDOUT,"strings\n");*/ #if PRINT_DP_LETTER pfprintf(PSTDOUT,"input word %s num_strings %d\n", input_word, lts->num_strings); #endif dp->properties[RightString] = find_best_string(input_word+index+1, lts); strcpy(tempstr, input_word); tempstr[index] = '\0'; dp->properties[LeftString] = find_best_prefix_string(tempstr, lts); #if PRINT_DP_LETTER pfprintf(PSTDOUT,"dp %c ", lm->letters[dp->letter]); for (i=0;iletters[word[i]]); } pfprintf(PSTDOUT," %c%c%c {%c} %c%c%c liw %d siw %d s2iw %d nw %d sir %d s2ir %d left_DFRE %d right_DFRE %d\n", lm->letters[dp->left_context[2]], lm->letters[dp->left_context[1]], lm->letters[dp->left_context[0]], lm->letters[dp->letter], lm->letters[dp->right_context[0]], lm->letters[dp->right_context[1]], lm->letters[dp->right_context[2]], dp->let_in_word, dp->syl_in_word, dp->syl2_in_word, dp->word_len, dp->syl_in_root, dp->syl2_in_root, dp->left_DFRE, dp->right_DFRE); #endif return 0; } int matches(LQUESTION *q1, LQUESTION *q2, int type, LDP *dp) { int m1, m2; switch(type) { case 0: return qmatches(q1, dp); case 1: m1 = qmatches(q1, dp); m2 = qmatches(q2, dp); return(m1 && m2); case 2: m1 = qmatches(q1, dp); m2 = qmatches(q2, dp); return(m1 && !m2); case 3: m1 = qmatches(q1, dp); m2 = qmatches(q2, dp); return(!m1 && m2); case 4: m1 = qmatches(q1, dp); m2 = qmatches(q2, dp); return(!m1 && !m2); default: return -1; } /* should not come here */ return -1; } int find_output_for_dp(LTS *lts, int *pbackoff_output) { LDP *dp; int index; RT_LTREE *tree; LQUESTION *q1; LQUESTION *q2; int comb_type; int q2_index; int left_index; dp = &(lts->dp); tree = lts->trees[dp->letter]; // properties[Letter]]; index = 0; while (1) { left_index = tree->left_nodes[index]; if (left_index == NO_NODE) { /*means its a leaf node*/ *pbackoff_output = tree->question2[index]; return tree->values_or_question1[index]; } q1 = lts->questions[tree->values_or_question1[index]]; q2_index = tree->question2[index] & 0x1FFF; comb_type = (tree->question2[index] & 0xE000) >> 13; q2 = lts->questions[q2_index]; if (matches(q1, q2, comb_type, dp)) { index = left_index; } else { index = left_index+1; } } } int add_output(char *output, char **output_phone_string, int out_len, int max_phone_length) { char *tok; int toklen; char seps[] = " "; if (strlen(output) == 0) return out_len; tok = safe_strtok(output, seps, &toklen); while (tok && toklen) { if ((toklen > 0) && (strncmp(tok, "null", 4) != 0)) { if (isdigit(tok[toklen-1])) { /*means it's a vowel. So, add a syllable boundary. It's position gets adjusted later by adjust_syllable_boundaries()*/ strcpy(output_phone_string[out_len++], LTS_MARKER_SYLL_START); if (out_len >= max_phone_length) return max_phone_length; } strncpy(output_phone_string[out_len], tok, toklen); output_phone_string[out_len++][toklen] = '\0'; if (out_len >= max_phone_length) return max_phone_length; } tok = safe_strtok(tok+toklen, seps, &toklen); } return out_len; } int is_allowable_cons_comb(LTS *lts, const char *cons_string) { /* int i; for (i=0;inum_cons_comb;i++) { #if PRINT_CONS_COMB pfprintf(PSTDOUT,"checking {%s} vs c[%d] {%s}\n", cons_string, i, lts->allowable_cons_comb[i]); #endif if (strcmp(cons_string, lts->allowable_cons_comb[i]) == 0) return 1; } return 0; */ ESR_ReturnCode rc; void* iVal = NULL; rc = PHashTableGetValue( (PHashTable*)lts->allowable_cons_combH, cons_string, &iVal); if(rc == ESR_SUCCESS) return 1; else return 0; } void adjust_syllable_boundaries(LTS *lts, char **output_phone_string, int num_out, int max_phone_length) { char *out; int i,j; int syl_start; int stress = 0; int first_syl_bound; char tempstr[20]; /*there should already be a syllable boundary before each vowel (add_output put one there)*/ /*so just find these, then shift back by allowable consonant combinations and move the syllable mark*/ for (i=0;i0;j--) { out = output_phone_string[j]; if (isdigit(out[strlen(out)-1])) { syl_start = j+1; break; /*means it's a vowel*/ } if (strcmp(out, LTS_MARKER_WORD_START) == 0) { syl_start = j+1; break; /*don't push syl boundaries before word boundaries*/ } if (strcmp(out, LTS_MARKER_PRON_START) == 0) { syl_start = j+1; break; /*don't push syl boundaries before phrase boundaries*/ } /* for sequences longer than 2, check 3-syllable onset first, then check 2-syllable onset */ if(j > 1){ sprintf(tempstr, "%s %s %s", output_phone_string[j-2], output_phone_string[j-1], output_phone_string[j]); if (!is_allowable_cons_comb(lts, tempstr)) { sprintf(tempstr, "%s %s", output_phone_string[j-1], output_phone_string[j]); if (!is_allowable_cons_comb(lts, tempstr)) { #if PRINT_CONS_COMB pfprintf(PSTDOUT,"cons comb %s %s not allowed\n", output_phone_string[j-1], output_phone_string[j]); #endif syl_start = j; break; } } } /* for sequences shorter than 2 */ else { sprintf(tempstr, "%s %s", output_phone_string[j-1], output_phone_string[j]); if (!is_allowable_cons_comb(lts, tempstr)) { #if PRINT_CONS_COMB pfprintf(PSTDOUT,"cons comb %s %s not allowed\n", output_phone_string[j-1], output_phone_string[j]); #endif syl_start = j; break; } } } /* end for j=i-1 */ /*shift over stuff between syl_start a gap*/ for (j=i;j>syl_start;j--) { strcpy(output_phone_string[j], output_phone_string[j-1]); } /*now find stress level from phone (and remove it) and add it to syl bound*/ if (i= 0){ for(; j>syl_start; j--){ strcpy(output_phone_string[j], output_phone_string[j-1]); } /* put syllable boundary after word boundary */ sprintf(output_phone_string[syl_start], LTS_MARKER_SYLL_START_DD, stress); /* advance i, reset variables */ i = first_syl_bound; first_syl_bound = syl_start = -1; } } } } SWIsltsResult lts_for_word(LTS *lts, char *word, int word_len, char **output_phone_string, int max_phone_length, int *pnum_out) { SWIsltsResult nRes = SWIsltsSuccess; int i,j; int root_start; int root_end; int output_index; int left_phone; char * input_seq; int found_match; int start_num_out; int backoff_output; int num_out; start_num_out = num_out = *pnum_out; root_start = 0; root_end = word_len; for (i=0;iphone_mapping); #if PRINT_LTS_WORD pfprintf(PSTDOUT,"got phone %d for initial | (LTS_MARKER_PIPESEP)\n", left_phone); #endif if (left_phone < 0) { #ifdef NO_STDERR PrintError("Error, cannot find | in phone mappings\n", NULL, NULL, NULL); #else PLogError(L("Error, cannot find | in phone mappings\n")); #endif nRes = SWIsltsInternalErr; goto CLEAN_UP; } } else { #if PRINT_LTS_WORD pfprintf(PSTDOUT,"about to call find_phone2 num_out %d\n", num_out); pfprintf(PSTDOUT,"out[%d] %s\n", num_out-1, output_phone_string[num_out-1]); #endif if (strcmp(output_phone_string[num_out-1], LTS_MARKER_PRON_START) == 0) left_phone = find_phone(LTS_MARKER_PIPESEP, lts->phone_mapping); else if (strcmp(output_phone_string[num_out-1], LTS_MARKER_WORD_START) == 0) left_phone = find_phone(LTS_MARKER_PIPESEP, lts->phone_mapping); else left_phone = find_phone(output_phone_string[num_out-1], lts->phone_mapping); #if PRINT_LTS_WORD pfprintf(PSTDOUT,"got phone %d for %s\n", left_phone, output_phone_string[num_out-1]); #endif if (left_phone < 0) { #ifdef NO_STDERR PrintError("Error, cannot find %s in phone mappings\n", (unsigned long)output_phone_string[num_out-1], NULL, NULL); #else PLogError(L("Error, cannot find %s in phone mappings\n"), output_phone_string[num_out-1]); #endif nRes = SWIsltsInternalErr; goto CLEAN_UP; } } /* pfprintf(PSTDOUT,"calling fill up dp\n");*/ if (fill_up_dp_for_letter(lts, word, word_len, i, root_start, root_end, left_phone)) continue; /* pfprintf(PSTDOUT,"calling find output\n");*/ output_index = find_output_for_dp(lts, &backoff_output); #if PRINT_LTS_WORD pfprintf(PSTDOUT,"got output %d\n", output_index); #endif found_match = 1; if (strlen(lts->input_for_output[output_index]) > 0) { /*some extra input string to use up*/ #if PRINT_LTS_WORD pfprintf(PSTDOUT,"GOT INPUT %s for %s letter %c\n", lts->input_for_output[output_index], word, word[i]); #endif input_seq = lts->input_for_output[output_index]; if (input_seq[0] == '=') { root_end = i; input_seq = input_seq+1; /*skip suffix indicator*/ } for (j=i+1;;j++) { if (input_seq[j-(i+1)] == '\0') break; if (input_seq[j-(i+1)] == '-') { root_start = j; break; } if (j >= word_len) { found_match = 0; break; } if (input_seq[j-(i+1)] != word[j]) { found_match = 0; break; } } if (found_match) { i = j-1; } } if (!found_match) { #if PRINT_LTS_WORD pfprintf(PSTDOUT,"using backoff output %s instead of regular %s\n", lts->outputs[backoff_output], ts->outputs[output_index]); #endif num_out = add_output(lts->outputs[backoff_output], output_phone_string, num_out, max_phone_length); } else { num_out = add_output(lts->outputs[output_index], output_phone_string, num_out, max_phone_length); } if (num_out >= max_phone_length) { nRes = SWIsltsMaxInputExceeded; goto CLEAN_UP; } } *pnum_out = num_out; return SWIsltsSuccess; CLEAN_UP: *pnum_out = 0; return nRes; } SWIsltsResult run_lts(LTS_HANDLE h, FSM_DICT_HANDLE hdict, char *input_sentence, char **output_phone_string, int *phone_length) { SWIsltsResult nRes = SWIsltsSuccess; int i; int len; int num_out = 0; LTS * lts; int was_in_phrase; char word[MAX_WORD_LEN]; int num_in_word; int max_phone_length; int pron_len; max_phone_length = *phone_length; len = strlen(input_sentence); lts = (LTS*) h; was_in_phrase = 0; /*add a phrase start then word start at beginning*/ strcpy(output_phone_string[num_out++], LTS_MARKER_PRON_START); if (num_out >= max_phone_length) { nRes = SWIsltsMaxInputExceeded; goto CLEAN_UP; } num_in_word = 0; pron_len = 1; // for the first time through for (i=0;i<=len;i++) { #if PRINT_LTS_WORD pfprintf(PSTDOUT,"WORKING on letter %d %c\n", i, input_sentence[i]); #endif /* Treat hyphen as word delimiter. Not quite right for German hyphenated compounds, but still an improvement. */ if ((input_sentence[i] == ' ') || (input_sentence[i] == '-') || (input_sentence[i] == '\t') || (i == len)) { if (num_in_word>0 ) { strcpy(output_phone_string[num_out++], LTS_MARKER_WORD_START); if (num_out >= max_phone_length) { nRes = SWIsltsMaxInputExceeded; goto CLEAN_UP; } word[num_in_word] = '\0'; if (1) { #if PRINT_DICT_LOOKUP pfprintf(PSTDOUT,"Did not find %s in dictionary\n", word); #endif pron_len = -num_out; nRes = lts_for_word(lts, word, num_in_word, output_phone_string, max_phone_length, &num_out); pron_len += num_out; // now pron_len is the number of phonemes/markers added if(pron_len == 0) num_out--; // to backspace on the LTS_MARKER_WORD_START !! if (nRes != SWIsltsSuccess) { goto CLEAN_UP; } } num_in_word = 0; } } else if ( (input_sentence[i] == '.') || (input_sentence[i] == ',') || (input_sentence[i] == '!') || (input_sentence[i] == '?') || (input_sentence[i] == '\n')) { if (was_in_phrase) { /*add a phrase boundary after lts is called*/ if (num_in_word > 0) { strcpy(output_phone_string[num_out++], LTS_MARKER_WORD_START); if (num_out >= max_phone_length) { nRes = SWIsltsMaxInputExceeded; goto CLEAN_UP; } word[num_in_word] = '\0'; if (1) { nRes = lts_for_word(lts, word, num_in_word, output_phone_string, max_phone_length, &num_out); if (nRes != SWIsltsSuccess) { goto CLEAN_UP; } } num_in_word = 0; } strcpy(output_phone_string[num_out++], LTS_MARKER_PRON_START); if (num_out >= max_phone_length) { nRes = SWIsltsMaxInputExceeded; goto CLEAN_UP; } was_in_phrase = 0; } } else { if (num_in_word < MAX_WORD_LEN-1) { word[num_in_word++] = toupper(input_sentence[i]); was_in_phrase = 1; } } } /*adjust syllable boundaries*/ adjust_syllable_boundaries(lts, output_phone_string, num_out, max_phone_length); *phone_length = num_out; return SWIsltsSuccess; CLEAN_UP: *phone_length = 0; return nRes; } #ifdef USE_STATIC_SLTS void *lts_alloc(int num, int size) { #ifdef NO_STDERR PrintError("USE_STATIC_SLTS: lts_alloc should not be called", NULL, NULL, NULL); #else PLogError(L("USE_STATIC_SLTS: lts_alloc should not be called")); #endif return NULL; } #else void *lts_alloc(int num, int size) { void *p; p = CALLOC(num, size, MTAG); return p; } #endif /* USE_STATIC_SLTS */