1 /*---------------------------------------------------------------------------*
2 * astar.c *
3 * *
4 * Copyright 2007, 2008 Nuance Communciations, Inc. *
5 * *
6 * Licensed under the Apache License, Version 2.0 (the 'License'); *
7 * you may not use this file except in compliance with the License. *
8 * *
9 * You may obtain a copy of the License at *
10 * http://www.apache.org/licenses/LICENSE-2.0 *
11 * *
12 * Unless required by applicable law or agreed to in writing, software *
13 * distributed under the License is distributed on an 'AS IS' BASIS, *
14 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. *
15 * See the License for the specific language governing permissions and *
16 * limitations under the License. *
17 * *
18 *---------------------------------------------------------------------------*/
19
20 #include "pstdio.h"
21 #include "passert.h"
22
23 #include"srec_sizes.h"
24 #include"search_network.h"
25 #include"srec.h"
26 #include"srec_context.h"
27 #include"word_lattice.h"
28 #include "portable.h"
29 #include "srec_stats.h"
30 #include "astar.h"
31 #include "astar_pphash.h"
32
33 #ifdef SET_RCSID
34 static const char *rcsid = 0 ? (const char *) &rcsid :
35 "$Id: astar.c,v 1.19.4.9 2008/04/30 15:12:15 dahan Exp $";
36 #endif
37
38 #define PRINT_ASTAR_SOMEWHAT 0
39 #define PRINT_ASTAR_DETAILS 0
40 #define PRINT_ASTAR_QBT_DETAILS 0 /* Quick Back Trace */
41 #define MAX_NBEST_LEN 32
42 #define NBEST_LEN_MARGIN 10
43 #define MAX_NUM_PARPS 400 /* 3*MAX_NBEST_LEN*MAX_WORDS_PER_COMPLETE_PATH need better dup
44 check on complete paths */
45 #define ASTAR_PRUNE_DELTA 20000
46 #define DEBUG_PARP_MANAGEMENT 0
47
48 #if PRINT_ASTAR_DETAILS
49 static int do_draw_as_dotty = 0;
50 static int do_draw_file_idx = 0;
51
52 int astar_draw_tree_as_dotty(const char* file, srec* rec, AstarStack* stack);
53 #endif
54
55 /*
56 The word graph is represented as an arc_token_list,
57 arc_token's are chained together 2 linked lists,
58 arc_token->first_next_arc ... like a "TO" node
59 arc_token->next_arc_index ... a linked list of arcs leaving the same node
60
61 get_arc_for_word() finds the arc_token for a particular extension
62 backward though the word graph (ie. forward through the reverse word graph)
63
64 */
65
66 #define ARC_TOKEN_ONE (arc_token*)1
get_arc_for_word(arc_token * atoken,wordID word,void * context_void,wordID terminal_word)67 arc_token* get_arc_for_word(arc_token* atoken, wordID word,
68 void* context_void,
69 wordID terminal_word)
70 {
71 srec_context* context = (srec_context*)context_void;
72 arc_token* arc_token_list = context->arc_token_list;
73 arc_token* tmp;
74 wordmap* wmap = context->olabels;
75
76 if (atoken == ARC_TOKEN_ONE)
77 {
78 /* log_report("Warning: bad thing is happening word=%d\n", word); */
79 return 0;
80 }
81 else if (atoken == 0)
82 {
83 arc_token root_arc;
84 root_arc.first_next_arc = ARC_TOKEN_LNK(arc_token_list, 0);
85 root_arc.next_token_index = ARC_TOKEN_NULL;
86 root_arc.ilabel = root_arc.olabel = 0;
87 return get_arc_for_word(&root_arc, word, context_void, terminal_word);
88
89 /* the arc token is NULL for partial paths just starting; but
90 the word graph has nasty epsilons at the beginning, we'll remove
91 them later, but must handle them in the mean time. */
92 atoken = &arc_token_list[0];
93 for (; atoken; atoken = ARC_TOKEN_PTR(arc_token_list, atoken->next_token_index))
94 {
95 if (atoken->ilabel == word)
96 return atoken;
97 else if (atoken->ilabel == WORD_EPSILON_LABEL)
98 {
99 for (tmp = ARC_TOKEN_PTR(arc_token_list, atoken->first_next_arc); tmp;
100 tmp = ARC_TOKEN_PTR(arc_token_list, tmp->next_token_index))
101 if (tmp->ilabel == word)
102 return tmp;
103 }
104 else if (atoken->ilabel < wmap->num_slots)
105 {
106 if (wordmap_whether_in_rule(wmap, word, atoken->ilabel))
107 return atoken;
108 }
109 }
110 return 0;
111 }
112 else if (word == terminal_word)
113 {
114 /* -pau- LABEL, the word graph does not seem to have them! */
115 tmp = ARC_TOKEN_PTR(arc_token_list, atoken->first_next_arc);
116 if (!tmp)
117 return ARC_TOKEN_ONE;
118 else if (tmp->first_next_arc == ARC_TOKEN_NULL && (tmp->ilabel == MAXwordID || tmp->ilabel == terminal_word))
119 return ARC_TOKEN_ONE;
120 else
121 {
122 /* again more weirdness in the output graph format1
123 might be due to multiple endnodes? */
124 for (tmp = ARC_TOKEN_PTR(arc_token_list, atoken->first_next_arc); tmp;
125 tmp = ARC_TOKEN_PTR(arc_token_list, tmp->next_token_index))
126 if (tmp->ilabel == MAXwordID && tmp->first_next_arc == ARC_TOKEN_NULL)
127 return ARC_TOKEN_ONE;
128 return 0;
129 }
130 }
131 else
132 {
133 #if PRINT_ASTAR_DETAILS
134 printf("word %d allowed? ", word);
135 #endif
136 if (atoken->first_next_arc == ARC_TOKEN_NULL)
137 return 0;
138 else
139 tmp = ARC_TOKEN_PTR(arc_token_list, atoken->first_next_arc);
140 /* handle single epsilons */
141 if (tmp->ilabel == WORD_EPSILON_LABEL && tmp->next_token_index == ARC_TOKEN_NULL)
142 tmp = ARC_TOKEN_PTR(arc_token_list, tmp->first_next_arc);
143 for (; tmp; tmp = ARC_TOKEN_PTR(arc_token_list, tmp->next_token_index))
144 {
145 #if PRINT_ASTAR_DETAILS
146 printf(" W%d(%s)", tmp->ilabel, tmp->ilabel != MAXwordID ? wmap->words[tmp->ilabel] : "");
147 #endif
148 if (tmp->ilabel == word)
149 {
150 #if PRINT_ASTAR_DETAILS
151 printf("\n");
152 #endif
153 return tmp;
154 }
155 else if (tmp->ilabel < wmap->num_slots)
156 {
157 if (wordmap_whether_in_rule(wmap, word, tmp->ilabel))
158 return tmp;
159 }
160 }
161 #if PRINT_ASTAR_DETAILS
162 printf("\n");
163 #endif
164 return 0;
165 }
166 }
167
get_arc_for_word_without_slot_annotation(arc_token * atoken,const char * word,void * context_void,wordID terminal_word)168 arc_token* get_arc_for_word_without_slot_annotation(arc_token* atoken, const char* word,
169 void* context_void,
170 wordID terminal_word)
171 {
172 srec_context* context = (srec_context*)context_void;
173 arc_token* arc_token_list = context->arc_token_list;
174 arc_token* tmp;
175 wordmap* wmap = context->olabels;
176 wordID wdid = wordmap_find_index(wmap, word);
177
178 if (atoken == ARC_TOKEN_ONE)
179 {
180 /* log_report("Warning: bad thing is happening word=%d\n", word); */
181 return 0;
182 }
183 else if (atoken == NULL)
184 {
185 arc_token root_arc;
186 root_arc.first_next_arc = ARC_TOKEN_LNK(arc_token_list, 0);
187 root_arc.next_token_index = ARC_TOKEN_NULL;
188 root_arc.ilabel = root_arc.olabel = 0;
189 return get_arc_for_word_without_slot_annotation(&root_arc, word, context_void, terminal_word);
190 }
191 else if (word == NULL)
192 {
193 /* -pau- LABEL, the word graph does not seem to have them! */
194 tmp = ARC_TOKEN_PTR(arc_token_list, atoken->first_next_arc);
195 if (!tmp)
196 return ARC_TOKEN_ONE;
197 else if (!tmp->first_next_arc && (tmp->ilabel == MAXwordID || tmp->ilabel == terminal_word))
198 return ARC_TOKEN_ONE;
199 else
200 {
201 /* again more weirdness in the output graph format1
202 might be due to multiple endnodes? */
203 for (tmp = ARC_TOKEN_PTR(arc_token_list, atoken->first_next_arc); tmp;
204 tmp = ARC_TOKEN_PTR(arc_token_list, tmp->next_token_index))
205 if (tmp->ilabel == MAXwordID && tmp->first_next_arc == ARC_TOKEN_NULL)
206 return ARC_TOKEN_ONE;
207 return 0;
208 }
209 }
210 else
211 {
212 for (tmp = ARC_TOKEN_PTR(arc_token_list, atoken->first_next_arc); tmp;
213 tmp = ARC_TOKEN_PTR(arc_token_list, tmp->next_token_index))
214 {
215 if (tmp->ilabel == wdid)
216 {
217 return tmp;
218 }
219 else if (tmp->ilabel < wmap->num_slots)
220 {
221 wdid = wordmap_find_index_in_rule(wmap, word, tmp->ilabel);
222 if (wdid != MAXwordID)
223 return tmp;
224 }
225 else if (tmp->ilabel == WORD_EPSILON_LABEL)
226 {
227 tmp = ARC_TOKEN_PTR(arc_token_list, tmp->first_next_arc);
228 tmp = get_arc_for_word_without_slot_annotation(tmp, word, context_void, terminal_word);
229 if (tmp) return tmp;
230 }
231 }
232 return 0;
233 }
234 }
235
236 /* protos */
237 #if DEBUG_PARP_MANAGEMENT
238 void list_free_parps(AstarStack* stack, char* msg);
239 #else
240 #define list_free_parps(stack,msg)
241 #endif
242
243 void print_partial_paths(partial_path** parps, int num_parps, srec* rec, const char* msg);
244 void print_path(partial_path* path, srec* rec, char* msg);
245 void sort_partial_paths(partial_path** parps, int num_parps);
246 void insert_partial_path(partial_path** parps, int *pnum_parps,
247 partial_path* insert_parp);
248 partial_path* make_new_partial_path(AstarStack* stack);
249 /*void free_partial_path(AstarStack* stack, partial_path* parp); put the proto in astar.h */
250
251 /* functions */
252
append_arc_arriving(partial_path * path,partial_path * prev_path)253 void append_arc_arriving(partial_path* path, partial_path* prev_path)
254 {
255 partial_path** pprev;
256 for (pprev = &path->first_prev_arc; (*pprev); pprev = &(*pprev)->linkl_prev_arc)
257 ASSERT(*pprev != prev_path);
258 *pprev = prev_path;
259 #if DEBUG_PARP_MANAGEMENT
260 if (1)
261 {
262 int i, j;
263 partial_path* path_list[256], *k;
264 memset(path_list, 0, sizeof(partial_path*)*32);
265 for (i = 0, k = path->first_prev_arc; k; k = k->linkl_prev_arc)
266 {
267 for (j = 0; j < i; j++)
268 if (k == path_list[j])
269 ASSERT(0);
270 path_list[i++] = k;
271 }
272 }
273 #endif
274 }
275
remove_path_arriving(partial_path * path,partial_path * prev_path)276 static void remove_path_arriving(partial_path* path, partial_path* prev_path)
277 {
278 partial_path** pprev;
279 if (!path) return;
280 for (pprev = &path->first_prev_arc; (*pprev); pprev = &(*pprev)->linkl_prev_arc)
281 if (*pprev == prev_path)
282 {
283 *pprev = (*pprev)->linkl_prev_arc;
284 return;
285 }
286 ASSERT(0);
287 }
288
extend_path(AstarStack * stack,partial_path * parp,wtokenID extend_token_index,arc_token * arc_for_extend_token_index,bigcostdata max_cost,word_token * word_token_array,int * pwhether_complete)289 partial_path* extend_path(AstarStack* stack,
290 partial_path* parp,
291 wtokenID extend_token_index,
292 arc_token* arc_for_extend_token_index,
293 bigcostdata max_cost,
294 word_token* word_token_array,
295 int* pwhether_complete)
296 {
297 asr_int32_t netcost;
298 partial_path* extended_parp;
299 word_token* wtoken;
300 costdata best_cost_for_node;
301 wtokenID best_extend_token;
302 partial_path* alt_extension;
303 int sanity_count;
304
305 wtoken = &word_token_array[ extend_token_index];
306
307 if (wtoken->end_time > word_token_array[parp->token_index].end_time)
308 {
309 /* 20030921: this should never happen but we keep it for stop gap */
310 /* why does it happen: when in srec_process_word_boundary() we
311 occasionally kill_fsm_nodes_for_word_backtrace() but we did not kill the
312 stokens for this backtrace, neither did we kill the altword_tokens. it
313 would just take too long to go through all of them, and so occasionally
314 there may leak some bad backtraces */
315 return 0;
316 }
317
318 /* finding the netcost of this path extension */
319 best_extend_token = word_token_array[ parp->token_index].backtrace;
320 best_cost_for_node = word_token_array[ best_extend_token].cost;
321 wtoken = &word_token_array[ extend_token_index];
322 ASSERT(word_token_array[best_extend_token].end_time ==
323 word_token_array[extend_token_index].end_time);
324 netcost = wtoken->cost - best_cost_for_node;
325 /* ASSERT( netcost > 0); bug: sometimes this fails! fix: just use int32 */
326 if (netcost + parp->costsofar > max_cost)
327 {
328 #if PRINT_ASTAR_DETAILS
329 printf("netcost %d (%d+%d) + parp->costsofar > max_cost %d\n",
330 netcost, wtoken->cost, best_cost_for_node, parp->costsofar, max_cost);
331 #endif
332 return 0;
333 }
334
335 /* check if we have a similar thing already extended */
336 sanity_count = 0;
337 for (alt_extension = parp->first_prev_arc; alt_extension;
338 alt_extension = alt_extension->linkl_prev_arc)
339 {
340 wtokenID alt_token_index = alt_extension->token_index;
341 wtokenID alt_bt_token_index;
342 wtokenID bt_token_index;
343 word_token* alt_wtoken;
344 int join_frame_diff; /* need a signed frameID */
345
346 ASSERT(sanity_count++ < 30);
347 if (alt_token_index == MAXwtokenID)
348 continue;
349 alt_wtoken = &word_token_array[alt_token_index];
350 if (alt_wtoken->word != wtoken->word)
351 continue;
352
353 alt_bt_token_index = alt_wtoken->backtrace;
354 bt_token_index = wtoken->backtrace;
355 if (alt_bt_token_index == MAXwtokenID && bt_token_index != MAXwtokenID)
356 continue;
357 else if (alt_bt_token_index != MAXwtokenID && bt_token_index == MAXwtokenID)
358 continue;
359 else if (alt_bt_token_index != MAXwtokenID && bt_token_index != MAXwtokenID)
360 {
361 word_token* alt_wtoken_bt;
362 word_token* wtoken_bt;
363 alt_wtoken_bt = &word_token_array[ alt_wtoken->backtrace];
364 wtoken_bt = &word_token_array[ wtoken->backtrace];
365 if (alt_wtoken_bt->word != wtoken_bt->word)
366 continue;
367 }
368
369 join_frame_diff = alt_wtoken->end_time - wtoken->end_time;
370 if (join_frame_diff < 0) join_frame_diff = -join_frame_diff;
371 if (join_frame_diff > 5)
372 continue;
373
374 /* the proposed extension is similar in "all" ways to an existing
375 extension, so let's not make this new extension */
376 #if PRINT_ASTAR_DETAILS
377 printf("proposed extension already done elsewhere\n");
378 #endif
379 return 0;
380 }
381
382 /* this is a TRUE new extension, so let's extend for sure */
383 extended_parp = make_new_partial_path(stack);
384 if (!extended_parp)
385 {
386 #if PRINT_ASTAR_DETAILS
387 printf("make_new_partial_path returned 0\n");
388 #endif
389 return 0;
390 }
391 extended_parp->costsofar = parp->costsofar + netcost;
392 extended_parp->token_index = extend_token_index;
393 if (extend_token_index != MAXwtokenID)
394 extended_parp->word = word_token_array[ extend_token_index].word;
395 else
396 extended_parp->word = MAXwordID;
397 if (wtoken->backtrace == MAXwtokenID)
398 {
399 *pwhether_complete = 1;
400 extended_parp->first_prev_arc = PARP_TERMINAL;
401 }
402 else
403 {
404 *pwhether_complete = 0;
405 }
406 extended_parp->arc_for_wtoken = arc_for_extend_token_index;
407
408 extended_parp->refcount = 1;
409 parp->refcount++;
410
411 /* maintain the parp tree */
412 extended_parp->next = parp;
413 append_arc_arriving(parp, extended_parp);
414 #if PRINT_ASTAR_DETAILS
415 printf("extend path returned %x\n", extended_parp);
416 #endif
417
418 return extended_parp;
419 }
420
check_stack_root_sanity(AstarStack * stack)421 void check_stack_root_sanity(AstarStack* stack)
422 {
423 partial_path* parp1 = stack->root_path;
424 /* append_arc_arriving(stack->root_path, parp); */
425 for (; parp1->linkl_prev_arc != NULL; parp1 = parp1->linkl_prev_arc)
426 ASSERT(parp1 != parp1->linkl_prev_arc);
427 }
428
429 /*
430 * make a blank partial path, free one if necessary
431 */
432
make_new_partial_path(AstarStack * stack)433 partial_path* make_new_partial_path(AstarStack* stack)
434 {
435 partial_path* return_parp = stack->free_parp_list;
436 if (return_parp)
437 {
438 stack->free_parp_list = return_parp->next;
439 memset((void*)return_parp, 0, sizeof(*return_parp)); /* needed */
440 }
441 else
442 {
443 log_report("Warning: ran out of partial_paths, reprune\n");
444 #if PRINT_ASTAR_DETAILS
445 printf("Warning: ran out of partial_paths, reprune\n");
446 #endif
447 /* kill the last one, and return it, this may free more than one parp! */
448 if (stack->num_active_paths == 0)
449 return 0;
450 stack->num_active_paths--;
451 return_parp = stack->active_paths[stack->num_active_paths];
452 hash_del((FixedSizeHash*)stack->pphash, return_parp);
453 free_partial_path(stack, return_parp);
454 return_parp = stack->free_parp_list;
455 stack->free_parp_list = return_parp->next;
456 memset((void*)return_parp, 0, sizeof(*return_parp)); /* needed */
457 }
458 return return_parp;
459 }
460
461 /* free_partial_path
462 frees the path that was passed in, and also any backpointers.
463 refcount counts the number of parps that depend on this parp */
free_partial_path(AstarStack * stack,partial_path * parp)464 void free_partial_path(AstarStack* stack, partial_path* parp)
465 {
466 partial_path* next_parp;
467 for (; parp; parp = next_parp)
468 {
469 next_parp = parp->next;
470 parp->refcount--;
471 if (parp->refcount == 0)
472 { /* first time around this always passes */
473 remove_path_arriving(parp->next, parp);
474 parp->next = stack->free_parp_list;
475 stack->free_parp_list = parp;
476 }
477 else break;
478 }
479 }
480
481 /*
482 * make a partial path from a single word at the very end of the graph
483 */
484
make_partial_path(AstarStack * stack,wtokenID token_index,srec * rec,int * pwhether_complete)485 partial_path* make_partial_path(AstarStack* stack,
486 wtokenID token_index, srec* rec,
487 int* pwhether_complete)
488 {
489 partial_path* parp;
490 word_token* wtoken;
491
492 /* todo: replace this with partial_path_tokens! */
493 parp = make_new_partial_path(stack);
494 if (!parp) return parp;
495
496 wtoken = &rec->word_token_array[token_index];
497 parp->token_index = token_index;
498 if (token_index != MAXwtokenID)
499 parp->word = rec->word_token_array[ token_index].word;
500 else
501 parp->word = MAXwordID;
502 /* wtoken->end_time should be equal to rec->current_search_frame */
503 ASSERT(rec->accumulated_cost_offset[ wtoken->end_time] != 0);
504 parp->costsofar = rec->accumulated_cost_offset[ wtoken->end_time];
505 parp->costsofar += wtoken->cost;
506 /* BKWD: rec->word_token_array[ wtoken->backtrace].cost + acc[] */
507 /* FRWD: wtoken->cost + acc[] - rec->word_token_array[ wtoken->backtrace].cost + acc[] */
508 parp->next = 0;
509 parp->first_prev_arc = parp->linkl_prev_arc = 0;
510 if (wtoken->backtrace == MAXwtokenID)
511 *pwhether_complete = 1;
512 else
513 *pwhether_complete = 0;
514 parp->arc_for_wtoken = 0;
515 parp->refcount = 1;
516 return parp;
517 }
518
519 /* initialize astar search */
520
astar_stack_make(srec * rec,int max_nbest_len)521 AstarStack* astar_stack_make(srec* rec, int max_nbest_len)
522 {
523 int i;
524 AstarStack *stack;
525
526 /* allocations */
527 stack = (AstarStack*)CALLOC_CLR(1, sizeof(AstarStack), "search.astar.base");
528 stack->max_active_paths = max_nbest_len + NBEST_LEN_MARGIN * 3;
529 stack->max_complete_paths = max_nbest_len + NBEST_LEN_MARGIN;
530 stack->complete_paths = (partial_path**)CALLOC_CLR(stack->max_complete_paths, sizeof(partial_path*), "search.astar.cplist");
531 stack->complete_path_confidences = (int*)CALLOC_CLR(stack->max_complete_paths, sizeof(int), "search.astar.confvalues");
532 stack->active_paths = (partial_path**)CALLOC_CLR(stack->max_active_paths, sizeof(partial_path*), "search.astar.aplist");
533 stack->prune_delta = ASTAR_PRUNE_DELTA;
534
535 stack->num_complete_paths = 0;
536 stack->num_active_paths = 0;
537
538 stack->partial_path_array = (partial_path*)CALLOC_CLR(MAX_NUM_PARPS, sizeof(stack->partial_path_array[0]), "search.astar.pparray");
539 stack->partial_path_array_size = MAX_NUM_PARPS;
540
541 stack->free_parp_list = &stack->partial_path_array[0];
542 for (i = 1; i < MAX_NUM_PARPS; i++)
543 {
544 stack->partial_path_array[i-1].next = &stack->partial_path_array[i];
545 }
546 stack->partial_path_array[i-1].next = 0;
547 stack->root_path = 0;
548
549 stack->pphash = (void*)CALLOC_CLR(1, sizeof(FixedSizeHash), "search.astar.pphash");
550 astar_stack_clear(stack);
551 return stack;
552 }
553
astar_stack_destroy(srec * rec)554 int astar_stack_destroy(srec* rec)
555 {
556 AstarStack *stack = rec->astar_stack;
557 FREE(stack->active_paths);
558 FREE(stack->complete_paths);
559 FREE(stack->complete_path_confidences);
560 FREE(stack->partial_path_array);
561 FREE(stack->pphash);
562 FREE(stack);
563 rec->astar_stack = 0;
564 return 0;
565 }
566
567 /* prepares for astar after forward search on an utterance */
568
astar_stack_prepare(AstarStack * stack,int request_nbest_len,srec * rec)569 int astar_stack_prepare(AstarStack* stack, int request_nbest_len, srec* rec)
570 {
571 wtokenID token_index;
572 word_token* wtoken;
573 partial_path* parp;
574 int whether_complete;
575 frameID end_frame = rec->current_search_frame;
576 int num_wordends;
577
578 list_free_parps(stack, "astar_stack_prepare ");
579
580 stack->num_active_paths = 0;
581 stack->num_complete_paths = 0;
582
583 stack->root_path = make_new_partial_path(stack);
584 ASSERT(stack->root_path);
585 stack->root_path->refcount = 9999;
586 stack->root_path->token_index = MAXwtokenID;
587 stack->root_path->word = MAXwordID;
588
589 num_wordends = 0;
590 for (token_index = rec->word_lattice->words_for_frame[end_frame];
591 token_index != MAXwtokenID;
592 token_index = wtoken->next_token_index)
593 {
594 num_wordends++;
595 wtoken = &rec->word_token_array[ token_index];
596 parp = make_partial_path(stack, token_index, rec, &whether_complete);
597 if (!parp)
598 {
599 log_report("Error: out-of-memory in astar_stack_prepare(), "
600 "num_wordends %d\n", num_wordends);
601 stack->num_complete_paths = 0;
602 return 1;
603 }
604 append_arc_arriving(stack->root_path, parp);
605
606 if (parp && whether_complete)
607 {
608 /* here .. check for dups ?? */
609 stack->complete_paths[ stack->num_complete_paths++] = parp;
610 if (stack->num_complete_paths == request_nbest_len)
611 return 0;
612 }
613 else if (parp)
614 {
615 stack->active_paths[ stack->num_active_paths++] = parp;
616 }
617 }
618
619 list_free_parps(stack, "astar_stack_prepare ");
620
621 return 0;
622 }
623
624 /* cleans up astar after an utterance */
625
astar_stack_clear(AstarStack * stack)626 void astar_stack_clear(AstarStack* stack)
627 {
628 int i;
629
630 /* free the partial_path's that were allocated */
631 for (i = 0; i < stack->num_active_paths; i++)
632 free_partial_path(stack, stack->active_paths[i]);
633 for (i = 0; i < stack->num_complete_paths; i++)
634 free_partial_path(stack, stack->complete_paths[i]);
635 if (stack->root_path)
636 free_partial_path(stack, stack->root_path);
637
638 /* this shouldn't be necessary, but there are a couple of bugs
639 in parp management, so let's leave it for now */
640 stack->free_parp_list = &stack->partial_path_array[0];
641 for (i = 1; i < MAX_NUM_PARPS; i++)
642 stack->partial_path_array[i-1].next = &stack->partial_path_array[i];
643 stack->partial_path_array[i-1].next = 0;
644 stack->num_active_paths = 0;
645 stack->num_complete_paths = 0;
646 stack->root_path = 0;
647
648 list_free_parps(stack, "astar_stack_clear ");
649
650 }
651
652 /* do the astar search */
653
astar_stack_do_backwards_search(srec * rec,int request_nbest_len)654 int astar_stack_do_backwards_search(srec* rec, int request_nbest_len)
655 {
656 int i;
657 AstarStack *stack = rec->astar_stack;
658 word_token *wtoken, *btoken;
659 partial_path *parp, *extended_parp, *tparp;
660 wtokenID token_index, btoken_index;
661 int whether_complete = 0;
662 bigcostdata max_cost = 0;
663 arc_token* arc_for_token_index = NULL;
664
665 arc_token* arc_token_list; /* to skip graph constraints, just set this to NULL */
666 arcID arc_token_list_len;
667 srec_word_lattice* lattice;
668
669 int max_complete_paths;
670
671 if (!rec || !rec->context)
672 {
673 log_report("Error: bad arguments in astar_stack_do_backwards_search()\n");
674 return 1;
675 }
676 max_complete_paths = request_nbest_len < stack->max_complete_paths ?
677 request_nbest_len : stack->max_complete_paths;
678
679 arc_token_list = rec->context->arc_token_list;
680 arc_token_list_len = rec->context->arc_token_list_len;
681 lattice = rec->word_lattice;
682
683 /* initialization, now from calling function */
684 /* astar_stack_prepare(stack, request_nbest_len, rec); */
685 hash_init((FixedSizeHash*)stack->pphash, rec);
686
687 /* search */
688 while (stack->num_active_paths > 0)
689 {
690
691 list_free_parps(stack, "do_astar_back BEG");
692
693 /* extend top path */
694 parp = stack->active_paths[0];
695 wtoken = &rec->word_token_array[parp->token_index];
696 token_index = wtoken->backtrace;
697 wtoken = &rec->word_token_array[token_index];
698 ASSERT(token_index != MAXwtokenID); /* should have been "complete" */
699
700
701 #if PRINT_ASTAR_DETAILS
702 print_partial_paths(stack->complete_paths, stack->num_complete_paths,
703 rec, "=== Complete Paths ===\n");
704 print_partial_paths(stack->active_paths, stack->num_active_paths,
705 rec, "=== Active Paths ===\n");
706 #endif
707
708 /* pop this one */
709 for (i = 0; i < stack->num_active_paths - 1; i++)
710 stack->active_paths[i] = stack->active_paths[i+1];
711 stack->num_active_paths--;
712
713 if (wtoken->end_time != MAXframeID)
714 {
715 /* sort the word token array by score, so that we pick the best
716 scoring paths first */
717 /* later add a 'whether_sorted' flag to the lattice_at_frame information */
718 sort_word_lattice_at_frame(rec, (frameID)(wtoken->end_time + 1));
719
720 /* extend this path, with every word ending where this word began */
721 /* #warning there appear to be duplicates */
722
723 btoken_index = lattice->words_for_frame[ wtoken->end_time+1];
724 }
725 else
726 {
727 btoken_index = MAXwtokenID;
728 }
729
730 #if PRINT_ASTAR_DETAILS
731 print_path(parp, rec, "Now Processing Top of Stack(2): ");
732 printf("Frame %d\n", wtoken->end_time + 1);
733 print_word_token_list(rec, btoken_index, "List of Word at Frame\n");
734 #endif
735
736 for (; btoken_index != MAXwtokenID; btoken_index = btoken->next_token_index)
737 {
738 btoken = &rec->word_token_array[btoken_index];
739
740 /* alternate choice must end at same frame */
741 // ASSERT(btoken->end_time == wtoken->end_time);
742
743 #if PRINT_ASTAR_DETAILS
744 print_path(parp, rec, "Now Processing Top of Stack(3): ");
745 print_word_token(rec, btoken_index, "Extending word ");
746 #endif
747
748 /* check if this potential extension is allowed by the
749 word graph, if not just drop it! */
750
751 if (arc_token_list)
752 {
753 arc_for_token_index = get_arc_for_word(parp->arc_for_wtoken,
754 btoken->word,
755 rec->context,
756 rec->context->beg_silence_word);
757 if (arc_for_token_index == NULL)
758 {
759 #if PRINT_ASTAR_DETAILS
760 printf("Not allowed by graph!\n");
761 #endif
762 continue;
763 }
764 }
765
766 /* figure out the cost to beat ! */
767 if (stack->num_complete_paths)
768 {
769 max_cost = stack->complete_paths[0]->costsofar + stack->prune_delta;
770 }
771 else if (stack->num_active_paths == stack->max_active_paths)
772 {
773 max_cost = stack->active_paths[ stack->num_active_paths-1]->costsofar;
774 }
775 else if (stack->num_active_paths > 0)
776 {
777 max_cost = stack->active_paths[0]->costsofar + stack->prune_delta;
778 }
779 else
780 {
781 max_cost = MAXbcostdata;
782 }
783
784 extended_parp = extend_path(stack, parp, btoken_index, arc_for_token_index, max_cost, rec->word_token_array, &whether_complete);
785
786 if (extended_parp)
787 {
788 int fsh_rc = hash_set((FixedSizeHash*)stack->pphash, extended_parp);
789 if (fsh_rc == FSH_KEY_OCCUPIED)
790 {
791 /* seen this path before, let's not bother with it */
792 #if PRINT_ASTAR_DETAILS
793 print_path(extended_parp, rec, "dup!! ");
794 #endif
795 free_partial_path(stack, extended_parp);
796 extended_parp = 0;
797 }
798 }
799
800 if (extended_parp && whether_complete)
801 {
802 ASSERT(stack->num_complete_paths < stack->max_complete_paths);
803 stack->complete_paths[ stack->num_complete_paths++] = extended_parp;
804 /*if(stack->num_complete_paths >= request_nbest_len)
805 return 0;*/
806
807
808 #if PRINT_ASTAR_DETAILS
809 print_path(extended_parp, rec, "&&Extended, complete : ");
810 #endif
811 }
812 else if (extended_parp)
813 {
814 /* todo: check if this extended_parp is already completed on the
815 stack->complete_paths, if so just rejoin with that guy somehow */
816
817 #if PRINT_ASTAR_DETAILS
818 print_path(extended_parp, rec, "&&Extended, incomplete : ");
819 #endif
820 if (stack->num_active_paths == stack->max_active_paths)
821 {
822 /* kill the last one */
823 stack->num_active_paths--;
824 tparp = stack->active_paths[stack->num_active_paths];
825 hash_del((FixedSizeHash*)stack->pphash, tparp);
826 free_partial_path(stack, tparp);
827 }
828 insert_partial_path(stack->active_paths, &stack->num_active_paths,
829 extended_parp);
830 }
831 #if PRINT_ASTAR_DETAILS
832 else
833 {
834 printf("&&Extended, cost too high (>%d):\n", max_cost);
835 }
836 #endif
837 if (stack->num_complete_paths == max_complete_paths)
838 {
839 #if PRINT_ASTAR_DETAILS
840 printf("Complete paths are full %d, stopping\n", stack->num_complete_paths);
841 #endif
842 break;
843 }
844 }
845 #if PRINT_ASTAR_DETAILS
846 if (do_draw_as_dotty > 0)
847 {
848 char tmp[32];
849 sprintf(tmp, "astar.%.3d.dot", do_draw_file_idx++);
850 astar_draw_tree_as_dotty(tmp, rec, stack);
851 if (do_draw_as_dotty > 1)
852 system("C:/tools/graphviz/bin/dotty.exe astar.dot");
853 }
854 #endif
855
856 SREC_STATS_UPDATE_ASTAR(stack);
857 hash_del((FixedSizeHash*)stack->pphash, parp);
858 free_partial_path(stack, parp); /* done all extensions, now free */
859 if (stack->num_complete_paths == max_complete_paths)
860 {
861 #if PRINT_ASTAR_DETAILS
862 printf("Complete paths are full %d, stopping\n", stack->num_complete_paths);
863 #endif
864 break;
865 }
866
867 list_free_parps(stack, "do_astar_back END");
868 }
869 sort_partial_paths(stack->complete_paths, stack->num_complete_paths);
870 /* if we're doing a search within a grammar, then print the complete choices
871 else we're likely just doing reprune_word_tokens() */
872 #if PRINT_ASTAR_SOMEWHAT
873 if (rec->context->arc_token_list)
874 print_partial_paths(stack->complete_paths, stack->num_complete_paths,
875 rec, "=== Complete paths ===\n");
876 #endif
877 /* now the caller must call clear */
878 /* astar_stack_clear(stack); */
879
880 return 0;
881 }
882
sort_partial_paths(partial_path ** parps,int num_parps)883 void sort_partial_paths(partial_path** parps, int num_parps)
884 {
885 int i, j;
886 for (i = 0; i < num_parps; i++)
887 {
888 for (j = 0; j < num_parps - 1; j++)
889 {
890 if (parps[j]->costsofar > parps[j+1]->costsofar)
891 {
892 partial_path* parp = parps[j];
893 parps[j] = parps[j+1];
894 parps[j+1] = parp;
895 }
896 }
897 }
898 }
899
insert_partial_path(partial_path ** parps,int * pnum_parps,partial_path * insert_parp)900 void insert_partial_path(partial_path** parps, int *pnum_parps, partial_path* insert_parp)
901 {
902 int i, j, insert_index;
903 int num_parps = *pnum_parps;
904
905 /* maintain the list sorted, search the list linearly for now,
906 do priority_q type heap later */
907 insert_index = num_parps;
908 for (i = 0; i < num_parps; i++)
909 {
910 if (insert_parp->costsofar < parps[i]->costsofar)
911 {
912 insert_index = i;
913 break;
914 }
915 }
916 for (j = num_parps; j > insert_index; --j)
917 parps[j] = parps[j-1];
918 parps[j] = insert_parp;
919 num_parps++;
920 *pnum_parps = num_parps;
921 }
922
print_path(partial_path * ipath,srec * rec,char * msg)923 void print_path(partial_path* ipath, srec* rec, char* msg)
924 {
925 partial_path* path;
926 word_token* wtoken;
927 word_token* last_wtoken;
928 char* p;
929 char trans[256];
930 int max_trans_len = 255;
931 int rc;
932 #ifndef NDEBUG
933 int sanity_count = 0;
934 #endif
935 frameID end_time;
936
937 PLogMessage("%spath score=%d ", msg, ipath->costsofar);
938
939 rc = sprint_word_token_backtrace(trans, max_trans_len, rec, ipath->token_index);
940 ASSERT(rc == 0);
941
942 last_wtoken = 0;
943 end_time = (ipath && ipath->token_index != MAXwtokenID) ? rec->word_token_array[ipath->token_index].end_time : MAXframeID;
944 #if SHOW_END_TIMES
945 printf("%s@%d || ", trans, end_time);
946 #else
947 printf("%s || ", trans);
948 #endif
949
950 path = ipath->next; /* we've already printed this thing */
951 for (; path; path = path->next)
952 {
953 ASSERT(sanity_count++ < 256);
954 if (path->token_index == MAXwtokenID) break;
955 wtoken = &rec->word_token_array[ path->token_index];
956 p = "NULL";
957 if (rec->context->olabels->words[wtoken->word])
958 p = rec->context->olabels->words[wtoken->word];
959 #if SHOW_END_TIMES
960 printf("%s@%d ", p, wtoken->end_time);
961 #else
962 printf("%s ", p);
963 #endif
964 if (last_wtoken != NULL)
965 {
966 if (wtoken->end_time < last_wtoken->end_time)
967 {
968 printf(" Error: wt%d < lwt%d\n", wtoken->end_time, last_wtoken->end_time);
969 pfflush(PSTDOUT);
970 ASSERT(0);
971 }
972 }
973 last_wtoken = wtoken;
974 }
975 printf("\n");
976 }
977
print_partial_paths(partial_path ** parps,int num_parps,srec * rec,const char * msg)978 void print_partial_paths(partial_path** parps, int num_parps,
979 srec* rec, const char* msg)
980 {
981 int i;
982 char buf[32];
983 printf("%s", msg);
984 for (i = 0; i < num_parps; i++)
985 {
986 sprintf(buf, "%.3d ", i);
987 print_path(parps[i], rec, buf);
988 }
989 }
990
991
992 /*--------------------------------------------------------------------------*
993 * *
994 * visualization .. sometimes helps debugging *
995 * *
996 *--------------------------------------------------------------------------*/
997
998 #if PRINT_ASTAR_DETAILS
999
1000
astar_draw_arc_as_dotty(FILE * fp,partial_path * parp,int src_node,int * nodes_used,srec * rec)1001 int astar_draw_arc_as_dotty(FILE* fp, partial_path* parp, int src_node, int *nodes_used, srec* rec)
1002 {
1003 word_token* word_token_array = rec->word_token_array;
1004 partial_path* parp1;
1005 int sanity_count = 0;
1006 int to_nodes[32], *pto_nodes, inode;
1007 pto_nodes = to_nodes;
1008
1009 fprintf(fp, "%d [label = \"%d\", shape = circle, style = solid]\n",
1010 src_node, src_node);
1011 for (parp1 = parp->first_prev_arc; parp1; parp1 = parp1->linkl_prev_arc)
1012 {
1013 arc_token* arc = parp1->arc_for_wtoken;
1014 for (inode = 0; nodes_used[inode]; inode++) ;
1015 nodes_used[inode] = 1;
1016 *pto_nodes++ = inode;
1017 fprintf(fp, " %d -> %d [label = \"(%d).%d.%s@%d/%d\"];\n",
1018 src_node, inode, parp1->refcount,
1019 parp1->token_index,
1020 (arc && arc != (arc_token*)1) ? rec->context->olabels->words[arc->ilabel] : "NULL",
1021 word_token_array[ parp1->token_index].end_time,
1022 parp1->costsofar);
1023 if (sanity_count++ > 30) break;
1024 }
1025
1026 pto_nodes = to_nodes;
1027 sanity_count = 0;
1028 for (parp1 = parp->first_prev_arc; parp1; parp1 = parp1->linkl_prev_arc)
1029 {
1030 astar_draw_arc_as_dotty(fp, parp1, *pto_nodes, nodes_used, rec);
1031 pto_nodes++;
1032 if (sanity_count++ > 30) break;
1033 }
1034 return 0;
1035 }
1036
astar_draw_tree_as_dotty(const char * file,srec * rec,AstarStack * stack)1037 int astar_draw_tree_as_dotty(const char* file, srec* rec, AstarStack* stack)
1038 {
1039 word_token* word_token_array = rec->word_token_array;
1040 FILE* fp = fopen(file, "w");
1041 partial_path* parp;
1042 int nodes_used[1024];
1043 memset(nodes_used, 0, 1024*sizeof(int));
1044
1045 fprintf(fp,
1046 "digraph FSM {\n"
1047 "rankdir = LR;\n"
1048 "size = \"8.5,11\";\n"
1049 "fontsize = 14;\n"
1050 "label = \"\\n\\naaron.PCLG\"\n"
1051 "center = 1;\n"
1052 "orientation = Landscape\n"
1053 );
1054 nodes_used[0] = 1;
1055 for (parp = stack->root_path; parp; parp = parp->linkl_prev_arc)
1056 astar_draw_arc_as_dotty(fp, parp, 0, nodes_used, rec);
1057
1058 fprintf(fp, "}\n");
1059 fclose(fp);
1060 printf("....... dotty %s ......\n", file);
1061 return 0;
1062 }
1063
1064 #endif
1065
1066 /*--------------------------------------------------------------------------*
1067 * *
1068 * functions relating to in-recognition backtrace *
1069 * *
1070 *--------------------------------------------------------------------------*/
1071
1072 int maybe_add_to_active_paths(AstarStack* stack, word_token* word_token_array, bigcostdata cost, wtokenID wtoken_index);
astar_stack_prepare_from_active_search(AstarStack * stack,int nbestlen,srec * rec)1073 int astar_stack_prepare_from_active_search(AstarStack* stack, int nbestlen, srec* rec)
1074 {
1075 wtokenID wtoken_index;
1076 ftokenID ftoken_index;
1077 fsmnode_token* ftoken;
1078 stokenID stoken_index;
1079 fsmarc_token* stoken;
1080 /* word_token* wtoken; */
1081 frameID prune_frame = rec->current_search_frame;
1082 int i, rc = 0, rc1 = 0;
1083 bigcostdata parp_costsofar;
1084
1085 stack->num_active_paths = 0;
1086 stack->num_complete_paths = 0;
1087 stack->root_path = 0;
1088
1089 /* put it on the stack */
1090 stack->root_path = make_new_partial_path(stack);
1091 ASSERT(stack->root_path);
1092 stack->root_path->refcount = 9999;
1093 stack->root_path->token_index = MAXwtokenID;
1094 stack->root_path->word = MAXwordID;
1095
1096 ftoken_index = rec->active_fsmnode_tokens;
1097 for (; ftoken_index != MAXftokenID; ftoken_index = ftoken->next_token_index)
1098 {
1099 ftoken = &rec->fsmnode_token_array[ ftoken_index];
1100 wtoken_index = ftoken->word_backtrace;
1101 if (wtoken_index == MAXwtokenID)
1102 continue;
1103
1104 /* fix the score */
1105 parp_costsofar = ftoken->cost;
1106 parp_costsofar += rec->accumulated_cost_offset[ prune_frame];
1107
1108 rc += (rc1 = maybe_add_to_active_paths(stack, rec->word_token_array, parp_costsofar, wtoken_index));
1109 /* we can handle that a path was not added for this ftoken because
1110 we made sure to flag the wtokens along it's top backtrace */
1111 }
1112
1113 stoken_index = rec->active_fsmarc_tokens;
1114 for (; stoken_index != MAXstokenID; stoken_index = stoken->next_token_index)
1115 {
1116 stoken = &rec->fsmarc_token_array[ stoken_index];
1117 for (i = 0; i < stoken->num_hmm_states; i++)
1118 {
1119 wtoken_index = stoken->word_backtrace[i];
1120 if (wtoken_index == MAXwtokenID)
1121 continue;
1122 parp_costsofar = stoken->cost[i];
1123 parp_costsofar += rec->accumulated_cost_offset[ prune_frame];
1124
1125 rc += (rc1 = maybe_add_to_active_paths(stack, rec->word_token_array, parp_costsofar, wtoken_index));
1126 /* we can handle that a path was not added for this stoken because
1127 we made sure to flag the wtokens along it's top backtrace */
1128 }
1129 }
1130
1131 #if PRINT_ASTAR_DETAILS
1132 print_partial_paths(stack->active_paths, stack->num_active_paths,
1133 rec, "== active paths before sorting ==\n");
1134 sort_partial_paths(stack->active_paths, stack->num_active_paths);
1135 print_partial_paths(stack->active_paths, stack->num_active_paths,
1136 rec, "== active paths after sorting ==\n");
1137 #endif
1138 list_free_parps(stack, "astar_prepare_from_active_search");
1139 return 0;
1140 }
1141
maybe_add_to_active_paths(AstarStack * stack,word_token * word_token_array,bigcostdata parp_costsofar,wtokenID wtoken_index)1142 int maybe_add_to_active_paths(AstarStack* stack, word_token* word_token_array, bigcostdata parp_costsofar, wtokenID wtoken_index)
1143 {
1144 int i;
1145 int replace_index;
1146 int inserts_index;
1147 partial_path* parp;
1148 word_token* wtoken;
1149 wtoken = &word_token_array[ wtoken_index];
1150
1151 if (wtoken->backtrace == MAXwtokenID)
1152 {
1153 return 0;
1154 }
1155
1156 /* see if we already have this word token backtrace */
1157 replace_index = -1;
1158 inserts_index = -1;
1159 for (i = 0; i < stack->num_active_paths; i++)
1160 {
1161 if (stack->active_paths[i]->token_index == wtoken_index)
1162 {
1163 if (parp_costsofar < stack->active_paths[i]->costsofar)
1164 {
1165 /* this one is better than another we already have! */
1166 replace_index = i;
1167 if (inserts_index < 0)
1168 inserts_index = i;
1169 }
1170 break;
1171 }
1172 else if (parp_costsofar < stack->active_paths[i]->costsofar)
1173 {
1174 if (inserts_index < 0)
1175 inserts_index = i;
1176 }
1177 }
1178 #if PRINT_ASTAR_QBT_DETAILS
1179 printf("maybe_add replace %d insert %d\n", replace_index, inserts_index);
1180 #endif
1181
1182 if (replace_index >= 0)
1183 {
1184 free_partial_path(stack, stack->active_paths[replace_index]);
1185 /* stack->active_paths[replace_index] = 0; */
1186 for (i = replace_index; i > inserts_index; --i)
1187 stack->active_paths[i] = stack->active_paths[i-1];
1188 stack->active_paths[inserts_index] = 0;
1189 }
1190 else if (inserts_index >= 0)
1191 {
1192 if (stack->num_active_paths == stack->max_active_paths)
1193 {
1194 free_partial_path(stack, stack->active_paths[ stack->num_active_paths-1]);
1195 stack->num_active_paths--;
1196 }
1197 for (i = stack->num_active_paths; i > inserts_index; --i)
1198 stack->active_paths[i] = stack->active_paths[i-1];
1199 stack->active_paths[inserts_index] = 0;
1200 stack->num_active_paths++;
1201 }
1202 else if (stack->num_active_paths < stack->max_active_paths)
1203 {
1204 /* append if there's space */
1205 inserts_index = stack->num_active_paths;
1206 stack->num_active_paths++;
1207 stack->active_paths[inserts_index] = 0;
1208 }
1209 else
1210 {
1211 /* no space */
1212 return 1;
1213 }
1214
1215 /* create a parp */
1216 #if PRINT_ASTAR_QBT_DETAILS
1217 printf("maybe_add .. creating new parp %d\n", parp_costsofar);
1218 #endif
1219 /* this should always succeed because of above frees */
1220 ASSERT(stack->free_parp_list);
1221 parp = make_new_partial_path(stack);
1222 parp->token_index = wtoken_index;
1223 if (wtoken_index != MAXwtokenID)
1224 parp->word = word_token_array[ wtoken_index].word;
1225 else
1226 parp->word = MAXwordID;
1227 parp->next = stack->root_path;
1228 parp->first_prev_arc = parp->linkl_prev_arc = 0;
1229 parp->arc_for_wtoken = 0;
1230 parp->refcount = 1;
1231 parp->costsofar = parp_costsofar;
1232
1233 stack->active_paths[ inserts_index] = parp;
1234
1235 #if PRINT_ASTAR_QBT_DETAILS
1236 printf("maybe_add .. appending to root\n");
1237 #endif
1238 append_arc_arriving(stack->root_path, parp);
1239 return 0;
1240 }
1241
1242
astar_stack_flag_word_tokens_used(AstarStack * stack,srec * rec)1243 int astar_stack_flag_word_tokens_used(AstarStack* stack, srec* rec)
1244 {
1245 int i;
1246 wtokenID wtoken_index;
1247 partial_path* parp;
1248 int num_flagged_by_path;
1249
1250 #if PRINT_ASTAR_QBT_DETAILS
1251 print_partial_paths(stack->complete_paths, stack->num_complete_paths,
1252 rec, "=== Complete QBT paths ===\n");
1253 #endif
1254
1255 for (i = 0; i < stack->num_complete_paths; i++)
1256 {
1257 num_flagged_by_path = 0;
1258 for (parp = stack->complete_paths[i]; parp; parp = parp->next)
1259 {
1260 wtoken_index = parp->token_index;
1261 if (wtoken_index == MAXwtokenID) break;
1262 rec->word_token_array_flags[ wtoken_index]++;
1263 if (rec->word_token_array_flags[wtoken_index] > 0)
1264 {
1265 num_flagged_by_path++;
1266 #if PRINT_ASTAR_QBT_DETAILS
1267 printf("%d ", wtoken_index);
1268 #endif
1269 }
1270 }
1271
1272 /* also flag the main backtrace of every word token */
1273 /* we do we need this? I'm not sure, but it appears
1274 that some backtrace tokens are not flagged for whatever
1275 reason. It's worth revisiting this when other bugs are
1276 are resolved. This is in a separate loop from the
1277 above because it allows us to detect that this is
1278 happening in the first place */
1279 for (parp = stack->complete_paths[i]; parp; parp = parp->next)
1280 {
1281 word_token *btoken, *last_btoken;
1282 wtokenID btoken_index;
1283 wtoken_index = parp->token_index;
1284 if (wtoken_index == MAXwtokenID) break;
1285 last_btoken = NULL;
1286 btoken = &rec->word_token_array[ wtoken_index];
1287 btoken_index = btoken->backtrace;
1288 for (; btoken_index != MAXwtokenID; btoken_index = btoken->backtrace)
1289 {
1290 btoken = &rec->word_token_array[ btoken_index];
1291 rec->word_token_array_flags[ btoken_index]++;
1292 if (rec->word_token_array_flags[ btoken_index] == 1)
1293 {
1294 num_flagged_by_path++;
1295 #if PRINT_ASTAR_QBT_DETAILS
1296 printf("%db ", btoken_index);
1297 #endif
1298 }
1299 if (last_btoken && last_btoken->end_time <= btoken->end_time)
1300 {
1301 PLogError("bad looping path encountered, breaking");
1302 break;
1303 }
1304 last_btoken = btoken;
1305 }
1306 }
1307
1308 #if PRINT_ASTAR_QBT_DETAILS
1309 printf("complete path %.3d flagged %d\n", i, num_flagged_by_path);
1310 #endif
1311 }
1312 return 0;
1313 }
1314
1315
1316 #if DEBUG_PARP_MANAGEMENT
1317 #define PARP_FREE 1
1318 #define PARP_USED 2
list_free_parps(AstarStack * stack,char * msg)1319 void list_free_parps(AstarStack* stack, char* msg)
1320 {
1321 partial_path* parp;
1322 int i, num = 0;
1323 char x[MAX_NUM_PARPS];
1324 for (i = 0; i < MAX_NUM_PARPS; i++) x[i] = 0;
1325 for (parp = stack->free_parp_list; parp; parp = parp->next)
1326 {
1327 num++;
1328 x[(parp-stack->partial_path_array)] = PARP_FREE;
1329 }
1330 PLogMessage("%sstack->free_parp_list size %d ", msg, num);
1331 PLogMessage("active %d complete %d\n", stack->num_active_paths, stack->num_complete_paths);
1332
1333 for (i = 0; i < stack->num_active_paths; i++)
1334 {
1335 parp = stack->active_paths[i];
1336 for (; parp; parp = parp->next) x[(parp-stack->partial_path_array)] = PARP_USED;
1337 }
1338 for (i = 0; i < stack->num_complete_paths; i++)
1339 {
1340 parp = stack->complete_paths[i];
1341 for (; parp; parp = parp->next) x[(parp-stack->partial_path_array)] = PARP_USED;
1342 }
1343 if (stack->root_path)
1344 x[(stack->root_path-stack->partial_path_array)] = PARP_USED;
1345 printf("free: ");
1346 for (i = 0; i < MAX_NUM_PARPS; i++) if (x[i] == PARP_FREE) printf(" %d", i);
1347 printf("\n");
1348 printf("used: ");
1349 for (i = 0; i < MAX_NUM_PARPS; i++) if (x[i] == PARP_USED) printf(" %d", i);
1350 printf("\n");
1351 for (i = 0, num = 0; i < MAX_NUM_PARPS; i++) if (!x[i]) num++;
1352 printf("unaccounted for %d\n", num);
1353 ASSERT(num == 0);
1354
1355 }
1356 #endif
1357