1 /*
2 ******************************************************************************
3 *
4 * Copyright (C) 1999-2011, International Business Machines
5 * Corporation and others. All Rights Reserved.
6 *
7 ******************************************************************************
8 * file name: ubidiln.c
9 * encoding: US-ASCII
10 * tab size: 8 (not used)
11 * indentation:4
12 *
13 * created on: 1999aug06
14 * created by: Markus W. Scherer, updated by Matitiahu Allouche
15 */
16
17 #include "cmemory.h"
18 #include "unicode/utypes.h"
19 #include "unicode/ustring.h"
20 #include "unicode/uchar.h"
21 #include "unicode/ubidi.h"
22 #include "ubidiimp.h"
23 #include "uassert.h"
24
25 #ifndef U_COMMON_IMPLEMENTATION
26 #error U_COMMON_IMPLEMENTATION not set - must be set for all ICU source files in common/ - see http://userguide.icu-project.org/howtouseicu
27 #endif
28
29 /*
30 * General remarks about the functions in this file:
31 *
32 * These functions deal with the aspects of potentially mixed-directional
33 * text in a single paragraph or in a line of a single paragraph
34 * which has already been processed according to
35 * the Unicode 3.0 BiDi algorithm as defined in
36 * http://www.unicode.org/unicode/reports/tr9/ , version 13,
37 * also described in The Unicode Standard, Version 4.0.1 .
38 *
39 * This means that there is a UBiDi object with a levels
40 * and a dirProps array.
41 * paraLevel and direction are also set.
42 * Only if the length of the text is zero, then levels==dirProps==NULL.
43 *
44 * The overall directionality of the paragraph
45 * or line is used to bypass the reordering steps if possible.
46 * Even purely RTL text does not need reordering there because
47 * the ubidi_getLogical/VisualIndex() functions can compute the
48 * index on the fly in such a case.
49 *
50 * The implementation of the access to same-level-runs and of the reordering
51 * do attempt to provide better performance and less memory usage compared to
52 * a direct implementation of especially rule (L2) with an array of
53 * one (32-bit) integer per text character.
54 *
55 * Here, the levels array is scanned as soon as necessary, and a vector of
56 * same-level-runs is created. Reordering then is done on this vector.
57 * For each run of text positions that were resolved to the same level,
58 * only 8 bytes are stored: the first text position of the run and the visual
59 * position behind the run after reordering.
60 * One sign bit is used to hold the directionality of the run.
61 * This is inefficient if there are many very short runs. If the average run
62 * length is <2, then this uses more memory.
63 *
64 * In a further attempt to save memory, the levels array is never changed
65 * after all the resolution rules (Xn, Wn, Nn, In).
66 * Many functions have to consider the field trailingWSStart:
67 * if it is less than length, then there is an implicit trailing run
68 * at the paraLevel,
69 * which is not reflected in the levels array.
70 * This allows a line UBiDi object to use the same levels array as
71 * its paragraph parent object.
72 *
73 * When a UBiDi object is created for a line of a paragraph, then the
74 * paragraph's levels and dirProps arrays are reused by way of setting
75 * a pointer into them, not by copying. This again saves memory and forbids to
76 * change the now shared levels for (L1).
77 */
78
79 /* handle trailing WS (L1) -------------------------------------------------- */
80
81 /*
82 * setTrailingWSStart() sets the start index for a trailing
83 * run of WS in the line. This is necessary because we do not modify
84 * the paragraph's levels array that we just point into.
85 * Using trailingWSStart is another form of performing (L1).
86 *
87 * To make subsequent operations easier, we also include the run
88 * before the WS if it is at the paraLevel - we merge the two here.
89 *
90 * This function is called only from ubidi_setLine(), so pBiDi->paraLevel is
91 * set correctly for the line even when contextual multiple paragraphs.
92 */
93 static void
setTrailingWSStart(UBiDi * pBiDi)94 setTrailingWSStart(UBiDi *pBiDi) {
95 /* pBiDi->direction!=UBIDI_MIXED */
96
97 const DirProp *dirProps=pBiDi->dirProps;
98 UBiDiLevel *levels=pBiDi->levels;
99 int32_t start=pBiDi->length;
100 UBiDiLevel paraLevel=pBiDi->paraLevel;
101
102 /* If the line is terminated by a block separator, all preceding WS etc...
103 are already set to paragraph level.
104 Setting trailingWSStart to pBidi->length will avoid changing the
105 level of B chars from 0 to paraLevel in ubidi_getLevels when
106 orderParagraphsLTR==TRUE.
107 */
108 if(NO_CONTEXT_RTL(dirProps[start-1])==B) {
109 pBiDi->trailingWSStart=start; /* currently == pBiDi->length */
110 return;
111 }
112 /* go backwards across all WS, BN, explicit codes */
113 while(start>0 && DIRPROP_FLAG_NC(dirProps[start-1])&MASK_WS) {
114 --start;
115 }
116
117 /* if the WS run can be merged with the previous run then do so here */
118 while(start>0 && levels[start-1]==paraLevel) {
119 --start;
120 }
121
122 pBiDi->trailingWSStart=start;
123 }
124
125 /* ubidi_setLine ------------------------------------------------------------ */
126
127 U_CAPI void U_EXPORT2
ubidi_setLine(const UBiDi * pParaBiDi,int32_t start,int32_t limit,UBiDi * pLineBiDi,UErrorCode * pErrorCode)128 ubidi_setLine(const UBiDi *pParaBiDi,
129 int32_t start, int32_t limit,
130 UBiDi *pLineBiDi,
131 UErrorCode *pErrorCode) {
132 int32_t length;
133
134 /* check the argument values */
135 RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
136 RETURN_VOID_IF_NOT_VALID_PARA(pParaBiDi, *pErrorCode);
137 RETURN_VOID_IF_BAD_RANGE(start, 0, limit, *pErrorCode);
138 RETURN_VOID_IF_BAD_RANGE(limit, 0, pParaBiDi->length+1, *pErrorCode);
139 if(pLineBiDi==NULL) {
140 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
141 return;
142 }
143 if(ubidi_getParagraph(pParaBiDi, start, NULL, NULL, NULL, pErrorCode) !=
144 ubidi_getParagraph(pParaBiDi, limit-1, NULL, NULL, NULL, pErrorCode)) {
145 /* the line crosses a paragraph boundary */
146 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
147 return;
148 }
149
150 /* set the values in pLineBiDi from its pParaBiDi parent */
151 pLineBiDi->pParaBiDi=NULL; /* mark unfinished setLine */
152 pLineBiDi->text=pParaBiDi->text+start;
153 length=pLineBiDi->length=limit-start;
154 pLineBiDi->resultLength=pLineBiDi->originalLength=length;
155 pLineBiDi->paraLevel=GET_PARALEVEL(pParaBiDi, start);
156 pLineBiDi->paraCount=pParaBiDi->paraCount;
157 pLineBiDi->runs=NULL;
158 pLineBiDi->flags=0;
159 pLineBiDi->reorderingMode=pParaBiDi->reorderingMode;
160 pLineBiDi->reorderingOptions=pParaBiDi->reorderingOptions;
161 pLineBiDi->controlCount=0;
162 if(pParaBiDi->controlCount>0) {
163 int32_t j;
164 for(j=start; j<limit; j++) {
165 if(IS_BIDI_CONTROL_CHAR(pParaBiDi->text[j])) {
166 pLineBiDi->controlCount++;
167 }
168 }
169 pLineBiDi->resultLength-=pLineBiDi->controlCount;
170 }
171
172 pLineBiDi->dirProps=pParaBiDi->dirProps+start;
173 pLineBiDi->levels=pParaBiDi->levels+start;
174 pLineBiDi->runCount=-1;
175
176 if(pParaBiDi->direction!=UBIDI_MIXED) {
177 /* the parent is already trivial */
178 pLineBiDi->direction=pParaBiDi->direction;
179
180 /*
181 * The parent's levels are all either
182 * implicitly or explicitly ==paraLevel;
183 * do the same here.
184 */
185 if(pParaBiDi->trailingWSStart<=start) {
186 pLineBiDi->trailingWSStart=0;
187 } else if(pParaBiDi->trailingWSStart<limit) {
188 pLineBiDi->trailingWSStart=pParaBiDi->trailingWSStart-start;
189 } else {
190 pLineBiDi->trailingWSStart=length;
191 }
192 } else {
193 const UBiDiLevel *levels=pLineBiDi->levels;
194 int32_t i, trailingWSStart;
195 UBiDiLevel level;
196
197 setTrailingWSStart(pLineBiDi);
198 trailingWSStart=pLineBiDi->trailingWSStart;
199
200 /* recalculate pLineBiDi->direction */
201 if(trailingWSStart==0) {
202 /* all levels are at paraLevel */
203 pLineBiDi->direction=(UBiDiDirection)(pLineBiDi->paraLevel&1);
204 } else {
205 /* get the level of the first character */
206 level=(UBiDiLevel)(levels[0]&1);
207
208 /* if there is anything of a different level, then the line is mixed */
209 if(trailingWSStart<length && (pLineBiDi->paraLevel&1)!=level) {
210 /* the trailing WS is at paraLevel, which differs from levels[0] */
211 pLineBiDi->direction=UBIDI_MIXED;
212 } else {
213 /* see if levels[1..trailingWSStart-1] have the same direction as levels[0] and paraLevel */
214 i=1;
215 for(;;) {
216 if(i==trailingWSStart) {
217 /* the direction values match those in level */
218 pLineBiDi->direction=(UBiDiDirection)level;
219 break;
220 } else if((levels[i]&1)!=level) {
221 pLineBiDi->direction=UBIDI_MIXED;
222 break;
223 }
224 ++i;
225 }
226 }
227 }
228
229 switch(pLineBiDi->direction) {
230 case UBIDI_LTR:
231 /* make sure paraLevel is even */
232 pLineBiDi->paraLevel=(UBiDiLevel)((pLineBiDi->paraLevel+1)&~1);
233
234 /* all levels are implicitly at paraLevel (important for ubidi_getLevels()) */
235 pLineBiDi->trailingWSStart=0;
236 break;
237 case UBIDI_RTL:
238 /* make sure paraLevel is odd */
239 pLineBiDi->paraLevel|=1;
240
241 /* all levels are implicitly at paraLevel (important for ubidi_getLevels()) */
242 pLineBiDi->trailingWSStart=0;
243 break;
244 default:
245 break;
246 }
247 }
248 pLineBiDi->pParaBiDi=pParaBiDi; /* mark successful setLine */
249 return;
250 }
251
252 U_CAPI UBiDiLevel U_EXPORT2
ubidi_getLevelAt(const UBiDi * pBiDi,int32_t charIndex)253 ubidi_getLevelAt(const UBiDi *pBiDi, int32_t charIndex) {
254 /* return paraLevel if in the trailing WS run, otherwise the real level */
255 if(!IS_VALID_PARA_OR_LINE(pBiDi) || charIndex<0 || pBiDi->length<=charIndex) {
256 return 0;
257 } else if(pBiDi->direction!=UBIDI_MIXED || charIndex>=pBiDi->trailingWSStart) {
258 return GET_PARALEVEL(pBiDi, charIndex);
259 } else {
260 return pBiDi->levels[charIndex];
261 }
262 }
263
264 U_CAPI const UBiDiLevel * U_EXPORT2
ubidi_getLevels(UBiDi * pBiDi,UErrorCode * pErrorCode)265 ubidi_getLevels(UBiDi *pBiDi, UErrorCode *pErrorCode) {
266 int32_t start, length;
267
268 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, NULL);
269 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, NULL);
270 if((length=pBiDi->length)<=0) {
271 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
272 return NULL;
273 }
274 if((start=pBiDi->trailingWSStart)==length) {
275 /* the current levels array reflects the WS run */
276 return pBiDi->levels;
277 }
278
279 /*
280 * After the previous if(), we know that the levels array
281 * has an implicit trailing WS run and therefore does not fully
282 * reflect itself all the levels.
283 * This must be a UBiDi object for a line, and
284 * we need to create a new levels array.
285 */
286 if(getLevelsMemory(pBiDi, length)) {
287 UBiDiLevel *levels=pBiDi->levelsMemory;
288
289 if(start>0 && levels!=pBiDi->levels) {
290 uprv_memcpy(levels, pBiDi->levels, start);
291 }
292 /* pBiDi->paraLevel is ok even if contextual multiple paragraphs,
293 since pBidi is a line object */
294 uprv_memset(levels+start, pBiDi->paraLevel, length-start);
295
296 /* this new levels array is set for the line and reflects the WS run */
297 pBiDi->trailingWSStart=length;
298 return pBiDi->levels=levels;
299 } else {
300 /* out of memory */
301 *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
302 return NULL;
303 }
304 }
305
306 U_CAPI void U_EXPORT2
ubidi_getLogicalRun(const UBiDi * pBiDi,int32_t logicalPosition,int32_t * pLogicalLimit,UBiDiLevel * pLevel)307 ubidi_getLogicalRun(const UBiDi *pBiDi, int32_t logicalPosition,
308 int32_t *pLogicalLimit, UBiDiLevel *pLevel) {
309 UErrorCode errorCode;
310 int32_t runCount, visualStart, logicalLimit, logicalFirst, i;
311 Run iRun;
312
313 errorCode=U_ZERO_ERROR;
314 RETURN_VOID_IF_BAD_RANGE(logicalPosition, 0, pBiDi->length, errorCode);
315 /* ubidi_countRuns will check VALID_PARA_OR_LINE */
316 runCount=ubidi_countRuns((UBiDi *)pBiDi, &errorCode);
317 if(U_FAILURE(errorCode)) {
318 return;
319 }
320 /* this is done based on runs rather than on levels since levels have
321 a special interpretation when UBIDI_REORDER_RUNS_ONLY
322 */
323 visualStart=logicalLimit=0;
324 iRun=pBiDi->runs[0];
325
326 for(i=0; i<runCount; i++) {
327 iRun = pBiDi->runs[i];
328 logicalFirst=GET_INDEX(iRun.logicalStart);
329 logicalLimit=logicalFirst+iRun.visualLimit-visualStart;
330 if((logicalPosition>=logicalFirst) &&
331 (logicalPosition<logicalLimit)) {
332 break;
333 }
334 visualStart = iRun.visualLimit;
335 }
336 if(pLogicalLimit) {
337 *pLogicalLimit=logicalLimit;
338 }
339 if(pLevel) {
340 if(pBiDi->reorderingMode==UBIDI_REORDER_RUNS_ONLY) {
341 *pLevel=(UBiDiLevel)GET_ODD_BIT(iRun.logicalStart);
342 }
343 else if(pBiDi->direction!=UBIDI_MIXED || logicalPosition>=pBiDi->trailingWSStart) {
344 *pLevel=GET_PARALEVEL(pBiDi, logicalPosition);
345 } else {
346 *pLevel=pBiDi->levels[logicalPosition];
347 }
348 }
349 }
350
351 /* runs API functions ------------------------------------------------------- */
352
353 U_CAPI int32_t U_EXPORT2
ubidi_countRuns(UBiDi * pBiDi,UErrorCode * pErrorCode)354 ubidi_countRuns(UBiDi *pBiDi, UErrorCode *pErrorCode) {
355 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
356 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
357 ubidi_getRuns(pBiDi, pErrorCode);
358 if(U_FAILURE(*pErrorCode)) {
359 return -1;
360 }
361 return pBiDi->runCount;
362 }
363
364 U_CAPI UBiDiDirection U_EXPORT2
ubidi_getVisualRun(UBiDi * pBiDi,int32_t runIndex,int32_t * pLogicalStart,int32_t * pLength)365 ubidi_getVisualRun(UBiDi *pBiDi, int32_t runIndex,
366 int32_t *pLogicalStart, int32_t *pLength)
367 {
368 int32_t start;
369 UErrorCode errorCode = U_ZERO_ERROR;
370 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, errorCode, UBIDI_LTR);
371 ubidi_getRuns(pBiDi, &errorCode);
372 if(U_FAILURE(errorCode)) {
373 return UBIDI_LTR;
374 }
375 RETURN_IF_BAD_RANGE(runIndex, 0, pBiDi->runCount, errorCode, UBIDI_LTR);
376
377 start=pBiDi->runs[runIndex].logicalStart;
378 if(pLogicalStart!=NULL) {
379 *pLogicalStart=GET_INDEX(start);
380 }
381 if(pLength!=NULL) {
382 if(runIndex>0) {
383 *pLength=pBiDi->runs[runIndex].visualLimit-
384 pBiDi->runs[runIndex-1].visualLimit;
385 } else {
386 *pLength=pBiDi->runs[0].visualLimit;
387 }
388 }
389 return (UBiDiDirection)GET_ODD_BIT(start);
390 }
391
392 /* in trivial cases there is only one trivial run; called by ubidi_getRuns() */
393 static void
getSingleRun(UBiDi * pBiDi,UBiDiLevel level)394 getSingleRun(UBiDi *pBiDi, UBiDiLevel level) {
395 /* simple, single-run case */
396 pBiDi->runs=pBiDi->simpleRuns;
397 pBiDi->runCount=1;
398
399 /* fill and reorder the single run */
400 pBiDi->runs[0].logicalStart=MAKE_INDEX_ODD_PAIR(0, level);
401 pBiDi->runs[0].visualLimit=pBiDi->length;
402 pBiDi->runs[0].insertRemove=0;
403 }
404
405 /* reorder the runs array (L2) ---------------------------------------------- */
406
407 /*
408 * Reorder the same-level runs in the runs array.
409 * Here, runCount>1 and maxLevel>=minLevel>=paraLevel.
410 * All the visualStart fields=logical start before reordering.
411 * The "odd" bits are not set yet.
412 *
413 * Reordering with this data structure lends itself to some handy shortcuts:
414 *
415 * Since each run is moved but not modified, and since at the initial maxLevel
416 * each sequence of same-level runs consists of only one run each, we
417 * don't need to do anything there and can predecrement maxLevel.
418 * In many simple cases, the reordering is thus done entirely in the
419 * index mapping.
420 * Also, reordering occurs only down to the lowest odd level that occurs,
421 * which is minLevel|1. However, if the lowest level itself is odd, then
422 * in the last reordering the sequence of the runs at this level or higher
423 * will be all runs, and we don't need the elaborate loop to search for them.
424 * This is covered by ++minLevel instead of minLevel|=1 followed
425 * by an extra reorder-all after the reorder-some loop.
426 * About a trailing WS run:
427 * Such a run would need special treatment because its level is not
428 * reflected in levels[] if this is not a paragraph object.
429 * Instead, all characters from trailingWSStart on are implicitly at
430 * paraLevel.
431 * However, for all maxLevel>paraLevel, this run will never be reordered
432 * and does not need to be taken into account. maxLevel==paraLevel is only reordered
433 * if minLevel==paraLevel is odd, which is done in the extra segment.
434 * This means that for the main reordering loop we don't need to consider
435 * this run and can --runCount. If it is later part of the all-runs
436 * reordering, then runCount is adjusted accordingly.
437 */
438 static void
reorderLine(UBiDi * pBiDi,UBiDiLevel minLevel,UBiDiLevel maxLevel)439 reorderLine(UBiDi *pBiDi, UBiDiLevel minLevel, UBiDiLevel maxLevel) {
440 Run *runs, tempRun;
441 UBiDiLevel *levels;
442 int32_t firstRun, endRun, limitRun, runCount;
443
444 /* nothing to do? */
445 if(maxLevel<=(minLevel|1)) {
446 return;
447 }
448
449 /*
450 * Reorder only down to the lowest odd level
451 * and reorder at an odd minLevel in a separate, simpler loop.
452 * See comments above for why minLevel is always incremented.
453 */
454 ++minLevel;
455
456 runs=pBiDi->runs;
457 levels=pBiDi->levels;
458 runCount=pBiDi->runCount;
459
460 /* do not include the WS run at paraLevel<=old minLevel except in the simple loop */
461 if(pBiDi->trailingWSStart<pBiDi->length) {
462 --runCount;
463 }
464
465 while(--maxLevel>=minLevel) {
466 firstRun=0;
467
468 /* loop for all sequences of runs */
469 for(;;) {
470 /* look for a sequence of runs that are all at >=maxLevel */
471 /* look for the first run of such a sequence */
472 while(firstRun<runCount && levels[runs[firstRun].logicalStart]<maxLevel) {
473 ++firstRun;
474 }
475 if(firstRun>=runCount) {
476 break; /* no more such runs */
477 }
478
479 /* look for the limit run of such a sequence (the run behind it) */
480 for(limitRun=firstRun; ++limitRun<runCount && levels[runs[limitRun].logicalStart]>=maxLevel;) {}
481
482 /* Swap the entire sequence of runs from firstRun to limitRun-1. */
483 endRun=limitRun-1;
484 while(firstRun<endRun) {
485 tempRun = runs[firstRun];
486 runs[firstRun]=runs[endRun];
487 runs[endRun]=tempRun;
488 ++firstRun;
489 --endRun;
490 }
491
492 if(limitRun==runCount) {
493 break; /* no more such runs */
494 } else {
495 firstRun=limitRun+1;
496 }
497 }
498 }
499
500 /* now do maxLevel==old minLevel (==odd!), see above */
501 if(!(minLevel&1)) {
502 firstRun=0;
503
504 /* include the trailing WS run in this complete reordering */
505 if(pBiDi->trailingWSStart==pBiDi->length) {
506 --runCount;
507 }
508
509 /* Swap the entire sequence of all runs. (endRun==runCount) */
510 while(firstRun<runCount) {
511 tempRun=runs[firstRun];
512 runs[firstRun]=runs[runCount];
513 runs[runCount]=tempRun;
514 ++firstRun;
515 --runCount;
516 }
517 }
518 }
519
520 /* compute the runs array --------------------------------------------------- */
521
getRunFromLogicalIndex(UBiDi * pBiDi,int32_t logicalIndex,UErrorCode * pErrorCode)522 static int32_t getRunFromLogicalIndex(UBiDi *pBiDi, int32_t logicalIndex, UErrorCode *pErrorCode) {
523 Run *runs=pBiDi->runs;
524 int32_t runCount=pBiDi->runCount, visualStart=0, i, length, logicalStart;
525
526 for(i=0; i<runCount; i++) {
527 length=runs[i].visualLimit-visualStart;
528 logicalStart=GET_INDEX(runs[i].logicalStart);
529 if((logicalIndex>=logicalStart) && (logicalIndex<(logicalStart+length))) {
530 return i;
531 }
532 visualStart+=length;
533 }
534 /* we should never get here */
535 U_ASSERT(FALSE);
536 *pErrorCode = U_INVALID_STATE_ERROR;
537 return 0;
538 }
539
540 /*
541 * Compute the runs array from the levels array.
542 * After ubidi_getRuns() returns TRUE, runCount is guaranteed to be >0
543 * and the runs are reordered.
544 * Odd-level runs have visualStart on their visual right edge and
545 * they progress visually to the left.
546 * If option UBIDI_OPTION_INSERT_MARKS is set, insertRemove will contain the
547 * sum of appropriate LRM/RLM_BEFORE/AFTER flags.
548 * If option UBIDI_OPTION_REMOVE_CONTROLS is set, insertRemove will contain the
549 * negative number of BiDi control characters within this run.
550 */
551 U_CFUNC UBool
ubidi_getRuns(UBiDi * pBiDi,UErrorCode * pErrorCode)552 ubidi_getRuns(UBiDi *pBiDi, UErrorCode *pErrorCode) {
553 /*
554 * This method returns immediately if the runs are already set. This
555 * includes the case of length==0 (handled in setPara)..
556 */
557 if (pBiDi->runCount>=0) {
558 return TRUE;
559 }
560
561 if(pBiDi->direction!=UBIDI_MIXED) {
562 /* simple, single-run case - this covers length==0 */
563 /* pBiDi->paraLevel is ok even for contextual multiple paragraphs */
564 getSingleRun(pBiDi, pBiDi->paraLevel);
565 } else /* UBIDI_MIXED, length>0 */ {
566 /* mixed directionality */
567 int32_t length=pBiDi->length, limit;
568 UBiDiLevel *levels=pBiDi->levels;
569 int32_t i, runCount;
570 UBiDiLevel level=UBIDI_DEFAULT_LTR; /* initialize with no valid level */
571 /*
572 * If there are WS characters at the end of the line
573 * and the run preceding them has a level different from
574 * paraLevel, then they will form their own run at paraLevel (L1).
575 * Count them separately.
576 * We need some special treatment for this in order to not
577 * modify the levels array which a line UBiDi object shares
578 * with its paragraph parent and its other line siblings.
579 * In other words, for the trailing WS, it may be
580 * levels[]!=paraLevel but we have to treat it like it were so.
581 */
582 limit=pBiDi->trailingWSStart;
583 /* count the runs, there is at least one non-WS run, and limit>0 */
584 runCount=0;
585 for(i=0; i<limit; ++i) {
586 /* increment runCount at the start of each run */
587 if(levels[i]!=level) {
588 ++runCount;
589 level=levels[i];
590 }
591 }
592
593 /*
594 * We don't need to see if the last run can be merged with a trailing
595 * WS run because setTrailingWSStart() would have done that.
596 */
597 if(runCount==1 && limit==length) {
598 /* There is only one non-WS run and no trailing WS-run. */
599 getSingleRun(pBiDi, levels[0]);
600 } else /* runCount>1 || limit<length */ {
601 /* allocate and set the runs */
602 Run *runs;
603 int32_t runIndex, start;
604 UBiDiLevel minLevel=UBIDI_MAX_EXPLICIT_LEVEL+1, maxLevel=0;
605
606 /* now, count a (non-mergeable) WS run */
607 if(limit<length) {
608 ++runCount;
609 }
610
611 /* runCount>1 */
612 if(getRunsMemory(pBiDi, runCount)) {
613 runs=pBiDi->runsMemory;
614 } else {
615 return FALSE;
616 }
617
618 /* set the runs */
619 /* FOOD FOR THOUGHT: this could be optimized, e.g.:
620 * 464->444, 484->444, 575->555, 595->555
621 * However, that would take longer. Check also how it would
622 * interact with BiDi control removal and inserting Marks.
623 */
624 runIndex=0;
625
626 /* search for the run limits and initialize visualLimit values with the run lengths */
627 i=0;
628 do {
629 /* prepare this run */
630 start=i;
631 level=levels[i];
632 if(level<minLevel) {
633 minLevel=level;
634 }
635 if(level>maxLevel) {
636 maxLevel=level;
637 }
638
639 /* look for the run limit */
640 while(++i<limit && levels[i]==level) {}
641
642 /* i is another run limit */
643 runs[runIndex].logicalStart=start;
644 runs[runIndex].visualLimit=i-start;
645 runs[runIndex].insertRemove=0;
646 ++runIndex;
647 } while(i<limit);
648
649 if(limit<length) {
650 /* there is a separate WS run */
651 runs[runIndex].logicalStart=limit;
652 runs[runIndex].visualLimit=length-limit;
653 /* For the trailing WS run, pBiDi->paraLevel is ok even
654 if contextual multiple paragraphs. */
655 if(pBiDi->paraLevel<minLevel) {
656 minLevel=pBiDi->paraLevel;
657 }
658 }
659
660 /* set the object fields */
661 pBiDi->runs=runs;
662 pBiDi->runCount=runCount;
663
664 reorderLine(pBiDi, minLevel, maxLevel);
665
666 /* now add the direction flags and adjust the visualLimit's to be just that */
667 /* this loop will also handle the trailing WS run */
668 limit=0;
669 for(i=0; i<runCount; ++i) {
670 ADD_ODD_BIT_FROM_LEVEL(runs[i].logicalStart, levels[runs[i].logicalStart]);
671 limit+=runs[i].visualLimit;
672 runs[i].visualLimit=limit;
673 }
674
675 /* Set the "odd" bit for the trailing WS run. */
676 /* For a RTL paragraph, it will be the *first* run in visual order. */
677 /* For the trailing WS run, pBiDi->paraLevel is ok even if
678 contextual multiple paragraphs. */
679 if(runIndex<runCount) {
680 int32_t trailingRun = ((pBiDi->paraLevel & 1) != 0)? 0 : runIndex;
681
682 ADD_ODD_BIT_FROM_LEVEL(runs[trailingRun].logicalStart, pBiDi->paraLevel);
683 }
684 }
685 }
686
687 /* handle insert LRM/RLM BEFORE/AFTER run */
688 if(pBiDi->insertPoints.size>0) {
689 Point *point, *start=pBiDi->insertPoints.points,
690 *limit=start+pBiDi->insertPoints.size;
691 int32_t runIndex;
692 for(point=start; point<limit; point++) {
693 runIndex=getRunFromLogicalIndex(pBiDi, point->pos, pErrorCode);
694 pBiDi->runs[runIndex].insertRemove|=point->flag;
695 }
696 }
697
698 /* handle remove BiDi control characters */
699 if(pBiDi->controlCount>0) {
700 int32_t runIndex;
701 const UChar *start=pBiDi->text, *limit=start+pBiDi->length, *pu;
702 for(pu=start; pu<limit; pu++) {
703 if(IS_BIDI_CONTROL_CHAR(*pu)) {
704 runIndex=getRunFromLogicalIndex(pBiDi, (int32_t)(pu-start), pErrorCode);
705 pBiDi->runs[runIndex].insertRemove--;
706 }
707 }
708 }
709
710 return TRUE;
711 }
712
713 static UBool
prepareReorder(const UBiDiLevel * levels,int32_t length,int32_t * indexMap,UBiDiLevel * pMinLevel,UBiDiLevel * pMaxLevel)714 prepareReorder(const UBiDiLevel *levels, int32_t length,
715 int32_t *indexMap,
716 UBiDiLevel *pMinLevel, UBiDiLevel *pMaxLevel) {
717 int32_t start;
718 UBiDiLevel level, minLevel, maxLevel;
719
720 if(levels==NULL || length<=0) {
721 return FALSE;
722 }
723
724 /* determine minLevel and maxLevel */
725 minLevel=UBIDI_MAX_EXPLICIT_LEVEL+1;
726 maxLevel=0;
727 for(start=length; start>0;) {
728 level=levels[--start];
729 if(level>UBIDI_MAX_EXPLICIT_LEVEL+1) {
730 return FALSE;
731 }
732 if(level<minLevel) {
733 minLevel=level;
734 }
735 if(level>maxLevel) {
736 maxLevel=level;
737 }
738 }
739 *pMinLevel=minLevel;
740 *pMaxLevel=maxLevel;
741
742 /* initialize the index map */
743 for(start=length; start>0;) {
744 --start;
745 indexMap[start]=start;
746 }
747
748 return TRUE;
749 }
750
751 /* reorder a line based on a levels array (L2) ------------------------------ */
752
753 U_CAPI void U_EXPORT2
ubidi_reorderLogical(const UBiDiLevel * levels,int32_t length,int32_t * indexMap)754 ubidi_reorderLogical(const UBiDiLevel *levels, int32_t length, int32_t *indexMap) {
755 int32_t start, limit, sumOfSosEos;
756 UBiDiLevel minLevel = 0, maxLevel = 0;
757
758 if(indexMap==NULL || !prepareReorder(levels, length, indexMap, &minLevel, &maxLevel)) {
759 return;
760 }
761
762 /* nothing to do? */
763 if(minLevel==maxLevel && (minLevel&1)==0) {
764 return;
765 }
766
767 /* reorder only down to the lowest odd level */
768 minLevel|=1;
769
770 /* loop maxLevel..minLevel */
771 do {
772 start=0;
773
774 /* loop for all sequences of levels to reorder at the current maxLevel */
775 for(;;) {
776 /* look for a sequence of levels that are all at >=maxLevel */
777 /* look for the first index of such a sequence */
778 while(start<length && levels[start]<maxLevel) {
779 ++start;
780 }
781 if(start>=length) {
782 break; /* no more such sequences */
783 }
784
785 /* look for the limit of such a sequence (the index behind it) */
786 for(limit=start; ++limit<length && levels[limit]>=maxLevel;) {}
787
788 /*
789 * sos=start of sequence, eos=end of sequence
790 *
791 * The closed (inclusive) interval from sos to eos includes all the logical
792 * and visual indexes within this sequence. They are logically and
793 * visually contiguous and in the same range.
794 *
795 * For each run, the new visual index=sos+eos-old visual index;
796 * we pre-add sos+eos into sumOfSosEos ->
797 * new visual index=sumOfSosEos-old visual index;
798 */
799 sumOfSosEos=start+limit-1;
800
801 /* reorder each index in the sequence */
802 do {
803 indexMap[start]=sumOfSosEos-indexMap[start];
804 } while(++start<limit);
805
806 /* start==limit */
807 if(limit==length) {
808 break; /* no more such sequences */
809 } else {
810 start=limit+1;
811 }
812 }
813 } while(--maxLevel>=minLevel);
814 }
815
816 U_CAPI void U_EXPORT2
ubidi_reorderVisual(const UBiDiLevel * levels,int32_t length,int32_t * indexMap)817 ubidi_reorderVisual(const UBiDiLevel *levels, int32_t length, int32_t *indexMap) {
818 int32_t start, end, limit, temp;
819 UBiDiLevel minLevel = 0, maxLevel = 0;
820
821 if(indexMap==NULL || !prepareReorder(levels, length, indexMap, &minLevel, &maxLevel)) {
822 return;
823 }
824
825 /* nothing to do? */
826 if(minLevel==maxLevel && (minLevel&1)==0) {
827 return;
828 }
829
830 /* reorder only down to the lowest odd level */
831 minLevel|=1;
832
833 /* loop maxLevel..minLevel */
834 do {
835 start=0;
836
837 /* loop for all sequences of levels to reorder at the current maxLevel */
838 for(;;) {
839 /* look for a sequence of levels that are all at >=maxLevel */
840 /* look for the first index of such a sequence */
841 while(start<length && levels[start]<maxLevel) {
842 ++start;
843 }
844 if(start>=length) {
845 break; /* no more such runs */
846 }
847
848 /* look for the limit of such a sequence (the index behind it) */
849 for(limit=start; ++limit<length && levels[limit]>=maxLevel;) {}
850
851 /*
852 * Swap the entire interval of indexes from start to limit-1.
853 * We don't need to swap the levels for the purpose of this
854 * algorithm: the sequence of levels that we look at does not
855 * move anyway.
856 */
857 end=limit-1;
858 while(start<end) {
859 temp=indexMap[start];
860 indexMap[start]=indexMap[end];
861 indexMap[end]=temp;
862
863 ++start;
864 --end;
865 }
866
867 if(limit==length) {
868 break; /* no more such sequences */
869 } else {
870 start=limit+1;
871 }
872 }
873 } while(--maxLevel>=minLevel);
874 }
875
876 /* API functions for logical<->visual mapping ------------------------------- */
877
878 U_CAPI int32_t U_EXPORT2
ubidi_getVisualIndex(UBiDi * pBiDi,int32_t logicalIndex,UErrorCode * pErrorCode)879 ubidi_getVisualIndex(UBiDi *pBiDi, int32_t logicalIndex, UErrorCode *pErrorCode) {
880 int32_t visualIndex=UBIDI_MAP_NOWHERE;
881 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
882 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
883 RETURN_IF_BAD_RANGE(logicalIndex, 0, pBiDi->length, *pErrorCode, -1);
884
885 /* we can do the trivial cases without the runs array */
886 switch(pBiDi->direction) {
887 case UBIDI_LTR:
888 visualIndex=logicalIndex;
889 break;
890 case UBIDI_RTL:
891 visualIndex=pBiDi->length-logicalIndex-1;
892 break;
893 default:
894 if(!ubidi_getRuns(pBiDi, pErrorCode)) {
895 *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
896 return -1;
897 } else {
898 Run *runs=pBiDi->runs;
899 int32_t i, visualStart=0, offset, length;
900
901 /* linear search for the run, search on the visual runs */
902 for(i=0; i<pBiDi->runCount; ++i) {
903 length=runs[i].visualLimit-visualStart;
904 offset=logicalIndex-GET_INDEX(runs[i].logicalStart);
905 if(offset>=0 && offset<length) {
906 if(IS_EVEN_RUN(runs[i].logicalStart)) {
907 /* LTR */
908 visualIndex=visualStart+offset;
909 } else {
910 /* RTL */
911 visualIndex=visualStart+length-offset-1;
912 }
913 break; /* exit for loop */
914 }
915 visualStart+=length;
916 }
917 if(i>=pBiDi->runCount) {
918 return UBIDI_MAP_NOWHERE;
919 }
920 }
921 }
922
923 if(pBiDi->insertPoints.size>0) {
924 /* add the number of added marks until the calculated visual index */
925 Run *runs=pBiDi->runs;
926 int32_t i, length, insertRemove;
927 int32_t visualStart=0, markFound=0;
928 for(i=0; ; i++, visualStart+=length) {
929 length=runs[i].visualLimit-visualStart;
930 insertRemove=runs[i].insertRemove;
931 if(insertRemove & (LRM_BEFORE|RLM_BEFORE)) {
932 markFound++;
933 }
934 /* is it the run containing the visual index? */
935 if(visualIndex<runs[i].visualLimit) {
936 return visualIndex+markFound;
937 }
938 if(insertRemove & (LRM_AFTER|RLM_AFTER)) {
939 markFound++;
940 }
941 }
942 }
943 else if(pBiDi->controlCount>0) {
944 /* subtract the number of controls until the calculated visual index */
945 Run *runs=pBiDi->runs;
946 int32_t i, j, start, limit, length, insertRemove;
947 int32_t visualStart=0, controlFound=0;
948 UChar uchar=pBiDi->text[logicalIndex];
949 /* is the logical index pointing to a control ? */
950 if(IS_BIDI_CONTROL_CHAR(uchar)) {
951 return UBIDI_MAP_NOWHERE;
952 }
953 /* loop on runs */
954 for(i=0; ; i++, visualStart+=length) {
955 length=runs[i].visualLimit-visualStart;
956 insertRemove=runs[i].insertRemove;
957 /* calculated visual index is beyond this run? */
958 if(visualIndex>=runs[i].visualLimit) {
959 controlFound-=insertRemove;
960 continue;
961 }
962 /* calculated visual index must be within current run */
963 if(insertRemove==0) {
964 return visualIndex-controlFound;
965 }
966 if(IS_EVEN_RUN(runs[i].logicalStart)) {
967 /* LTR: check from run start to logical index */
968 start=runs[i].logicalStart;
969 limit=logicalIndex;
970 } else {
971 /* RTL: check from logical index to run end */
972 start=logicalIndex+1;
973 limit=GET_INDEX(runs[i].logicalStart)+length;
974 }
975 for(j=start; j<limit; j++) {
976 uchar=pBiDi->text[j];
977 if(IS_BIDI_CONTROL_CHAR(uchar)) {
978 controlFound++;
979 }
980 }
981 return visualIndex-controlFound;
982 }
983 }
984
985 return visualIndex;
986 }
987
988 U_CAPI int32_t U_EXPORT2
ubidi_getLogicalIndex(UBiDi * pBiDi,int32_t visualIndex,UErrorCode * pErrorCode)989 ubidi_getLogicalIndex(UBiDi *pBiDi, int32_t visualIndex, UErrorCode *pErrorCode) {
990 Run *runs;
991 int32_t i, runCount, start;
992 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
993 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
994 RETURN_IF_BAD_RANGE(visualIndex, 0, pBiDi->resultLength, *pErrorCode, -1);
995 /* we can do the trivial cases without the runs array */
996 if(pBiDi->insertPoints.size==0 && pBiDi->controlCount==0) {
997 if(pBiDi->direction==UBIDI_LTR) {
998 return visualIndex;
999 }
1000 else if(pBiDi->direction==UBIDI_RTL) {
1001 return pBiDi->length-visualIndex-1;
1002 }
1003 }
1004 if(!ubidi_getRuns(pBiDi, pErrorCode)) {
1005 *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
1006 return -1;
1007 }
1008
1009 runs=pBiDi->runs;
1010 runCount=pBiDi->runCount;
1011 if(pBiDi->insertPoints.size>0) {
1012 /* handle inserted LRM/RLM */
1013 int32_t markFound=0, insertRemove;
1014 int32_t visualStart=0, length;
1015 runs=pBiDi->runs;
1016 /* subtract number of marks until visual index */
1017 for(i=0; ; i++, visualStart+=length) {
1018 length=runs[i].visualLimit-visualStart;
1019 insertRemove=runs[i].insertRemove;
1020 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1021 if(visualIndex<=(visualStart+markFound)) {
1022 return UBIDI_MAP_NOWHERE;
1023 }
1024 markFound++;
1025 }
1026 /* is adjusted visual index within this run? */
1027 if(visualIndex<(runs[i].visualLimit+markFound)) {
1028 visualIndex-=markFound;
1029 break;
1030 }
1031 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1032 if(visualIndex==(visualStart+length+markFound)) {
1033 return UBIDI_MAP_NOWHERE;
1034 }
1035 markFound++;
1036 }
1037 }
1038 }
1039 else if(pBiDi->controlCount>0) {
1040 /* handle removed BiDi control characters */
1041 int32_t controlFound=0, insertRemove, length;
1042 int32_t logicalStart, logicalEnd, visualStart=0, j, k;
1043 UChar uchar;
1044 UBool evenRun;
1045 /* add number of controls until visual index */
1046 for(i=0; ; i++, visualStart+=length) {
1047 length=runs[i].visualLimit-visualStart;
1048 insertRemove=runs[i].insertRemove;
1049 /* is adjusted visual index beyond current run? */
1050 if(visualIndex>=(runs[i].visualLimit-controlFound+insertRemove)) {
1051 controlFound-=insertRemove;
1052 continue;
1053 }
1054 /* adjusted visual index is within current run */
1055 if(insertRemove==0) {
1056 visualIndex+=controlFound;
1057 break;
1058 }
1059 /* count non-control chars until visualIndex */
1060 logicalStart=runs[i].logicalStart;
1061 evenRun=IS_EVEN_RUN(logicalStart);
1062 REMOVE_ODD_BIT(logicalStart);
1063 logicalEnd=logicalStart+length-1;
1064 for(j=0; j<length; j++) {
1065 k= evenRun ? logicalStart+j : logicalEnd-j;
1066 uchar=pBiDi->text[k];
1067 if(IS_BIDI_CONTROL_CHAR(uchar)) {
1068 controlFound++;
1069 }
1070 if((visualIndex+controlFound)==(visualStart+j)) {
1071 break;
1072 }
1073 }
1074 visualIndex+=controlFound;
1075 break;
1076 }
1077 }
1078 /* handle all cases */
1079 if(runCount<=10) {
1080 /* linear search for the run */
1081 for(i=0; visualIndex>=runs[i].visualLimit; ++i) {}
1082 } else {
1083 /* binary search for the run */
1084 int32_t begin=0, limit=runCount;
1085
1086 /* the middle if() is guaranteed to find the run, we don't need a loop limit */
1087 for(;;) {
1088 i=(begin+limit)/2;
1089 if(visualIndex>=runs[i].visualLimit) {
1090 begin=i+1;
1091 } else if(i==0 || visualIndex>=runs[i-1].visualLimit) {
1092 break;
1093 } else {
1094 limit=i;
1095 }
1096 }
1097 }
1098
1099 start=runs[i].logicalStart;
1100 if(IS_EVEN_RUN(start)) {
1101 /* LTR */
1102 /* the offset in runs[i] is visualIndex-runs[i-1].visualLimit */
1103 if(i>0) {
1104 visualIndex-=runs[i-1].visualLimit;
1105 }
1106 return start+visualIndex;
1107 } else {
1108 /* RTL */
1109 return GET_INDEX(start)+runs[i].visualLimit-visualIndex-1;
1110 }
1111 }
1112
1113 U_CAPI void U_EXPORT2
ubidi_getLogicalMap(UBiDi * pBiDi,int32_t * indexMap,UErrorCode * pErrorCode)1114 ubidi_getLogicalMap(UBiDi *pBiDi, int32_t *indexMap, UErrorCode *pErrorCode) {
1115 RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
1116 /* ubidi_countRuns() checks for VALID_PARA_OR_LINE */
1117 ubidi_countRuns(pBiDi, pErrorCode);
1118 if(U_FAILURE(*pErrorCode)) {
1119 /* no op */
1120 } else if(indexMap==NULL) {
1121 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1122 } else {
1123 /* fill a logical-to-visual index map using the runs[] */
1124 int32_t visualStart, visualLimit, i, j, k;
1125 int32_t logicalStart, logicalLimit;
1126 Run *runs=pBiDi->runs;
1127 if (pBiDi->length<=0) {
1128 return;
1129 }
1130 if (pBiDi->length>pBiDi->resultLength) {
1131 uprv_memset(indexMap, 0xFF, pBiDi->length*sizeof(int32_t));
1132 }
1133
1134 visualStart=0;
1135 for(j=0; j<pBiDi->runCount; ++j) {
1136 logicalStart=GET_INDEX(runs[j].logicalStart);
1137 visualLimit=runs[j].visualLimit;
1138 if(IS_EVEN_RUN(runs[j].logicalStart)) {
1139 do { /* LTR */
1140 indexMap[logicalStart++]=visualStart++;
1141 } while(visualStart<visualLimit);
1142 } else {
1143 logicalStart+=visualLimit-visualStart; /* logicalLimit */
1144 do { /* RTL */
1145 indexMap[--logicalStart]=visualStart++;
1146 } while(visualStart<visualLimit);
1147 }
1148 /* visualStart==visualLimit; */
1149 }
1150
1151 if(pBiDi->insertPoints.size>0) {
1152 int32_t markFound=0, runCount=pBiDi->runCount;
1153 int32_t length, insertRemove;
1154 visualStart=0;
1155 /* add number of marks found until each index */
1156 for(i=0; i<runCount; i++, visualStart+=length) {
1157 length=runs[i].visualLimit-visualStart;
1158 insertRemove=runs[i].insertRemove;
1159 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1160 markFound++;
1161 }
1162 if(markFound>0) {
1163 logicalStart=GET_INDEX(runs[i].logicalStart);
1164 logicalLimit=logicalStart+length;
1165 for(j=logicalStart; j<logicalLimit; j++) {
1166 indexMap[j]+=markFound;
1167 }
1168 }
1169 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1170 markFound++;
1171 }
1172 }
1173 }
1174 else if(pBiDi->controlCount>0) {
1175 int32_t controlFound=0, runCount=pBiDi->runCount;
1176 int32_t length, insertRemove;
1177 UBool evenRun;
1178 UChar uchar;
1179 visualStart=0;
1180 /* subtract number of controls found until each index */
1181 for(i=0; i<runCount; i++, visualStart+=length) {
1182 length=runs[i].visualLimit-visualStart;
1183 insertRemove=runs[i].insertRemove;
1184 /* no control found within previous runs nor within this run */
1185 if((controlFound-insertRemove)==0) {
1186 continue;
1187 }
1188 logicalStart=runs[i].logicalStart;
1189 evenRun=IS_EVEN_RUN(logicalStart);
1190 REMOVE_ODD_BIT(logicalStart);
1191 logicalLimit=logicalStart+length;
1192 /* if no control within this run */
1193 if(insertRemove==0) {
1194 for(j=logicalStart; j<logicalLimit; j++) {
1195 indexMap[j]-=controlFound;
1196 }
1197 continue;
1198 }
1199 for(j=0; j<length; j++) {
1200 k= evenRun ? logicalStart+j : logicalLimit-j-1;
1201 uchar=pBiDi->text[k];
1202 if(IS_BIDI_CONTROL_CHAR(uchar)) {
1203 controlFound++;
1204 indexMap[k]=UBIDI_MAP_NOWHERE;
1205 continue;
1206 }
1207 indexMap[k]-=controlFound;
1208 }
1209 }
1210 }
1211 }
1212 }
1213
1214 U_CAPI void U_EXPORT2
ubidi_getVisualMap(UBiDi * pBiDi,int32_t * indexMap,UErrorCode * pErrorCode)1215 ubidi_getVisualMap(UBiDi *pBiDi, int32_t *indexMap, UErrorCode *pErrorCode) {
1216 RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
1217 if(indexMap==NULL) {
1218 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1219 return;
1220 }
1221 /* ubidi_countRuns() checks for VALID_PARA_OR_LINE */
1222 ubidi_countRuns(pBiDi, pErrorCode);
1223 if(U_SUCCESS(*pErrorCode)) {
1224 /* fill a visual-to-logical index map using the runs[] */
1225 Run *runs=pBiDi->runs, *runsLimit=runs+pBiDi->runCount;
1226 int32_t logicalStart, visualStart, visualLimit, *pi=indexMap;
1227
1228 if (pBiDi->resultLength<=0) {
1229 return;
1230 }
1231 visualStart=0;
1232 for(; runs<runsLimit; ++runs) {
1233 logicalStart=runs->logicalStart;
1234 visualLimit=runs->visualLimit;
1235 if(IS_EVEN_RUN(logicalStart)) {
1236 do { /* LTR */
1237 *pi++ = logicalStart++;
1238 } while(++visualStart<visualLimit);
1239 } else {
1240 REMOVE_ODD_BIT(logicalStart);
1241 logicalStart+=visualLimit-visualStart; /* logicalLimit */
1242 do { /* RTL */
1243 *pi++ = --logicalStart;
1244 } while(++visualStart<visualLimit);
1245 }
1246 /* visualStart==visualLimit; */
1247 }
1248
1249 if(pBiDi->insertPoints.size>0) {
1250 int32_t markFound=0, runCount=pBiDi->runCount;
1251 int32_t insertRemove, i, j, k;
1252 runs=pBiDi->runs;
1253 /* count all inserted marks */
1254 for(i=0; i<runCount; i++) {
1255 insertRemove=runs[i].insertRemove;
1256 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1257 markFound++;
1258 }
1259 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1260 markFound++;
1261 }
1262 }
1263 /* move back indexes by number of preceding marks */
1264 k=pBiDi->resultLength;
1265 for(i=runCount-1; i>=0 && markFound>0; i--) {
1266 insertRemove=runs[i].insertRemove;
1267 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1268 indexMap[--k]= UBIDI_MAP_NOWHERE;
1269 markFound--;
1270 }
1271 visualStart= i>0 ? runs[i-1].visualLimit : 0;
1272 for(j=runs[i].visualLimit-1; j>=visualStart && markFound>0; j--) {
1273 indexMap[--k]=indexMap[j];
1274 }
1275 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1276 indexMap[--k]= UBIDI_MAP_NOWHERE;
1277 markFound--;
1278 }
1279 }
1280 }
1281 else if(pBiDi->controlCount>0) {
1282 int32_t runCount=pBiDi->runCount, logicalEnd;
1283 int32_t insertRemove, length, i, j, k, m;
1284 UChar uchar;
1285 UBool evenRun;
1286 runs=pBiDi->runs;
1287 visualStart=0;
1288 /* move forward indexes by number of preceding controls */
1289 k=0;
1290 for(i=0; i<runCount; i++, visualStart+=length) {
1291 length=runs[i].visualLimit-visualStart;
1292 insertRemove=runs[i].insertRemove;
1293 /* if no control found yet, nothing to do in this run */
1294 if((insertRemove==0)&&(k==visualStart)) {
1295 k+=length;
1296 continue;
1297 }
1298 /* if no control in this run */
1299 if(insertRemove==0) {
1300 visualLimit=runs[i].visualLimit;
1301 for(j=visualStart; j<visualLimit; j++) {
1302 indexMap[k++]=indexMap[j];
1303 }
1304 continue;
1305 }
1306 logicalStart=runs[i].logicalStart;
1307 evenRun=IS_EVEN_RUN(logicalStart);
1308 REMOVE_ODD_BIT(logicalStart);
1309 logicalEnd=logicalStart+length-1;
1310 for(j=0; j<length; j++) {
1311 m= evenRun ? logicalStart+j : logicalEnd-j;
1312 uchar=pBiDi->text[m];
1313 if(!IS_BIDI_CONTROL_CHAR(uchar)) {
1314 indexMap[k++]=m;
1315 }
1316 }
1317 }
1318 }
1319 }
1320 }
1321
1322 U_CAPI void U_EXPORT2
ubidi_invertMap(const int32_t * srcMap,int32_t * destMap,int32_t length)1323 ubidi_invertMap(const int32_t *srcMap, int32_t *destMap, int32_t length) {
1324 if(srcMap!=NULL && destMap!=NULL && length>0) {
1325 const int32_t *pi;
1326 int32_t destLength=-1, count=0;
1327 /* find highest value and count positive indexes in srcMap */
1328 pi=srcMap+length;
1329 while(pi>srcMap) {
1330 if(*--pi>destLength) {
1331 destLength=*pi;
1332 }
1333 if(*pi>=0) {
1334 count++;
1335 }
1336 }
1337 destLength++; /* add 1 for origin 0 */
1338 if(count<destLength) {
1339 /* we must fill unmatched destMap entries with -1 */
1340 uprv_memset(destMap, 0xFF, destLength*sizeof(int32_t));
1341 }
1342 pi=srcMap+length;
1343 while(length>0) {
1344 if(*--pi>=0) {
1345 destMap[*pi]=--length;
1346 } else {
1347 --length;
1348 }
1349 }
1350 }
1351 }
1352