• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 ******************************************************************************
5 *
6 *   Copyright (C) 1999-2015, International Business Machines
7 *   Corporation and others.  All Rights Reserved.
8 *
9 ******************************************************************************
10 *   file name:  ubidiln.c
11 *   encoding:   UTF-8
12 *   tab size:   8 (not used)
13 *   indentation:4
14 *
15 *   created on: 1999aug06
16 *   created by: Markus W. Scherer, updated by Matitiahu Allouche
17 */
18 
19 #include "cmemory.h"
20 #include "unicode/utypes.h"
21 #include "unicode/ustring.h"
22 #include "unicode/uchar.h"
23 #include "unicode/ubidi.h"
24 #include "ubidiimp.h"
25 #include "uassert.h"
26 
27 /*
28  * General remarks about the functions in this file:
29  *
30  * These functions deal with the aspects of potentially mixed-directional
31  * text in a single paragraph or in a line of a single paragraph
32  * which has already been processed according to
33  * the Unicode 6.3 BiDi algorithm as defined in
34  * https://www.unicode.org/reports/tr9/ , version 28,
35  * also described in The Unicode Standard, Version 6.3.0 .
36  *
37  * This means that there is a UBiDi object with a levels
38  * and a dirProps array.
39  * paraLevel and direction are also set.
40  * Only if the length of the text is zero, then levels==dirProps==nullptr.
41  *
42  * The overall directionality of the paragraph
43  * or line is used to bypass the reordering steps if possible.
44  * Even purely RTL text does not need reordering there because
45  * the ubidi_getLogical/VisualIndex() functions can compute the
46  * index on the fly in such a case.
47  *
48  * The implementation of the access to same-level-runs and of the reordering
49  * do attempt to provide better performance and less memory usage compared to
50  * a direct implementation of especially rule (L2) with an array of
51  * one (32-bit) integer per text character.
52  *
53  * Here, the levels array is scanned as soon as necessary, and a vector of
54  * same-level-runs is created. Reordering then is done on this vector.
55  * For each run of text positions that were resolved to the same level,
56  * only 8 bytes are stored: the first text position of the run and the visual
57  * position behind the run after reordering.
58  * One sign bit is used to hold the directionality of the run.
59  * This is inefficient if there are many very short runs. If the average run
60  * length is <2, then this uses more memory.
61  *
62  * In a further attempt to save memory, the levels array is never changed
63  * after all the resolution rules (Xn, Wn, Nn, In).
64  * Many functions have to consider the field trailingWSStart:
65  * if it is less than length, then there is an implicit trailing run
66  * at the paraLevel,
67  * which is not reflected in the levels array.
68  * This allows a line UBiDi object to use the same levels array as
69  * its paragraph parent object.
70  *
71  * When a UBiDi object is created for a line of a paragraph, then the
72  * paragraph's levels and dirProps arrays are reused by way of setting
73  * a pointer into them, not by copying. This again saves memory and forbids to
74  * change the now shared levels for (L1).
75  */
76 
77 /* handle trailing WS (L1) -------------------------------------------------- */
78 
79 /*
80  * setTrailingWSStart() sets the start index for a trailing
81  * run of WS in the line. This is necessary because we do not modify
82  * the paragraph's levels array that we just point into.
83  * Using trailingWSStart is another form of performing (L1).
84  *
85  * To make subsequent operations easier, we also include the run
86  * before the WS if it is at the paraLevel - we merge the two here.
87  *
88  * This function is called only from ubidi_setLine(), so pBiDi->paraLevel is
89  * set correctly for the line even when contextual multiple paragraphs.
90  */
91 static void
setTrailingWSStart(UBiDi * pBiDi)92 setTrailingWSStart(UBiDi *pBiDi) {
93     /* pBiDi->direction!=UBIDI_MIXED */
94 
95     const DirProp *dirProps=pBiDi->dirProps;
96     UBiDiLevel *levels=pBiDi->levels;
97     int32_t start=pBiDi->length;
98     UBiDiLevel paraLevel=pBiDi->paraLevel;
99 
100     /* If the line is terminated by a block separator, all preceding WS etc...
101        are already set to paragraph level.
102        Setting trailingWSStart to pBidi->length will avoid changing the
103        level of B chars from 0 to paraLevel in ubidi_getLevels when
104        orderParagraphsLTR==true.
105      */
106     if(dirProps[start-1]==B) {
107         pBiDi->trailingWSStart=start;   /* currently == pBiDi->length */
108         return;
109     }
110     /* go backwards across all WS, BN, explicit codes */
111     while(start>0 && DIRPROP_FLAG(dirProps[start-1])&MASK_WS) {
112         --start;
113     }
114 
115     /* if the WS run can be merged with the previous run then do so here */
116     while(start>0 && levels[start-1]==paraLevel) {
117         --start;
118     }
119 
120     pBiDi->trailingWSStart=start;
121 }
122 
123 /* ubidi_setLine ------------------------------------------------------------ */
124 
125 U_CAPI void U_EXPORT2
ubidi_setLine(const UBiDi * pParaBiDi,int32_t start,int32_t limit,UBiDi * pLineBiDi,UErrorCode * pErrorCode)126 ubidi_setLine(const UBiDi *pParaBiDi,
127               int32_t start, int32_t limit,
128               UBiDi *pLineBiDi,
129               UErrorCode *pErrorCode) {
130     int32_t length;
131 
132     /* check the argument values */
133     RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
134     RETURN_VOID_IF_NOT_VALID_PARA(pParaBiDi, *pErrorCode);
135     RETURN_VOID_IF_BAD_RANGE(start, 0, limit, *pErrorCode);
136     RETURN_VOID_IF_BAD_RANGE(limit, 0, pParaBiDi->length+1, *pErrorCode);
137     if(pLineBiDi==nullptr) {
138         *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
139         return;
140     }
141     if(ubidi_getParagraph(pParaBiDi, start, nullptr, nullptr, nullptr, pErrorCode) !=
142        ubidi_getParagraph(pParaBiDi, limit-1, nullptr, nullptr, nullptr, pErrorCode)) {
143         /* the line crosses a paragraph boundary */
144         *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
145         return;
146     }
147 
148     /* set the values in pLineBiDi from its pParaBiDi parent */
149     pLineBiDi->pParaBiDi=nullptr;          /* mark unfinished setLine */
150     pLineBiDi->text=pParaBiDi->text+start;
151     length=pLineBiDi->length=limit-start;
152     pLineBiDi->resultLength=pLineBiDi->originalLength=length;
153     pLineBiDi->paraLevel=GET_PARALEVEL(pParaBiDi, start);
154     pLineBiDi->paraCount=pParaBiDi->paraCount;
155     pLineBiDi->runs=nullptr;
156     pLineBiDi->flags=0;
157     pLineBiDi->reorderingMode=pParaBiDi->reorderingMode;
158     pLineBiDi->reorderingOptions=pParaBiDi->reorderingOptions;
159     pLineBiDi->controlCount=0;
160     if(pParaBiDi->controlCount>0) {
161         int32_t j;
162         for(j=start; j<limit; j++) {
163             if(IS_BIDI_CONTROL_CHAR(pParaBiDi->text[j])) {
164                 pLineBiDi->controlCount++;
165             }
166         }
167         pLineBiDi->resultLength-=pLineBiDi->controlCount;
168     }
169 
170     pLineBiDi->dirProps=pParaBiDi->dirProps+start;
171     pLineBiDi->levels=pParaBiDi->levels+start;
172     pLineBiDi->runCount=-1;
173 
174     if(pParaBiDi->direction!=UBIDI_MIXED) {
175         /* the parent is already trivial */
176         pLineBiDi->direction=pParaBiDi->direction;
177 
178         /*
179          * The parent's levels are all either
180          * implicitly or explicitly ==paraLevel;
181          * do the same here.
182          */
183         if(pParaBiDi->trailingWSStart<=start) {
184             pLineBiDi->trailingWSStart=0;
185         } else if(pParaBiDi->trailingWSStart<limit) {
186             pLineBiDi->trailingWSStart=pParaBiDi->trailingWSStart-start;
187         } else {
188             pLineBiDi->trailingWSStart=length;
189         }
190     } else {
191         const UBiDiLevel *levels=pLineBiDi->levels;
192         int32_t i, trailingWSStart;
193         UBiDiLevel level;
194 
195         setTrailingWSStart(pLineBiDi);
196         trailingWSStart=pLineBiDi->trailingWSStart;
197 
198         /* recalculate pLineBiDi->direction */
199         if(trailingWSStart==0) {
200             /* all levels are at paraLevel */
201             pLineBiDi->direction=(UBiDiDirection)(pLineBiDi->paraLevel&1);
202         } else {
203             /* get the level of the first character */
204             level=(UBiDiLevel)(levels[0]&1);
205 
206             /* if there is anything of a different level, then the line is mixed */
207             if(trailingWSStart<length && (pLineBiDi->paraLevel&1)!=level) {
208                 /* the trailing WS is at paraLevel, which differs from levels[0] */
209                 pLineBiDi->direction=UBIDI_MIXED;
210             } else {
211                 /* see if levels[1..trailingWSStart-1] have the same direction as levels[0] and paraLevel */
212                 i=1;
213                 for(;;) {
214                     if(i==trailingWSStart) {
215                         /* the direction values match those in level */
216                         pLineBiDi->direction=(UBiDiDirection)level;
217                         break;
218                     } else if((levels[i]&1)!=level) {
219                         pLineBiDi->direction=UBIDI_MIXED;
220                         break;
221                     }
222                     ++i;
223                 }
224             }
225         }
226 
227         switch(pLineBiDi->direction) {
228         case UBIDI_LTR:
229             /* make sure paraLevel is even */
230             pLineBiDi->paraLevel=(UBiDiLevel)((pLineBiDi->paraLevel+1)&~1);
231 
232             /* all levels are implicitly at paraLevel (important for ubidi_getLevels()) */
233             pLineBiDi->trailingWSStart=0;
234             break;
235         case UBIDI_RTL:
236             /* make sure paraLevel is odd */
237             pLineBiDi->paraLevel|=1;
238 
239             /* all levels are implicitly at paraLevel (important for ubidi_getLevels()) */
240             pLineBiDi->trailingWSStart=0;
241             break;
242         default:
243             break;
244         }
245     }
246     pLineBiDi->pParaBiDi=pParaBiDi;     /* mark successful setLine */
247 }
248 
249 U_CAPI UBiDiLevel U_EXPORT2
ubidi_getLevelAt(const UBiDi * pBiDi,int32_t charIndex)250 ubidi_getLevelAt(const UBiDi *pBiDi, int32_t charIndex) {
251     /* return paraLevel if in the trailing WS run, otherwise the real level */
252     if(!IS_VALID_PARA_OR_LINE(pBiDi) || charIndex<0 || pBiDi->length<=charIndex) {
253         return 0;
254     } else if(pBiDi->direction!=UBIDI_MIXED || charIndex>=pBiDi->trailingWSStart) {
255         return GET_PARALEVEL(pBiDi, charIndex);
256     } else {
257         return pBiDi->levels[charIndex];
258     }
259 }
260 
261 U_CAPI const UBiDiLevel * U_EXPORT2
ubidi_getLevels(UBiDi * pBiDi,UErrorCode * pErrorCode)262 ubidi_getLevels(UBiDi *pBiDi, UErrorCode *pErrorCode) {
263     int32_t start, length;
264 
265     RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, nullptr);
266     RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, nullptr);
267     if((length=pBiDi->length)<=0) {
268         *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
269         return nullptr;
270     }
271     if((start=pBiDi->trailingWSStart)==length) {
272         /* the current levels array reflects the WS run */
273         return pBiDi->levels;
274     }
275 
276     /*
277      * After the previous if(), we know that the levels array
278      * has an implicit trailing WS run and therefore does not fully
279      * reflect itself all the levels.
280      * This must be a UBiDi object for a line, and
281      * we need to create a new levels array.
282      */
283     if(getLevelsMemory(pBiDi, length)) {
284         UBiDiLevel *levels=pBiDi->levelsMemory;
285 
286         if(start>0 && levels!=pBiDi->levels) {
287             uprv_memcpy(levels, pBiDi->levels, start);
288         }
289         /* pBiDi->paraLevel is ok even if contextual multiple paragraphs,
290            since pBidi is a line object                                     */
291         uprv_memset(levels+start, pBiDi->paraLevel, length-start);
292 
293         /* this new levels array is set for the line and reflects the WS run */
294         pBiDi->trailingWSStart=length;
295         return pBiDi->levels=levels;
296     } else {
297         /* out of memory */
298         *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
299         return nullptr;
300     }
301 }
302 
303 U_CAPI void U_EXPORT2
ubidi_getLogicalRun(const UBiDi * pBiDi,int32_t logicalPosition,int32_t * pLogicalLimit,UBiDiLevel * pLevel)304 ubidi_getLogicalRun(const UBiDi *pBiDi, int32_t logicalPosition,
305                     int32_t *pLogicalLimit, UBiDiLevel *pLevel) {
306     UErrorCode errorCode;
307     int32_t runCount, visualStart, logicalLimit, logicalFirst, i;
308     Run iRun;
309 
310     errorCode=U_ZERO_ERROR;
311     RETURN_VOID_IF_BAD_RANGE(logicalPosition, 0, pBiDi->length, errorCode);
312     /* ubidi_countRuns will check VALID_PARA_OR_LINE */
313     runCount=ubidi_countRuns((UBiDi *)pBiDi, &errorCode);
314     if(U_FAILURE(errorCode)) {
315         return;
316     }
317     /* this is done based on runs rather than on levels since levels have
318        a special interpretation when UBIDI_REORDER_RUNS_ONLY
319      */
320     visualStart=logicalLimit=0;
321     iRun=pBiDi->runs[0];
322 
323     for(i=0; i<runCount; i++) {
324         iRun = pBiDi->runs[i];
325         logicalFirst=GET_INDEX(iRun.logicalStart);
326         logicalLimit=logicalFirst+iRun.visualLimit-visualStart;
327         if((logicalPosition>=logicalFirst) &&
328            (logicalPosition<logicalLimit)) {
329             break;
330         }
331         visualStart = iRun.visualLimit;
332     }
333     if(pLogicalLimit) {
334         *pLogicalLimit=logicalLimit;
335     }
336     if(pLevel) {
337         if(pBiDi->reorderingMode==UBIDI_REORDER_RUNS_ONLY) {
338             *pLevel=(UBiDiLevel)GET_ODD_BIT(iRun.logicalStart);
339         }
340         else if(pBiDi->direction!=UBIDI_MIXED || logicalPosition>=pBiDi->trailingWSStart) {
341             *pLevel=GET_PARALEVEL(pBiDi, logicalPosition);
342         } else {
343         *pLevel=pBiDi->levels[logicalPosition];
344         }
345     }
346 }
347 
348 /* runs API functions ------------------------------------------------------- */
349 
350 U_CAPI int32_t U_EXPORT2
ubidi_countRuns(UBiDi * pBiDi,UErrorCode * pErrorCode)351 ubidi_countRuns(UBiDi *pBiDi, UErrorCode *pErrorCode) {
352     RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
353     RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
354     ubidi_getRuns(pBiDi, pErrorCode);
355     if(U_FAILURE(*pErrorCode)) {
356         return -1;
357     }
358     return pBiDi->runCount;
359 }
360 
361 U_CAPI UBiDiDirection U_EXPORT2
ubidi_getVisualRun(UBiDi * pBiDi,int32_t runIndex,int32_t * pLogicalStart,int32_t * pLength)362 ubidi_getVisualRun(UBiDi *pBiDi, int32_t runIndex,
363                    int32_t *pLogicalStart, int32_t *pLength)
364 {
365     int32_t start;
366     UErrorCode errorCode = U_ZERO_ERROR;
367     RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, errorCode, UBIDI_LTR);
368     ubidi_getRuns(pBiDi, &errorCode);
369     if(U_FAILURE(errorCode)) {
370         return UBIDI_LTR;
371     }
372     RETURN_IF_BAD_RANGE(runIndex, 0, pBiDi->runCount, errorCode, UBIDI_LTR);
373 
374     start=pBiDi->runs[runIndex].logicalStart;
375     if(pLogicalStart!=nullptr) {
376         *pLogicalStart=GET_INDEX(start);
377     }
378     if(pLength!=nullptr) {
379         if(runIndex>0) {
380             *pLength=pBiDi->runs[runIndex].visualLimit-
381                      pBiDi->runs[runIndex-1].visualLimit;
382         } else {
383             *pLength=pBiDi->runs[0].visualLimit;
384         }
385     }
386     return (UBiDiDirection)GET_ODD_BIT(start);
387 }
388 
389 /* in trivial cases there is only one trivial run; called by ubidi_getRuns() */
390 static void
getSingleRun(UBiDi * pBiDi,UBiDiLevel level)391 getSingleRun(UBiDi *pBiDi, UBiDiLevel level) {
392     /* simple, single-run case */
393     pBiDi->runs=pBiDi->simpleRuns;
394     pBiDi->runCount=1;
395 
396     /* fill and reorder the single run */
397     pBiDi->runs[0].logicalStart=MAKE_INDEX_ODD_PAIR(0, level);
398     pBiDi->runs[0].visualLimit=pBiDi->length;
399     pBiDi->runs[0].insertRemove=0;
400 }
401 
402 /* reorder the runs array (L2) ---------------------------------------------- */
403 
404 /*
405  * Reorder the same-level runs in the runs array.
406  * Here, runCount>1 and maxLevel>=minLevel>=paraLevel.
407  * All the visualStart fields=logical start before reordering.
408  * The "odd" bits are not set yet.
409  *
410  * Reordering with this data structure lends itself to some handy shortcuts:
411  *
412  * Since each run is moved but not modified, and since at the initial maxLevel
413  * each sequence of same-level runs consists of only one run each, we
414  * don't need to do anything there and can predecrement maxLevel.
415  * In many simple cases, the reordering is thus done entirely in the
416  * index mapping.
417  * Also, reordering occurs only down to the lowest odd level that occurs,
418  * which is minLevel|1. However, if the lowest level itself is odd, then
419  * in the last reordering the sequence of the runs at this level or higher
420  * will be all runs, and we don't need the elaborate loop to search for them.
421  * This is covered by ++minLevel instead of minLevel|=1 followed
422  * by an extra reorder-all after the reorder-some loop.
423  * About a trailing WS run:
424  * Such a run would need special treatment because its level is not
425  * reflected in levels[] if this is not a paragraph object.
426  * Instead, all characters from trailingWSStart on are implicitly at
427  * paraLevel.
428  * However, for all maxLevel>paraLevel, this run will never be reordered
429  * and does not need to be taken into account. maxLevel==paraLevel is only reordered
430  * if minLevel==paraLevel is odd, which is done in the extra segment.
431  * This means that for the main reordering loop we don't need to consider
432  * this run and can --runCount. If it is later part of the all-runs
433  * reordering, then runCount is adjusted accordingly.
434  */
435 static void
reorderLine(UBiDi * pBiDi,UBiDiLevel minLevel,UBiDiLevel maxLevel)436 reorderLine(UBiDi *pBiDi, UBiDiLevel minLevel, UBiDiLevel maxLevel) {
437     Run *runs, tempRun;
438     UBiDiLevel *levels;
439     int32_t firstRun, endRun, limitRun, runCount;
440 
441     /* nothing to do? */
442     if(maxLevel<=(minLevel|1)) {
443         return;
444     }
445 
446     /*
447      * Reorder only down to the lowest odd level
448      * and reorder at an odd minLevel in a separate, simpler loop.
449      * See comments above for why minLevel is always incremented.
450      */
451     ++minLevel;
452 
453     runs=pBiDi->runs;
454     levels=pBiDi->levels;
455     runCount=pBiDi->runCount;
456 
457     /* do not include the WS run at paraLevel<=old minLevel except in the simple loop */
458     if(pBiDi->trailingWSStart<pBiDi->length) {
459         --runCount;
460     }
461 
462     while(--maxLevel>=minLevel) {
463         firstRun=0;
464 
465         /* loop for all sequences of runs */
466         for(;;) {
467             /* look for a sequence of runs that are all at >=maxLevel */
468             /* look for the first run of such a sequence */
469             while(firstRun<runCount && levels[runs[firstRun].logicalStart]<maxLevel) {
470                 ++firstRun;
471             }
472             if(firstRun>=runCount) {
473                 break;  /* no more such runs */
474             }
475 
476             /* look for the limit run of such a sequence (the run behind it) */
477             for(limitRun=firstRun; ++limitRun<runCount && levels[runs[limitRun].logicalStart]>=maxLevel;) {}
478 
479             /* Swap the entire sequence of runs from firstRun to limitRun-1. */
480             endRun=limitRun-1;
481             while(firstRun<endRun) {
482                 tempRun = runs[firstRun];
483                 runs[firstRun]=runs[endRun];
484                 runs[endRun]=tempRun;
485                 ++firstRun;
486                 --endRun;
487             }
488 
489             if(limitRun==runCount) {
490                 break;  /* no more such runs */
491             } else {
492                 firstRun=limitRun+1;
493             }
494         }
495     }
496 
497     /* now do maxLevel==old minLevel (==odd!), see above */
498     if(!(minLevel&1)) {
499         firstRun=0;
500 
501         /* include the trailing WS run in this complete reordering */
502         if(pBiDi->trailingWSStart==pBiDi->length) {
503             --runCount;
504         }
505 
506         /* Swap the entire sequence of all runs. (endRun==runCount) */
507         while(firstRun<runCount) {
508             tempRun=runs[firstRun];
509             runs[firstRun]=runs[runCount];
510             runs[runCount]=tempRun;
511             ++firstRun;
512             --runCount;
513         }
514     }
515 }
516 
517 /* compute the runs array --------------------------------------------------- */
518 
getRunFromLogicalIndex(UBiDi * pBiDi,int32_t logicalIndex)519 static int32_t getRunFromLogicalIndex(UBiDi *pBiDi, int32_t logicalIndex) {
520     Run *runs=pBiDi->runs;
521     int32_t runCount=pBiDi->runCount, visualStart=0, i, length, logicalStart;
522 
523     for(i=0; i<runCount; i++) {
524         length=runs[i].visualLimit-visualStart;
525         logicalStart=GET_INDEX(runs[i].logicalStart);
526         if((logicalIndex>=logicalStart) && (logicalIndex<(logicalStart+length))) {
527             return i;
528         }
529         visualStart+=length;
530     }
531     /* we should never get here */
532     UPRV_UNREACHABLE_EXIT;
533 }
534 
535 /*
536  * Compute the runs array from the levels array.
537  * After ubidi_getRuns() returns true, runCount is guaranteed to be >0
538  * and the runs are reordered.
539  * Odd-level runs have visualStart on their visual right edge and
540  * they progress visually to the left.
541  * If option UBIDI_OPTION_INSERT_MARKS is set, insertRemove will contain the
542  * sum of appropriate LRM/RLM_BEFORE/AFTER flags.
543  * If option UBIDI_OPTION_REMOVE_CONTROLS is set, insertRemove will contain the
544  * negative number of BiDi control characters within this run.
545  */
546 U_CFUNC UBool
ubidi_getRuns(UBiDi * pBiDi,UErrorCode *)547 ubidi_getRuns(UBiDi *pBiDi, UErrorCode*) {
548     /*
549      * This method returns immediately if the runs are already set. This
550      * includes the case of length==0 (handled in setPara)..
551      */
552     if (pBiDi->runCount>=0) {
553         return true;
554     }
555 
556     if(pBiDi->direction!=UBIDI_MIXED) {
557         /* simple, single-run case - this covers length==0 */
558         /* pBiDi->paraLevel is ok even for contextual multiple paragraphs */
559         getSingleRun(pBiDi, pBiDi->paraLevel);
560     } else /* UBIDI_MIXED, length>0 */ {
561         /* mixed directionality */
562         int32_t length=pBiDi->length, limit;
563         UBiDiLevel *levels=pBiDi->levels;
564         int32_t i, runCount;
565         UBiDiLevel level=UBIDI_DEFAULT_LTR;   /* initialize with no valid level */
566         /*
567          * If there are WS characters at the end of the line
568          * and the run preceding them has a level different from
569          * paraLevel, then they will form their own run at paraLevel (L1).
570          * Count them separately.
571          * We need some special treatment for this in order to not
572          * modify the levels array which a line UBiDi object shares
573          * with its paragraph parent and its other line siblings.
574          * In other words, for the trailing WS, it may be
575          * levels[]!=paraLevel but we have to treat it like it were so.
576          */
577         limit=pBiDi->trailingWSStart;
578         /* count the runs, there is at least one non-WS run, and limit>0 */
579         runCount=0;
580         for(i=0; i<limit; ++i) {
581             /* increment runCount at the start of each run */
582             if(levels[i]!=level) {
583                 ++runCount;
584                 level=levels[i];
585             }
586         }
587 
588         /*
589          * We don't need to see if the last run can be merged with a trailing
590          * WS run because setTrailingWSStart() would have done that.
591          */
592         if(runCount==1 && limit==length) {
593             /* There is only one non-WS run and no trailing WS-run. */
594             getSingleRun(pBiDi, levels[0]);
595         } else /* runCount>1 || limit<length */ {
596             /* allocate and set the runs */
597             Run *runs;
598             int32_t runIndex, start;
599             UBiDiLevel minLevel=UBIDI_MAX_EXPLICIT_LEVEL+1, maxLevel=0;
600 
601             /* now, count a (non-mergeable) WS run */
602             if(limit<length) {
603                 ++runCount;
604             }
605 
606             /* runCount>1 */
607             if(getRunsMemory(pBiDi, runCount)) {
608                 runs=pBiDi->runsMemory;
609             } else {
610                 return false;
611             }
612 
613             /* set the runs */
614             /* FOOD FOR THOUGHT: this could be optimized, e.g.:
615              * 464->444, 484->444, 575->555, 595->555
616              * However, that would take longer. Check also how it would
617              * interact with BiDi control removal and inserting Marks.
618              */
619             runIndex=0;
620 
621             /* search for the run limits and initialize visualLimit values with the run lengths */
622             i=0;
623             do {
624                 /* prepare this run */
625                 start=i;
626                 level=levels[i];
627                 if(level<minLevel) {
628                     minLevel=level;
629                 }
630                 if(level>maxLevel) {
631                     maxLevel=level;
632                 }
633 
634                 /* look for the run limit */
635                 while(++i<limit && levels[i]==level) {}
636 
637                 /* i is another run limit */
638                 runs[runIndex].logicalStart=start;
639                 runs[runIndex].visualLimit=i-start;
640                 runs[runIndex].insertRemove=0;
641                 ++runIndex;
642             } while(i<limit);
643 
644             if(limit<length) {
645                 /* there is a separate WS run */
646                 runs[runIndex].logicalStart=limit;
647                 runs[runIndex].visualLimit=length-limit;
648                 /* For the trailing WS run, pBiDi->paraLevel is ok even
649                    if contextual multiple paragraphs.                   */
650                 if(pBiDi->paraLevel<minLevel) {
651                     minLevel=pBiDi->paraLevel;
652                 }
653             }
654 
655             /* set the object fields */
656             pBiDi->runs=runs;
657             pBiDi->runCount=runCount;
658 
659             reorderLine(pBiDi, minLevel, maxLevel);
660 
661             /* now add the direction flags and adjust the visualLimit's to be just that */
662             /* this loop will also handle the trailing WS run */
663             limit=0;
664             for(i=0; i<runCount; ++i) {
665                 ADD_ODD_BIT_FROM_LEVEL(runs[i].logicalStart, levels[runs[i].logicalStart]);
666                 limit+=runs[i].visualLimit;
667                 runs[i].visualLimit=limit;
668             }
669 
670             /* Set the "odd" bit for the trailing WS run. */
671             /* For a RTL paragraph, it will be the *first* run in visual order. */
672             /* For the trailing WS run, pBiDi->paraLevel is ok even if
673                contextual multiple paragraphs.                          */
674             if(runIndex<runCount) {
675                 int32_t trailingRun = ((pBiDi->paraLevel & 1) != 0)? 0 : runIndex;
676 
677                 ADD_ODD_BIT_FROM_LEVEL(runs[trailingRun].logicalStart, pBiDi->paraLevel);
678             }
679         }
680     }
681 
682     /* handle insert LRM/RLM BEFORE/AFTER run */
683     if(pBiDi->insertPoints.size>0) {
684         Point *point, *start=pBiDi->insertPoints.points,
685                       *limit=start+pBiDi->insertPoints.size;
686         int32_t runIndex;
687         for(point=start; point<limit; point++) {
688             runIndex=getRunFromLogicalIndex(pBiDi, point->pos);
689             pBiDi->runs[runIndex].insertRemove|=point->flag;
690         }
691     }
692 
693     /* handle remove BiDi control characters */
694     if(pBiDi->controlCount>0) {
695         int32_t runIndex;
696         const char16_t *start=pBiDi->text, *limit=start+pBiDi->length, *pu;
697         for(pu=start; pu<limit; pu++) {
698             if(IS_BIDI_CONTROL_CHAR(*pu)) {
699                 runIndex=getRunFromLogicalIndex(pBiDi, (int32_t)(pu-start));
700                 pBiDi->runs[runIndex].insertRemove--;
701             }
702         }
703     }
704 
705     return true;
706 }
707 
708 static UBool
prepareReorder(const UBiDiLevel * levels,int32_t length,int32_t * indexMap,UBiDiLevel * pMinLevel,UBiDiLevel * pMaxLevel)709 prepareReorder(const UBiDiLevel *levels, int32_t length,
710                int32_t *indexMap,
711                UBiDiLevel *pMinLevel, UBiDiLevel *pMaxLevel) {
712     int32_t start;
713     UBiDiLevel level, minLevel, maxLevel;
714 
715     if(levels==nullptr || length<=0) {
716         return false;
717     }
718 
719     /* determine minLevel and maxLevel */
720     minLevel=UBIDI_MAX_EXPLICIT_LEVEL+1;
721     maxLevel=0;
722     for(start=length; start>0;) {
723         level=levels[--start];
724         if(level>UBIDI_MAX_EXPLICIT_LEVEL+1) {
725             return false;
726         }
727         if(level<minLevel) {
728             minLevel=level;
729         }
730         if(level>maxLevel) {
731             maxLevel=level;
732         }
733     }
734     *pMinLevel=minLevel;
735     *pMaxLevel=maxLevel;
736 
737     /* initialize the index map */
738     for(start=length; start>0;) {
739         --start;
740         indexMap[start]=start;
741     }
742 
743     return true;
744 }
745 
746 /* reorder a line based on a levels array (L2) ------------------------------ */
747 
748 U_CAPI void U_EXPORT2
ubidi_reorderLogical(const UBiDiLevel * levels,int32_t length,int32_t * indexMap)749 ubidi_reorderLogical(const UBiDiLevel *levels, int32_t length, int32_t *indexMap) {
750     int32_t start, limit, sumOfSosEos;
751     UBiDiLevel minLevel = 0, maxLevel = 0;
752 
753     if(indexMap==nullptr || !prepareReorder(levels, length, indexMap, &minLevel, &maxLevel)) {
754         return;
755     }
756 
757     /* nothing to do? */
758     if(minLevel==maxLevel && (minLevel&1)==0) {
759         return;
760     }
761 
762     /* reorder only down to the lowest odd level */
763     minLevel|=1;
764 
765     /* loop maxLevel..minLevel */
766     do {
767         start=0;
768 
769         /* loop for all sequences of levels to reorder at the current maxLevel */
770         for(;;) {
771             /* look for a sequence of levels that are all at >=maxLevel */
772             /* look for the first index of such a sequence */
773             while(start<length && levels[start]<maxLevel) {
774                 ++start;
775             }
776             if(start>=length) {
777                 break;  /* no more such sequences */
778             }
779 
780             /* look for the limit of such a sequence (the index behind it) */
781             for(limit=start; ++limit<length && levels[limit]>=maxLevel;) {}
782 
783             /*
784              * sos=start of sequence, eos=end of sequence
785              *
786              * The closed (inclusive) interval from sos to eos includes all the logical
787              * and visual indexes within this sequence. They are logically and
788              * visually contiguous and in the same range.
789              *
790              * For each run, the new visual index=sos+eos-old visual index;
791              * we pre-add sos+eos into sumOfSosEos ->
792              * new visual index=sumOfSosEos-old visual index;
793              */
794             sumOfSosEos=start+limit-1;
795 
796             /* reorder each index in the sequence */
797             do {
798                 indexMap[start]=sumOfSosEos-indexMap[start];
799             } while(++start<limit);
800 
801             /* start==limit */
802             if(limit==length) {
803                 break;  /* no more such sequences */
804             } else {
805                 start=limit+1;
806             }
807         }
808     } while(--maxLevel>=minLevel);
809 }
810 
811 U_CAPI void U_EXPORT2
ubidi_reorderVisual(const UBiDiLevel * levels,int32_t length,int32_t * indexMap)812 ubidi_reorderVisual(const UBiDiLevel *levels, int32_t length, int32_t *indexMap) {
813     int32_t start, end, limit, temp;
814     UBiDiLevel minLevel = 0, maxLevel = 0;
815 
816     if(indexMap==nullptr || !prepareReorder(levels, length, indexMap, &minLevel, &maxLevel)) {
817         return;
818     }
819 
820     /* nothing to do? */
821     if(minLevel==maxLevel && (minLevel&1)==0) {
822         return;
823     }
824 
825     /* reorder only down to the lowest odd level */
826     minLevel|=1;
827 
828     /* loop maxLevel..minLevel */
829     do {
830         start=0;
831 
832         /* loop for all sequences of levels to reorder at the current maxLevel */
833         for(;;) {
834             /* look for a sequence of levels that are all at >=maxLevel */
835             /* look for the first index of such a sequence */
836             while(start<length && levels[start]<maxLevel) {
837                 ++start;
838             }
839             if(start>=length) {
840                 break;  /* no more such runs */
841             }
842 
843             /* look for the limit of such a sequence (the index behind it) */
844             for(limit=start; ++limit<length && levels[limit]>=maxLevel;) {}
845 
846             /*
847              * Swap the entire interval of indexes from start to limit-1.
848              * We don't need to swap the levels for the purpose of this
849              * algorithm: the sequence of levels that we look at does not
850              * move anyway.
851              */
852             end=limit-1;
853             while(start<end) {
854                 temp=indexMap[start];
855                 indexMap[start]=indexMap[end];
856                 indexMap[end]=temp;
857 
858                 ++start;
859                 --end;
860             }
861 
862             if(limit==length) {
863                 break;  /* no more such sequences */
864             } else {
865                 start=limit+1;
866             }
867         }
868     } while(--maxLevel>=minLevel);
869 }
870 
871 /* API functions for logical<->visual mapping ------------------------------- */
872 
873 U_CAPI int32_t U_EXPORT2
ubidi_getVisualIndex(UBiDi * pBiDi,int32_t logicalIndex,UErrorCode * pErrorCode)874 ubidi_getVisualIndex(UBiDi *pBiDi, int32_t logicalIndex, UErrorCode *pErrorCode) {
875     int32_t visualIndex=UBIDI_MAP_NOWHERE;
876     RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
877     RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
878     RETURN_IF_BAD_RANGE(logicalIndex, 0, pBiDi->length, *pErrorCode, -1);
879 
880     /* we can do the trivial cases without the runs array */
881     switch(pBiDi->direction) {
882     case UBIDI_LTR:
883         visualIndex=logicalIndex;
884         break;
885     case UBIDI_RTL:
886         visualIndex=pBiDi->length-logicalIndex-1;
887         break;
888     default:
889         if(!ubidi_getRuns(pBiDi, pErrorCode)) {
890             *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
891             return -1;
892         } else {
893             Run *runs=pBiDi->runs;
894             int32_t i, visualStart=0, offset, length;
895 
896             /* linear search for the run, search on the visual runs */
897             for(i=0; i<pBiDi->runCount; ++i) {
898                 length=runs[i].visualLimit-visualStart;
899                 offset=logicalIndex-GET_INDEX(runs[i].logicalStart);
900                 if(offset>=0 && offset<length) {
901                     if(IS_EVEN_RUN(runs[i].logicalStart)) {
902                         /* LTR */
903                         visualIndex=visualStart+offset;
904                     } else {
905                         /* RTL */
906                         visualIndex=visualStart+length-offset-1;
907                     }
908                     break;          /* exit for loop */
909                 }
910                 visualStart+=length;
911             }
912             if(i>=pBiDi->runCount) {
913                 return UBIDI_MAP_NOWHERE;
914             }
915         }
916     }
917 
918     if(pBiDi->insertPoints.size>0) {
919         /* add the number of added marks until the calculated visual index */
920         Run *runs=pBiDi->runs;
921         int32_t i, length, insertRemove;
922         int32_t visualStart=0, markFound=0;
923         for(i=0; ; i++, visualStart+=length) {
924             length=runs[i].visualLimit-visualStart;
925             insertRemove=runs[i].insertRemove;
926             if(insertRemove & (LRM_BEFORE|RLM_BEFORE)) {
927                 markFound++;
928             }
929             /* is it the run containing the visual index? */
930             if(visualIndex<runs[i].visualLimit) {
931                 return visualIndex+markFound;
932             }
933             if(insertRemove & (LRM_AFTER|RLM_AFTER)) {
934                 markFound++;
935             }
936         }
937     }
938     else if(pBiDi->controlCount>0) {
939         /* subtract the number of controls until the calculated visual index */
940         Run *runs=pBiDi->runs;
941         int32_t i, j, start, limit, length, insertRemove;
942         int32_t visualStart=0, controlFound=0;
943         char16_t uchar=pBiDi->text[logicalIndex];
944         /* is the logical index pointing to a control ? */
945         if(IS_BIDI_CONTROL_CHAR(uchar)) {
946             return UBIDI_MAP_NOWHERE;
947         }
948         /* loop on runs */
949         for(i=0; ; i++, visualStart+=length) {
950             length=runs[i].visualLimit-visualStart;
951             insertRemove=runs[i].insertRemove;
952             /* calculated visual index is beyond this run? */
953             if(visualIndex>=runs[i].visualLimit) {
954                 controlFound-=insertRemove;
955                 continue;
956             }
957             /* calculated visual index must be within current run */
958             if(insertRemove==0) {
959                 return visualIndex-controlFound;
960             }
961             if(IS_EVEN_RUN(runs[i].logicalStart)) {
962                 /* LTR: check from run start to logical index */
963                 start=runs[i].logicalStart;
964                 limit=logicalIndex;
965             } else {
966                 /* RTL: check from logical index to run end */
967                 start=logicalIndex+1;
968                 limit=GET_INDEX(runs[i].logicalStart)+length;
969             }
970             for(j=start; j<limit; j++) {
971                 uchar=pBiDi->text[j];
972                 if(IS_BIDI_CONTROL_CHAR(uchar)) {
973                     controlFound++;
974                 }
975             }
976             return visualIndex-controlFound;
977         }
978     }
979 
980     return visualIndex;
981 }
982 
983 U_CAPI int32_t U_EXPORT2
ubidi_getLogicalIndex(UBiDi * pBiDi,int32_t visualIndex,UErrorCode * pErrorCode)984 ubidi_getLogicalIndex(UBiDi *pBiDi, int32_t visualIndex, UErrorCode *pErrorCode) {
985     Run *runs;
986     int32_t i, runCount, start;
987     RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
988     RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
989     RETURN_IF_BAD_RANGE(visualIndex, 0, pBiDi->resultLength, *pErrorCode, -1);
990     /* we can do the trivial cases without the runs array */
991     if(pBiDi->insertPoints.size==0 && pBiDi->controlCount==0) {
992         if(pBiDi->direction==UBIDI_LTR) {
993             return visualIndex;
994         }
995         else if(pBiDi->direction==UBIDI_RTL) {
996             return pBiDi->length-visualIndex-1;
997         }
998     }
999     if(!ubidi_getRuns(pBiDi, pErrorCode)) {
1000         *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
1001         return -1;
1002     }
1003 
1004     runs=pBiDi->runs;
1005     runCount=pBiDi->runCount;
1006     if(pBiDi->insertPoints.size>0) {
1007         /* handle inserted LRM/RLM */
1008         int32_t markFound=0, insertRemove;
1009         int32_t visualStart=0, length;
1010         runs=pBiDi->runs;
1011         /* subtract number of marks until visual index */
1012         for(i=0; ; i++, visualStart+=length) {
1013             length=runs[i].visualLimit-visualStart;
1014             insertRemove=runs[i].insertRemove;
1015             if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1016                 if(visualIndex<=(visualStart+markFound)) {
1017                     return UBIDI_MAP_NOWHERE;
1018                 }
1019                 markFound++;
1020             }
1021             /* is adjusted visual index within this run? */
1022             if(visualIndex<(runs[i].visualLimit+markFound)) {
1023                 visualIndex-=markFound;
1024                 break;
1025             }
1026             if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1027                 if(visualIndex==(visualStart+length+markFound)) {
1028                     return UBIDI_MAP_NOWHERE;
1029                 }
1030                 markFound++;
1031             }
1032         }
1033     }
1034     else if(pBiDi->controlCount>0) {
1035         /* handle removed BiDi control characters */
1036         int32_t controlFound=0, insertRemove, length;
1037         int32_t logicalStart, logicalEnd, visualStart=0, j, k;
1038         char16_t uchar;
1039         UBool evenRun;
1040         /* add number of controls until visual index */
1041         for(i=0; ; i++, visualStart+=length) {
1042             length=runs[i].visualLimit-visualStart;
1043             insertRemove=runs[i].insertRemove;
1044             /* is adjusted visual index beyond current run? */
1045             if(visualIndex>=(runs[i].visualLimit-controlFound+insertRemove)) {
1046                 controlFound-=insertRemove;
1047                 continue;
1048             }
1049             /* adjusted visual index is within current run */
1050             if(insertRemove==0) {
1051                 visualIndex+=controlFound;
1052                 break;
1053             }
1054             /* count non-control chars until visualIndex */
1055             logicalStart=runs[i].logicalStart;
1056             evenRun=IS_EVEN_RUN(logicalStart);
1057             REMOVE_ODD_BIT(logicalStart);
1058             logicalEnd=logicalStart+length-1;
1059             for(j=0; j<length; j++) {
1060                 k= evenRun ? logicalStart+j : logicalEnd-j;
1061                 uchar=pBiDi->text[k];
1062                 if(IS_BIDI_CONTROL_CHAR(uchar)) {
1063                     controlFound++;
1064                 }
1065                 if((visualIndex+controlFound)==(visualStart+j)) {
1066                     break;
1067                 }
1068             }
1069             visualIndex+=controlFound;
1070             break;
1071         }
1072     }
1073     /* handle all cases */
1074     if(runCount<=10) {
1075         /* linear search for the run */
1076         for(i=0; visualIndex>=runs[i].visualLimit; ++i) {}
1077     } else {
1078         /* binary search for the run */
1079         int32_t begin=0, limit=runCount;
1080 
1081         /* the middle if() is guaranteed to find the run, we don't need a loop limit */
1082         for(;;) {
1083             i=(begin+limit)/2;
1084             if(visualIndex>=runs[i].visualLimit) {
1085                 begin=i+1;
1086             } else if(i==0 || visualIndex>=runs[i-1].visualLimit) {
1087                 break;
1088             } else {
1089                 limit=i;
1090             }
1091         }
1092     }
1093 
1094     start=runs[i].logicalStart;
1095     if(IS_EVEN_RUN(start)) {
1096         /* LTR */
1097         /* the offset in runs[i] is visualIndex-runs[i-1].visualLimit */
1098         if(i>0) {
1099             visualIndex-=runs[i-1].visualLimit;
1100         }
1101         return start+visualIndex;
1102     } else {
1103         /* RTL */
1104         return GET_INDEX(start)+runs[i].visualLimit-visualIndex-1;
1105     }
1106 }
1107 
1108 U_CAPI void U_EXPORT2
ubidi_getLogicalMap(UBiDi * pBiDi,int32_t * indexMap,UErrorCode * pErrorCode)1109 ubidi_getLogicalMap(UBiDi *pBiDi, int32_t *indexMap, UErrorCode *pErrorCode) {
1110     RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
1111     /* ubidi_countRuns() checks for VALID_PARA_OR_LINE */
1112     ubidi_countRuns(pBiDi, pErrorCode);
1113     if(U_FAILURE(*pErrorCode)) {
1114         /* no op */
1115     } else if(indexMap==nullptr) {
1116         *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1117     } else {
1118         /* fill a logical-to-visual index map using the runs[] */
1119         int32_t visualStart, visualLimit, i, j, k;
1120         int32_t logicalStart, logicalLimit;
1121         Run *runs=pBiDi->runs;
1122         if (pBiDi->length<=0) {
1123             return;
1124         }
1125         if (pBiDi->length>pBiDi->resultLength) {
1126             uprv_memset(indexMap, 0xFF, pBiDi->length*sizeof(int32_t));
1127         }
1128 
1129         visualStart=0;
1130         for(j=0; j<pBiDi->runCount; ++j) {
1131             logicalStart=GET_INDEX(runs[j].logicalStart);
1132             visualLimit=runs[j].visualLimit;
1133             if(IS_EVEN_RUN(runs[j].logicalStart)) {
1134                 do { /* LTR */
1135                     indexMap[logicalStart++]=visualStart++;
1136                 } while(visualStart<visualLimit);
1137             } else {
1138                 logicalStart+=visualLimit-visualStart;  /* logicalLimit */
1139                 do { /* RTL */
1140                     indexMap[--logicalStart]=visualStart++;
1141                 } while(visualStart<visualLimit);
1142             }
1143             /* visualStart==visualLimit; */
1144         }
1145 
1146         if(pBiDi->insertPoints.size>0) {
1147             int32_t markFound=0, runCount=pBiDi->runCount;
1148             int32_t length, insertRemove;
1149             visualStart=0;
1150             /* add number of marks found until each index */
1151             for(i=0; i<runCount; i++, visualStart+=length) {
1152                 length=runs[i].visualLimit-visualStart;
1153                 insertRemove=runs[i].insertRemove;
1154                 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1155                     markFound++;
1156                 }
1157                 if(markFound>0) {
1158                     logicalStart=GET_INDEX(runs[i].logicalStart);
1159                     logicalLimit=logicalStart+length;
1160                     for(j=logicalStart; j<logicalLimit; j++) {
1161                         indexMap[j]+=markFound;
1162                     }
1163                 }
1164                 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1165                     markFound++;
1166                 }
1167             }
1168         }
1169         else if(pBiDi->controlCount>0) {
1170             int32_t controlFound=0, runCount=pBiDi->runCount;
1171             int32_t length, insertRemove;
1172             UBool evenRun;
1173             char16_t uchar;
1174             visualStart=0;
1175             /* subtract number of controls found until each index */
1176             for(i=0; i<runCount; i++, visualStart+=length) {
1177                 length=runs[i].visualLimit-visualStart;
1178                 insertRemove=runs[i].insertRemove;
1179                 /* no control found within previous runs nor within this run */
1180                 if((controlFound-insertRemove)==0) {
1181                     continue;
1182                 }
1183                 logicalStart=runs[i].logicalStart;
1184                 evenRun=IS_EVEN_RUN(logicalStart);
1185                 REMOVE_ODD_BIT(logicalStart);
1186                 logicalLimit=logicalStart+length;
1187                 /* if no control within this run */
1188                 if(insertRemove==0) {
1189                     for(j=logicalStart; j<logicalLimit; j++) {
1190                         indexMap[j]-=controlFound;
1191                     }
1192                     continue;
1193                 }
1194                 for(j=0; j<length; j++) {
1195                     k= evenRun ? logicalStart+j : logicalLimit-j-1;
1196                     uchar=pBiDi->text[k];
1197                     if(IS_BIDI_CONTROL_CHAR(uchar)) {
1198                         controlFound++;
1199                         indexMap[k]=UBIDI_MAP_NOWHERE;
1200                         continue;
1201                     }
1202                     indexMap[k]-=controlFound;
1203                 }
1204             }
1205         }
1206     }
1207 }
1208 
1209 U_CAPI void U_EXPORT2
ubidi_getVisualMap(UBiDi * pBiDi,int32_t * indexMap,UErrorCode * pErrorCode)1210 ubidi_getVisualMap(UBiDi *pBiDi, int32_t *indexMap, UErrorCode *pErrorCode) {
1211     RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
1212     if(indexMap==nullptr) {
1213         *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1214         return;
1215     }
1216     /* ubidi_countRuns() checks for VALID_PARA_OR_LINE */
1217     ubidi_countRuns(pBiDi, pErrorCode);
1218     if(U_SUCCESS(*pErrorCode)) {
1219         /* fill a visual-to-logical index map using the runs[] */
1220         Run *runs=pBiDi->runs, *runsLimit=runs+pBiDi->runCount;
1221         int32_t logicalStart, visualStart, visualLimit, *pi=indexMap;
1222 
1223         if (pBiDi->resultLength<=0) {
1224             return;
1225         }
1226         visualStart=0;
1227         for(; runs<runsLimit; ++runs) {
1228             logicalStart=runs->logicalStart;
1229             visualLimit=runs->visualLimit;
1230             if(IS_EVEN_RUN(logicalStart)) {
1231                 do { /* LTR */
1232                     *pi++ = logicalStart++;
1233                 } while(++visualStart<visualLimit);
1234             } else {
1235                 REMOVE_ODD_BIT(logicalStart);
1236                 logicalStart+=visualLimit-visualStart;  /* logicalLimit */
1237                 do { /* RTL */
1238                     *pi++ = --logicalStart;
1239                 } while(++visualStart<visualLimit);
1240             }
1241             /* visualStart==visualLimit; */
1242         }
1243 
1244         if(pBiDi->insertPoints.size>0) {
1245             int32_t markFound=0, runCount=pBiDi->runCount;
1246             int32_t insertRemove, i, j, k;
1247             runs=pBiDi->runs;
1248             /* count all inserted marks */
1249             for(i=0; i<runCount; i++) {
1250                 insertRemove=runs[i].insertRemove;
1251                 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1252                     markFound++;
1253                 }
1254                 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1255                     markFound++;
1256                 }
1257             }
1258             /* move back indexes by number of preceding marks */
1259             k=pBiDi->resultLength;
1260             for(i=runCount-1; i>=0 && markFound>0; i--) {
1261                 insertRemove=runs[i].insertRemove;
1262                 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1263                     indexMap[--k]= UBIDI_MAP_NOWHERE;
1264                     markFound--;
1265                 }
1266                 visualStart= i>0 ? runs[i-1].visualLimit : 0;
1267                 for(j=runs[i].visualLimit-1; j>=visualStart && markFound>0; j--) {
1268                     indexMap[--k]=indexMap[j];
1269                 }
1270                 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1271                     indexMap[--k]= UBIDI_MAP_NOWHERE;
1272                     markFound--;
1273                 }
1274             }
1275         }
1276         else if(pBiDi->controlCount>0) {
1277             int32_t runCount=pBiDi->runCount, logicalEnd;
1278             int32_t insertRemove, length, i, j, k, m;
1279             char16_t uchar;
1280             UBool evenRun;
1281             runs=pBiDi->runs;
1282             visualStart=0;
1283             /* move forward indexes by number of preceding controls */
1284             k=0;
1285             for(i=0; i<runCount; i++, visualStart+=length) {
1286                 length=runs[i].visualLimit-visualStart;
1287                 insertRemove=runs[i].insertRemove;
1288                 /* if no control found yet, nothing to do in this run */
1289                 if((insertRemove==0)&&(k==visualStart)) {
1290                     k+=length;
1291                     continue;
1292                 }
1293                 /* if no control in this run */
1294                 if(insertRemove==0) {
1295                     visualLimit=runs[i].visualLimit;
1296                     for(j=visualStart; j<visualLimit; j++) {
1297                         indexMap[k++]=indexMap[j];
1298                     }
1299                     continue;
1300                 }
1301                 logicalStart=runs[i].logicalStart;
1302                 evenRun=IS_EVEN_RUN(logicalStart);
1303                 REMOVE_ODD_BIT(logicalStart);
1304                 logicalEnd=logicalStart+length-1;
1305                 for(j=0; j<length; j++) {
1306                     m= evenRun ? logicalStart+j : logicalEnd-j;
1307                     uchar=pBiDi->text[m];
1308                     if(!IS_BIDI_CONTROL_CHAR(uchar)) {
1309                         indexMap[k++]=m;
1310                     }
1311                 }
1312             }
1313         }
1314     }
1315 }
1316 
1317 U_CAPI void U_EXPORT2
ubidi_invertMap(const int32_t * srcMap,int32_t * destMap,int32_t length)1318 ubidi_invertMap(const int32_t *srcMap, int32_t *destMap, int32_t length) {
1319     if(srcMap!=nullptr && destMap!=nullptr && length>0) {
1320         const int32_t *pi;
1321         int32_t destLength=-1, count=0;
1322         /* find highest value and count positive indexes in srcMap */
1323         pi=srcMap+length;
1324         while(pi>srcMap) {
1325             if(*--pi>destLength) {
1326                 destLength=*pi;
1327             }
1328             if(*pi>=0) {
1329                 count++;
1330             }
1331         }
1332         destLength++;           /* add 1 for origin 0 */
1333         if(count<destLength) {
1334             /* we must fill unmatched destMap entries with -1 */
1335             uprv_memset(destMap, 0xFF, destLength*sizeof(int32_t));
1336         }
1337         pi=srcMap+length;
1338         while(length>0) {
1339             if(*--pi>=0) {
1340                 destMap[*pi]=--length;
1341             } else {
1342                 --length;
1343             }
1344         }
1345     }
1346 }
1347