1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 ******************************************************************************
5 *
6 * Copyright (C) 1999-2015, International Business Machines
7 * Corporation and others. All Rights Reserved.
8 *
9 ******************************************************************************
10 * file name: ubidiln.c
11 * encoding: UTF-8
12 * tab size: 8 (not used)
13 * indentation:4
14 *
15 * created on: 1999aug06
16 * created by: Markus W. Scherer, updated by Matitiahu Allouche
17 */
18
19 #include "cmemory.h"
20 #include "unicode/utypes.h"
21 #include "unicode/ustring.h"
22 #include "unicode/uchar.h"
23 #include "unicode/ubidi.h"
24 #include "ubidiimp.h"
25 #include "uassert.h"
26
27 /*
28 * General remarks about the functions in this file:
29 *
30 * These functions deal with the aspects of potentially mixed-directional
31 * text in a single paragraph or in a line of a single paragraph
32 * which has already been processed according to
33 * the Unicode 6.3 BiDi algorithm as defined in
34 * https://www.unicode.org/reports/tr9/ , version 28,
35 * also described in The Unicode Standard, Version 6.3.0 .
36 *
37 * This means that there is a UBiDi object with a levels
38 * and a dirProps array.
39 * paraLevel and direction are also set.
40 * Only if the length of the text is zero, then levels==dirProps==nullptr.
41 *
42 * The overall directionality of the paragraph
43 * or line is used to bypass the reordering steps if possible.
44 * Even purely RTL text does not need reordering there because
45 * the ubidi_getLogical/VisualIndex() functions can compute the
46 * index on the fly in such a case.
47 *
48 * The implementation of the access to same-level-runs and of the reordering
49 * do attempt to provide better performance and less memory usage compared to
50 * a direct implementation of especially rule (L2) with an array of
51 * one (32-bit) integer per text character.
52 *
53 * Here, the levels array is scanned as soon as necessary, and a vector of
54 * same-level-runs is created. Reordering then is done on this vector.
55 * For each run of text positions that were resolved to the same level,
56 * only 8 bytes are stored: the first text position of the run and the visual
57 * position behind the run after reordering.
58 * One sign bit is used to hold the directionality of the run.
59 * This is inefficient if there are many very short runs. If the average run
60 * length is <2, then this uses more memory.
61 *
62 * In a further attempt to save memory, the levels array is never changed
63 * after all the resolution rules (Xn, Wn, Nn, In).
64 * Many functions have to consider the field trailingWSStart:
65 * if it is less than length, then there is an implicit trailing run
66 * at the paraLevel,
67 * which is not reflected in the levels array.
68 * This allows a line UBiDi object to use the same levels array as
69 * its paragraph parent object.
70 *
71 * When a UBiDi object is created for a line of a paragraph, then the
72 * paragraph's levels and dirProps arrays are reused by way of setting
73 * a pointer into them, not by copying. This again saves memory and forbids to
74 * change the now shared levels for (L1).
75 */
76
77 /* handle trailing WS (L1) -------------------------------------------------- */
78
79 /*
80 * setTrailingWSStart() sets the start index for a trailing
81 * run of WS in the line. This is necessary because we do not modify
82 * the paragraph's levels array that we just point into.
83 * Using trailingWSStart is another form of performing (L1).
84 *
85 * To make subsequent operations easier, we also include the run
86 * before the WS if it is at the paraLevel - we merge the two here.
87 *
88 * This function is called only from ubidi_setLine(), so pBiDi->paraLevel is
89 * set correctly for the line even when contextual multiple paragraphs.
90 */
91 static void
setTrailingWSStart(UBiDi * pBiDi)92 setTrailingWSStart(UBiDi *pBiDi) {
93 /* pBiDi->direction!=UBIDI_MIXED */
94
95 const DirProp *dirProps=pBiDi->dirProps;
96 UBiDiLevel *levels=pBiDi->levels;
97 int32_t start=pBiDi->length;
98 UBiDiLevel paraLevel=pBiDi->paraLevel;
99
100 /* If the line is terminated by a block separator, all preceding WS etc...
101 are already set to paragraph level.
102 Setting trailingWSStart to pBidi->length will avoid changing the
103 level of B chars from 0 to paraLevel in ubidi_getLevels when
104 orderParagraphsLTR==true.
105 */
106 if(dirProps[start-1]==B) {
107 pBiDi->trailingWSStart=start; /* currently == pBiDi->length */
108 return;
109 }
110 /* go backwards across all WS, BN, explicit codes */
111 while(start>0 && DIRPROP_FLAG(dirProps[start-1])&MASK_WS) {
112 --start;
113 }
114
115 /* if the WS run can be merged with the previous run then do so here */
116 while(start>0 && levels[start-1]==paraLevel) {
117 --start;
118 }
119
120 pBiDi->trailingWSStart=start;
121 }
122
123 /* ubidi_setLine ------------------------------------------------------------ */
124
125 U_CAPI void U_EXPORT2
ubidi_setLine(const UBiDi * pParaBiDi,int32_t start,int32_t limit,UBiDi * pLineBiDi,UErrorCode * pErrorCode)126 ubidi_setLine(const UBiDi *pParaBiDi,
127 int32_t start, int32_t limit,
128 UBiDi *pLineBiDi,
129 UErrorCode *pErrorCode) {
130 int32_t length;
131
132 /* check the argument values */
133 RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
134 RETURN_VOID_IF_NOT_VALID_PARA(pParaBiDi, *pErrorCode);
135 RETURN_VOID_IF_BAD_RANGE(start, 0, limit, *pErrorCode);
136 RETURN_VOID_IF_BAD_RANGE(limit, 0, pParaBiDi->length+1, *pErrorCode);
137 if(pLineBiDi==nullptr) {
138 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
139 return;
140 }
141 if(ubidi_getParagraph(pParaBiDi, start, nullptr, nullptr, nullptr, pErrorCode) !=
142 ubidi_getParagraph(pParaBiDi, limit-1, nullptr, nullptr, nullptr, pErrorCode)) {
143 /* the line crosses a paragraph boundary */
144 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
145 return;
146 }
147
148 /* set the values in pLineBiDi from its pParaBiDi parent */
149 pLineBiDi->pParaBiDi=nullptr; /* mark unfinished setLine */
150 pLineBiDi->text=pParaBiDi->text+start;
151 length=pLineBiDi->length=limit-start;
152 pLineBiDi->resultLength=pLineBiDi->originalLength=length;
153 pLineBiDi->paraLevel=GET_PARALEVEL(pParaBiDi, start);
154 pLineBiDi->paraCount=pParaBiDi->paraCount;
155 pLineBiDi->runs=nullptr;
156 pLineBiDi->flags=0;
157 pLineBiDi->reorderingMode=pParaBiDi->reorderingMode;
158 pLineBiDi->reorderingOptions=pParaBiDi->reorderingOptions;
159 pLineBiDi->controlCount=0;
160 if(pParaBiDi->controlCount>0) {
161 int32_t j;
162 for(j=start; j<limit; j++) {
163 if(IS_BIDI_CONTROL_CHAR(pParaBiDi->text[j])) {
164 pLineBiDi->controlCount++;
165 }
166 }
167 pLineBiDi->resultLength-=pLineBiDi->controlCount;
168 }
169
170 pLineBiDi->dirProps=pParaBiDi->dirProps+start;
171 pLineBiDi->levels=pParaBiDi->levels+start;
172 pLineBiDi->runCount=-1;
173
174 if(pParaBiDi->direction!=UBIDI_MIXED) {
175 /* the parent is already trivial */
176 pLineBiDi->direction=pParaBiDi->direction;
177
178 /*
179 * The parent's levels are all either
180 * implicitly or explicitly ==paraLevel;
181 * do the same here.
182 */
183 if(pParaBiDi->trailingWSStart<=start) {
184 pLineBiDi->trailingWSStart=0;
185 } else if(pParaBiDi->trailingWSStart<limit) {
186 pLineBiDi->trailingWSStart=pParaBiDi->trailingWSStart-start;
187 } else {
188 pLineBiDi->trailingWSStart=length;
189 }
190 } else {
191 const UBiDiLevel *levels=pLineBiDi->levels;
192 int32_t i, trailingWSStart;
193 UBiDiLevel level;
194
195 setTrailingWSStart(pLineBiDi);
196 trailingWSStart=pLineBiDi->trailingWSStart;
197
198 /* recalculate pLineBiDi->direction */
199 if(trailingWSStart==0) {
200 /* all levels are at paraLevel */
201 pLineBiDi->direction=(UBiDiDirection)(pLineBiDi->paraLevel&1);
202 } else {
203 /* get the level of the first character */
204 level=(UBiDiLevel)(levels[0]&1);
205
206 /* if there is anything of a different level, then the line is mixed */
207 if(trailingWSStart<length && (pLineBiDi->paraLevel&1)!=level) {
208 /* the trailing WS is at paraLevel, which differs from levels[0] */
209 pLineBiDi->direction=UBIDI_MIXED;
210 } else {
211 /* see if levels[1..trailingWSStart-1] have the same direction as levels[0] and paraLevel */
212 i=1;
213 for(;;) {
214 if(i==trailingWSStart) {
215 /* the direction values match those in level */
216 pLineBiDi->direction=(UBiDiDirection)level;
217 break;
218 } else if((levels[i]&1)!=level) {
219 pLineBiDi->direction=UBIDI_MIXED;
220 break;
221 }
222 ++i;
223 }
224 }
225 }
226
227 switch(pLineBiDi->direction) {
228 case UBIDI_LTR:
229 /* make sure paraLevel is even */
230 pLineBiDi->paraLevel=(UBiDiLevel)((pLineBiDi->paraLevel+1)&~1);
231
232 /* all levels are implicitly at paraLevel (important for ubidi_getLevels()) */
233 pLineBiDi->trailingWSStart=0;
234 break;
235 case UBIDI_RTL:
236 /* make sure paraLevel is odd */
237 pLineBiDi->paraLevel|=1;
238
239 /* all levels are implicitly at paraLevel (important for ubidi_getLevels()) */
240 pLineBiDi->trailingWSStart=0;
241 break;
242 default:
243 break;
244 }
245 }
246 pLineBiDi->pParaBiDi=pParaBiDi; /* mark successful setLine */
247 }
248
249 U_CAPI UBiDiLevel U_EXPORT2
ubidi_getLevelAt(const UBiDi * pBiDi,int32_t charIndex)250 ubidi_getLevelAt(const UBiDi *pBiDi, int32_t charIndex) {
251 /* return paraLevel if in the trailing WS run, otherwise the real level */
252 if(!IS_VALID_PARA_OR_LINE(pBiDi) || charIndex<0 || pBiDi->length<=charIndex) {
253 return 0;
254 } else if(pBiDi->direction!=UBIDI_MIXED || charIndex>=pBiDi->trailingWSStart) {
255 return GET_PARALEVEL(pBiDi, charIndex);
256 } else {
257 return pBiDi->levels[charIndex];
258 }
259 }
260
261 U_CAPI const UBiDiLevel * U_EXPORT2
ubidi_getLevels(UBiDi * pBiDi,UErrorCode * pErrorCode)262 ubidi_getLevels(UBiDi *pBiDi, UErrorCode *pErrorCode) {
263 int32_t start, length;
264
265 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, nullptr);
266 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, nullptr);
267 if((length=pBiDi->length)<=0) {
268 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
269 return nullptr;
270 }
271 if((start=pBiDi->trailingWSStart)==length) {
272 /* the current levels array reflects the WS run */
273 return pBiDi->levels;
274 }
275
276 /*
277 * After the previous if(), we know that the levels array
278 * has an implicit trailing WS run and therefore does not fully
279 * reflect itself all the levels.
280 * This must be a UBiDi object for a line, and
281 * we need to create a new levels array.
282 */
283 if(getLevelsMemory(pBiDi, length)) {
284 UBiDiLevel *levels=pBiDi->levelsMemory;
285
286 if(start>0 && levels!=pBiDi->levels) {
287 uprv_memcpy(levels, pBiDi->levels, start);
288 }
289 /* pBiDi->paraLevel is ok even if contextual multiple paragraphs,
290 since pBidi is a line object */
291 uprv_memset(levels+start, pBiDi->paraLevel, length-start);
292
293 /* this new levels array is set for the line and reflects the WS run */
294 pBiDi->trailingWSStart=length;
295 return pBiDi->levels=levels;
296 } else {
297 /* out of memory */
298 *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
299 return nullptr;
300 }
301 }
302
303 U_CAPI void U_EXPORT2
ubidi_getLogicalRun(const UBiDi * pBiDi,int32_t logicalPosition,int32_t * pLogicalLimit,UBiDiLevel * pLevel)304 ubidi_getLogicalRun(const UBiDi *pBiDi, int32_t logicalPosition,
305 int32_t *pLogicalLimit, UBiDiLevel *pLevel) {
306 UErrorCode errorCode;
307 int32_t runCount, visualStart, logicalLimit, logicalFirst, i;
308 Run iRun;
309
310 errorCode=U_ZERO_ERROR;
311 RETURN_VOID_IF_BAD_RANGE(logicalPosition, 0, pBiDi->length, errorCode);
312 /* ubidi_countRuns will check VALID_PARA_OR_LINE */
313 runCount=ubidi_countRuns((UBiDi *)pBiDi, &errorCode);
314 if(U_FAILURE(errorCode)) {
315 return;
316 }
317 /* this is done based on runs rather than on levels since levels have
318 a special interpretation when UBIDI_REORDER_RUNS_ONLY
319 */
320 visualStart=logicalLimit=0;
321 iRun=pBiDi->runs[0];
322
323 for(i=0; i<runCount; i++) {
324 iRun = pBiDi->runs[i];
325 logicalFirst=GET_INDEX(iRun.logicalStart);
326 logicalLimit=logicalFirst+iRun.visualLimit-visualStart;
327 if((logicalPosition>=logicalFirst) &&
328 (logicalPosition<logicalLimit)) {
329 break;
330 }
331 visualStart = iRun.visualLimit;
332 }
333 if(pLogicalLimit) {
334 *pLogicalLimit=logicalLimit;
335 }
336 if(pLevel) {
337 if(pBiDi->reorderingMode==UBIDI_REORDER_RUNS_ONLY) {
338 *pLevel=(UBiDiLevel)GET_ODD_BIT(iRun.logicalStart);
339 }
340 else if(pBiDi->direction!=UBIDI_MIXED || logicalPosition>=pBiDi->trailingWSStart) {
341 *pLevel=GET_PARALEVEL(pBiDi, logicalPosition);
342 } else {
343 *pLevel=pBiDi->levels[logicalPosition];
344 }
345 }
346 }
347
348 /* runs API functions ------------------------------------------------------- */
349
350 U_CAPI int32_t U_EXPORT2
ubidi_countRuns(UBiDi * pBiDi,UErrorCode * pErrorCode)351 ubidi_countRuns(UBiDi *pBiDi, UErrorCode *pErrorCode) {
352 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
353 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
354 ubidi_getRuns(pBiDi, pErrorCode);
355 if(U_FAILURE(*pErrorCode)) {
356 return -1;
357 }
358 return pBiDi->runCount;
359 }
360
361 U_CAPI UBiDiDirection U_EXPORT2
ubidi_getVisualRun(UBiDi * pBiDi,int32_t runIndex,int32_t * pLogicalStart,int32_t * pLength)362 ubidi_getVisualRun(UBiDi *pBiDi, int32_t runIndex,
363 int32_t *pLogicalStart, int32_t *pLength)
364 {
365 int32_t start;
366 UErrorCode errorCode = U_ZERO_ERROR;
367 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, errorCode, UBIDI_LTR);
368 ubidi_getRuns(pBiDi, &errorCode);
369 if(U_FAILURE(errorCode)) {
370 return UBIDI_LTR;
371 }
372 RETURN_IF_BAD_RANGE(runIndex, 0, pBiDi->runCount, errorCode, UBIDI_LTR);
373
374 start=pBiDi->runs[runIndex].logicalStart;
375 if(pLogicalStart!=nullptr) {
376 *pLogicalStart=GET_INDEX(start);
377 }
378 if(pLength!=nullptr) {
379 if(runIndex>0) {
380 *pLength=pBiDi->runs[runIndex].visualLimit-
381 pBiDi->runs[runIndex-1].visualLimit;
382 } else {
383 *pLength=pBiDi->runs[0].visualLimit;
384 }
385 }
386 return (UBiDiDirection)GET_ODD_BIT(start);
387 }
388
389 /* in trivial cases there is only one trivial run; called by ubidi_getRuns() */
390 static void
getSingleRun(UBiDi * pBiDi,UBiDiLevel level)391 getSingleRun(UBiDi *pBiDi, UBiDiLevel level) {
392 /* simple, single-run case */
393 pBiDi->runs=pBiDi->simpleRuns;
394 pBiDi->runCount=1;
395
396 /* fill and reorder the single run */
397 pBiDi->runs[0].logicalStart=MAKE_INDEX_ODD_PAIR(0, level);
398 pBiDi->runs[0].visualLimit=pBiDi->length;
399 pBiDi->runs[0].insertRemove=0;
400 }
401
402 /* reorder the runs array (L2) ---------------------------------------------- */
403
404 /*
405 * Reorder the same-level runs in the runs array.
406 * Here, runCount>1 and maxLevel>=minLevel>=paraLevel.
407 * All the visualStart fields=logical start before reordering.
408 * The "odd" bits are not set yet.
409 *
410 * Reordering with this data structure lends itself to some handy shortcuts:
411 *
412 * Since each run is moved but not modified, and since at the initial maxLevel
413 * each sequence of same-level runs consists of only one run each, we
414 * don't need to do anything there and can predecrement maxLevel.
415 * In many simple cases, the reordering is thus done entirely in the
416 * index mapping.
417 * Also, reordering occurs only down to the lowest odd level that occurs,
418 * which is minLevel|1. However, if the lowest level itself is odd, then
419 * in the last reordering the sequence of the runs at this level or higher
420 * will be all runs, and we don't need the elaborate loop to search for them.
421 * This is covered by ++minLevel instead of minLevel|=1 followed
422 * by an extra reorder-all after the reorder-some loop.
423 * About a trailing WS run:
424 * Such a run would need special treatment because its level is not
425 * reflected in levels[] if this is not a paragraph object.
426 * Instead, all characters from trailingWSStart on are implicitly at
427 * paraLevel.
428 * However, for all maxLevel>paraLevel, this run will never be reordered
429 * and does not need to be taken into account. maxLevel==paraLevel is only reordered
430 * if minLevel==paraLevel is odd, which is done in the extra segment.
431 * This means that for the main reordering loop we don't need to consider
432 * this run and can --runCount. If it is later part of the all-runs
433 * reordering, then runCount is adjusted accordingly.
434 */
435 static void
reorderLine(UBiDi * pBiDi,UBiDiLevel minLevel,UBiDiLevel maxLevel)436 reorderLine(UBiDi *pBiDi, UBiDiLevel minLevel, UBiDiLevel maxLevel) {
437 Run *runs, tempRun;
438 UBiDiLevel *levels;
439 int32_t firstRun, endRun, limitRun, runCount;
440
441 /* nothing to do? */
442 if(maxLevel<=(minLevel|1)) {
443 return;
444 }
445
446 /*
447 * Reorder only down to the lowest odd level
448 * and reorder at an odd minLevel in a separate, simpler loop.
449 * See comments above for why minLevel is always incremented.
450 */
451 ++minLevel;
452
453 runs=pBiDi->runs;
454 levels=pBiDi->levels;
455 runCount=pBiDi->runCount;
456
457 /* do not include the WS run at paraLevel<=old minLevel except in the simple loop */
458 if(pBiDi->trailingWSStart<pBiDi->length) {
459 --runCount;
460 }
461
462 while(--maxLevel>=minLevel) {
463 firstRun=0;
464
465 /* loop for all sequences of runs */
466 for(;;) {
467 /* look for a sequence of runs that are all at >=maxLevel */
468 /* look for the first run of such a sequence */
469 while(firstRun<runCount && levels[runs[firstRun].logicalStart]<maxLevel) {
470 ++firstRun;
471 }
472 if(firstRun>=runCount) {
473 break; /* no more such runs */
474 }
475
476 /* look for the limit run of such a sequence (the run behind it) */
477 for(limitRun=firstRun; ++limitRun<runCount && levels[runs[limitRun].logicalStart]>=maxLevel;) {}
478
479 /* Swap the entire sequence of runs from firstRun to limitRun-1. */
480 endRun=limitRun-1;
481 while(firstRun<endRun) {
482 tempRun = runs[firstRun];
483 runs[firstRun]=runs[endRun];
484 runs[endRun]=tempRun;
485 ++firstRun;
486 --endRun;
487 }
488
489 if(limitRun==runCount) {
490 break; /* no more such runs */
491 } else {
492 firstRun=limitRun+1;
493 }
494 }
495 }
496
497 /* now do maxLevel==old minLevel (==odd!), see above */
498 if(!(minLevel&1)) {
499 firstRun=0;
500
501 /* include the trailing WS run in this complete reordering */
502 if(pBiDi->trailingWSStart==pBiDi->length) {
503 --runCount;
504 }
505
506 /* Swap the entire sequence of all runs. (endRun==runCount) */
507 while(firstRun<runCount) {
508 tempRun=runs[firstRun];
509 runs[firstRun]=runs[runCount];
510 runs[runCount]=tempRun;
511 ++firstRun;
512 --runCount;
513 }
514 }
515 }
516
517 /* compute the runs array --------------------------------------------------- */
518
getRunFromLogicalIndex(UBiDi * pBiDi,int32_t logicalIndex)519 static int32_t getRunFromLogicalIndex(UBiDi *pBiDi, int32_t logicalIndex) {
520 Run *runs=pBiDi->runs;
521 int32_t runCount=pBiDi->runCount, visualStart=0, i, length, logicalStart;
522
523 for(i=0; i<runCount; i++) {
524 length=runs[i].visualLimit-visualStart;
525 logicalStart=GET_INDEX(runs[i].logicalStart);
526 if((logicalIndex>=logicalStart) && (logicalIndex<(logicalStart+length))) {
527 return i;
528 }
529 visualStart+=length;
530 }
531 /* we should never get here */
532 UPRV_UNREACHABLE_EXIT;
533 }
534
535 /*
536 * Compute the runs array from the levels array.
537 * After ubidi_getRuns() returns true, runCount is guaranteed to be >0
538 * and the runs are reordered.
539 * Odd-level runs have visualStart on their visual right edge and
540 * they progress visually to the left.
541 * If option UBIDI_OPTION_INSERT_MARKS is set, insertRemove will contain the
542 * sum of appropriate LRM/RLM_BEFORE/AFTER flags.
543 * If option UBIDI_OPTION_REMOVE_CONTROLS is set, insertRemove will contain the
544 * negative number of BiDi control characters within this run.
545 */
546 U_CFUNC UBool
ubidi_getRuns(UBiDi * pBiDi,UErrorCode *)547 ubidi_getRuns(UBiDi *pBiDi, UErrorCode*) {
548 /*
549 * This method returns immediately if the runs are already set. This
550 * includes the case of length==0 (handled in setPara)..
551 */
552 if (pBiDi->runCount>=0) {
553 return true;
554 }
555
556 if(pBiDi->direction!=UBIDI_MIXED) {
557 /* simple, single-run case - this covers length==0 */
558 /* pBiDi->paraLevel is ok even for contextual multiple paragraphs */
559 getSingleRun(pBiDi, pBiDi->paraLevel);
560 } else /* UBIDI_MIXED, length>0 */ {
561 /* mixed directionality */
562 int32_t length=pBiDi->length, limit;
563 UBiDiLevel *levels=pBiDi->levels;
564 int32_t i, runCount;
565 UBiDiLevel level=UBIDI_DEFAULT_LTR; /* initialize with no valid level */
566 /*
567 * If there are WS characters at the end of the line
568 * and the run preceding them has a level different from
569 * paraLevel, then they will form their own run at paraLevel (L1).
570 * Count them separately.
571 * We need some special treatment for this in order to not
572 * modify the levels array which a line UBiDi object shares
573 * with its paragraph parent and its other line siblings.
574 * In other words, for the trailing WS, it may be
575 * levels[]!=paraLevel but we have to treat it like it were so.
576 */
577 limit=pBiDi->trailingWSStart;
578 /* count the runs, there is at least one non-WS run, and limit>0 */
579 runCount=0;
580 for(i=0; i<limit; ++i) {
581 /* increment runCount at the start of each run */
582 if(levels[i]!=level) {
583 ++runCount;
584 level=levels[i];
585 }
586 }
587
588 /*
589 * We don't need to see if the last run can be merged with a trailing
590 * WS run because setTrailingWSStart() would have done that.
591 */
592 if(runCount==1 && limit==length) {
593 /* There is only one non-WS run and no trailing WS-run. */
594 getSingleRun(pBiDi, levels[0]);
595 } else /* runCount>1 || limit<length */ {
596 /* allocate and set the runs */
597 Run *runs;
598 int32_t runIndex, start;
599 UBiDiLevel minLevel=UBIDI_MAX_EXPLICIT_LEVEL+1, maxLevel=0;
600
601 /* now, count a (non-mergeable) WS run */
602 if(limit<length) {
603 ++runCount;
604 }
605
606 /* runCount>1 */
607 if(getRunsMemory(pBiDi, runCount)) {
608 runs=pBiDi->runsMemory;
609 } else {
610 return false;
611 }
612
613 /* set the runs */
614 /* FOOD FOR THOUGHT: this could be optimized, e.g.:
615 * 464->444, 484->444, 575->555, 595->555
616 * However, that would take longer. Check also how it would
617 * interact with BiDi control removal and inserting Marks.
618 */
619 runIndex=0;
620
621 /* search for the run limits and initialize visualLimit values with the run lengths */
622 i=0;
623 do {
624 /* prepare this run */
625 start=i;
626 level=levels[i];
627 if(level<minLevel) {
628 minLevel=level;
629 }
630 if(level>maxLevel) {
631 maxLevel=level;
632 }
633
634 /* look for the run limit */
635 while(++i<limit && levels[i]==level) {}
636
637 /* i is another run limit */
638 runs[runIndex].logicalStart=start;
639 runs[runIndex].visualLimit=i-start;
640 runs[runIndex].insertRemove=0;
641 ++runIndex;
642 } while(i<limit);
643
644 if(limit<length) {
645 /* there is a separate WS run */
646 runs[runIndex].logicalStart=limit;
647 runs[runIndex].visualLimit=length-limit;
648 /* For the trailing WS run, pBiDi->paraLevel is ok even
649 if contextual multiple paragraphs. */
650 if(pBiDi->paraLevel<minLevel) {
651 minLevel=pBiDi->paraLevel;
652 }
653 }
654
655 /* set the object fields */
656 pBiDi->runs=runs;
657 pBiDi->runCount=runCount;
658
659 reorderLine(pBiDi, minLevel, maxLevel);
660
661 /* now add the direction flags and adjust the visualLimit's to be just that */
662 /* this loop will also handle the trailing WS run */
663 limit=0;
664 for(i=0; i<runCount; ++i) {
665 ADD_ODD_BIT_FROM_LEVEL(runs[i].logicalStart, levels[runs[i].logicalStart]);
666 limit+=runs[i].visualLimit;
667 runs[i].visualLimit=limit;
668 }
669
670 /* Set the "odd" bit for the trailing WS run. */
671 /* For a RTL paragraph, it will be the *first* run in visual order. */
672 /* For the trailing WS run, pBiDi->paraLevel is ok even if
673 contextual multiple paragraphs. */
674 if(runIndex<runCount) {
675 int32_t trailingRun = ((pBiDi->paraLevel & 1) != 0)? 0 : runIndex;
676
677 ADD_ODD_BIT_FROM_LEVEL(runs[trailingRun].logicalStart, pBiDi->paraLevel);
678 }
679 }
680 }
681
682 /* handle insert LRM/RLM BEFORE/AFTER run */
683 if(pBiDi->insertPoints.size>0) {
684 Point *point, *start=pBiDi->insertPoints.points,
685 *limit=start+pBiDi->insertPoints.size;
686 int32_t runIndex;
687 for(point=start; point<limit; point++) {
688 runIndex=getRunFromLogicalIndex(pBiDi, point->pos);
689 pBiDi->runs[runIndex].insertRemove|=point->flag;
690 }
691 }
692
693 /* handle remove BiDi control characters */
694 if(pBiDi->controlCount>0) {
695 int32_t runIndex;
696 const char16_t *start=pBiDi->text, *limit=start+pBiDi->length, *pu;
697 for(pu=start; pu<limit; pu++) {
698 if(IS_BIDI_CONTROL_CHAR(*pu)) {
699 runIndex=getRunFromLogicalIndex(pBiDi, (int32_t)(pu-start));
700 pBiDi->runs[runIndex].insertRemove--;
701 }
702 }
703 }
704
705 return true;
706 }
707
708 static UBool
prepareReorder(const UBiDiLevel * levels,int32_t length,int32_t * indexMap,UBiDiLevel * pMinLevel,UBiDiLevel * pMaxLevel)709 prepareReorder(const UBiDiLevel *levels, int32_t length,
710 int32_t *indexMap,
711 UBiDiLevel *pMinLevel, UBiDiLevel *pMaxLevel) {
712 int32_t start;
713 UBiDiLevel level, minLevel, maxLevel;
714
715 if(levels==nullptr || length<=0) {
716 return false;
717 }
718
719 /* determine minLevel and maxLevel */
720 minLevel=UBIDI_MAX_EXPLICIT_LEVEL+1;
721 maxLevel=0;
722 for(start=length; start>0;) {
723 level=levels[--start];
724 if(level>UBIDI_MAX_EXPLICIT_LEVEL+1) {
725 return false;
726 }
727 if(level<minLevel) {
728 minLevel=level;
729 }
730 if(level>maxLevel) {
731 maxLevel=level;
732 }
733 }
734 *pMinLevel=minLevel;
735 *pMaxLevel=maxLevel;
736
737 /* initialize the index map */
738 for(start=length; start>0;) {
739 --start;
740 indexMap[start]=start;
741 }
742
743 return true;
744 }
745
746 /* reorder a line based on a levels array (L2) ------------------------------ */
747
748 U_CAPI void U_EXPORT2
ubidi_reorderLogical(const UBiDiLevel * levels,int32_t length,int32_t * indexMap)749 ubidi_reorderLogical(const UBiDiLevel *levels, int32_t length, int32_t *indexMap) {
750 int32_t start, limit, sumOfSosEos;
751 UBiDiLevel minLevel = 0, maxLevel = 0;
752
753 if(indexMap==nullptr || !prepareReorder(levels, length, indexMap, &minLevel, &maxLevel)) {
754 return;
755 }
756
757 /* nothing to do? */
758 if(minLevel==maxLevel && (minLevel&1)==0) {
759 return;
760 }
761
762 /* reorder only down to the lowest odd level */
763 minLevel|=1;
764
765 /* loop maxLevel..minLevel */
766 do {
767 start=0;
768
769 /* loop for all sequences of levels to reorder at the current maxLevel */
770 for(;;) {
771 /* look for a sequence of levels that are all at >=maxLevel */
772 /* look for the first index of such a sequence */
773 while(start<length && levels[start]<maxLevel) {
774 ++start;
775 }
776 if(start>=length) {
777 break; /* no more such sequences */
778 }
779
780 /* look for the limit of such a sequence (the index behind it) */
781 for(limit=start; ++limit<length && levels[limit]>=maxLevel;) {}
782
783 /*
784 * sos=start of sequence, eos=end of sequence
785 *
786 * The closed (inclusive) interval from sos to eos includes all the logical
787 * and visual indexes within this sequence. They are logically and
788 * visually contiguous and in the same range.
789 *
790 * For each run, the new visual index=sos+eos-old visual index;
791 * we pre-add sos+eos into sumOfSosEos ->
792 * new visual index=sumOfSosEos-old visual index;
793 */
794 sumOfSosEos=start+limit-1;
795
796 /* reorder each index in the sequence */
797 do {
798 indexMap[start]=sumOfSosEos-indexMap[start];
799 } while(++start<limit);
800
801 /* start==limit */
802 if(limit==length) {
803 break; /* no more such sequences */
804 } else {
805 start=limit+1;
806 }
807 }
808 } while(--maxLevel>=minLevel);
809 }
810
811 U_CAPI void U_EXPORT2
ubidi_reorderVisual(const UBiDiLevel * levels,int32_t length,int32_t * indexMap)812 ubidi_reorderVisual(const UBiDiLevel *levels, int32_t length, int32_t *indexMap) {
813 int32_t start, end, limit, temp;
814 UBiDiLevel minLevel = 0, maxLevel = 0;
815
816 if(indexMap==nullptr || !prepareReorder(levels, length, indexMap, &minLevel, &maxLevel)) {
817 return;
818 }
819
820 /* nothing to do? */
821 if(minLevel==maxLevel && (minLevel&1)==0) {
822 return;
823 }
824
825 /* reorder only down to the lowest odd level */
826 minLevel|=1;
827
828 /* loop maxLevel..minLevel */
829 do {
830 start=0;
831
832 /* loop for all sequences of levels to reorder at the current maxLevel */
833 for(;;) {
834 /* look for a sequence of levels that are all at >=maxLevel */
835 /* look for the first index of such a sequence */
836 while(start<length && levels[start]<maxLevel) {
837 ++start;
838 }
839 if(start>=length) {
840 break; /* no more such runs */
841 }
842
843 /* look for the limit of such a sequence (the index behind it) */
844 for(limit=start; ++limit<length && levels[limit]>=maxLevel;) {}
845
846 /*
847 * Swap the entire interval of indexes from start to limit-1.
848 * We don't need to swap the levels for the purpose of this
849 * algorithm: the sequence of levels that we look at does not
850 * move anyway.
851 */
852 end=limit-1;
853 while(start<end) {
854 temp=indexMap[start];
855 indexMap[start]=indexMap[end];
856 indexMap[end]=temp;
857
858 ++start;
859 --end;
860 }
861
862 if(limit==length) {
863 break; /* no more such sequences */
864 } else {
865 start=limit+1;
866 }
867 }
868 } while(--maxLevel>=minLevel);
869 }
870
871 /* API functions for logical<->visual mapping ------------------------------- */
872
873 U_CAPI int32_t U_EXPORT2
ubidi_getVisualIndex(UBiDi * pBiDi,int32_t logicalIndex,UErrorCode * pErrorCode)874 ubidi_getVisualIndex(UBiDi *pBiDi, int32_t logicalIndex, UErrorCode *pErrorCode) {
875 int32_t visualIndex=UBIDI_MAP_NOWHERE;
876 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
877 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
878 RETURN_IF_BAD_RANGE(logicalIndex, 0, pBiDi->length, *pErrorCode, -1);
879
880 /* we can do the trivial cases without the runs array */
881 switch(pBiDi->direction) {
882 case UBIDI_LTR:
883 visualIndex=logicalIndex;
884 break;
885 case UBIDI_RTL:
886 visualIndex=pBiDi->length-logicalIndex-1;
887 break;
888 default:
889 if(!ubidi_getRuns(pBiDi, pErrorCode)) {
890 *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
891 return -1;
892 } else {
893 Run *runs=pBiDi->runs;
894 int32_t i, visualStart=0, offset, length;
895
896 /* linear search for the run, search on the visual runs */
897 for(i=0; i<pBiDi->runCount; ++i) {
898 length=runs[i].visualLimit-visualStart;
899 offset=logicalIndex-GET_INDEX(runs[i].logicalStart);
900 if(offset>=0 && offset<length) {
901 if(IS_EVEN_RUN(runs[i].logicalStart)) {
902 /* LTR */
903 visualIndex=visualStart+offset;
904 } else {
905 /* RTL */
906 visualIndex=visualStart+length-offset-1;
907 }
908 break; /* exit for loop */
909 }
910 visualStart+=length;
911 }
912 if(i>=pBiDi->runCount) {
913 return UBIDI_MAP_NOWHERE;
914 }
915 }
916 }
917
918 if(pBiDi->insertPoints.size>0) {
919 /* add the number of added marks until the calculated visual index */
920 Run *runs=pBiDi->runs;
921 int32_t i, length, insertRemove;
922 int32_t visualStart=0, markFound=0;
923 for(i=0; ; i++, visualStart+=length) {
924 length=runs[i].visualLimit-visualStart;
925 insertRemove=runs[i].insertRemove;
926 if(insertRemove & (LRM_BEFORE|RLM_BEFORE)) {
927 markFound++;
928 }
929 /* is it the run containing the visual index? */
930 if(visualIndex<runs[i].visualLimit) {
931 return visualIndex+markFound;
932 }
933 if(insertRemove & (LRM_AFTER|RLM_AFTER)) {
934 markFound++;
935 }
936 }
937 }
938 else if(pBiDi->controlCount>0) {
939 /* subtract the number of controls until the calculated visual index */
940 Run *runs=pBiDi->runs;
941 int32_t i, j, start, limit, length, insertRemove;
942 int32_t visualStart=0, controlFound=0;
943 char16_t uchar=pBiDi->text[logicalIndex];
944 /* is the logical index pointing to a control ? */
945 if(IS_BIDI_CONTROL_CHAR(uchar)) {
946 return UBIDI_MAP_NOWHERE;
947 }
948 /* loop on runs */
949 for(i=0; ; i++, visualStart+=length) {
950 length=runs[i].visualLimit-visualStart;
951 insertRemove=runs[i].insertRemove;
952 /* calculated visual index is beyond this run? */
953 if(visualIndex>=runs[i].visualLimit) {
954 controlFound-=insertRemove;
955 continue;
956 }
957 /* calculated visual index must be within current run */
958 if(insertRemove==0) {
959 return visualIndex-controlFound;
960 }
961 if(IS_EVEN_RUN(runs[i].logicalStart)) {
962 /* LTR: check from run start to logical index */
963 start=runs[i].logicalStart;
964 limit=logicalIndex;
965 } else {
966 /* RTL: check from logical index to run end */
967 start=logicalIndex+1;
968 limit=GET_INDEX(runs[i].logicalStart)+length;
969 }
970 for(j=start; j<limit; j++) {
971 uchar=pBiDi->text[j];
972 if(IS_BIDI_CONTROL_CHAR(uchar)) {
973 controlFound++;
974 }
975 }
976 return visualIndex-controlFound;
977 }
978 }
979
980 return visualIndex;
981 }
982
983 U_CAPI int32_t U_EXPORT2
ubidi_getLogicalIndex(UBiDi * pBiDi,int32_t visualIndex,UErrorCode * pErrorCode)984 ubidi_getLogicalIndex(UBiDi *pBiDi, int32_t visualIndex, UErrorCode *pErrorCode) {
985 Run *runs;
986 int32_t i, runCount, start;
987 RETURN_IF_NULL_OR_FAILING_ERRCODE(pErrorCode, -1);
988 RETURN_IF_NOT_VALID_PARA_OR_LINE(pBiDi, *pErrorCode, -1);
989 RETURN_IF_BAD_RANGE(visualIndex, 0, pBiDi->resultLength, *pErrorCode, -1);
990 /* we can do the trivial cases without the runs array */
991 if(pBiDi->insertPoints.size==0 && pBiDi->controlCount==0) {
992 if(pBiDi->direction==UBIDI_LTR) {
993 return visualIndex;
994 }
995 else if(pBiDi->direction==UBIDI_RTL) {
996 return pBiDi->length-visualIndex-1;
997 }
998 }
999 if(!ubidi_getRuns(pBiDi, pErrorCode)) {
1000 *pErrorCode=U_MEMORY_ALLOCATION_ERROR;
1001 return -1;
1002 }
1003
1004 runs=pBiDi->runs;
1005 runCount=pBiDi->runCount;
1006 if(pBiDi->insertPoints.size>0) {
1007 /* handle inserted LRM/RLM */
1008 int32_t markFound=0, insertRemove;
1009 int32_t visualStart=0, length;
1010 runs=pBiDi->runs;
1011 /* subtract number of marks until visual index */
1012 for(i=0; ; i++, visualStart+=length) {
1013 length=runs[i].visualLimit-visualStart;
1014 insertRemove=runs[i].insertRemove;
1015 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1016 if(visualIndex<=(visualStart+markFound)) {
1017 return UBIDI_MAP_NOWHERE;
1018 }
1019 markFound++;
1020 }
1021 /* is adjusted visual index within this run? */
1022 if(visualIndex<(runs[i].visualLimit+markFound)) {
1023 visualIndex-=markFound;
1024 break;
1025 }
1026 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1027 if(visualIndex==(visualStart+length+markFound)) {
1028 return UBIDI_MAP_NOWHERE;
1029 }
1030 markFound++;
1031 }
1032 }
1033 }
1034 else if(pBiDi->controlCount>0) {
1035 /* handle removed BiDi control characters */
1036 int32_t controlFound=0, insertRemove, length;
1037 int32_t logicalStart, logicalEnd, visualStart=0, j, k;
1038 char16_t uchar;
1039 UBool evenRun;
1040 /* add number of controls until visual index */
1041 for(i=0; ; i++, visualStart+=length) {
1042 length=runs[i].visualLimit-visualStart;
1043 insertRemove=runs[i].insertRemove;
1044 /* is adjusted visual index beyond current run? */
1045 if(visualIndex>=(runs[i].visualLimit-controlFound+insertRemove)) {
1046 controlFound-=insertRemove;
1047 continue;
1048 }
1049 /* adjusted visual index is within current run */
1050 if(insertRemove==0) {
1051 visualIndex+=controlFound;
1052 break;
1053 }
1054 /* count non-control chars until visualIndex */
1055 logicalStart=runs[i].logicalStart;
1056 evenRun=IS_EVEN_RUN(logicalStart);
1057 REMOVE_ODD_BIT(logicalStart);
1058 logicalEnd=logicalStart+length-1;
1059 for(j=0; j<length; j++) {
1060 k= evenRun ? logicalStart+j : logicalEnd-j;
1061 uchar=pBiDi->text[k];
1062 if(IS_BIDI_CONTROL_CHAR(uchar)) {
1063 controlFound++;
1064 }
1065 if((visualIndex+controlFound)==(visualStart+j)) {
1066 break;
1067 }
1068 }
1069 visualIndex+=controlFound;
1070 break;
1071 }
1072 }
1073 /* handle all cases */
1074 if(runCount<=10) {
1075 /* linear search for the run */
1076 for(i=0; visualIndex>=runs[i].visualLimit; ++i) {}
1077 } else {
1078 /* binary search for the run */
1079 int32_t begin=0, limit=runCount;
1080
1081 /* the middle if() is guaranteed to find the run, we don't need a loop limit */
1082 for(;;) {
1083 i=(begin+limit)/2;
1084 if(visualIndex>=runs[i].visualLimit) {
1085 begin=i+1;
1086 } else if(i==0 || visualIndex>=runs[i-1].visualLimit) {
1087 break;
1088 } else {
1089 limit=i;
1090 }
1091 }
1092 }
1093
1094 start=runs[i].logicalStart;
1095 if(IS_EVEN_RUN(start)) {
1096 /* LTR */
1097 /* the offset in runs[i] is visualIndex-runs[i-1].visualLimit */
1098 if(i>0) {
1099 visualIndex-=runs[i-1].visualLimit;
1100 }
1101 return start+visualIndex;
1102 } else {
1103 /* RTL */
1104 return GET_INDEX(start)+runs[i].visualLimit-visualIndex-1;
1105 }
1106 }
1107
1108 U_CAPI void U_EXPORT2
ubidi_getLogicalMap(UBiDi * pBiDi,int32_t * indexMap,UErrorCode * pErrorCode)1109 ubidi_getLogicalMap(UBiDi *pBiDi, int32_t *indexMap, UErrorCode *pErrorCode) {
1110 RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
1111 /* ubidi_countRuns() checks for VALID_PARA_OR_LINE */
1112 ubidi_countRuns(pBiDi, pErrorCode);
1113 if(U_FAILURE(*pErrorCode)) {
1114 /* no op */
1115 } else if(indexMap==nullptr) {
1116 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1117 } else {
1118 /* fill a logical-to-visual index map using the runs[] */
1119 int32_t visualStart, visualLimit, i, j, k;
1120 int32_t logicalStart, logicalLimit;
1121 Run *runs=pBiDi->runs;
1122 if (pBiDi->length<=0) {
1123 return;
1124 }
1125 if (pBiDi->length>pBiDi->resultLength) {
1126 uprv_memset(indexMap, 0xFF, pBiDi->length*sizeof(int32_t));
1127 }
1128
1129 visualStart=0;
1130 for(j=0; j<pBiDi->runCount; ++j) {
1131 logicalStart=GET_INDEX(runs[j].logicalStart);
1132 visualLimit=runs[j].visualLimit;
1133 if(IS_EVEN_RUN(runs[j].logicalStart)) {
1134 do { /* LTR */
1135 indexMap[logicalStart++]=visualStart++;
1136 } while(visualStart<visualLimit);
1137 } else {
1138 logicalStart+=visualLimit-visualStart; /* logicalLimit */
1139 do { /* RTL */
1140 indexMap[--logicalStart]=visualStart++;
1141 } while(visualStart<visualLimit);
1142 }
1143 /* visualStart==visualLimit; */
1144 }
1145
1146 if(pBiDi->insertPoints.size>0) {
1147 int32_t markFound=0, runCount=pBiDi->runCount;
1148 int32_t length, insertRemove;
1149 visualStart=0;
1150 /* add number of marks found until each index */
1151 for(i=0; i<runCount; i++, visualStart+=length) {
1152 length=runs[i].visualLimit-visualStart;
1153 insertRemove=runs[i].insertRemove;
1154 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1155 markFound++;
1156 }
1157 if(markFound>0) {
1158 logicalStart=GET_INDEX(runs[i].logicalStart);
1159 logicalLimit=logicalStart+length;
1160 for(j=logicalStart; j<logicalLimit; j++) {
1161 indexMap[j]+=markFound;
1162 }
1163 }
1164 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1165 markFound++;
1166 }
1167 }
1168 }
1169 else if(pBiDi->controlCount>0) {
1170 int32_t controlFound=0, runCount=pBiDi->runCount;
1171 int32_t length, insertRemove;
1172 UBool evenRun;
1173 char16_t uchar;
1174 visualStart=0;
1175 /* subtract number of controls found until each index */
1176 for(i=0; i<runCount; i++, visualStart+=length) {
1177 length=runs[i].visualLimit-visualStart;
1178 insertRemove=runs[i].insertRemove;
1179 /* no control found within previous runs nor within this run */
1180 if((controlFound-insertRemove)==0) {
1181 continue;
1182 }
1183 logicalStart=runs[i].logicalStart;
1184 evenRun=IS_EVEN_RUN(logicalStart);
1185 REMOVE_ODD_BIT(logicalStart);
1186 logicalLimit=logicalStart+length;
1187 /* if no control within this run */
1188 if(insertRemove==0) {
1189 for(j=logicalStart; j<logicalLimit; j++) {
1190 indexMap[j]-=controlFound;
1191 }
1192 continue;
1193 }
1194 for(j=0; j<length; j++) {
1195 k= evenRun ? logicalStart+j : logicalLimit-j-1;
1196 uchar=pBiDi->text[k];
1197 if(IS_BIDI_CONTROL_CHAR(uchar)) {
1198 controlFound++;
1199 indexMap[k]=UBIDI_MAP_NOWHERE;
1200 continue;
1201 }
1202 indexMap[k]-=controlFound;
1203 }
1204 }
1205 }
1206 }
1207 }
1208
1209 U_CAPI void U_EXPORT2
ubidi_getVisualMap(UBiDi * pBiDi,int32_t * indexMap,UErrorCode * pErrorCode)1210 ubidi_getVisualMap(UBiDi *pBiDi, int32_t *indexMap, UErrorCode *pErrorCode) {
1211 RETURN_VOID_IF_NULL_OR_FAILING_ERRCODE(pErrorCode);
1212 if(indexMap==nullptr) {
1213 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1214 return;
1215 }
1216 /* ubidi_countRuns() checks for VALID_PARA_OR_LINE */
1217 ubidi_countRuns(pBiDi, pErrorCode);
1218 if(U_SUCCESS(*pErrorCode)) {
1219 /* fill a visual-to-logical index map using the runs[] */
1220 Run *runs=pBiDi->runs, *runsLimit=runs+pBiDi->runCount;
1221 int32_t logicalStart, visualStart, visualLimit, *pi=indexMap;
1222
1223 if (pBiDi->resultLength<=0) {
1224 return;
1225 }
1226 visualStart=0;
1227 for(; runs<runsLimit; ++runs) {
1228 logicalStart=runs->logicalStart;
1229 visualLimit=runs->visualLimit;
1230 if(IS_EVEN_RUN(logicalStart)) {
1231 do { /* LTR */
1232 *pi++ = logicalStart++;
1233 } while(++visualStart<visualLimit);
1234 } else {
1235 REMOVE_ODD_BIT(logicalStart);
1236 logicalStart+=visualLimit-visualStart; /* logicalLimit */
1237 do { /* RTL */
1238 *pi++ = --logicalStart;
1239 } while(++visualStart<visualLimit);
1240 }
1241 /* visualStart==visualLimit; */
1242 }
1243
1244 if(pBiDi->insertPoints.size>0) {
1245 int32_t markFound=0, runCount=pBiDi->runCount;
1246 int32_t insertRemove, i, j, k;
1247 runs=pBiDi->runs;
1248 /* count all inserted marks */
1249 for(i=0; i<runCount; i++) {
1250 insertRemove=runs[i].insertRemove;
1251 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1252 markFound++;
1253 }
1254 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1255 markFound++;
1256 }
1257 }
1258 /* move back indexes by number of preceding marks */
1259 k=pBiDi->resultLength;
1260 for(i=runCount-1; i>=0 && markFound>0; i--) {
1261 insertRemove=runs[i].insertRemove;
1262 if(insertRemove&(LRM_AFTER|RLM_AFTER)) {
1263 indexMap[--k]= UBIDI_MAP_NOWHERE;
1264 markFound--;
1265 }
1266 visualStart= i>0 ? runs[i-1].visualLimit : 0;
1267 for(j=runs[i].visualLimit-1; j>=visualStart && markFound>0; j--) {
1268 indexMap[--k]=indexMap[j];
1269 }
1270 if(insertRemove&(LRM_BEFORE|RLM_BEFORE)) {
1271 indexMap[--k]= UBIDI_MAP_NOWHERE;
1272 markFound--;
1273 }
1274 }
1275 }
1276 else if(pBiDi->controlCount>0) {
1277 int32_t runCount=pBiDi->runCount, logicalEnd;
1278 int32_t insertRemove, length, i, j, k, m;
1279 char16_t uchar;
1280 UBool evenRun;
1281 runs=pBiDi->runs;
1282 visualStart=0;
1283 /* move forward indexes by number of preceding controls */
1284 k=0;
1285 for(i=0; i<runCount; i++, visualStart+=length) {
1286 length=runs[i].visualLimit-visualStart;
1287 insertRemove=runs[i].insertRemove;
1288 /* if no control found yet, nothing to do in this run */
1289 if((insertRemove==0)&&(k==visualStart)) {
1290 k+=length;
1291 continue;
1292 }
1293 /* if no control in this run */
1294 if(insertRemove==0) {
1295 visualLimit=runs[i].visualLimit;
1296 for(j=visualStart; j<visualLimit; j++) {
1297 indexMap[k++]=indexMap[j];
1298 }
1299 continue;
1300 }
1301 logicalStart=runs[i].logicalStart;
1302 evenRun=IS_EVEN_RUN(logicalStart);
1303 REMOVE_ODD_BIT(logicalStart);
1304 logicalEnd=logicalStart+length-1;
1305 for(j=0; j<length; j++) {
1306 m= evenRun ? logicalStart+j : logicalEnd-j;
1307 uchar=pBiDi->text[m];
1308 if(!IS_BIDI_CONTROL_CHAR(uchar)) {
1309 indexMap[k++]=m;
1310 }
1311 }
1312 }
1313 }
1314 }
1315 }
1316
1317 U_CAPI void U_EXPORT2
ubidi_invertMap(const int32_t * srcMap,int32_t * destMap,int32_t length)1318 ubidi_invertMap(const int32_t *srcMap, int32_t *destMap, int32_t length) {
1319 if(srcMap!=nullptr && destMap!=nullptr && length>0) {
1320 const int32_t *pi;
1321 int32_t destLength=-1, count=0;
1322 /* find highest value and count positive indexes in srcMap */
1323 pi=srcMap+length;
1324 while(pi>srcMap) {
1325 if(*--pi>destLength) {
1326 destLength=*pi;
1327 }
1328 if(*pi>=0) {
1329 count++;
1330 }
1331 }
1332 destLength++; /* add 1 for origin 0 */
1333 if(count<destLength) {
1334 /* we must fill unmatched destMap entries with -1 */
1335 uprv_memset(destMap, 0xFF, destLength*sizeof(int32_t));
1336 }
1337 pi=srcMap+length;
1338 while(length>0) {
1339 if(*--pi>=0) {
1340 destMap[*pi]=--length;
1341 } else {
1342 --length;
1343 }
1344 }
1345 }
1346 }
1347