1 /*
2 ******************************************************************************
3 *
4 * Copyright (C) 1999-2009, International Business Machines
5 * Corporation and others. All Rights Reserved.
6 *
7 ******************************************************************************
8 * file name: udata.c
9 * encoding: US-ASCII
10 * tab size: 8 (not used)
11 * indentation:4
12 *
13 * created on: 1999oct25
14 * created by: Markus W. Scherer
15 */
16
17 #include "unicode/utypes.h"
18 #include "unicode/putil.h"
19 #include "umutex.h"
20 #include "cmemory.h"
21 #include "cstring.h"
22 #include "unicode/udata.h"
23 #include "unicode/uversion.h"
24 #include "uhash.h"
25 #include "ucln_cmn.h"
26 #include "putilimp.h"
27
28 #include "udatamem.h"
29 #include "umapfile.h"
30 #include "ucmndata.h"
31
32 /***********************************************************************
33 *
34 * Notes on the organization of the ICU data implementation
35 *
36 * All of the public API is defined in udata.h
37 *
38 * The implementation is split into several files...
39 *
40 * - udata.c (this file) contains higher level code that knows about
41 * the search paths for locating data, caching opened data, etc.
42 *
43 * - umapfile.c contains the low level platform-specific code for actually loading
44 * (memory mapping, file reading, whatever) data into memory.
45 *
46 * - ucmndata.c deals with the tables of contents of ICU data items within
47 * an ICU common format data file. The implementation includes
48 * an abstract interface and support for multiple TOC formats.
49 * All knowledge of any specific TOC format is encapsulated here.
50 *
51 * - udatamem.c has code for managing UDataMemory structs. These are little
52 * descriptor objects for blocks of memory holding ICU data of
53 * various types.
54 */
55
56 /* configuration ---------------------------------------------------------- */
57
58 /* If you are excruciatingly bored turn this on .. */
59 /* #define UDATA_DEBUG 1 */
60
61 #if defined(UDATA_DEBUG)
62 # include <stdio.h>
63 #endif
64
65
66 /***********************************************************************
67 *
68 * static (Global) data
69 *
70 ************************************************************************/
71 static UDataMemory *gCommonICUData = NULL; /* Pointer to the common ICU data. */
72 /* May be updated once, if we started with */
73 /* a stub or subset library. */
74
75 static UDataMemory *gStubICUData = NULL; /* If gCommonICUData does get updated, remember */
76 /* the original one so that it can be cleaned */
77 /* up when ICU is shut down. */
78
79 static UHashtable *gCommonDataCache = NULL; /* Global hash table of opened ICU data files. */
80
81 static UDataFileAccess gDataFileAccess = UDATA_DEFAULT_ACCESS;
82
83 static UBool U_CALLCONV
udata_cleanup(void)84 udata_cleanup(void)
85 {
86 if (gCommonDataCache) { /* Delete the cache of user data mappings. */
87 uhash_close(gCommonDataCache); /* Table owns the contents, and will delete them. */
88 gCommonDataCache = NULL; /* Cleanup is not thread safe. */
89 }
90
91 if (gCommonICUData != NULL) {
92 udata_close(gCommonICUData); /* Clean up common ICU Data */
93 gCommonICUData = NULL;
94 }
95
96 if (gStubICUData != NULL) {
97 udata_close(gStubICUData); /* Clean up the stub ICU Data */
98 gStubICUData = NULL;
99 }
100
101
102 return TRUE; /* Everything was cleaned up */
103 }
104
105
106
107
108 /*
109 * setCommonICUData. Set a UDataMemory to be the global ICU Data
110 */
111 static void
setCommonICUData(UDataMemory * pData,UDataMemory * oldData,UBool warn,UErrorCode * pErr)112 setCommonICUData(UDataMemory *pData, /* The new common data. Belongs to caller, we copy it. */
113 UDataMemory *oldData, /* Old ICUData ptr. Overwrite of this value is ok, */
114 /* of any others is not. */
115 UBool warn, /* If true, set USING_DEFAULT warning if ICUData was */
116 /* changed by another thread before we got to it. */
117 UErrorCode *pErr)
118 {
119 UDataMemory *newCommonData = UDataMemory_createNewInstance(pErr);
120 if (U_FAILURE(*pErr)) {
121 return;
122 }
123
124 /* For the assignment, other threads must cleanly see either the old */
125 /* or the new, not some partially initialized new. The old can not be */
126 /* deleted - someone may still have a pointer to it lying around in */
127 /* their locals. */
128 UDatamemory_assign(newCommonData, pData);
129 umtx_lock(NULL);
130 if (gCommonICUData==oldData) {
131 gStubICUData = gCommonICUData; /* remember the old Common Data, so it can be cleaned up. */
132 gCommonICUData = newCommonData;
133 ucln_common_registerCleanup(UCLN_COMMON_UDATA, udata_cleanup);
134 }
135 else {
136 if (warn==TRUE) {
137 *pErr = U_USING_DEFAULT_WARNING;
138 }
139 uprv_free(newCommonData);
140 }
141 umtx_unlock(NULL);
142 }
143
144 static const char *
findBasename(const char * path)145 findBasename(const char *path) {
146 const char *basename=uprv_strrchr(path, U_FILE_SEP_CHAR);
147 if(basename==NULL) {
148 return path;
149 } else {
150 return basename+1;
151 }
152 }
153
154 #ifdef UDATA_DEBUG
155 static const char *
packageNameFromPath(const char * path)156 packageNameFromPath(const char *path)
157 {
158 if((path == NULL) || (*path == 0)) {
159 return U_ICUDATA_NAME;
160 }
161
162 path = findBasename(path);
163
164 if((path == NULL) || (*path == 0)) {
165 return U_ICUDATA_NAME;
166 }
167
168 return path;
169 }
170 #endif
171
172 /*----------------------------------------------------------------------*
173 * *
174 * Cache for common data *
175 * Functions for looking up or adding entries to a cache of *
176 * data that has been previously opened. Avoids a potentially *
177 * expensive operation of re-opening the data for subsequent *
178 * uses. *
179 * *
180 * Data remains cached for the duration of the process. *
181 * *
182 *----------------------------------------------------------------------*/
183
184 typedef struct DataCacheElement {
185 char *name;
186 UDataMemory *item;
187 } DataCacheElement;
188
189
190
191 /*
192 * Deleter function for DataCacheElements.
193 * udata cleanup function closes the hash table; hash table in turn calls back to
194 * here for each entry.
195 */
DataCacheElement_deleter(void * pDCEl)196 static void U_CALLCONV DataCacheElement_deleter(void *pDCEl) {
197 DataCacheElement *p = (DataCacheElement *)pDCEl;
198 udata_close(p->item); /* unmaps storage */
199 uprv_free(p->name); /* delete the hash key string. */
200 uprv_free(pDCEl); /* delete 'this' */
201 }
202
203 /* udata_getCacheHashTable()
204 * Get the hash table used to store the data cache entries.
205 * Lazy create it if it doesn't yet exist.
206 */
udata_getHashTable()207 static UHashtable *udata_getHashTable() {
208 UErrorCode err = U_ZERO_ERROR;
209 UBool cacheIsInitialized;
210 UHashtable *tHT = NULL;
211
212 UMTX_CHECK(NULL, (gCommonDataCache != NULL), cacheIsInitialized);
213
214 if (cacheIsInitialized) {
215 return gCommonDataCache;
216 }
217
218 tHT = uhash_open(uhash_hashChars, uhash_compareChars, NULL, &err);
219 /* Check for null pointer. */
220 if (tHT == NULL) {
221 return NULL; /* TODO: Handle this error better. */
222 }
223 uhash_setValueDeleter(tHT, DataCacheElement_deleter);
224
225 umtx_lock(NULL);
226 if (gCommonDataCache == NULL) {
227 gCommonDataCache = tHT;
228 tHT = NULL;
229 ucln_common_registerCleanup(UCLN_COMMON_UDATA, udata_cleanup);
230 }
231 umtx_unlock(NULL);
232 if (tHT != NULL) {
233 uhash_close(tHT);
234 }
235
236 if (U_FAILURE(err)) {
237 return NULL; /* TODO: handle this error better. */
238 }
239 return gCommonDataCache;
240 }
241
242
243
udata_findCachedData(const char * path)244 static UDataMemory *udata_findCachedData(const char *path)
245 {
246 UHashtable *htable;
247 UDataMemory *retVal = NULL;
248 DataCacheElement *el;
249 const char *baseName;
250
251 baseName = findBasename(path); /* Cache remembers only the base name, not the full path. */
252 htable = udata_getHashTable();
253 umtx_lock(NULL);
254 el = (DataCacheElement *)uhash_get(htable, baseName);
255 umtx_unlock(NULL);
256 if (el != NULL) {
257 retVal = el->item;
258 }
259 #ifdef UDATA_DEBUG
260 fprintf(stderr, "Cache: [%s] -> %p\n", baseName, retVal);
261 #endif
262 return retVal;
263 }
264
265
udata_cacheDataItem(const char * path,UDataMemory * item,UErrorCode * pErr)266 static UDataMemory *udata_cacheDataItem(const char *path, UDataMemory *item, UErrorCode *pErr) {
267 DataCacheElement *newElement;
268 const char *baseName;
269 int32_t nameLen;
270 UHashtable *htable;
271 UDataMemory *oldValue = NULL;
272 UErrorCode subErr = U_ZERO_ERROR;
273
274 if (U_FAILURE(*pErr)) {
275 return NULL;
276 }
277
278 /* Create a new DataCacheElement - the thingy we store in the hash table -
279 * and copy the supplied path and UDataMemoryItems into it.
280 */
281 newElement = uprv_malloc(sizeof(DataCacheElement));
282 if (newElement == NULL) {
283 *pErr = U_MEMORY_ALLOCATION_ERROR;
284 return NULL;
285 }
286 newElement->item = UDataMemory_createNewInstance(pErr);
287 if (U_FAILURE(*pErr)) {
288 uprv_free(newElement);
289 return NULL;
290 }
291 UDatamemory_assign(newElement->item, item);
292
293 baseName = findBasename(path);
294 nameLen = (int32_t)uprv_strlen(baseName);
295 newElement->name = uprv_malloc(nameLen+1);
296 if (newElement->name == NULL) {
297 *pErr = U_MEMORY_ALLOCATION_ERROR;
298 uprv_free(newElement->item);
299 uprv_free(newElement);
300 return NULL;
301 }
302 uprv_strcpy(newElement->name, baseName);
303
304 /* Stick the new DataCacheElement into the hash table.
305 */
306 htable = udata_getHashTable();
307 umtx_lock(NULL);
308 oldValue = uhash_get(htable, path);
309 if (oldValue != NULL) {
310 subErr = U_USING_DEFAULT_WARNING;
311 }
312 else {
313 uhash_put(
314 htable,
315 newElement->name, /* Key */
316 newElement, /* Value */
317 &subErr);
318 }
319 umtx_unlock(NULL);
320
321 #ifdef UDATA_DEBUG
322 fprintf(stderr, "Cache: [%s] <<< %p : %s. vFunc=%p\n", newElement->name,
323 newElement->item, u_errorName(subErr), newElement->item->vFuncs);
324 #endif
325
326 if (subErr == U_USING_DEFAULT_WARNING || U_FAILURE(subErr)) {
327 *pErr = subErr; /* copy sub err unto fillin ONLY if something happens. */
328 uprv_free(newElement->name);
329 uprv_free(newElement->item);
330 uprv_free(newElement);
331 return oldValue;
332 }
333
334 return newElement->item;
335 }
336
337
338
339 /*-------------------------------------------------------------------------------
340 *
341 * TinyString - a small set of really simple string functions, for
342 * the purpose of consolidating buffer overflow code in one place
343 *
344 * Use wherever you would otherwise declare a fixed sized char[xx] buffer.
345 * Do non-growing ops by accessing fields of struct directly
346 * Grow using the append function to automatically extend buffer
347 * as needed.
348 *
349 *-------------------------------------------------------------------------------*/
350 typedef struct TinyString {
351 char *s;
352 int32_t length;
353 char fStaticBuf[100];
354 int32_t fCapacity;
355 } TinyString;
356
TinyString_init(TinyString * This)357 static void TinyString_init(TinyString *This) {
358 This->s = This->fStaticBuf;
359 *This->s = 0;
360 This->length = 0;
361 This->fCapacity = sizeof(This->fStaticBuf)-1;
362 }
363
TinyString_append(TinyString * This,const char * what)364 static void TinyString_append(TinyString *This, const char *what) {
365 int32_t newLen;
366 newLen = This->length + (int32_t)uprv_strlen(what);
367 if (newLen >= This->fCapacity) {
368 int32_t newCapacity = newLen * 2;
369 char *newBuf = (char *)uprv_malloc(newCapacity+1);
370 if (newBuf != NULL) {
371 uprv_strcpy(newBuf, This->s);
372 if (This->s != This->fStaticBuf) {
373 uprv_free(This->s);
374 }
375 This->s = newBuf;
376 This->fCapacity = newCapacity;
377 }
378 }
379 if (newLen < This->fCapacity) {
380 uprv_strcat(This->s+This->length, what);
381 This->length = newLen;
382 }
383 }
384
TinyString_appendn(TinyString * This,const char * what,int32_t n)385 static void TinyString_appendn(TinyString *This, const char *what, int32_t n) {
386 int32_t newLen;
387 newLen = This->length + n;
388 if (newLen >= This->fCapacity) {
389 int32_t newCapacity = newLen * 2;
390 char *newBuf = (char *)uprv_malloc(newCapacity+1);
391 if (newBuf != NULL) {
392 uprv_strcpy(newBuf, This->s);
393 if (This->s != This->fStaticBuf) {
394 uprv_free(This->s);
395 }
396 This->s = newBuf;
397 This->fCapacity = newCapacity;
398 }
399 }
400 if (newLen < This->fCapacity) {
401 uprv_strncat(This->s+This->length, what, n);
402 This->length = newLen;
403 }
404 }
405
TinyString_dt(TinyString * This)406 static void TinyString_dt(TinyString *This) {
407 if (This->s != This->fStaticBuf) {
408 uprv_free(This->s);
409 }
410 TinyString_init(This);
411 }
412
413
414
415
416 /*----------------------------------------------------------------------*==============
417 * *
418 * Path management. Could be shared with other tools/etc if need be *
419 * later on. *
420 * *
421 *----------------------------------------------------------------------*/
422
423 #define U_DATA_PATHITER_BUFSIZ 128 /* Size of local buffer for paths */
424 /* Overflow causes malloc of larger buf */
425
426 typedef struct
427 {
428 const char *path; /* working path (u_icudata_Dir) */
429 const char *nextPath; /* path following this one */
430 const char *basename; /* item's basename (icudt22e_mt.res)*/
431 const char *suffix; /* item suffix (can be null) */
432
433 uint32_t basenameLen; /* length of basename */
434
435 char *itemPath; /* path passed in with item name */
436 char itemPathBuf[U_DATA_PATHITER_BUFSIZ];
437
438 char *pathBuffer; /* output path for this it'ion */
439 char pathBufferA[U_DATA_PATHITER_BUFSIZ];
440
441 char *packageStub; /* example: "/icudt28b". Will ignore that leaf in set paths. */
442 char packageStubBuf[U_DATA_PATHITER_BUFSIZ];
443 uint32_t packageStubLen;
444
445 UBool checkLastFour; /* if TRUE then allow paths such as '/foo/myapp.dat'
446 * to match, checks last 4 chars of suffix with
447 * last 4 of path, then previous chars. */
448
449 } UDataPathIterator;
450
451 /**
452 * Initialize (or re-initialize) a user-supplied UDataPathIterator
453 * Note: UDataPathIterator does not allocate storage, so it doesn't need to be closed.
454 *
455 * @param iter The iterator to be initialized. Its current state does not matter.
456 * @param path The full pathname to be iterated over. If NULL, defaults to U_ICUDATA_NAME
457 * @param pkg Package which is being searched for, ex "icudt28l". Will ignore leave directories such as /icudt28l
458 * @param item Item to be searched for. Can include full path, such as /a/b/foo.dat
459 * @param suffix Optional item suffix, if not-null (ex. ".dat") then 'path' can contain 'item' explicitly.
460 * Ex: 'stuff.dat' would be found in '/a/foo:/tmp/stuff.dat:/bar/baz' as item #2.
461 * '/blarg/stuff.dat' would also be found.
462 */
udata_pathiter_init(UDataPathIterator * iter,const char * path,const char * pkg,const char * item,const char * suffix,UBool doCheckLastFour)463 static void udata_pathiter_init(UDataPathIterator *iter, const char *path, const char *pkg,
464 const char *item, const char *suffix, UBool doCheckLastFour)
465 {
466 #ifdef UDATA_DEBUG
467 fprintf(stderr, "SUFFIX1=%s PATH=%s\n", suffix, path);
468 #endif
469 /** Path **/
470 if(path == NULL) {
471 iter->path = u_getDataDirectory();
472 } else {
473 iter->path = path;
474 }
475
476 /** Package **/
477 if(pkg == NULL) {
478 iter->packageStubLen = 0;
479 iter->packageStub=iter->packageStubBuf;
480 iter->packageStub[0] = 0;
481 } else {
482 if(uprv_strlen(pkg) + 2 > U_DATA_PATHITER_BUFSIZ) {
483 iter->packageStub = uprv_malloc(uprv_strlen(pkg)+2);
484 /* Check for null pointer. */
485 if (iter->packageStub == NULL) {
486 return;
487 }
488 } else {
489 iter->packageStub = iter->packageStubBuf;
490 }
491 iter->packageStub[0] = U_FILE_SEP_CHAR;
492 uprv_strcpy(iter->packageStub+1, pkg);
493 iter->packageStubLen = (int32_t)uprv_strlen(iter->packageStub);
494
495 #ifdef UDATA_DEBUG
496 fprintf(stderr, "STUB=%s [%d]\n", iter->packageStub, iter->packageStubLen);
497 #endif
498 }
499
500 /** Item **/
501 iter->basename = findBasename(item);
502 iter->basenameLen = (int32_t)uprv_strlen(iter->basename);
503
504 /** Item path **/
505 iter->itemPath = iter->itemPathBuf;
506 if(iter->basename == item) {
507 iter->itemPath[0] = 0;
508 iter->nextPath = iter->path;
509 } else {
510 int32_t itemPathLen = (int32_t)(iter->basename-item);
511 if (itemPathLen >= U_DATA_PATHITER_BUFSIZ) {
512 char *t = (char *)uprv_malloc(itemPathLen+1);
513 if (t != NULL) {
514 iter->itemPath = t;
515 } else {
516 /* Malloc failed. Ignore the itemPath. */
517 itemPathLen = 0;
518 }
519 }
520 uprv_strncpy(iter->itemPath, item, itemPathLen);
521 iter->itemPath[itemPathLen]=0;
522 iter->nextPath = iter->itemPath;
523 }
524 #ifdef UDATA_DEBUG
525 fprintf(stderr, "SUFFIX=%s [%p]\n", suffix, suffix);
526 #endif
527
528 /** Suffix **/
529 if(suffix != NULL) {
530 iter->suffix = suffix;
531 } else {
532 iter->suffix = "";
533 }
534
535 iter->checkLastFour = doCheckLastFour;
536
537 /* pathBuffer will hold the output path strings returned by the this iterator
538 * Get an upper bound of possible string size, and make sure that the buffer
539 * is big enough (sum of length of each piece, 2 extra delimiters, + trailing NULL) */
540 {
541 int32_t maxPathLen = (int32_t)(uprv_strlen(iter->path) + uprv_strlen(item) + uprv_strlen(iter->suffix) + iter->packageStubLen + 3);
542 iter->pathBuffer = iter->pathBufferA;
543 if (maxPathLen >= U_DATA_PATHITER_BUFSIZ) {
544 iter->pathBuffer = (char *)uprv_malloc(maxPathLen);
545 if (iter->pathBuffer == NULL) {
546 iter->pathBuffer = iter->pathBufferA;
547 iter->path = "";
548 }
549 }
550 }
551
552 #ifdef UDATA_DEBUG
553 fprintf(stderr, "%p: init %s -> [path=%s], [base=%s], [suff=%s], [itempath=%s], [nextpath=%s], [checklast4=%s]\n",
554 iter,
555 item,
556 iter->path,
557 iter->basename,
558 iter->suffix,
559 iter->itemPath,
560 iter->nextPath,
561 iter->checkLastFour?"TRUE":"false");
562 #endif
563
564 }
565
566 /**
567 * Get the next path on the list.
568 *
569 * @param iter The Iter to be used
570 * @param len If set, pointer to the length of the returned path, for convenience.
571 * @return Pointer to the next path segment, or NULL if there are no more.
572 */
udata_pathiter_next(UDataPathIterator * iter)573 static const char *udata_pathiter_next(UDataPathIterator *iter)
574 {
575 const char *path = NULL;
576 uint32_t pathLen = 0;
577 const char *pathBasename;
578
579 do
580 {
581 if( iter->nextPath == NULL ) {
582 break;
583 }
584
585 path = iter->nextPath;
586
587 if(iter->nextPath == iter->itemPath) { /* we were processing item's path. */
588 iter->nextPath = iter->path; /* start with regular path next tm. */
589 pathLen = (int32_t)uprv_strlen(path);
590 } else {
591 /* fix up next for next time */
592 iter->nextPath = uprv_strchr(path, U_PATH_SEP_CHAR);
593 if(iter->nextPath == NULL) {
594 /* segment: entire path */
595 pathLen = (int32_t)uprv_strlen(path);
596 } else {
597 /* segment: until next segment */
598 pathLen = (int32_t)(iter->nextPath - path);
599 if(*iter->nextPath) { /* skip divider */
600 iter->nextPath ++;
601 }
602 }
603 }
604
605 if(pathLen == 0) {
606 continue;
607 }
608
609 #ifdef UDATA_DEBUG
610 fprintf(stderr, "rest of path (IDD) = %s\n", path);
611 fprintf(stderr, " ");
612 {
613 uint32_t qqq;
614 for(qqq=0;qqq<pathLen;qqq++)
615 {
616 fprintf(stderr, " ");
617 }
618
619 fprintf(stderr, "^\n");
620 }
621 #endif
622 uprv_strncpy(iter->pathBuffer, path, pathLen);
623 iter->pathBuffer[pathLen] = 0;
624
625 /* check for .dat files */
626 pathBasename = findBasename(iter->pathBuffer);
627
628 if(iter->checkLastFour == TRUE &&
629 (pathLen>=4) &&
630 uprv_strncmp(iter->pathBuffer +(pathLen-4),iter->suffix,4)==0 && /* suffix matches */
631 uprv_strncmp(findBasename(iter->pathBuffer),iter->basename,iter->basenameLen)==0 && /* base matches */
632 uprv_strlen(pathBasename)==(iter->basenameLen+4)) { /* base+suffix = full len */
633
634 #ifdef UDATA_DEBUG
635 fprintf(stderr, "Have %s file on the path: %s\n", iter->suffix, iter->pathBuffer);
636 #endif
637 /* do nothing */
638 }
639 else
640 { /* regular dir path */
641 if(iter->pathBuffer[pathLen-1] != U_FILE_SEP_CHAR) {
642 if((pathLen>=4) &&
643 uprv_strncmp(iter->pathBuffer+(pathLen-4), ".dat", 4) == 0)
644 {
645 #ifdef UDATA_DEBUG
646 fprintf(stderr, "skipping non-directory .dat file %s\n", iter->pathBuffer);
647 #endif
648 continue;
649 }
650
651 /* Check if it is a directory with the same name as our package */
652 if(iter->packageStubLen &&
653 (pathLen > iter->packageStubLen) &&
654 !uprv_strcmp(iter->pathBuffer + pathLen - iter->packageStubLen, iter->packageStub)) {
655 #ifdef UDATA_DEBUG
656 fprintf(stderr, "Found stub %s ( will add package %s of len %d)\n", iter->packageStub, iter->basename, iter->basenameLen);
657 #endif
658 pathLen -= iter->packageStubLen;
659 }
660
661 iter->pathBuffer[pathLen++] = U_FILE_SEP_CHAR;
662 }
663
664 uprv_strncpy(iter->pathBuffer + pathLen, /* + basename */
665 iter->packageStub+1,
666 iter->packageStubLen-1);
667
668 pathLen += iter->packageStubLen-1;
669
670 if(*iter->suffix) /* tack on suffix */
671 {
672 uprv_strcpy(iter->pathBuffer + pathLen,
673 iter->suffix);
674 pathLen += (int32_t)uprv_strlen(iter->suffix);
675 }
676
677 }
678
679 #ifdef UDATA_DEBUG
680 fprintf(stderr, " --> %s\n", iter->pathBuffer);
681 #endif
682
683 return iter->pathBuffer;
684
685 } while(iter->path);
686
687 /* fell way off the end */
688 return NULL;
689 }
690
691
692 /*
693 * Path Iterator Destructor. Clean up any allocated storage
694 */
udata_pathiter_dt(UDataPathIterator * iter)695 static void udata_pathiter_dt(UDataPathIterator *iter) {
696 if (iter->itemPath != iter->itemPathBuf) {
697 uprv_free(iter->itemPath);
698 iter->itemPath = NULL;
699 }
700 if (iter->pathBuffer != iter->pathBufferA) {
701 uprv_free(iter->pathBuffer);
702 iter->pathBuffer = NULL;
703 }
704 if (iter->packageStub != iter->packageStubBuf) {
705 uprv_free(iter->packageStub);
706 iter->packageStub = NULL;
707 }
708 }
709
710 /* ==================================================================================*/
711
712
713 /*----------------------------------------------------------------------*
714 * *
715 * Add a static reference to the common data library *
716 * Unless overridden by an explicit udata_setCommonData, this will be *
717 * our common data. *
718 * *
719 *----------------------------------------------------------------------*/
720 extern const ICU_Data_Header U_DATA_API U_ICUDATA_ENTRY_POINT;
721
722
723 /*----------------------------------------------------------------------*
724 * *
725 * openCommonData Attempt to open a common format (.dat) file *
726 * Map it into memory (if it's not there already) *
727 * and return a UDataMemory object for it. *
728 * *
729 * If the requested data is already open and cached *
730 * just return the cached UDataMem object. *
731 * *
732 *----------------------------------------------------------------------*/
733 static UDataMemory *
openCommonData(const char * path,UBool isICUData,UErrorCode * pErrorCode)734 openCommonData(const char *path, /* Path from OpenChoice? */
735 UBool isICUData, /* ICU Data true if path == NULL */
736 UErrorCode *pErrorCode)
737 {
738 UDataMemory tData;
739 UDataPathIterator iter;
740 const char *pathBuffer;
741 const char *inBasename;
742
743 if (U_FAILURE(*pErrorCode)) {
744 return NULL;
745 }
746
747 UDataMemory_init(&tData);
748
749 /* ??????? TODO revisit this */
750 if (isICUData) {
751 /* "mini-cache" for common ICU data */
752 if(gCommonICUData != NULL) {
753 return gCommonICUData;
754 }
755
756 tData.pHeader = &U_ICUDATA_ENTRY_POINT.hdr;
757 udata_checkCommonData(&tData, pErrorCode);
758 setCommonICUData(&tData, NULL, FALSE, pErrorCode);
759 return gCommonICUData;
760 }
761
762
763 /* request is NOT for ICU Data. */
764
765 /* Find the base name portion of the supplied path. */
766 /* inBasename will be left pointing somewhere within the original path string. */
767 inBasename = findBasename(path);
768 #ifdef UDATA_DEBUG
769 fprintf(stderr, "inBasename = %s\n", inBasename);
770 #endif
771
772 if(*inBasename==0) {
773 /* no basename. This will happen if the original path was a directory name, */
774 /* like "a/b/c/". (Fallback to separate files will still work.) */
775 #ifdef UDATA_DEBUG
776 fprintf(stderr, "ocd: no basename in %s, bailing.\n", path);
777 #endif
778 *pErrorCode=U_FILE_ACCESS_ERROR;
779 return NULL;
780 }
781
782 /* Is the requested common data file already open and cached? */
783 /* Note that the cache is keyed by the base name only. The rest of the path, */
784 /* if any, is not considered. */
785 {
786 UDataMemory *dataToReturn = udata_findCachedData(inBasename);
787 if (dataToReturn != NULL) {
788 return dataToReturn;
789 }
790 }
791
792 /* Requested item is not in the cache.
793 * Hunt it down, trying all the path locations
794 */
795
796 udata_pathiter_init(&iter, u_getDataDirectory(), inBasename, path, ".dat", TRUE);
797
798 while((UDataMemory_isLoaded(&tData)==FALSE) &&
799 (pathBuffer = udata_pathiter_next(&iter)) != NULL)
800 {
801 #ifdef UDATA_DEBUG
802 fprintf(stderr, "ocd: trying path %s - ", pathBuffer);
803 #endif
804 uprv_mapFile(&tData, pathBuffer);
805 #ifdef UDATA_DEBUG
806 fprintf(stderr, "%s\n", UDataMemory_isLoaded(&tData)?"LOADED":"not loaded");
807 #endif
808 }
809 udata_pathiter_dt(&iter); /* Note: this call may invalidate "pathBuffer" */
810
811 #if defined(OS390_STUBDATA) && defined(OS390BATCH)
812 if (!UDataMemory_isLoaded(&tData)) {
813 char ourPathBuffer[1024];
814 /* One more chance, for extendCommonData() */
815 uprv_strncpy(ourPathBuffer, path, 1019);
816 ourPathBuffer[1019]=0;
817 uprv_strcat(ourPathBuffer, ".dat");
818 uprv_mapFile(&tData, ourPathBuffer);
819 }
820 #endif
821
822 if (!UDataMemory_isLoaded(&tData)) {
823 /* no common data */
824 *pErrorCode=U_FILE_ACCESS_ERROR;
825 return NULL;
826 }
827
828 /* we have mapped a file, check its header */
829 udata_checkCommonData(&tData, pErrorCode);
830
831
832 /* Cache the UDataMemory struct for this .dat file,
833 * so we won't need to hunt it down and map it again next time
834 * something is needed from it. */
835 return udata_cacheDataItem(inBasename, &tData, pErrorCode);
836 }
837
838
839 #ifdef OS390
840 # define MAX_STUB_ENTRIES 8
841 #else
842 # define MAX_STUB_ENTRIES 0
843 #endif
844
845
846 /*----------------------------------------------------------------------*
847 * *
848 * extendICUData If the full set of ICU data was not loaded at *
849 * program startup, load it now. This function will *
850 * be called when the lookup of an ICU data item in *
851 * the common ICU data fails. *
852 * *
853 * The parameter is the UDataMemory in which the *
854 * search for a requested item failed. *
855 * *
856 * return true if new data is loaded, false otherwise.*
857 * *
858 *----------------------------------------------------------------------*/
extendICUData(UDataMemory * failedData,UErrorCode * pErr)859 static UBool extendICUData(UDataMemory *failedData, UErrorCode *pErr)
860 {
861 /* If the data library that we are running with turns out to be the
862 * stub library (or, on the 390, the subset library), we will try to
863 * load a .dat file instead. The stub library has no entries in its
864 * TOC, which is how we identify it here.
865 */
866 UDataMemory *pData;
867 UDataMemory copyPData;
868
869 if (failedData->vFuncs->NumEntries(failedData) > MAX_STUB_ENTRIES) {
870 /* Not the stub. We can't extend. */
871 return FALSE;
872 }
873
874 /* See if we can explicitly open a .dat file for the ICUData. */
875 pData = openCommonData(
876 U_ICUDATA_NAME, /* "icudt20l" , for example. */
877 FALSE, /* Pretend we're not opening ICUData */
878 pErr);
879
880 /* How about if there is no pData, eh... */
881
882 UDataMemory_init(©PData);
883 if(pData != NULL) {
884 UDatamemory_assign(©PData, pData);
885 copyPData.map = 0; /* The mapping for this data is owned by the hash table */
886 copyPData.mapAddr = 0; /* which will unmap it when ICU is shut down. */
887 /* CommonICUData is also unmapped when ICU is shut down.*/
888 /* To avoid unmapping the data twice, zero out the map */
889 /* fields in the UDataMemory that we're assigning */
890 /* to CommonICUData. */
891
892 setCommonICUData(©PData, /* The new common data. */
893 failedData, /* Old ICUData ptr. Overwrite of this value is ok, */
894 FALSE, /* No warnings if write didn't happen */
895 pErr); /* setCommonICUData honors errors; NOP if error set */
896 }
897
898
899 return gCommonICUData != failedData; /* Return true if ICUData pointer was updated. */
900 /* (Could potentialy have been done by another thread racing */
901 /* us through here, but that's fine, we still return true */
902 /* so that current thread will also examine extended data. */
903 }
904
905
906
907
908 /*----------------------------------------------------------------------*
909 * *
910 * udata_setCommonData *
911 * *
912 *----------------------------------------------------------------------*/
913 U_CAPI void U_EXPORT2
udata_setCommonData(const void * data,UErrorCode * pErrorCode)914 udata_setCommonData(const void *data, UErrorCode *pErrorCode) {
915 UDataMemory dataMemory;
916
917 if(pErrorCode==NULL || U_FAILURE(*pErrorCode)) {
918 return;
919 }
920
921 if(data==NULL) {
922 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
923 return;
924 }
925
926 /* do we already have common ICU data set? */
927 if(gCommonICUData != NULL) {
928 *pErrorCode=U_USING_DEFAULT_WARNING;
929 return;
930 }
931
932 /* set the data pointer and test for validity */
933 UDataMemory_init(&dataMemory);
934 UDataMemory_setData(&dataMemory, data);
935 udata_checkCommonData(&dataMemory, pErrorCode);
936 if (U_FAILURE(*pErrorCode)) {return;}
937
938 /* we have good data */
939 /* Set it up as the ICU Common Data. */
940 setCommonICUData(&dataMemory, NULL, TRUE, pErrorCode);
941 }
942
943
944
945
946 /*---------------------------------------------------------------------------
947 *
948 * udata_setAppData
949 *
950 *---------------------------------------------------------------------------- */
951 U_CAPI void U_EXPORT2
udata_setAppData(const char * path,const void * data,UErrorCode * err)952 udata_setAppData(const char *path, const void *data, UErrorCode *err)
953 {
954 UDataMemory udm;
955
956 if(err==NULL || U_FAILURE(*err)) {
957 return;
958 }
959 if(data==NULL) {
960 *err=U_ILLEGAL_ARGUMENT_ERROR;
961 return;
962 }
963
964 UDataMemory_init(&udm);
965 UDataMemory_setData(&udm, data);
966 udata_checkCommonData(&udm, err);
967 udata_cacheDataItem(path, &udm, err);
968 }
969
970 /*----------------------------------------------------------------------------*
971 * *
972 * checkDataItem Given a freshly located/loaded data item, either *
973 * an entry in a common file or a separately loaded file, *
974 * sanity check its header, and see if the data is *
975 * acceptable to the app. *
976 * If the data is good, create and return a UDataMemory *
977 * object that can be returned to the application. *
978 * Return NULL on any sort of failure. *
979 * *
980 *----------------------------------------------------------------------------*/
981 static UDataMemory *
checkDataItem(const DataHeader * pHeader,UDataMemoryIsAcceptable * isAcceptable,void * context,const char * type,const char * name,UErrorCode * nonFatalErr,UErrorCode * fatalErr)982 checkDataItem
983 (
984 const DataHeader *pHeader, /* The data item to be checked. */
985 UDataMemoryIsAcceptable *isAcceptable, /* App's call-back function */
986 void *context, /* pass-thru param for above. */
987 const char *type, /* pass-thru param for above. */
988 const char *name, /* pass-thru param for above. */
989 UErrorCode *nonFatalErr, /* Error code if this data was not acceptable */
990 /* but openChoice should continue with */
991 /* trying to get data from fallback path. */
992 UErrorCode *fatalErr /* Bad error, caller should return immediately */
993 )
994 {
995 UDataMemory *rDataMem = NULL; /* the new UDataMemory, to be returned. */
996
997 if (U_FAILURE(*fatalErr)) {
998 return NULL;
999 }
1000
1001 if(pHeader->dataHeader.magic1==0xda &&
1002 pHeader->dataHeader.magic2==0x27 &&
1003 (isAcceptable==NULL || isAcceptable(context, type, name, &pHeader->info))
1004 ) {
1005 rDataMem=UDataMemory_createNewInstance(fatalErr);
1006 if (U_FAILURE(*fatalErr)) {
1007 return NULL;
1008 }
1009 rDataMem->pHeader = pHeader;
1010 } else {
1011 /* the data is not acceptable, look further */
1012 /* If we eventually find something good, this errorcode will be */
1013 /* cleared out. */
1014 *nonFatalErr=U_INVALID_FORMAT_ERROR;
1015 }
1016 return rDataMem;
1017 }
1018
1019 /**
1020 * @return 0 if not loaded, 1 if loaded or err
1021 */
doLoadFromIndividualFiles(const char * pkgName,const char * dataPath,const char * tocEntryPathSuffix,const char * path,const char * type,const char * name,UDataMemoryIsAcceptable * isAcceptable,void * context,UErrorCode * subErrorCode,UErrorCode * pErrorCode)1022 static UDataMemory *doLoadFromIndividualFiles(const char *pkgName,
1023 const char *dataPath, const char *tocEntryPathSuffix,
1024 /* following arguments are the same as doOpenChoice itself */
1025 const char *path, const char *type, const char *name,
1026 UDataMemoryIsAcceptable *isAcceptable, void *context,
1027 UErrorCode *subErrorCode,
1028 UErrorCode *pErrorCode)
1029 {
1030 UDataMemory *retVal = NULL;
1031 const char *pathBuffer;
1032 UDataMemory dataMemory;
1033 UDataMemory *pEntryData;
1034
1035 UDataPathIterator iter;
1036 /* look in ind. files: package\nam.typ ========================= */
1037 /* init path iterator for individual files */
1038 udata_pathiter_init(&iter, dataPath, pkgName, path, tocEntryPathSuffix, FALSE);
1039
1040 while((pathBuffer = udata_pathiter_next(&iter)))
1041 {
1042 #ifdef UDATA_DEBUG
1043 fprintf(stderr, "UDATA: trying individual file %s\n", pathBuffer);
1044 #endif
1045 if(uprv_mapFile(&dataMemory, pathBuffer))
1046 {
1047 pEntryData = checkDataItem(dataMemory.pHeader, isAcceptable, context, type, name, subErrorCode, pErrorCode);
1048 if (pEntryData != NULL) {
1049 /* Data is good.
1050 * Hand off ownership of the backing memory to the user's UDataMemory.
1051 * and return it. */
1052 pEntryData->mapAddr = dataMemory.mapAddr;
1053 pEntryData->map = dataMemory.map;
1054
1055 #ifdef UDATA_DEBUG
1056 fprintf(stderr, "** Mapped file: %s\n", pathBuffer);
1057 #endif
1058 retVal = pEntryData;
1059 goto commonReturn;
1060 }
1061
1062 /* the data is not acceptable, or some error occured. Either way, unmap the memory */
1063 udata_close(&dataMemory);
1064
1065 /* If we had a nasty error, bail out completely. */
1066 if (U_FAILURE(*pErrorCode)) {
1067 retVal = NULL;
1068 goto commonReturn;
1069 }
1070
1071 /* Otherwise remember that we found data but didn't like it for some reason */
1072 *subErrorCode=U_INVALID_FORMAT_ERROR;
1073 }
1074 #ifdef UDATA_DEBUG
1075 fprintf(stderr, "%s\n", UDataMemory_isLoaded(&dataMemory)?"LOADED":"not loaded");
1076 #endif
1077 }
1078 commonReturn:
1079 udata_pathiter_dt(&iter);
1080 return retVal;
1081 }
1082
1083 /**
1084 * @return 0 if not loaded, 1 if loaded or err
1085 */
doLoadFromCommonData(UBool isICUData,const char * pkgName,const char * dataPath,const char * tocEntryPathSuffix,const char * tocEntryName,const char * path,const char * type,const char * name,UDataMemoryIsAcceptable * isAcceptable,void * context,UErrorCode * subErrorCode,UErrorCode * pErrorCode)1086 static UDataMemory *doLoadFromCommonData(UBool isICUData, const char *pkgName,
1087 const char *dataPath, const char *tocEntryPathSuffix, const char *tocEntryName,
1088 /* following arguments are the same as doOpenChoice itself */
1089 const char *path, const char *type, const char *name,
1090 UDataMemoryIsAcceptable *isAcceptable, void *context,
1091 UErrorCode *subErrorCode,
1092 UErrorCode *pErrorCode)
1093 {
1094 UDataMemory *retVal = NULL;
1095 UDataMemory *pEntryData;
1096 const DataHeader *pHeader;
1097 UDataMemory *pCommonData;
1098 /* try to get common data. The loop is for platforms such as the 390 that do
1099 * not initially load the full set of ICU data. If the lookup of an ICU data item
1100 * fails, the full (but slower to load) set is loaded, the and the loop repeats,
1101 * trying the lookup again. Once the full set of ICU data is loaded, the loop wont
1102 * repeat because the full set will be checked the first time through.
1103 *
1104 * The loop also handles the fallback to a .dat file if the application linked
1105 * to the stub data library rather than a real library.
1106 */
1107 for (;;) {
1108 pCommonData=openCommonData(path, isICUData, subErrorCode); /** search for pkg **/
1109
1110 if(U_SUCCESS(*subErrorCode)) {
1111 int32_t length;
1112
1113 /* look up the data piece in the common data */
1114 pHeader=pCommonData->vFuncs->Lookup(pCommonData, tocEntryName, &length, subErrorCode);
1115 #ifdef UDATA_DEBUG
1116 fprintf(stderr, "%s: pHeader=%p - %s\n", tocEntryName, pHeader, u_errorName(*subErrorCode));
1117 #endif
1118
1119 if(pHeader!=NULL) {
1120 pEntryData = checkDataItem(pHeader, isAcceptable, context, type, name, subErrorCode, pErrorCode);
1121 #ifdef UDATA_DEBUG
1122 fprintf(stderr, "pEntryData=%p\n", pEntryData);
1123 #endif
1124 if (U_FAILURE(*pErrorCode)) {
1125 retVal = NULL;
1126 goto commonReturn;
1127 }
1128 if (pEntryData != NULL) {
1129 pEntryData->length = length;
1130 retVal = pEntryData;
1131 goto commonReturn;
1132 }
1133 }
1134 }
1135 /* Data wasn't found. If we were looking for an ICUData item and there is
1136 * more data available, load it and try again,
1137 * otherwise break out of this loop. */
1138 if (!(isICUData && pCommonData && extendICUData(pCommonData, subErrorCode))) {
1139 break;
1140 }
1141 }
1142
1143 commonReturn:
1144 return retVal;
1145 }
1146
1147 /*
1148 * A note on the ownership of Mapped Memory
1149 *
1150 * For common format files, ownership resides with the UDataMemory object
1151 * that lives in the cache of opened common data. These UDataMemorys are private
1152 * to the udata implementation, and are never seen directly by users.
1153 *
1154 * The UDataMemory objects returned to users will have the address of some desired
1155 * data within the mapped region, but they wont have the mapping info itself, and thus
1156 * won't cause anything to be removed from memory when they are closed.
1157 *
1158 * For individual data files, the UDataMemory returned to the user holds the
1159 * information necessary to unmap the data on close. If the user independently
1160 * opens the same data file twice, two completely independent mappings will be made.
1161 * (There is no cache of opened data items from individual files, only a cache of
1162 * opened Common Data files, that is, files containing a collection of data items.)
1163 *
1164 * For common data passed in from the user via udata_setAppData() or
1165 * udata_setCommonData(), ownership remains with the user.
1166 *
1167 * UDataMemory objects themselves, as opposed to the memory they describe,
1168 * can be anywhere - heap, stack/local or global.
1169 * They have a flag to indicate when they're heap allocated and thus
1170 * must be deleted when closed.
1171 */
1172
1173
1174 /*----------------------------------------------------------------------------*
1175 * *
1176 * main data loading functions *
1177 * *
1178 *----------------------------------------------------------------------------*/
1179 static UDataMemory *
doOpenChoice(const char * path,const char * type,const char * name,UDataMemoryIsAcceptable * isAcceptable,void * context,UErrorCode * pErrorCode)1180 doOpenChoice(const char *path, const char *type, const char *name,
1181 UDataMemoryIsAcceptable *isAcceptable, void *context,
1182 UErrorCode *pErrorCode)
1183 {
1184 UDataMemory *retVal = NULL;
1185
1186 TinyString tocEntryName; /* entry name in tree format. ex: 'icudt28b/coll/ar.res' */
1187 TinyString tocEntryPath; /* entry name in path format. ex: 'icudt28b\\coll\\ar.res' */
1188
1189 TinyString pkgName;
1190 TinyString treeName;
1191 #if (U_FILE_SEP_CHAR != U_FILE_ALT_SEP_CHAR) /* '/' vs '\' */
1192 TinyString altSepPath;
1193 #endif
1194
1195 const char *dataPath;
1196
1197 int32_t tocEntrySuffixIndex;
1198 const char *tocEntryPathSuffix;
1199 UErrorCode subErrorCode=U_ZERO_ERROR;
1200 const char *treeChar;
1201
1202 UBool isICUData = FALSE;
1203
1204
1205 /* Is this path ICU data? */
1206 if(path == NULL ||
1207 !strcmp(path, U_ICUDATA_ALIAS) || /* "ICUDATA" */
1208 !uprv_strncmp(path, U_ICUDATA_NAME U_TREE_SEPARATOR_STRING, /* "icudt26e-" */
1209 uprv_strlen(U_ICUDATA_NAME U_TREE_SEPARATOR_STRING)) ||
1210 !uprv_strncmp(path, U_ICUDATA_ALIAS U_TREE_SEPARATOR_STRING, /* "ICUDATA-" */
1211 uprv_strlen(U_ICUDATA_ALIAS U_TREE_SEPARATOR_STRING))) {
1212 isICUData = TRUE;
1213 }
1214
1215 #if (U_FILE_SEP_CHAR != U_FILE_ALT_SEP_CHAR) /* Windows: try "foo\bar" and "foo/bar" */
1216 /* remap from alternate path char to the main one */
1217 TinyString_init(&altSepPath);
1218 if(path) {
1219 char *p;
1220 if((p=uprv_strchr(path,U_FILE_ALT_SEP_CHAR))) {
1221 TinyString_append(&altSepPath, path);
1222 while((p=uprv_strchr(altSepPath.s,U_FILE_ALT_SEP_CHAR))) {
1223 *p = U_FILE_SEP_CHAR;
1224 }
1225 #if defined (UDATA_DEBUG)
1226 fprintf(stderr, "Changed path from [%s] to [%s]\n", path, altSepPath.s);
1227 #endif
1228 path = altSepPath.s;
1229 }
1230 }
1231 #endif
1232
1233 TinyString_init(&tocEntryName);
1234 TinyString_init(&tocEntryPath);
1235
1236 TinyString_init(&pkgName);
1237 TinyString_init(&treeName);
1238
1239 /* ======= Set up strings */
1240 if(path==NULL) {
1241 TinyString_append(&pkgName, U_ICUDATA_NAME);
1242 } else {
1243 const char *pkg;
1244 const char *first;
1245 pkg = uprv_strrchr(path, U_FILE_SEP_CHAR);
1246 first = uprv_strchr(path, U_FILE_SEP_CHAR);
1247 if(uprv_pathIsAbsolute(path) || (pkg != first)) { /* more than one slash in the path- not a tree name */
1248 /* see if this is an /absolute/path/to/package path */
1249 if(pkg) {
1250 TinyString_append(&pkgName, pkg+1);
1251 } else {
1252 TinyString_append(&pkgName, path);
1253 }
1254 } else {
1255 treeChar = uprv_strchr(path, U_TREE_SEPARATOR);
1256 if(treeChar) {
1257 TinyString_append(&treeName, treeChar+1); /* following '-' */
1258 if(isICUData) {
1259 TinyString_append(&pkgName, U_ICUDATA_NAME);
1260 } else {
1261 TinyString_appendn(&pkgName, path, (int32_t)(treeChar-path));
1262 if (first == NULL) {
1263 /*
1264 This user data has no path, but there is a tree name.
1265 Look up the correct path from the data cache later.
1266 */
1267 path = pkgName.s;
1268 }
1269 }
1270 } else {
1271 if(isICUData) {
1272 TinyString_append(&pkgName, U_ICUDATA_NAME);
1273 } else {
1274 TinyString_append(&pkgName, path);
1275 }
1276 }
1277 }
1278 }
1279
1280 #ifdef UDATA_DEBUG
1281 fprintf(stderr, " P=%s T=%s\n", pkgName.s, treeName.s);
1282 #endif
1283
1284 /* setting up the entry name and file name
1285 * Make up a full name by appending the type to the supplied
1286 * name, assuming that a type was supplied.
1287 */
1288
1289 /* prepend the package */
1290 TinyString_append(&tocEntryName, pkgName.s);
1291 TinyString_append(&tocEntryPath, pkgName.s);
1292 tocEntrySuffixIndex = tocEntryName.length;
1293
1294 if(treeName.s[0]) {
1295 TinyString_append(&tocEntryName, U_TREE_ENTRY_SEP_STRING);
1296 TinyString_append(&tocEntryName, treeName.s);
1297
1298 TinyString_append(&tocEntryPath, U_FILE_SEP_STRING);
1299 TinyString_append(&tocEntryPath, treeName.s);
1300 }
1301
1302 TinyString_append(&tocEntryName, U_TREE_ENTRY_SEP_STRING);
1303 TinyString_append(&tocEntryPath, U_FILE_SEP_STRING);
1304 TinyString_append(&tocEntryName, name);
1305 TinyString_append(&tocEntryPath, name);
1306 if(type!=NULL && *type!=0) {
1307 TinyString_append(&tocEntryName, ".");
1308 TinyString_append(&tocEntryName, type);
1309 TinyString_append(&tocEntryPath, ".");
1310 TinyString_append(&tocEntryPath, type);
1311 }
1312 tocEntryPathSuffix = tocEntryPath.s+tocEntrySuffixIndex; /* suffix starts here */
1313
1314 #ifdef UDATA_DEBUG
1315 fprintf(stderr, " tocEntryName = %s\n", tocEntryName.s);
1316 fprintf(stderr, " tocEntryPath = %s\n", tocEntryName.s);
1317 #endif
1318
1319 if(path == NULL) {
1320 path = COMMON_DATA_NAME; /* "icudt26e" */
1321 }
1322
1323 /************************ Begin loop looking for ind. files ***************/
1324 #ifdef UDATA_DEBUG
1325 fprintf(stderr, "IND: inBasename = %s, pkg=%s\n", "(n/a)", packageNameFromPath(path));
1326 #endif
1327
1328 /* End of dealing with a null basename */
1329 dataPath = u_getDataDirectory();
1330
1331 /**** COMMON PACKAGE - only if packages are first. */
1332 if(gDataFileAccess == UDATA_PACKAGES_FIRST) {
1333 #ifdef UDATA_DEBUG
1334 fprintf(stderr, "Trying packages (UDATA_PACKAGES_FIRST)\n");
1335 #endif
1336 /* #2 */
1337 retVal = doLoadFromCommonData(isICUData,
1338 pkgName.s, dataPath, tocEntryPathSuffix, tocEntryName.s,
1339 path, type, name, isAcceptable, context, &subErrorCode, pErrorCode);
1340 if((retVal != NULL) || U_FAILURE(*pErrorCode)) {
1341 goto commonReturn;
1342 }
1343 }
1344
1345 /**** INDIVIDUAL FILES */
1346 if((gDataFileAccess==UDATA_PACKAGES_FIRST) ||
1347 (gDataFileAccess==UDATA_FILES_FIRST)) {
1348 #ifdef UDATA_DEBUG
1349 fprintf(stderr, "Trying individual files\n");
1350 #endif
1351 /* Check to make sure that there is a dataPath to iterate over */
1352 if ((dataPath && *dataPath) || !isICUData) {
1353 retVal = doLoadFromIndividualFiles(pkgName.s, dataPath, tocEntryPathSuffix,
1354 path, type, name, isAcceptable, context, &subErrorCode, pErrorCode);
1355 if((retVal != NULL) || U_FAILURE(*pErrorCode)) {
1356 goto commonReturn;
1357 }
1358 }
1359 }
1360
1361 /**** COMMON PACKAGE */
1362 if((gDataFileAccess==UDATA_ONLY_PACKAGES) ||
1363 (gDataFileAccess==UDATA_FILES_FIRST)) {
1364 #ifdef UDATA_DEBUG
1365 fprintf(stderr, "Trying packages (UDATA_ONLY_PACKAGES || UDATA_FILES_FIRST)\n");
1366 #endif
1367 retVal = doLoadFromCommonData(isICUData,
1368 pkgName.s, dataPath, tocEntryPathSuffix, tocEntryName.s,
1369 path, type, name, isAcceptable, context, &subErrorCode, pErrorCode);
1370 if((retVal != NULL) || U_FAILURE(*pErrorCode)) {
1371 goto commonReturn;
1372 }
1373 }
1374
1375 /* Load from DLL. If we haven't attempted package load, we also haven't had any chance to
1376 try a DLL (static or setCommonData/etc) load.
1377 If we ever have a "UDATA_ONLY_FILES", add it to the or list here. */
1378 if(gDataFileAccess==UDATA_NO_FILES) {
1379 #ifdef UDATA_DEBUG
1380 fprintf(stderr, "Trying common data (UDATA_NO_FILES)\n");
1381 #endif
1382 retVal = doLoadFromCommonData(isICUData,
1383 pkgName.s, "", tocEntryPathSuffix, tocEntryName.s,
1384 path, type, name, isAcceptable, context, &subErrorCode, pErrorCode);
1385 if((retVal != NULL) || U_FAILURE(*pErrorCode)) {
1386 goto commonReturn;
1387 }
1388 }
1389
1390 /* data not found */
1391 if(U_SUCCESS(*pErrorCode)) {
1392 if(U_SUCCESS(subErrorCode)) {
1393 /* file not found */
1394 *pErrorCode=U_FILE_ACCESS_ERROR;
1395 } else {
1396 /* entry point not found or rejected */
1397 *pErrorCode=subErrorCode;
1398 }
1399 }
1400
1401 commonReturn:
1402 TinyString_dt(&tocEntryName);
1403 TinyString_dt(&tocEntryPath);
1404 TinyString_dt(&pkgName);
1405 TinyString_dt(&treeName);
1406 #if (U_FILE_SEP_CHAR != U_FILE_ALT_SEP_CHAR)
1407 TinyString_dt(&altSepPath);
1408 #endif
1409 return retVal;
1410 }
1411
1412
1413
1414 /* API ---------------------------------------------------------------------- */
1415
1416 U_CAPI UDataMemory * U_EXPORT2
udata_open(const char * path,const char * type,const char * name,UErrorCode * pErrorCode)1417 udata_open(const char *path, const char *type, const char *name,
1418 UErrorCode *pErrorCode) {
1419 #ifdef UDATA_DEBUG
1420 fprintf(stderr, "udata_open(): Opening: %s : %s . %s\n", (path?path:"NULL"), name, type);
1421 fflush(stderr);
1422 #endif
1423
1424 if(pErrorCode==NULL || U_FAILURE(*pErrorCode)) {
1425 return NULL;
1426 } else if(name==NULL || *name==0) {
1427 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1428 return NULL;
1429 } else {
1430 return doOpenChoice(path, type, name, NULL, NULL, pErrorCode);
1431 }
1432 }
1433
1434
1435
1436 U_CAPI UDataMemory * U_EXPORT2
udata_openChoice(const char * path,const char * type,const char * name,UDataMemoryIsAcceptable * isAcceptable,void * context,UErrorCode * pErrorCode)1437 udata_openChoice(const char *path, const char *type, const char *name,
1438 UDataMemoryIsAcceptable *isAcceptable, void *context,
1439 UErrorCode *pErrorCode) {
1440 #ifdef UDATA_DEBUG
1441 fprintf(stderr, "udata_openChoice(): Opening: %s : %s . %s\n", (path?path:"NULL"), name, type);
1442 #endif
1443
1444 if(pErrorCode==NULL || U_FAILURE(*pErrorCode)) {
1445 return NULL;
1446 } else if(name==NULL || *name==0 || isAcceptable==NULL) {
1447 *pErrorCode=U_ILLEGAL_ARGUMENT_ERROR;
1448 return NULL;
1449 } else {
1450 return doOpenChoice(path, type, name, isAcceptable, context, pErrorCode);
1451 }
1452 }
1453
1454
1455
1456 U_CAPI void U_EXPORT2
udata_getInfo(UDataMemory * pData,UDataInfo * pInfo)1457 udata_getInfo(UDataMemory *pData, UDataInfo *pInfo) {
1458 if(pInfo!=NULL) {
1459 if(pData!=NULL && pData->pHeader!=NULL) {
1460 const UDataInfo *info=&pData->pHeader->info;
1461 uint16_t dataInfoSize=udata_getInfoSize(info);
1462 if(pInfo->size>dataInfoSize) {
1463 pInfo->size=dataInfoSize;
1464 }
1465 uprv_memcpy((uint16_t *)pInfo+1, (const uint16_t *)info+1, pInfo->size-2);
1466 if(info->isBigEndian!=U_IS_BIG_ENDIAN) {
1467 /* opposite endianness */
1468 uint16_t x=info->reservedWord;
1469 pInfo->reservedWord=(uint16_t)((x<<8)|(x>>8));
1470 }
1471 } else {
1472 pInfo->size=0;
1473 }
1474 }
1475 }
1476
1477
udata_setFileAccess(UDataFileAccess access,UErrorCode * status)1478 U_CAPI void U_EXPORT2 udata_setFileAccess(UDataFileAccess access, UErrorCode *status)
1479 {
1480 gDataFileAccess = access;
1481 }
1482
1483