1 // © 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ****************************************************************************** 5 * Copyright (C) 2015, International Business Machines Corporation and 6 * others. All Rights Reserved. 7 ****************************************************************************** 8 * 9 * File UNIFIEDCACHE.H - The ICU Unified cache. 10 ****************************************************************************** 11 */ 12 13 #ifndef __UNIFIED_CACHE_H__ 14 #define __UNIFIED_CACHE_H__ 15 16 #include "utypeinfo.h" // for 'typeid' to work 17 18 #include "unicode/uobject.h" 19 #include "unicode/locid.h" 20 #include "sharedobject.h" 21 #include "unicode/unistr.h" 22 #include "cstring.h" 23 #include "ustr_imp.h" 24 25 struct UHashtable; 26 struct UHashElement; 27 28 U_NAMESPACE_BEGIN 29 30 class UnifiedCache; 31 32 /** 33 * A base class for all cache keys. 34 */ 35 class U_COMMON_API CacheKeyBase : public UObject { 36 public: CacheKeyBase()37 CacheKeyBase() : fCreationStatus(U_ZERO_ERROR), fIsPrimary(false) {} 38 39 /** 40 * Copy constructor. Needed to support cloning. 41 */ CacheKeyBase(const CacheKeyBase & other)42 CacheKeyBase(const CacheKeyBase &other) 43 : UObject(other), fCreationStatus(other.fCreationStatus), fIsPrimary(false) { } 44 virtual ~CacheKeyBase(); 45 46 /** 47 * Returns the hash code for this object. 48 */ 49 virtual int32_t hashCode() const = 0; 50 51 /** 52 * Clones this object polymorphically. Caller owns returned value. 53 */ 54 virtual CacheKeyBase *clone() const = 0; 55 56 /** 57 * Equality operator. 58 */ 59 virtual UBool operator == (const CacheKeyBase &other) const = 0; 60 61 /** 62 * Create a new object for this key. Called by cache on cache miss. 63 * createObject must add a reference to the object it returns. Note 64 * that getting an object from the cache and returning it without calling 65 * removeRef on it satisfies this requirement. It can also return NULL 66 * and set status to an error. 67 * 68 * @param creationContext the context in which the object is being 69 * created. May be NULL. 70 * @param status Implementations can return a failure here. 71 * In addition, implementations may return a 72 * non NULL object and set a warning status. 73 */ 74 virtual const SharedObject *createObject( 75 const void *creationContext, UErrorCode &status) const = 0; 76 77 /** 78 * Writes a description of this key to buffer and returns buffer. Written 79 * description is NULL terminated. 80 */ 81 virtual char *writeDescription(char *buffer, int32_t bufSize) const = 0; 82 83 /** 84 * Inequality operator. 85 */ 86 UBool operator != (const CacheKeyBase &other) const { 87 return !(*this == other); 88 } 89 private: 90 mutable UErrorCode fCreationStatus; 91 mutable UBool fIsPrimary; 92 friend class UnifiedCache; 93 }; 94 95 96 97 /** 98 * Templated version of CacheKeyBase. 99 * A key of type LocaleCacheKey<T> maps to a value of type T. 100 */ 101 template<typename T> 102 class CacheKey : public CacheKeyBase { 103 public: ~CacheKey()104 virtual ~CacheKey() { } 105 /** 106 * The template parameter, T, determines the hash code returned. 107 */ hashCode()108 virtual int32_t hashCode() const { 109 const char *s = typeid(T).name(); 110 return ustr_hashCharsN(s, static_cast<int32_t>(uprv_strlen(s))); 111 } 112 113 /** 114 * Use the value type, T, as the description. 115 */ writeDescription(char * buffer,int32_t bufLen)116 virtual char *writeDescription(char *buffer, int32_t bufLen) const { 117 const char *s = typeid(T).name(); 118 uprv_strncpy(buffer, s, bufLen); 119 buffer[bufLen - 1] = 0; 120 return buffer; 121 } 122 123 /** 124 * Two objects are equal if they are of the same type. 125 */ 126 virtual UBool operator == (const CacheKeyBase &other) const { 127 return typeid(*this) == typeid(other); 128 } 129 }; 130 131 /** 132 * Cache key based on locale. 133 * A key of type LocaleCacheKey<T> maps to a value of type T. 134 */ 135 template<typename T> 136 class LocaleCacheKey : public CacheKey<T> { 137 protected: 138 Locale fLoc; 139 public: LocaleCacheKey(const Locale & loc)140 LocaleCacheKey(const Locale &loc) : fLoc(loc) {} LocaleCacheKey(const LocaleCacheKey<T> & other)141 LocaleCacheKey(const LocaleCacheKey<T> &other) 142 : CacheKey<T>(other), fLoc(other.fLoc) { } ~LocaleCacheKey()143 virtual ~LocaleCacheKey() { } hashCode()144 virtual int32_t hashCode() const { 145 return (int32_t)(37u * (uint32_t)CacheKey<T>::hashCode() + (uint32_t)fLoc.hashCode()); 146 } 147 virtual UBool operator == (const CacheKeyBase &other) const { 148 // reflexive 149 if (this == &other) { 150 return true; 151 } 152 if (!CacheKey<T>::operator == (other)) { 153 return false; 154 } 155 // We know this and other are of same class because operator== on 156 // CacheKey returned true. 157 const LocaleCacheKey<T> *fOther = 158 static_cast<const LocaleCacheKey<T> *>(&other); 159 return fLoc == fOther->fLoc; 160 } clone()161 virtual CacheKeyBase *clone() const { 162 return new LocaleCacheKey<T>(*this); 163 } 164 virtual const T *createObject( 165 const void *creationContext, UErrorCode &status) const; 166 /** 167 * Use the locale id as the description. 168 */ writeDescription(char * buffer,int32_t bufLen)169 virtual char *writeDescription(char *buffer, int32_t bufLen) const { 170 const char *s = fLoc.getName(); 171 uprv_strncpy(buffer, s, bufLen); 172 buffer[bufLen - 1] = 0; 173 return buffer; 174 } 175 176 }; 177 178 /** 179 * The unified cache. A singleton type. 180 * Design doc here: 181 * https://docs.google.com/document/d/1RwGQJs4N4tawNbf809iYDRCvXoMKqDJihxzYt1ysmd8/edit?usp=sharing 182 */ 183 class U_COMMON_API UnifiedCache : public UnifiedCacheBase { 184 public: 185 /** 186 * @internal 187 * Do not call directly. Instead use UnifiedCache::getInstance() as 188 * there should be only one UnifiedCache in an application. 189 */ 190 UnifiedCache(UErrorCode &status); 191 192 /** 193 * Return a pointer to the global cache instance. 194 */ 195 static UnifiedCache *getInstance(UErrorCode &status); 196 197 /** 198 * Fetches a value from the cache by key. Equivalent to 199 * get(key, NULL, ptr, status); 200 */ 201 template<typename T> get(const CacheKey<T> & key,const T * & ptr,UErrorCode & status)202 void get( 203 const CacheKey<T>& key, 204 const T *&ptr, 205 UErrorCode &status) const { 206 get(key, NULL, ptr, status); 207 } 208 209 /** 210 * Fetches value from the cache by key. 211 * 212 * @param key the cache key. 213 * @param creationContext passed verbatim to createObject method of key 214 * @param ptr On entry, ptr must be NULL or be included if 215 * the reference count of the object it points 216 * to. On exit, ptr points to the fetched object 217 * from the cache or is left unchanged on 218 * failure. Caller must call removeRef on ptr 219 * if set to a non NULL value. 220 * @param status Any error returned here. May be set to a 221 * warning value even if ptr is set. 222 */ 223 template<typename T> get(const CacheKey<T> & key,const void * creationContext,const T * & ptr,UErrorCode & status)224 void get( 225 const CacheKey<T>& key, 226 const void *creationContext, 227 const T *&ptr, 228 UErrorCode &status) const { 229 if (U_FAILURE(status)) { 230 return; 231 } 232 UErrorCode creationStatus = U_ZERO_ERROR; 233 const SharedObject *value = NULL; 234 _get(key, value, creationContext, creationStatus); 235 const T *tvalue = (const T *) value; 236 if (U_SUCCESS(creationStatus)) { 237 SharedObject::copyPtr(tvalue, ptr); 238 } 239 SharedObject::clearPtr(tvalue); 240 // Take care not to overwrite a warning status passed in with 241 // another warning or U_ZERO_ERROR. 242 if (status == U_ZERO_ERROR || U_FAILURE(creationStatus)) { 243 status = creationStatus; 244 } 245 } 246 247 #ifdef UNIFIED_CACHE_DEBUG 248 /** 249 * Dumps the contents of this cache to standard error. Used for testing of 250 * cache only. 251 */ 252 void dumpContents() const; 253 #endif 254 255 /** 256 * Convenience method to get a value of type T from cache for a 257 * particular locale with creationContext == NULL. 258 * @param loc the locale 259 * @param ptr On entry, must be NULL or included in the ref count 260 * of the object to which it points. 261 * On exit, fetched value stored here or is left 262 * unchanged on failure. Caller must call removeRef on 263 * ptr if set to a non NULL value. 264 * @param status Any error returned here. May be set to a 265 * warning value even if ptr is set. 266 */ 267 template<typename T> getByLocale(const Locale & loc,const T * & ptr,UErrorCode & status)268 static void getByLocale( 269 const Locale &loc, const T *&ptr, UErrorCode &status) { 270 const UnifiedCache *cache = getInstance(status); 271 if (U_FAILURE(status)) { 272 return; 273 } 274 cache->get(LocaleCacheKey<T>(loc), ptr, status); 275 } 276 277 #ifdef UNIFIED_CACHE_DEBUG 278 /** 279 * Dumps the cache contents to stderr. For testing only. 280 */ 281 static void dump(); 282 #endif 283 284 /** 285 * Returns the number of keys in this cache. For testing only. 286 */ 287 int32_t keyCount() const; 288 289 /** 290 * Removes any values from cache that are not referenced outside 291 * the cache. 292 */ 293 void flush() const; 294 295 /** 296 * Configures at what point evcition of unused entries will begin. 297 * Eviction is triggered whenever the number of evictable keys exeeds 298 * BOTH count AND (number of in-use items) * (percentageOfInUseItems / 100). 299 * Once the number of unused entries drops below one of these, 300 * eviction ceases. Because eviction happens incrementally, 301 * the actual unused entry count may exceed both these numbers 302 * from time to time. 303 * 304 * A cache entry is defined as unused if it is not essential to guarantee 305 * that for a given key X, the cache returns the same reference to the 306 * same value as long as the client already holds a reference to that 307 * value. 308 * 309 * If this method is never called, the default settings are 1000 and 100%. 310 * 311 * Although this method is thread-safe, it is designed to be called at 312 * application startup. If it is called in the middle of execution, it 313 * will have no immediate effect on the cache. However over time, the 314 * cache will perform eviction slices in an attempt to honor the new 315 * settings. 316 * 317 * If a client already holds references to many different unique values 318 * in the cache such that the number of those unique values far exeeds 319 * "count" then the cache may not be able to maintain this maximum. 320 * However, if this happens, the cache still guarantees that the number of 321 * unused entries will remain only a small percentage of the total cache 322 * size. 323 * 324 * If the parameters passed are negative, setEvctionPolicy sets status to 325 * U_ILLEGAL_ARGUMENT_ERROR. 326 */ 327 void setEvictionPolicy( 328 int32_t count, int32_t percentageOfInUseItems, UErrorCode &status); 329 330 331 /** 332 * Returns how many entries have been auto evicted during the lifetime 333 * of this cache. This only includes auto evicted entries, not 334 * entries evicted because of a call to flush(). 335 */ 336 int64_t autoEvictedCount() const; 337 338 /** 339 * Returns the unused entry count in this cache. For testing only, 340 * Regular clients will not need this. 341 */ 342 int32_t unusedCount() const; 343 344 virtual void handleUnreferencedObject() const; 345 virtual ~UnifiedCache(); 346 347 private: 348 UHashtable *fHashtable; 349 mutable int32_t fEvictPos; 350 mutable int32_t fNumValuesTotal; 351 mutable int32_t fNumValuesInUse; 352 int32_t fMaxUnused; 353 int32_t fMaxPercentageOfInUse; 354 mutable int64_t fAutoEvictedCount; 355 SharedObject *fNoValue; 356 357 UnifiedCache(const UnifiedCache &other); 358 UnifiedCache &operator=(const UnifiedCache &other); 359 360 /** 361 * Flushes the contents of the cache. If cache values hold references to other 362 * cache values then _flush should be called in a loop until it returns false. 363 * 364 * On entry, gCacheMutex must be held. 365 * On exit, those values with are evictable are flushed. 366 * 367 * @param all if false flush evictable items only, which are those with no external 368 * references, plus those that can be safely recreated.<br> 369 * if true, flush all elements. Any values (sharedObjects) with remaining 370 * hard (external) references are not deleted, but are detached from 371 * the cache, so that a subsequent removeRefs can delete them. 372 * _flush is not thread safe when all is true. 373 * @return true if any value in cache was flushed or false otherwise. 374 */ 375 UBool _flush(UBool all) const; 376 377 /** 378 * Gets value out of cache. 379 * On entry. gCacheMutex must not be held. value must be NULL. status 380 * must be U_ZERO_ERROR. 381 * On exit. value and status set to what is in cache at key or on cache 382 * miss the key's createObject() is called and value and status are set to 383 * the result of that. In this latter case, best effort is made to add the 384 * value and status to the cache. If createObject() fails to create a value, 385 * fNoValue is stored in cache, and value is set to NULL. Caller must call 386 * removeRef on value if non NULL. 387 */ 388 void _get( 389 const CacheKeyBase &key, 390 const SharedObject *&value, 391 const void *creationContext, 392 UErrorCode &status) const; 393 394 /** 395 * Attempts to fetch value and status for key from cache. 396 * On entry, gCacheMutex must not be held value must be NULL and status must 397 * be U_ZERO_ERROR. 398 * On exit, either returns false (In this 399 * case caller should try to create the object) or returns true with value 400 * pointing to the fetched value and status set to fetched status. When 401 * false is returned status may be set to failure if an in progress hash 402 * entry could not be made but value will remain unchanged. When true is 403 * returned, caller must call removeRef() on value. 404 */ 405 UBool _poll( 406 const CacheKeyBase &key, 407 const SharedObject *&value, 408 UErrorCode &status) const; 409 410 /** 411 * Places a new value and creationStatus in the cache for the given key. 412 * On entry, gCacheMutex must be held. key must not exist in the cache. 413 * On exit, value and creation status placed under key. Soft reference added 414 * to value on successful add. On error sets status. 415 */ 416 void _putNew( 417 const CacheKeyBase &key, 418 const SharedObject *value, 419 const UErrorCode creationStatus, 420 UErrorCode &status) const; 421 422 /** 423 * Places value and status at key if there is no value at key or if cache 424 * entry for key is in progress. Otherwise, it leaves the current value and 425 * status there. 426 * 427 * On entry. gCacheMutex must not be held. Value must be 428 * included in the reference count of the object to which it points. 429 * 430 * On exit, value and status are changed to what was already in the cache if 431 * something was there and not in progress. Otherwise, value and status are left 432 * unchanged in which case they are placed in the cache on a best-effort basis. 433 * Caller must call removeRef() on value. 434 */ 435 void _putIfAbsentAndGet( 436 const CacheKeyBase &key, 437 const SharedObject *&value, 438 UErrorCode &status) const; 439 440 /** 441 * Returns the next element in the cache round robin style. 442 * Returns nullptr if the cache is empty. 443 * On entry, gCacheMutex must be held. 444 */ 445 const UHashElement *_nextElement() const; 446 447 /** 448 * Return the number of cache items that would need to be evicted 449 * to bring usage into conformance with eviction policy. 450 * 451 * An item corresponds to an entry in the hash table, a hash table element. 452 * 453 * On entry, gCacheMutex must be held. 454 */ 455 int32_t _computeCountOfItemsToEvict() const; 456 457 /** 458 * Run an eviction slice. 459 * On entry, gCacheMutex must be held. 460 * _runEvictionSlice runs a slice of the evict pipeline by examining the next 461 * 10 entries in the cache round robin style evicting them if they are eligible. 462 */ 463 void _runEvictionSlice() const; 464 465 /** 466 * Register a primary cache entry. A primary key is the first key to create 467 * a given SharedObject value. Subsequent keys whose create function 468 * produce referneces to an already existing SharedObject are not primary - 469 * they can be evicted and subsequently recreated. 470 * 471 * On entry, gCacheMutex must be held. 472 * On exit, items in use count incremented, entry is marked as a primary 473 * entry, and value registered with cache so that subsequent calls to 474 * addRef() and removeRef() on it correctly interact with the cache. 475 */ 476 void _registerPrimary(const CacheKeyBase *theKey, const SharedObject *value) const; 477 478 /** 479 * Store a value and creation error status in given hash entry. 480 * On entry, gCacheMutex must be held. Hash entry element must be in progress. 481 * value must be non NULL. 482 * On Exit, soft reference added to value. value and status stored in hash 483 * entry. Soft reference removed from previous stored value. Waiting 484 * threads notified. 485 */ 486 void _put( 487 const UHashElement *element, 488 const SharedObject *value, 489 const UErrorCode status) const; 490 /** 491 * Remove a soft reference, and delete the SharedObject if no references remain. 492 * To be used from within the UnifiedCache implementation only. 493 * gCacheMutex must be held by caller. 494 * @param value the SharedObject to be acted on. 495 */ 496 void removeSoftRef(const SharedObject *value) const; 497 498 /** 499 * Increment the hard reference count of the given SharedObject. 500 * gCacheMutex must be held by the caller. 501 * Update numValuesEvictable on transitions between zero and one reference. 502 * 503 * @param value The SharedObject to be referenced. 504 * @return the hard reference count after the addition. 505 */ 506 int32_t addHardRef(const SharedObject *value) const; 507 508 /** 509 * Decrement the hard reference count of the given SharedObject. 510 * gCacheMutex must be held by the caller. 511 * Update numValuesEvictable on transitions between one and zero reference. 512 * 513 * @param value The SharedObject to be referenced. 514 * @return the hard reference count after the removal. 515 */ 516 int32_t removeHardRef(const SharedObject *value) const; 517 518 519 #ifdef UNIFIED_CACHE_DEBUG 520 void _dumpContents() const; 521 #endif 522 523 /** 524 * Fetch value and error code from a particular hash entry. 525 * On entry, gCacheMutex must be held. value must be either NULL or must be 526 * included in the ref count of the object to which it points. 527 * On exit, value and status set to what is in the hash entry. Caller must 528 * eventually call removeRef on value. 529 * If hash entry is in progress, value will be set to gNoValue and status will 530 * be set to U_ZERO_ERROR. 531 */ 532 void _fetch(const UHashElement *element, const SharedObject *&value, 533 UErrorCode &status) const; 534 535 /** 536 * Determine if given hash entry is in progress. 537 * On entry, gCacheMutex must be held. 538 */ 539 UBool _inProgress(const UHashElement *element) const; 540 541 /** 542 * Determine if given hash entry is in progress. 543 * On entry, gCacheMutex must be held. 544 */ 545 UBool _inProgress(const SharedObject *theValue, UErrorCode creationStatus) const; 546 547 /** 548 * Determine if given hash entry is eligible for eviction. 549 * On entry, gCacheMutex must be held. 550 */ 551 UBool _isEvictable(const UHashElement *element) const; 552 }; 553 554 U_NAMESPACE_END 555 556 #endif 557