1 // © 2016 and later: Unicode, Inc. and others.
2 // License & terms of use: http://www.unicode.org/copyright.html
3 /*
4 ******************************************************************************
5 * Copyright (C) 2015, International Business Machines Corporation and
6 * others. All Rights Reserved.
7 ******************************************************************************
8 *
9 * File UNIFIEDCACHE.H - The ICU Unified cache.
10 ******************************************************************************
11 */
12 
13 #ifndef __UNIFIED_CACHE_H__
14 #define __UNIFIED_CACHE_H__
15 
16 #include "utypeinfo.h"  // for 'typeid' to work
17 
18 #include "unicode/uobject.h"
19 #include "unicode/locid.h"
20 #include "sharedobject.h"
21 #include "unicode/unistr.h"
22 #include "cstring.h"
23 #include "ustr_imp.h"
24 
25 struct UHashtable;
26 struct UHashElement;
27 
28 U_NAMESPACE_BEGIN
29 
30 class UnifiedCache;
31 
32 /**
33  * A base class for all cache keys.
34  */
35 class U_COMMON_API CacheKeyBase : public UObject {
36  public:
CacheKeyBase()37    CacheKeyBase() : fCreationStatus(U_ZERO_ERROR), fIsPrimary(false) {}
38 
39    /**
40     * Copy constructor. Needed to support cloning.
41     */
CacheKeyBase(const CacheKeyBase & other)42    CacheKeyBase(const CacheKeyBase &other)
43            : UObject(other), fCreationStatus(other.fCreationStatus), fIsPrimary(false) { }
44    virtual ~CacheKeyBase();
45 
46    /**
47     * Returns the hash code for this object.
48     */
49    virtual int32_t hashCode() const = 0;
50 
51    /**
52     * Clones this object polymorphically. Caller owns returned value.
53     */
54    virtual CacheKeyBase *clone() const = 0;
55 
56    /**
57     * Equality operator.
58     */
59    virtual UBool operator == (const CacheKeyBase &other) const = 0;
60 
61    /**
62     * Create a new object for this key. Called by cache on cache miss.
63     * createObject must add a reference to the object it returns. Note
64     * that getting an object from the cache and returning it without calling
65     * removeRef on it satisfies this requirement. It can also return NULL
66     * and set status to an error.
67     *
68     * @param creationContext the context in which the object is being
69     *                        created. May be NULL.
70     * @param status          Implementations can return a failure here.
71     *                        In addition, implementations may return a
72     *                        non NULL object and set a warning status.
73     */
74    virtual const SharedObject *createObject(
75            const void *creationContext, UErrorCode &status) const = 0;
76 
77    /**
78     * Writes a description of this key to buffer and returns buffer. Written
79     * description is NULL terminated.
80     */
81    virtual char *writeDescription(char *buffer, int32_t bufSize) const = 0;
82 
83    /**
84     * Inequality operator.
85     */
86    UBool operator != (const CacheKeyBase &other) const {
87        return !(*this == other);
88    }
89  private:
90    mutable UErrorCode fCreationStatus;
91    mutable UBool fIsPrimary;
92    friend class UnifiedCache;
93 };
94 
95 
96 
97 /**
98  * Templated version of CacheKeyBase.
99  * A key of type LocaleCacheKey<T> maps to a value of type T.
100  */
101 template<typename T>
102 class CacheKey : public CacheKeyBase {
103  public:
~CacheKey()104    virtual ~CacheKey() { }
105    /**
106     * The template parameter, T, determines the hash code returned.
107     */
hashCode()108    virtual int32_t hashCode() const {
109        const char *s = typeid(T).name();
110        return ustr_hashCharsN(s, static_cast<int32_t>(uprv_strlen(s)));
111    }
112 
113    /**
114     * Use the value type, T,  as the description.
115     */
writeDescription(char * buffer,int32_t bufLen)116    virtual char *writeDescription(char *buffer, int32_t bufLen) const {
117        const char *s = typeid(T).name();
118        uprv_strncpy(buffer, s, bufLen);
119        buffer[bufLen - 1] = 0;
120        return buffer;
121    }
122 
123    /**
124     * Two objects are equal if they are of the same type.
125     */
126    virtual UBool operator == (const CacheKeyBase &other) const {
127        return typeid(*this) == typeid(other);
128    }
129 };
130 
131 /**
132  * Cache key based on locale.
133  * A key of type LocaleCacheKey<T> maps to a value of type T.
134  */
135 template<typename T>
136 class LocaleCacheKey : public CacheKey<T> {
137  protected:
138    Locale   fLoc;
139  public:
LocaleCacheKey(const Locale & loc)140    LocaleCacheKey(const Locale &loc) : fLoc(loc) {}
LocaleCacheKey(const LocaleCacheKey<T> & other)141    LocaleCacheKey(const LocaleCacheKey<T> &other)
142            : CacheKey<T>(other), fLoc(other.fLoc) { }
~LocaleCacheKey()143    virtual ~LocaleCacheKey() { }
hashCode()144    virtual int32_t hashCode() const {
145        return (int32_t)(37u * (uint32_t)CacheKey<T>::hashCode() + (uint32_t)fLoc.hashCode());
146    }
147    virtual UBool operator == (const CacheKeyBase &other) const {
148        // reflexive
149        if (this == &other) {
150            return true;
151        }
152        if (!CacheKey<T>::operator == (other)) {
153            return false;
154        }
155        // We know this and other are of same class because operator== on
156        // CacheKey returned true.
157        const LocaleCacheKey<T> *fOther =
158                static_cast<const LocaleCacheKey<T> *>(&other);
159        return fLoc == fOther->fLoc;
160    }
clone()161    virtual CacheKeyBase *clone() const {
162        return new LocaleCacheKey<T>(*this);
163    }
164    virtual const T *createObject(
165            const void *creationContext, UErrorCode &status) const;
166    /**
167     * Use the locale id as the description.
168     */
writeDescription(char * buffer,int32_t bufLen)169    virtual char *writeDescription(char *buffer, int32_t bufLen) const {
170        const char *s = fLoc.getName();
171        uprv_strncpy(buffer, s, bufLen);
172        buffer[bufLen - 1] = 0;
173        return buffer;
174    }
175 
176 };
177 
178 /**
179  * The unified cache. A singleton type.
180  * Design doc here:
181  * https://docs.google.com/document/d/1RwGQJs4N4tawNbf809iYDRCvXoMKqDJihxzYt1ysmd8/edit?usp=sharing
182  */
183 class U_COMMON_API UnifiedCache : public UnifiedCacheBase {
184  public:
185    /**
186     * @internal
187     * Do not call directly. Instead use UnifiedCache::getInstance() as
188     * there should be only one UnifiedCache in an application.
189     */
190    UnifiedCache(UErrorCode &status);
191 
192    /**
193     * Return a pointer to the global cache instance.
194     */
195    static UnifiedCache *getInstance(UErrorCode &status);
196 
197    /**
198     * Fetches a value from the cache by key. Equivalent to
199     * get(key, NULL, ptr, status);
200     */
201    template<typename T>
get(const CacheKey<T> & key,const T * & ptr,UErrorCode & status)202    void get(
203            const CacheKey<T>& key,
204            const T *&ptr,
205            UErrorCode &status) const {
206        get(key, NULL, ptr, status);
207    }
208 
209    /**
210     * Fetches value from the cache by key.
211     *
212     * @param key             the cache key.
213     * @param creationContext passed verbatim to createObject method of key
214     * @param ptr             On entry, ptr must be NULL or be included if
215     *                        the reference count of the object it points
216     *                        to. On exit, ptr points to the fetched object
217     *                        from the cache or is left unchanged on
218     *                        failure. Caller must call removeRef on ptr
219     *                        if set to a non NULL value.
220     * @param status          Any error returned here. May be set to a
221     *                        warning value even if ptr is set.
222     */
223    template<typename T>
get(const CacheKey<T> & key,const void * creationContext,const T * & ptr,UErrorCode & status)224    void get(
225            const CacheKey<T>& key,
226            const void *creationContext,
227            const T *&ptr,
228            UErrorCode &status) const {
229        if (U_FAILURE(status)) {
230            return;
231        }
232        UErrorCode creationStatus = U_ZERO_ERROR;
233        const SharedObject *value = NULL;
234        _get(key, value, creationContext, creationStatus);
235        const T *tvalue = (const T *) value;
236        if (U_SUCCESS(creationStatus)) {
237            SharedObject::copyPtr(tvalue, ptr);
238        }
239        SharedObject::clearPtr(tvalue);
240        // Take care not to overwrite a warning status passed in with
241        // another warning or U_ZERO_ERROR.
242        if (status == U_ZERO_ERROR || U_FAILURE(creationStatus)) {
243            status = creationStatus;
244        }
245    }
246 
247 #ifdef UNIFIED_CACHE_DEBUG
248    /**
249     * Dumps the contents of this cache to standard error. Used for testing of
250     * cache only.
251     */
252    void dumpContents() const;
253 #endif
254 
255    /**
256     * Convenience method to get a value of type T from cache for a
257     * particular locale with creationContext == NULL.
258     * @param loc    the locale
259     * @param ptr    On entry, must be NULL or included in the ref count
260     *               of the object to which it points.
261     *               On exit, fetched value stored here or is left
262     *               unchanged on failure. Caller must call removeRef on
263     *               ptr if set to a non NULL value.
264     * @param status Any error returned here. May be set to a
265     *               warning value even if ptr is set.
266     */
267    template<typename T>
getByLocale(const Locale & loc,const T * & ptr,UErrorCode & status)268    static void getByLocale(
269            const Locale &loc, const T *&ptr, UErrorCode &status) {
270        const UnifiedCache *cache = getInstance(status);
271        if (U_FAILURE(status)) {
272            return;
273        }
274        cache->get(LocaleCacheKey<T>(loc), ptr, status);
275    }
276 
277 #ifdef UNIFIED_CACHE_DEBUG
278    /**
279     * Dumps the cache contents to stderr. For testing only.
280     */
281    static void dump();
282 #endif
283 
284    /**
285     * Returns the number of keys in this cache. For testing only.
286     */
287    int32_t keyCount() const;
288 
289    /**
290     * Removes any values from cache that are not referenced outside
291     * the cache.
292     */
293    void flush() const;
294 
295    /**
296     * Configures at what point evcition of unused entries will begin.
297     * Eviction is triggered whenever the number of evictable keys exeeds
298     * BOTH count AND (number of in-use items) * (percentageOfInUseItems / 100).
299     * Once the number of unused entries drops below one of these,
300     * eviction ceases. Because eviction happens incrementally,
301     * the actual unused entry count may exceed both these numbers
302     * from time to time.
303     *
304     * A cache entry is defined as unused if it is not essential to guarantee
305     * that for a given key X, the cache returns the same reference to the
306     * same value as long as the client already holds a reference to that
307     * value.
308     *
309     * If this method is never called, the default settings are 1000 and 100%.
310     *
311     * Although this method is thread-safe, it is designed to be called at
312     * application startup. If it is called in the middle of execution, it
313     * will have no immediate effect on the cache. However over time, the
314     * cache will perform eviction slices in an attempt to honor the new
315     * settings.
316     *
317     * If a client already holds references to many different unique values
318     * in the cache such that the number of those unique values far exeeds
319     * "count" then the cache may not be able to maintain this maximum.
320     * However, if this happens, the cache still guarantees that the number of
321     * unused entries will remain only a small percentage of the total cache
322     * size.
323     *
324     * If the parameters passed are negative, setEvctionPolicy sets status to
325     * U_ILLEGAL_ARGUMENT_ERROR.
326     */
327    void setEvictionPolicy(
328            int32_t count, int32_t percentageOfInUseItems, UErrorCode &status);
329 
330 
331    /**
332     * Returns how many entries have been auto evicted during the lifetime
333     * of this cache. This only includes auto evicted entries, not
334     * entries evicted because of a call to flush().
335     */
336    int64_t autoEvictedCount() const;
337 
338    /**
339     * Returns the unused entry count in this cache. For testing only,
340     * Regular clients will not need this.
341     */
342    int32_t unusedCount() const;
343 
344    virtual void handleUnreferencedObject() const;
345    virtual ~UnifiedCache();
346 
347  private:
348    UHashtable *fHashtable;
349    mutable int32_t fEvictPos;
350    mutable int32_t fNumValuesTotal;
351    mutable int32_t fNumValuesInUse;
352    int32_t fMaxUnused;
353    int32_t fMaxPercentageOfInUse;
354    mutable int64_t fAutoEvictedCount;
355    SharedObject *fNoValue;
356 
357    UnifiedCache(const UnifiedCache &other);
358    UnifiedCache &operator=(const UnifiedCache &other);
359 
360    /**
361     * Flushes the contents of the cache. If cache values hold references to other
362     * cache values then _flush should be called in a loop until it returns false.
363     *
364     * On entry, gCacheMutex must be held.
365     * On exit, those values with are evictable are flushed.
366     *
367     *  @param all if false flush evictable items only, which are those with no external
368     *                    references, plus those that can be safely recreated.<br>
369     *            if true, flush all elements. Any values (sharedObjects) with remaining
370     *                     hard (external) references are not deleted, but are detached from
371     *                     the cache, so that a subsequent removeRefs can delete them.
372     *                     _flush is not thread safe when all is true.
373     *   @return true if any value in cache was flushed or false otherwise.
374     */
375    UBool _flush(UBool all) const;
376 
377    /**
378     * Gets value out of cache.
379     * On entry. gCacheMutex must not be held. value must be NULL. status
380     * must be U_ZERO_ERROR.
381     * On exit. value and status set to what is in cache at key or on cache
382     * miss the key's createObject() is called and value and status are set to
383     * the result of that. In this latter case, best effort is made to add the
384     * value and status to the cache. If createObject() fails to create a value,
385     * fNoValue is stored in cache, and value is set to NULL. Caller must call
386     * removeRef on value if non NULL.
387     */
388    void _get(
389            const CacheKeyBase &key,
390            const SharedObject *&value,
391            const void *creationContext,
392            UErrorCode &status) const;
393 
394     /**
395      * Attempts to fetch value and status for key from cache.
396      * On entry, gCacheMutex must not be held value must be NULL and status must
397      * be U_ZERO_ERROR.
398      * On exit, either returns false (In this
399      * case caller should try to create the object) or returns true with value
400      * pointing to the fetched value and status set to fetched status. When
401      * false is returned status may be set to failure if an in progress hash
402      * entry could not be made but value will remain unchanged. When true is
403      * returned, caller must call removeRef() on value.
404      */
405     UBool _poll(
406             const CacheKeyBase &key,
407             const SharedObject *&value,
408             UErrorCode &status) const;
409 
410     /**
411      * Places a new value and creationStatus in the cache for the given key.
412      * On entry, gCacheMutex must be held. key must not exist in the cache.
413      * On exit, value and creation status placed under key. Soft reference added
414      * to value on successful add. On error sets status.
415      */
416     void _putNew(
417         const CacheKeyBase &key,
418         const SharedObject *value,
419         const UErrorCode creationStatus,
420         UErrorCode &status) const;
421 
422     /**
423      * Places value and status at key if there is no value at key or if cache
424      * entry for key is in progress. Otherwise, it leaves the current value and
425      * status there.
426      *
427      * On entry. gCacheMutex must not be held. Value must be
428      * included in the reference count of the object to which it points.
429      *
430      * On exit, value and status are changed to what was already in the cache if
431      * something was there and not in progress. Otherwise, value and status are left
432      * unchanged in which case they are placed in the cache on a best-effort basis.
433      * Caller must call removeRef() on value.
434      */
435    void _putIfAbsentAndGet(
436            const CacheKeyBase &key,
437            const SharedObject *&value,
438            UErrorCode &status) const;
439 
440     /**
441      * Returns the next element in the cache round robin style.
442      * Returns nullptr if the cache is empty.
443      * On entry, gCacheMutex must be held.
444      */
445     const UHashElement *_nextElement() const;
446 
447    /**
448     * Return the number of cache items that would need to be evicted
449     * to bring usage into conformance with eviction policy.
450     *
451     * An item corresponds to an entry in the hash table, a hash table element.
452     *
453     * On entry, gCacheMutex must be held.
454     */
455    int32_t _computeCountOfItemsToEvict() const;
456 
457    /**
458     * Run an eviction slice.
459     * On entry, gCacheMutex must be held.
460     * _runEvictionSlice runs a slice of the evict pipeline by examining the next
461     * 10 entries in the cache round robin style evicting them if they are eligible.
462     */
463    void _runEvictionSlice() const;
464 
465    /**
466     * Register a primary cache entry. A primary key is the first key to create
467     * a given  SharedObject value. Subsequent keys whose create function
468     * produce referneces to an already existing SharedObject are not primary -
469     * they can be evicted and subsequently recreated.
470     *
471     * On entry, gCacheMutex must be held.
472     * On exit, items in use count incremented, entry is marked as a primary
473     * entry, and value registered with cache so that subsequent calls to
474     * addRef() and removeRef() on it correctly interact with the cache.
475     */
476    void _registerPrimary(const CacheKeyBase *theKey, const SharedObject *value) const;
477 
478    /**
479     * Store a value and creation error status in given hash entry.
480     * On entry, gCacheMutex must be held. Hash entry element must be in progress.
481     * value must be non NULL.
482     * On Exit, soft reference added to value. value and status stored in hash
483     * entry. Soft reference removed from previous stored value. Waiting
484     * threads notified.
485     */
486    void _put(
487            const UHashElement *element,
488            const SharedObject *value,
489            const UErrorCode status) const;
490     /**
491      * Remove a soft reference, and delete the SharedObject if no references remain.
492      * To be used from within the UnifiedCache implementation only.
493      * gCacheMutex must be held by caller.
494      * @param value the SharedObject to be acted on.
495      */
496    void removeSoftRef(const SharedObject *value) const;
497 
498    /**
499     * Increment the hard reference count of the given SharedObject.
500     * gCacheMutex must be held by the caller.
501     * Update numValuesEvictable on transitions between zero and one reference.
502     *
503     * @param value The SharedObject to be referenced.
504     * @return the hard reference count after the addition.
505     */
506    int32_t addHardRef(const SharedObject *value) const;
507 
508   /**
509     * Decrement the hard reference count of the given SharedObject.
510     * gCacheMutex must be held by the caller.
511     * Update numValuesEvictable on transitions between one and zero reference.
512     *
513     * @param value The SharedObject to be referenced.
514     * @return the hard reference count after the removal.
515     */
516    int32_t removeHardRef(const SharedObject *value) const;
517 
518 
519 #ifdef UNIFIED_CACHE_DEBUG
520    void _dumpContents() const;
521 #endif
522 
523    /**
524     *  Fetch value and error code from a particular hash entry.
525     *  On entry, gCacheMutex must be held. value must be either NULL or must be
526     *  included in the ref count of the object to which it points.
527     *  On exit, value and status set to what is in the hash entry. Caller must
528     *  eventually call removeRef on value.
529     *  If hash entry is in progress, value will be set to gNoValue and status will
530     *  be set to U_ZERO_ERROR.
531     */
532    void _fetch(const UHashElement *element, const SharedObject *&value,
533                        UErrorCode &status) const;
534 
535     /**
536      * Determine if given hash entry is in progress.
537      * On entry, gCacheMutex must be held.
538      */
539    UBool _inProgress(const UHashElement *element) const;
540 
541    /**
542     * Determine if given hash entry is in progress.
543     * On entry, gCacheMutex must be held.
544     */
545    UBool _inProgress(const SharedObject *theValue, UErrorCode creationStatus) const;
546 
547    /**
548     * Determine if given hash entry is eligible for eviction.
549     * On entry, gCacheMutex must be held.
550     */
551    UBool _isEvictable(const UHashElement *element) const;
552 };
553 
554 U_NAMESPACE_END
555 
556 #endif
557