1 // © 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ********************************************************************** 5 * Copyright (c) 2002-2011, International Business Machines Corporation 6 * and others. All Rights Reserved. 7 ********************************************************************** 8 * Date Name Description 9 * 01/21/2002 aliu Creation. 10 ********************************************************************** 11 */ 12 13 #ifndef STRREPL_H 14 #define STRREPL_H 15 16 #include "unicode/utypes.h" 17 18 #if !UCONFIG_NO_TRANSLITERATION 19 20 #include "unicode/unifunct.h" 21 #include "unicode/unirepl.h" 22 #include "unicode/unistr.h" 23 24 U_NAMESPACE_BEGIN 25 26 class TransliterationRuleData; 27 28 /** 29 * A replacer that produces static text as its output. The text may 30 * contain transliterator stand-in characters that represent nested 31 * UnicodeReplacer objects, making it possible to encode a tree of 32 * replacers in a StringReplacer. A StringReplacer that contains such 33 * stand-ins is called a <em>complex</em> StringReplacer. A complex 34 * StringReplacer has a slower processing loop than a non-complex one. 35 * @author Alan Liu 36 */ 37 class StringReplacer : public UnicodeFunctor, public UnicodeReplacer { 38 39 private: 40 41 /** 42 * Output text, possibly containing stand-in characters that 43 * represent nested UnicodeReplacers. 44 */ 45 UnicodeString output; 46 47 /** 48 * Cursor position. Value is ignored if hasCursor is false. 49 */ 50 int32_t cursorPos; 51 52 /** 53 * True if this object outputs a cursor position. 54 */ 55 UBool hasCursor; 56 57 /** 58 * A complex object contains nested replacers and requires more 59 * complex processing. StringReplacers are initially assumed to 60 * be complex. If no nested replacers are seen during processing, 61 * then isComplex is set to false, and future replacements are 62 * short circuited for better performance. 63 */ 64 UBool isComplex; 65 66 /** 67 * Object that translates stand-in characters in 'output' to 68 * UnicodeReplacer objects. 69 */ 70 const TransliterationRuleData* data; 71 72 public: 73 74 /** 75 * Construct a StringReplacer that sets the emits the given output 76 * text and sets the cursor to the given position. 77 * @param theOutput text that will replace input text when the 78 * replace() method is called. May contain stand-in characters 79 * that represent nested replacers. 80 * @param theCursorPos cursor position that will be returned by 81 * the replace() method 82 * @param theData transliterator context object that translates 83 * stand-in characters to UnicodeReplacer objects 84 */ 85 StringReplacer(const UnicodeString& theOutput, 86 int32_t theCursorPos, 87 const TransliterationRuleData* theData); 88 89 /** 90 * Construct a StringReplacer that sets the emits the given output 91 * text and does not modify the cursor. 92 * @param theOutput text that will replace input text when the 93 * replace() method is called. May contain stand-in characters 94 * that represent nested replacers. 95 * @param theData transliterator context object that translates 96 * stand-in characters to UnicodeReplacer objects 97 */ 98 StringReplacer(const UnicodeString& theOutput, 99 const TransliterationRuleData* theData); 100 101 /** 102 * Copy constructor. 103 */ 104 StringReplacer(const StringReplacer& other); 105 106 /** 107 * Destructor 108 */ 109 virtual ~StringReplacer(); 110 111 /** 112 * Implement UnicodeFunctor 113 */ 114 virtual UnicodeFunctor* clone() const; 115 116 /** 117 * UnicodeFunctor API. Cast 'this' to a UnicodeReplacer* pointer 118 * and return the pointer. 119 */ 120 virtual UnicodeReplacer* toReplacer() const; 121 122 /** 123 * UnicodeReplacer API 124 */ 125 virtual int32_t replace(Replaceable& text, 126 int32_t start, 127 int32_t limit, 128 int32_t& cursor); 129 130 /** 131 * UnicodeReplacer API 132 */ 133 virtual UnicodeString& toReplacerPattern(UnicodeString& result, 134 UBool escapeUnprintable) const; 135 136 /** 137 * Implement UnicodeReplacer 138 */ 139 virtual void addReplacementSetTo(UnicodeSet& toUnionTo) const; 140 141 /** 142 * UnicodeFunctor API 143 */ 144 virtual void setData(const TransliterationRuleData*); 145 146 /** 147 * ICU "poor man's RTTI", returns a UClassID for this class. 148 */ 149 static UClassID U_EXPORT2 getStaticClassID(); 150 151 /** 152 * ICU "poor man's RTTI", returns a UClassID for the actual class. 153 */ 154 virtual UClassID getDynamicClassID() const; 155 }; 156 157 U_NAMESPACE_END 158 159 #endif /* #if !UCONFIG_NO_TRANSLITERATION */ 160 161 #endif 162 163 //eof 164