1 // © 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ********************************************************************** 5 * Copyright (c) 2001-2015, International Business Machines 6 * Corporation and others. All Rights Reserved. 7 ********************************************************************** 8 * Date Name Description 9 * 11/19/2001 aliu Creation. 10 * 05/19/2010 markus Rewritten from scratch 11 ********************************************************************** 12 */ 13 14 #ifndef CHARSTRING_H 15 #define CHARSTRING_H 16 17 #include "unicode/utypes.h" 18 #include "unicode/unistr.h" 19 #include "unicode/uobject.h" 20 #include "cmemory.h" 21 22 U_NAMESPACE_BEGIN 23 24 // Windows needs us to DLL-export the MaybeStackArray template specialization, 25 // but MacOS X cannot handle it. Same as in digitlst.h. 26 #if !U_PLATFORM_IS_DARWIN_BASED 27 template class U_COMMON_API MaybeStackArray<char, 40>; 28 #endif 29 30 /** 31 * ICU-internal char * string class. 32 * This class does not assume or enforce any particular character encoding. 33 * Raw bytes can be stored. The string object owns its characters. 34 * A terminating NUL is stored, but the class does not prevent embedded NUL characters. 35 * 36 * This class wants to be convenient but is also deliberately minimalist. 37 * Please do not add methods if they only add minor convenience. 38 * For example: 39 * cs.data()[5]='a'; // no need for setCharAt(5, 'a') 40 */ 41 class U_COMMON_API CharString : public UMemory { 42 public: CharString()43 CharString() : len(0) { buffer[0]=0; } CharString(StringPiece s,UErrorCode & errorCode)44 CharString(StringPiece s, UErrorCode &errorCode) : len(0) { 45 buffer[0]=0; 46 append(s, errorCode); 47 } CharString(const CharString & s,UErrorCode & errorCode)48 CharString(const CharString &s, UErrorCode &errorCode) : len(0) { 49 buffer[0]=0; 50 append(s, errorCode); 51 } CharString(const char * s,int32_t sLength,UErrorCode & errorCode)52 CharString(const char *s, int32_t sLength, UErrorCode &errorCode) : len(0) { 53 buffer[0]=0; 54 append(s, sLength, errorCode); 55 } ~CharString()56 ~CharString() {} 57 58 /** 59 * Move constructor; might leave src in an undefined state. 60 * This string will have the same contents and state that the source string had. 61 */ 62 CharString(CharString &&src) U_NOEXCEPT; 63 /** 64 * Move assignment operator; might leave src in an undefined state. 65 * This string will have the same contents and state that the source string had. 66 * The behavior is undefined if *this and src are the same object. 67 */ 68 CharString &operator=(CharString &&src) U_NOEXCEPT; 69 70 /** 71 * Replaces this string's contents with the other string's contents. 72 * CharString does not support the standard copy constructor nor 73 * the assignment operator, to make copies explicit and to 74 * use a UErrorCode where memory allocations might be needed. 75 */ 76 CharString ©From(const CharString &other, UErrorCode &errorCode); 77 isEmpty()78 UBool isEmpty() const { return len==0; } length()79 int32_t length() const { return len; } 80 char operator[](int32_t index) const { return buffer[index]; } toStringPiece()81 StringPiece toStringPiece() const { return StringPiece(buffer.getAlias(), len); } 82 data()83 const char *data() const { return buffer.getAlias(); } data()84 char *data() { return buffer.getAlias(); } 85 /** 86 * Allocates length()+1 chars and copies the NUL-terminated data(). 87 * The caller must uprv_free() the result. 88 */ 89 char *cloneData(UErrorCode &errorCode) const; 90 /** 91 * Copies the contents of the string into dest. 92 * Checks if there is enough space in dest, extracts the entire string if possible, 93 * and NUL-terminates dest if possible. 94 * 95 * If the string fits into dest but cannot be NUL-terminated (length()==capacity), 96 * then the error code is set to U_STRING_NOT_TERMINATED_WARNING. 97 * If the string itself does not fit into dest (length()>capacity), 98 * then the error code is set to U_BUFFER_OVERFLOW_ERROR. 99 * 100 * @param dest Destination string buffer. 101 * @param capacity Size of the dest buffer (number of chars). 102 * @param errorCode ICU error code. 103 * @return length() 104 */ 105 int32_t extract(char *dest, int32_t capacity, UErrorCode &errorCode) const; 106 107 bool operator==(StringPiece other) const { 108 return len == other.length() && (len == 0 || uprv_memcmp(data(), other.data(), len) == 0); 109 } 110 bool operator!=(StringPiece other) const { 111 return !operator==(other); 112 } 113 114 /** @return last index of c, or -1 if c is not in this string */ 115 int32_t lastIndexOf(char c) const; 116 117 bool contains(StringPiece s) const; 118 clear()119 CharString &clear() { len=0; buffer[0]=0; return *this; } 120 CharString &truncate(int32_t newLength); 121 122 CharString &append(char c, UErrorCode &errorCode); append(StringPiece s,UErrorCode & errorCode)123 CharString &append(StringPiece s, UErrorCode &errorCode) { 124 return append(s.data(), s.length(), errorCode); 125 } append(const CharString & s,UErrorCode & errorCode)126 CharString &append(const CharString &s, UErrorCode &errorCode) { 127 return append(s.data(), s.length(), errorCode); 128 } 129 CharString &append(const char *s, int32_t sLength, UErrorCode &status); 130 131 CharString &appendNumber(int32_t number, UErrorCode &status); 132 133 /** 134 * Returns a writable buffer for appending and writes the buffer's capacity to 135 * resultCapacity. Guarantees resultCapacity>=minCapacity if U_SUCCESS(). 136 * There will additionally be space for a terminating NUL right at resultCapacity. 137 * (This function is similar to ByteSink.GetAppendBuffer().) 138 * 139 * The returned buffer is only valid until the next write operation 140 * on this string. 141 * 142 * After writing at most resultCapacity bytes, call append() with the 143 * pointer returned from this function and the number of bytes written. 144 * 145 * @param minCapacity required minimum capacity of the returned buffer; 146 * must be non-negative 147 * @param desiredCapacityHint desired capacity of the returned buffer; 148 * must be non-negative 149 * @param resultCapacity will be set to the capacity of the returned buffer 150 * @param errorCode in/out error code 151 * @return a buffer with resultCapacity>=min_capacity 152 */ 153 char *getAppendBuffer(int32_t minCapacity, 154 int32_t desiredCapacityHint, 155 int32_t &resultCapacity, 156 UErrorCode &errorCode); 157 158 CharString &appendInvariantChars(const UnicodeString &s, UErrorCode &errorCode); 159 CharString &appendInvariantChars(const UChar* uchars, int32_t ucharsLen, UErrorCode& errorCode); 160 161 /** 162 * Appends a filename/path part, e.g., a directory name. 163 * First appends a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR if necessary. 164 * Does nothing if s is empty. 165 */ 166 CharString &appendPathPart(StringPiece s, UErrorCode &errorCode); 167 168 /** 169 * Appends a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR if this string is not empty 170 * and does not already end with a U_FILE_SEP_CHAR or U_FILE_ALT_SEP_CHAR. 171 */ 172 CharString &ensureEndsWithFileSeparator(UErrorCode &errorCode); 173 174 private: 175 MaybeStackArray<char, 40> buffer; 176 int32_t len; 177 178 UBool ensureCapacity(int32_t capacity, int32_t desiredCapacityHint, UErrorCode &errorCode); 179 180 CharString(const CharString &other); // forbid copying of this class 181 CharString &operator=(const CharString &other); // forbid copying of this class 182 183 /** 184 * Returns U_FILE_ALT_SEP_CHAR if found in string, and U_FILE_SEP_CHAR is not found. 185 * Otherwise returns U_FILE_SEP_CHAR. 186 */ 187 char getDirSepChar() const; 188 }; 189 190 U_NAMESPACE_END 191 192 #endif 193 //eof 194