• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 /*
2  * (C) 1999 Lars Knoll (knoll@kde.org)
3  * Copyright (C) 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2012, 2013 Apple Inc. All rights reserved.
4  *
5  * This library is free software; you can redistribute it and/or
6  * modify it under the terms of the GNU Library General Public
7  * License as published by the Free Software Foundation; either
8  * version 2 of the License, or (at your option) any later version.
9  *
10  * This library is distributed in the hope that it will be useful,
11  * but WITHOUT ANY WARRANTY; without even the implied warranty of
12  * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
13  * Library General Public License for more details.
14  *
15  * You should have received a copy of the GNU Library General Public License
16  * along with this library; see the file COPYING.LIB.  If not, write to
17  * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
18  * Boston, MA 02110-1301, USA.
19  *
20  */
21 
22 #ifndef WTFString_h
23 #define WTFString_h
24 
25 // This file would be called String.h, but that conflicts with <string.h>
26 // on systems without case-sensitive file systems.
27 
28 #include "wtf/HashTableDeletedValueType.h"
29 #include "wtf/WTFExport.h"
30 #include "wtf/text/ASCIIFastPath.h"
31 #include "wtf/text/StringImpl.h"
32 #include "wtf/text/StringView.h"
33 
34 #ifdef __OBJC__
35 #include <objc/objc.h>
36 #endif
37 
38 namespace WTF {
39 
40 class CString;
41 struct StringHash;
42 
43 // Declarations of string operations
44 
45 WTF_EXPORT int charactersToIntStrict(const LChar*, size_t, bool* ok = 0, int base = 10);
46 WTF_EXPORT int charactersToIntStrict(const UChar*, size_t, bool* ok = 0, int base = 10);
47 WTF_EXPORT unsigned charactersToUIntStrict(const LChar*, size_t, bool* ok = 0, int base = 10);
48 WTF_EXPORT unsigned charactersToUIntStrict(const UChar*, size_t, bool* ok = 0, int base = 10);
49 WTF_EXPORT int64_t charactersToInt64Strict(const LChar*, size_t, bool* ok = 0, int base = 10);
50 WTF_EXPORT int64_t charactersToInt64Strict(const UChar*, size_t, bool* ok = 0, int base = 10);
51 WTF_EXPORT uint64_t charactersToUInt64Strict(const LChar*, size_t, bool* ok = 0, int base = 10);
52 WTF_EXPORT uint64_t charactersToUInt64Strict(const UChar*, size_t, bool* ok = 0, int base = 10);
53 WTF_EXPORT intptr_t charactersToIntPtrStrict(const LChar*, size_t, bool* ok = 0, int base = 10);
54 WTF_EXPORT intptr_t charactersToIntPtrStrict(const UChar*, size_t, bool* ok = 0, int base = 10);
55 
56 WTF_EXPORT int charactersToInt(const LChar*, size_t, bool* ok = 0); // ignores trailing garbage
57 WTF_EXPORT int charactersToInt(const UChar*, size_t, bool* ok = 0); // ignores trailing garbage
58 WTF_EXPORT unsigned charactersToUInt(const LChar*, size_t, bool* ok = 0); // ignores trailing garbage
59 WTF_EXPORT unsigned charactersToUInt(const UChar*, size_t, bool* ok = 0); // ignores trailing garbage
60 WTF_EXPORT int64_t charactersToInt64(const LChar*, size_t, bool* ok = 0); // ignores trailing garbage
61 WTF_EXPORT int64_t charactersToInt64(const UChar*, size_t, bool* ok = 0); // ignores trailing garbage
62 WTF_EXPORT uint64_t charactersToUInt64(const LChar*, size_t, bool* ok = 0); // ignores trailing garbage
63 WTF_EXPORT uint64_t charactersToUInt64(const UChar*, size_t, bool* ok = 0); // ignores trailing garbage
64 WTF_EXPORT intptr_t charactersToIntPtr(const LChar*, size_t, bool* ok = 0); // ignores trailing garbage
65 WTF_EXPORT intptr_t charactersToIntPtr(const UChar*, size_t, bool* ok = 0); // ignores trailing garbage
66 
67 // FIXME: Like the strict functions above, these give false for "ok" when there is trailing garbage.
68 // Like the non-strict functions above, these return the value when there is trailing garbage.
69 // It would be better if these were more consistent with the above functions instead.
70 WTF_EXPORT double charactersToDouble(const LChar*, size_t, bool* ok = 0);
71 WTF_EXPORT double charactersToDouble(const UChar*, size_t, bool* ok = 0);
72 WTF_EXPORT float charactersToFloat(const LChar*, size_t, bool* ok = 0);
73 WTF_EXPORT float charactersToFloat(const UChar*, size_t, bool* ok = 0);
74 WTF_EXPORT float charactersToFloat(const LChar*, size_t, size_t& parsedLength);
75 WTF_EXPORT float charactersToFloat(const UChar*, size_t, size_t& parsedLength);
76 
77 enum TrailingZerosTruncatingPolicy {
78     KeepTrailingZeros,
79     TruncateTrailingZeros
80 };
81 
82 template<bool isSpecialCharacter(UChar), typename CharacterType>
83 bool isAllSpecialCharacters(const CharacterType*, size_t);
84 
85 // You can find documentation about this class in this doc:
86 // https://docs.google.com/document/d/1kOCUlJdh2WJMJGDf-WoEQhmnjKLaOYRbiHz5TiGJl14/edit?usp=sharing
87 class WTF_EXPORT String {
88 public:
89     // Construct a null string, distinguishable from an empty string.
String()90     String() { }
91 
92     // Construct a string with UTF-16 data.
93     String(const UChar* characters, unsigned length);
94 
95     // Construct a string by copying the contents of a vector.
96     // This method will never create a null string. Vectors with size() == 0
97     // will return the empty string.
98     // NOTE: This is different from String(vector.data(), vector.size())
99     // which will sometimes return a null string when vector.data() is null
100     // which can only occur for vectors without inline capacity.
101     // See: https://bugs.webkit.org/show_bug.cgi?id=109792
102     template<size_t inlineCapacity>
103     explicit String(const Vector<UChar, inlineCapacity>&);
104 
105     // Construct a string with UTF-16 data, from a null-terminated source.
106     String(const UChar*);
107 
108     // Construct a string with latin1 data.
109     String(const LChar* characters, unsigned length);
110     String(const char* characters, unsigned length);
111 
112     // Construct a string with latin1 data, from a null-terminated source.
113     String(const LChar* characters);
114     String(const char* characters);
115 
116     // Construct a string referencing an existing StringImpl.
String(StringImpl * impl)117     String(StringImpl* impl) : m_impl(impl) { }
String(PassRefPtr<StringImpl> impl)118     String(PassRefPtr<StringImpl> impl) : m_impl(impl) { }
119 
120 #if COMPILER_SUPPORTS(CXX_RVALUE_REFERENCES)
121     // We have to declare the copy constructor and copy assignment operator as well, otherwise
122     // they'll be implicitly deleted by adding the move constructor and move assignment operator.
String(const String & other)123     String(const String& other) : m_impl(other.m_impl) { }
String(String && other)124     String(String&& other) : m_impl(other.m_impl.release()) { }
125     String& operator=(const String& other) { m_impl = other.m_impl; return *this; }
126     String& operator=(String&& other) { m_impl = other.m_impl.release(); return *this; }
127 #endif
128 
129     // Inline the destructor.
~String()130     ALWAYS_INLINE ~String() { }
131 
swap(String & o)132     void swap(String& o) { m_impl.swap(o.m_impl); }
133 
134     template<typename CharType>
adopt(StringBuffer<CharType> & buffer)135     static String adopt(StringBuffer<CharType>& buffer)
136     {
137         if (!buffer.length())
138             return StringImpl::empty();
139         return String(buffer.release());
140     }
141 
isNull()142     bool isNull() const { return !m_impl; }
isEmpty()143     bool isEmpty() const { return !m_impl || !m_impl->length(); }
144 
impl()145     StringImpl* impl() const { return m_impl.get(); }
releaseImpl()146     PassRefPtr<StringImpl> releaseImpl() { return m_impl.release(); }
147 
length()148     unsigned length() const
149     {
150         if (!m_impl)
151             return 0;
152         return m_impl->length();
153     }
154 
characters8()155     const LChar* characters8() const
156     {
157         if (!m_impl)
158             return 0;
159         ASSERT(m_impl->is8Bit());
160         return m_impl->characters8();
161     }
162 
characters16()163     const UChar* characters16() const
164     {
165         if (!m_impl)
166             return 0;
167         ASSERT(!m_impl->is8Bit());
168         return m_impl->characters16();
169     }
170 
171     // Return characters8() or characters16() depending on CharacterType.
172     template <typename CharacterType>
173     inline const CharacterType* getCharacters() const;
174 
is8Bit()175     bool is8Bit() const { return m_impl->is8Bit(); }
176 
sizeInBytes()177     unsigned sizeInBytes() const
178     {
179         if (!m_impl)
180             return 0;
181         return m_impl->length() * (is8Bit() ? sizeof(LChar) : sizeof(UChar));
182     }
183 
184     CString ascii() const;
185     CString latin1() const;
186 
187     typedef enum {
188         LenientConversion,
189         StrictConversion,
190         StrictConversionReplacingUnpairedSurrogatesWithFFFD,
191     } ConversionMode;
192 
193     CString utf8(ConversionMode = LenientConversion) const;
194 
195     UChar operator[](unsigned index) const
196     {
197         if (!m_impl || index >= m_impl->length())
198             return 0;
199         return (*m_impl)[index];
200     }
201 
202     static String number(int);
203     static String number(unsigned);
204     static String number(long);
205     static String number(unsigned long);
206     static String number(long long);
207     static String number(unsigned long long);
208 
209     static String number(double, unsigned precision = 6, TrailingZerosTruncatingPolicy = TruncateTrailingZeros);
210 
211     // Number to String conversion following the ECMAScript definition.
212     static String numberToStringECMAScript(double);
213     static String numberToStringFixedWidth(double, unsigned decimalPlaces);
214 
215     // Find a single character or string, also with match function & latin1 forms.
216     size_t find(UChar c, unsigned start = 0) const
217         { return m_impl ? m_impl->find(c, start) : kNotFound; }
218 
find(const String & str)219     size_t find(const String& str) const
220         { return m_impl ? m_impl->find(str.impl()) : kNotFound; }
find(const String & str,unsigned start)221     size_t find(const String& str, unsigned start) const
222         { return m_impl ? m_impl->find(str.impl(), start) : kNotFound; }
223 
224     size_t find(CharacterMatchFunctionPtr matchFunction, unsigned start = 0) const
225         { return m_impl ? m_impl->find(matchFunction, start) : kNotFound; }
226     size_t find(const LChar* str, unsigned start = 0) const
227         { return m_impl ? m_impl->find(str, start) : kNotFound; }
228 
229     size_t findNextLineStart(unsigned start = 0) const
230         { return m_impl ? m_impl->findNextLineStart(start) : kNotFound; }
231 
232     // Find the last instance of a single character or string.
233     size_t reverseFind(UChar c, unsigned start = UINT_MAX) const
234         { return m_impl ? m_impl->reverseFind(c, start) : kNotFound; }
235     size_t reverseFind(const String& str, unsigned start = UINT_MAX) const
236         { return m_impl ? m_impl->reverseFind(str.impl(), start) : kNotFound; }
237 
238     // Case insensitive string matching.
239     size_t findIgnoringCase(const LChar* str, unsigned start = 0) const
240         { return m_impl ? m_impl->findIgnoringCase(str, start) : kNotFound; }
241     size_t findIgnoringCase(const String& str, unsigned start = 0) const
242         { return m_impl ? m_impl->findIgnoringCase(str.impl(), start) : kNotFound; }
243     size_t reverseFindIgnoringCase(const String& str, unsigned start = UINT_MAX) const
244         { return m_impl ? m_impl->reverseFindIgnoringCase(str.impl(), start) : kNotFound; }
245 
246     // Wrappers for find & reverseFind adding dynamic sensitivity check.
find(const LChar * str,unsigned start,bool caseSensitive)247     size_t find(const LChar* str, unsigned start, bool caseSensitive) const
248         { return caseSensitive ? find(str, start) : findIgnoringCase(str, start); }
find(const String & str,unsigned start,bool caseSensitive)249     size_t find(const String& str, unsigned start, bool caseSensitive) const
250         { return caseSensitive ? find(str, start) : findIgnoringCase(str, start); }
reverseFind(const String & str,unsigned start,bool caseSensitive)251     size_t reverseFind(const String& str, unsigned start, bool caseSensitive) const
252         { return caseSensitive ? reverseFind(str, start) : reverseFindIgnoringCase(str, start); }
253 
254     Vector<UChar> charactersWithNullTermination() const;
255     unsigned copyTo(UChar* buffer, unsigned pos, unsigned maxLength) const;
256 
257     template<size_t inlineCapacity>
258     void appendTo(Vector<UChar, inlineCapacity>&, unsigned pos = 0, unsigned len = UINT_MAX) const;
259 
260     template<typename BufferType>
261     void appendTo(BufferType&, unsigned pos = 0, unsigned len = UINT_MAX) const;
262 
263     template<size_t inlineCapacity>
264     void prependTo(Vector<UChar, inlineCapacity>&, unsigned pos = 0, unsigned len = UINT_MAX) const;
265 
266     UChar32 characterStartingAt(unsigned) const;
267 
contains(UChar c)268     bool contains(UChar c) const { return find(c) != kNotFound; }
269     bool contains(const LChar* str, bool caseSensitive = true) const { return find(str, 0, caseSensitive) != kNotFound; }
270     bool contains(const String& str, bool caseSensitive = true) const { return find(str, 0, caseSensitive) != kNotFound; }
271 
272     bool startsWith(const String& s, bool caseSensitive = true) const
273         { return m_impl ? m_impl->startsWith(s.impl(), caseSensitive) : s.isEmpty(); }
startsWith(UChar character)274     bool startsWith(UChar character) const
275         { return m_impl ? m_impl->startsWith(character) : false; }
276     template<unsigned matchLength>
277     bool startsWith(const char (&prefix)[matchLength], bool caseSensitive = true) const
278         { return m_impl ? m_impl->startsWith<matchLength>(prefix, caseSensitive) : !matchLength; }
279 
280     bool endsWith(const String& s, bool caseSensitive = true) const
281         { return m_impl ? m_impl->endsWith(s.impl(), caseSensitive) : s.isEmpty(); }
endsWith(UChar character)282     bool endsWith(UChar character) const
283         { return m_impl ? m_impl->endsWith(character) : false; }
284     template<unsigned matchLength>
285     bool endsWith(const char (&prefix)[matchLength], bool caseSensitive = true) const
286         { return m_impl ? m_impl->endsWith<matchLength>(prefix, caseSensitive) : !matchLength; }
287 
288     void append(const String&);
289     void append(LChar);
append(char c)290     void append(char c) { append(static_cast<LChar>(c)); };
291     void append(UChar);
292     void append(const LChar*, unsigned length);
293     void append(const UChar*, unsigned length);
294     void insert(const String&, unsigned pos);
295     void insert(const LChar*, unsigned length, unsigned pos);
296     void insert(const UChar*, unsigned length, unsigned pos);
297 
replace(UChar a,UChar b)298     String& replace(UChar a, UChar b) { if (m_impl) m_impl = m_impl->replace(a, b); return *this; }
replace(UChar a,const String & b)299     String& replace(UChar a, const String& b) { if (m_impl) m_impl = m_impl->replace(a, b.impl()); return *this; }
replace(const String & a,const String & b)300     String& replace(const String& a, const String& b) { if (m_impl) m_impl = m_impl->replace(a.impl(), b.impl()); return *this; }
replace(unsigned index,unsigned len,const String & b)301     String& replace(unsigned index, unsigned len, const String& b) { if (m_impl) m_impl = m_impl->replace(index, len, b.impl()); return *this; }
302 
303     template<unsigned charactersCount>
replaceWithLiteral(UChar a,const char (& characters)[charactersCount])304     ALWAYS_INLINE String& replaceWithLiteral(UChar a, const char (&characters)[charactersCount])
305     {
306         if (m_impl)
307             m_impl = m_impl->replace(a, characters, charactersCount - 1);
308 
309         return *this;
310     }
311 
fill(UChar c)312     void fill(UChar c) { if (m_impl) m_impl = m_impl->fill(c); }
313 
314     void ensure16Bit();
315 
316     void truncate(unsigned len);
317     void remove(unsigned pos, int len = 1);
318 
319     String substring(unsigned pos, unsigned len = UINT_MAX) const;
left(unsigned len)320     String left(unsigned len) const { return substring(0, len); }
right(unsigned len)321     String right(unsigned len) const { return substring(length() - len, len); }
322 
createView()323     StringView createView() const { return StringView(impl()); }
createView(unsigned offset,unsigned length)324     StringView createView(unsigned offset, unsigned length) const { return StringView(impl(), offset, length); }
325 
326     // Returns a lowercase/uppercase version of the string
327     String lower() const;
328     String upper() const;
329 
330     String lower(const AtomicString& localeIdentifier) const;
331     String upper(const AtomicString& localeIdentifier) const;
332 
333     String stripWhiteSpace() const;
334     String stripWhiteSpace(IsWhiteSpaceFunctionPtr) const;
335     String simplifyWhiteSpace(StripBehavior stripBehavior = StripExtraWhiteSpace) const;
336     String simplifyWhiteSpace(IsWhiteSpaceFunctionPtr, StripBehavior stripBehavior = StripExtraWhiteSpace) const;
337 
338     String removeCharacters(CharacterMatchFunctionPtr) const;
339     template<bool isSpecialCharacter(UChar)> bool isAllSpecialCharacters() const;
340 
341     // Return the string with case folded for case insensitive comparison.
342     String foldCase() const;
343 
344     static String format(const char *, ...) WTF_ATTRIBUTE_PRINTF(1, 2);
345 
346     // Returns an uninitialized string. The characters needs to be written
347     // into the buffer returned in data before the returned string is used.
348     // Failure to do this will have unpredictable results.
createUninitialized(unsigned length,UChar * & data)349     static String createUninitialized(unsigned length, UChar*& data) { return StringImpl::createUninitialized(length, data); }
createUninitialized(unsigned length,LChar * & data)350     static String createUninitialized(unsigned length, LChar*& data) { return StringImpl::createUninitialized(length, data); }
351 
352     void split(const String& separator, bool allowEmptyEntries, Vector<String>& result) const;
split(const String & separator,Vector<String> & result)353     void split(const String& separator, Vector<String>& result) const
354     {
355         split(separator, false, result);
356     }
357     void split(UChar separator, bool allowEmptyEntries, Vector<String>& result) const;
split(UChar separator,Vector<String> & result)358     void split(UChar separator, Vector<String>& result) const
359     {
360         split(separator, false, result);
361     }
362 
363     int toIntStrict(bool* ok = 0, int base = 10) const;
364     unsigned toUIntStrict(bool* ok = 0, int base = 10) const;
365     int64_t toInt64Strict(bool* ok = 0, int base = 10) const;
366     uint64_t toUInt64Strict(bool* ok = 0, int base = 10) const;
367     intptr_t toIntPtrStrict(bool* ok = 0, int base = 10) const;
368 
369     int toInt(bool* ok = 0) const;
370     unsigned toUInt(bool* ok = 0) const;
371     int64_t toInt64(bool* ok = 0) const;
372     uint64_t toUInt64(bool* ok = 0) const;
373     intptr_t toIntPtr(bool* ok = 0) const;
374 
375     // FIXME: Like the strict functions above, these give false for "ok" when there is trailing garbage.
376     // Like the non-strict functions above, these return the value when there is trailing garbage.
377     // It would be better if these were more consistent with the above functions instead.
378     double toDouble(bool* ok = 0) const;
379     float toFloat(bool* ok = 0) const;
380 
381     bool percentage(int& percentage) const;
382 
383     String isolatedCopy() const;
384     bool isSafeToSendToAnotherThread() const;
385 
386     // Prevent Strings from being implicitly convertable to bool as it will be ambiguous on any platform that
387     // allows implicit conversion to another pointer type (e.g., Mac allows implicit conversion to NSString*).
388     typedef struct ImplicitConversionFromWTFStringToBoolDisallowedA* (String::*UnspecifiedBoolTypeA);
389     typedef struct ImplicitConversionFromWTFStringToBoolDisallowedB* (String::*UnspecifiedBoolTypeB);
390     operator UnspecifiedBoolTypeA() const;
391     operator UnspecifiedBoolTypeB() const;
392 
393 #if USE(CF)
394     String(CFStringRef);
395     RetainPtr<CFStringRef> createCFString() const;
396 #endif
397 
398 #ifdef __OBJC__
399     String(NSString*);
400 
401     // This conversion maps NULL to "", which loses the meaning of NULL, but we
402     // need this mapping because AppKit crashes when passed nil NSStrings.
403     operator NSString*() const { if (!m_impl) return @""; return *m_impl; }
404 #endif
405 
406     static String make8BitFrom16BitSource(const UChar*, size_t);
407     template<size_t inlineCapacity>
make8BitFrom16BitSource(const Vector<UChar,inlineCapacity> & buffer)408     static String make8BitFrom16BitSource(const Vector<UChar, inlineCapacity>& buffer)
409     {
410         return make8BitFrom16BitSource(buffer.data(), buffer.size());
411     }
412 
413     static String make16BitFrom8BitSource(const LChar*, size_t);
414 
415     // String::fromUTF8 will return a null string if
416     // the input data contains invalid UTF-8 sequences.
417     static String fromUTF8(const LChar*, size_t);
418     static String fromUTF8(const LChar*);
fromUTF8(const char * s,size_t length)419     static String fromUTF8(const char* s, size_t length) { return fromUTF8(reinterpret_cast<const LChar*>(s), length); };
fromUTF8(const char * s)420     static String fromUTF8(const char* s) { return fromUTF8(reinterpret_cast<const LChar*>(s)); };
421     static String fromUTF8(const CString&);
422 
423     // Tries to convert the passed in string to UTF-8, but will fall back to Latin-1 if the string is not valid UTF-8.
424     static String fromUTF8WithLatin1Fallback(const LChar*, size_t);
fromUTF8WithLatin1Fallback(const char * s,size_t length)425     static String fromUTF8WithLatin1Fallback(const char* s, size_t length) { return fromUTF8WithLatin1Fallback(reinterpret_cast<const LChar*>(s), length); };
426 
427     bool containsOnlyASCII() const;
428     bool containsOnlyLatin1() const;
containsOnlyWhitespace()429     bool containsOnlyWhitespace() const { return !m_impl || m_impl->containsOnlyWhitespace(); }
430 
431     // Hash table deleted values, which are only constructed and never copied or destroyed.
String(WTF::HashTableDeletedValueType)432     String(WTF::HashTableDeletedValueType) : m_impl(WTF::HashTableDeletedValue) { }
isHashTableDeletedValue()433     bool isHashTableDeletedValue() const { return m_impl.isHashTableDeletedValue(); }
434 
435 #ifndef NDEBUG
436     void show() const;
437 #endif
438 
439     // Workaround for a compiler bug. Use operator[] instead.
characterAt(unsigned index)440     UChar characterAt(unsigned index) const
441     {
442         if (!m_impl || index >= m_impl->length())
443             return 0;
444         return (*m_impl)[index];
445     }
446 
447 private:
448     template <typename CharacterType>
449     void removeInternal(const CharacterType*, unsigned, int);
450 
451     template <typename CharacterType>
452     void appendInternal(CharacterType);
453 
454     RefPtr<StringImpl> m_impl;
455 };
456 
457 inline bool operator==(const String& a, const String& b) { return equal(a.impl(), b.impl()); }
458 inline bool operator==(const String& a, const LChar* b) { return equal(a.impl(), b); }
459 inline bool operator==(const String& a, const char* b) { return equal(a.impl(), reinterpret_cast<const LChar*>(b)); }
460 inline bool operator==(const LChar* a, const String& b) { return equal(a, b.impl()); }
461 inline bool operator==(const char* a, const String& b) { return equal(reinterpret_cast<const LChar*>(a), b.impl()); }
462 template<size_t inlineCapacity>
463 inline bool operator==(const Vector<char, inlineCapacity>& a, const String& b) { return equal(b.impl(), a.data(), a.size()); }
464 template<size_t inlineCapacity>
465 inline bool operator==(const String& a, const Vector<char, inlineCapacity>& b) { return b == a; }
466 
467 
468 inline bool operator!=(const String& a, const String& b) { return !equal(a.impl(), b.impl()); }
469 inline bool operator!=(const String& a, const LChar* b) { return !equal(a.impl(), b); }
470 inline bool operator!=(const String& a, const char* b) { return !equal(a.impl(), reinterpret_cast<const LChar*>(b)); }
471 inline bool operator!=(const LChar* a, const String& b) { return !equal(a, b.impl()); }
472 inline bool operator!=(const char* a, const String& b) { return !equal(reinterpret_cast<const LChar*>(a), b.impl()); }
473 template<size_t inlineCapacity>
474 inline bool operator!=(const Vector<char, inlineCapacity>& a, const String& b) { return !(a == b); }
475 template<size_t inlineCapacity>
476 inline bool operator!=(const String& a, const Vector<char, inlineCapacity>& b) { return b != a; }
477 
equalIgnoringCase(const String & a,const String & b)478 inline bool equalIgnoringCase(const String& a, const String& b) { return equalIgnoringCase(a.impl(), b.impl()); }
equalIgnoringCase(const String & a,const LChar * b)479 inline bool equalIgnoringCase(const String& a, const LChar* b) { return equalIgnoringCase(a.impl(), b); }
equalIgnoringCase(const String & a,const char * b)480 inline bool equalIgnoringCase(const String& a, const char* b) { return equalIgnoringCase(a.impl(), reinterpret_cast<const LChar*>(b)); }
equalIgnoringCase(const LChar * a,const String & b)481 inline bool equalIgnoringCase(const LChar* a, const String& b) { return equalIgnoringCase(a, b.impl()); }
equalIgnoringCase(const char * a,const String & b)482 inline bool equalIgnoringCase(const char* a, const String& b) { return equalIgnoringCase(reinterpret_cast<const LChar*>(a), b.impl()); }
483 
equalPossiblyIgnoringCase(const String & a,const String & b,bool ignoreCase)484 inline bool equalPossiblyIgnoringCase(const String& a, const String& b, bool ignoreCase)
485 {
486     return ignoreCase ? equalIgnoringCase(a, b) : (a == b);
487 }
488 
equalIgnoringNullity(const String & a,const String & b)489 inline bool equalIgnoringNullity(const String& a, const String& b) { return equalIgnoringNullity(a.impl(), b.impl()); }
490 
491 template<size_t inlineCapacity>
equalIgnoringNullity(const Vector<UChar,inlineCapacity> & a,const String & b)492 inline bool equalIgnoringNullity(const Vector<UChar, inlineCapacity>& a, const String& b) { return equalIgnoringNullity(a, b.impl()); }
493 
494 inline bool operator!(const String& str) { return str.isNull(); }
495 
swap(String & a,String & b)496 inline void swap(String& a, String& b) { a.swap(b); }
497 
498 // Definitions of string operations
499 
500 template<size_t inlineCapacity>
String(const Vector<UChar,inlineCapacity> & vector)501 String::String(const Vector<UChar, inlineCapacity>& vector)
502     : m_impl(vector.size() ? StringImpl::create(vector.data(), vector.size()) : StringImpl::empty())
503 {
504 }
505 
506 template<>
507 inline const LChar* String::getCharacters<LChar>() const
508 {
509     ASSERT(is8Bit());
510     return characters8();
511 }
512 
513 template<>
514 inline const UChar* String::getCharacters<UChar>() const
515 {
516     ASSERT(!is8Bit());
517     return characters16();
518 }
519 
containsOnlyLatin1()520 inline bool String::containsOnlyLatin1() const
521 {
522     if (isEmpty())
523         return true;
524 
525     if (is8Bit())
526         return true;
527 
528     const UChar* characters = characters16();
529     UChar ored = 0;
530     for (size_t i = 0; i < m_impl->length(); ++i)
531         ored |= characters[i];
532     return !(ored & 0xFF00);
533 }
534 
535 
536 #ifdef __OBJC__
537 // This is for situations in WebKit where the long standing behavior has been
538 // "nil if empty", so we try to maintain longstanding behavior for the sake of
539 // entrenched clients
nsStringNilIfEmpty(const String & str)540 inline NSString* nsStringNilIfEmpty(const String& str) {  return str.isEmpty() ? nil : (NSString*)str; }
541 #endif
542 
containsOnlyASCII()543 inline bool String::containsOnlyASCII() const
544 {
545     if (isEmpty())
546         return true;
547 
548     if (is8Bit())
549         return charactersAreAllASCII(characters8(), m_impl->length());
550 
551     return charactersAreAllASCII(characters16(), m_impl->length());
552 }
553 
554 WTF_EXPORT int codePointCompare(const String&, const String&);
555 
codePointCompareLessThan(const String & a,const String & b)556 inline bool codePointCompareLessThan(const String& a, const String& b)
557 {
558     return codePointCompare(a.impl(), b.impl()) < 0;
559 }
560 
561 template<size_t inlineCapacity>
append(Vector<UChar,inlineCapacity> & vector,const String & string)562 inline void append(Vector<UChar, inlineCapacity>& vector, const String& string)
563 {
564     unsigned length = string.length();
565     if (!length)
566         return;
567     if (string.is8Bit()) {
568         const LChar* characters8 = string.characters8();
569         vector.reserveCapacity(vector.size() + length);
570         for (size_t i = 0; i < length; ++i)
571             vector.uncheckedAppend(characters8[i]);
572     } else {
573         vector.append(string.characters16(), length);
574     }
575 }
576 
577 template<typename CharacterType>
appendNumber(Vector<CharacterType> & vector,unsigned char number)578 inline void appendNumber(Vector<CharacterType>& vector, unsigned char number)
579 {
580     int numberLength = number > 99 ? 3 : (number > 9 ? 2 : 1);
581     size_t vectorSize = vector.size();
582     vector.grow(vectorSize + numberLength);
583 
584     switch (numberLength) {
585     case 3:
586         vector[vectorSize + 2] = number % 10 + '0';
587         number /= 10;
588 
589     case 2:
590         vector[vectorSize + 1] = number % 10 + '0';
591         number /= 10;
592 
593     case 1:
594         vector[vectorSize] = number % 10 + '0';
595     }
596 }
597 
598 template<bool isSpecialCharacter(UChar), typename CharacterType>
isAllSpecialCharacters(const CharacterType * characters,size_t length)599 inline bool isAllSpecialCharacters(const CharacterType* characters, size_t length)
600 {
601     for (size_t i = 0; i < length; ++i) {
602         if (!isSpecialCharacter(characters[i]))
603             return false;
604     }
605     return true;
606 }
607 
608 template<bool isSpecialCharacter(UChar)>
isAllSpecialCharacters()609 inline bool String::isAllSpecialCharacters() const
610 {
611     size_t len = length();
612 
613     if (!len)
614         return true;
615 
616     if (is8Bit())
617         return WTF::isAllSpecialCharacters<isSpecialCharacter, LChar>(characters8(), len);
618     return WTF::isAllSpecialCharacters<isSpecialCharacter, UChar>(characters16(), len);
619 }
620 
621 template<size_t inlineCapacity>
appendTo(Vector<UChar,inlineCapacity> & result,unsigned pos,unsigned len)622 inline void String::appendTo(Vector<UChar, inlineCapacity>& result, unsigned pos, unsigned len) const
623 {
624     unsigned numberOfCharactersToCopy = std::min(len, length() - pos);
625     if (numberOfCharactersToCopy <= 0)
626         return;
627     result.reserveCapacity(result.size() + numberOfCharactersToCopy);
628     if (is8Bit()) {
629         const LChar* characters8 = m_impl->characters8();
630         for (size_t i = 0; i < numberOfCharactersToCopy; ++i)
631             result.uncheckedAppend(characters8[pos + i]);
632     } else {
633         const UChar* characters16 = m_impl->characters16();
634         result.append(characters16 + pos, numberOfCharactersToCopy);
635     }
636 }
637 
638 template<typename BufferType>
appendTo(BufferType & result,unsigned pos,unsigned len)639 inline void String::appendTo(BufferType& result, unsigned pos, unsigned len) const
640 {
641     unsigned numberOfCharactersToCopy = std::min(len, length() - pos);
642     if (numberOfCharactersToCopy <= 0)
643         return;
644     if (is8Bit())
645         result.append(m_impl->characters8() + pos, numberOfCharactersToCopy);
646     else
647         result.append(m_impl->characters16() + pos, numberOfCharactersToCopy);
648 }
649 
650 template<size_t inlineCapacity>
prependTo(Vector<UChar,inlineCapacity> & result,unsigned pos,unsigned len)651 inline void String::prependTo(Vector<UChar, inlineCapacity>& result, unsigned pos, unsigned len) const
652 {
653     unsigned numberOfCharactersToCopy = std::min(len, length() - pos);
654     if (numberOfCharactersToCopy <= 0)
655         return;
656     if (is8Bit()) {
657         size_t oldSize = result.size();
658         result.resize(oldSize + numberOfCharactersToCopy);
659         memmove(result.data() + numberOfCharactersToCopy, result.data(), oldSize * sizeof(UChar));
660         StringImpl::copyChars(result.data(), m_impl->characters8() + pos, numberOfCharactersToCopy);
661     } else {
662         result.prepend(m_impl->characters16() + pos, numberOfCharactersToCopy);
663     }
664 }
665 
666 // StringHash is the default hash for String
667 template<typename T> struct DefaultHash;
668 template<> struct DefaultHash<String> {
669     typedef StringHash Hash;
670 };
671 
672 template <> struct VectorTraits<String> : SimpleClassVectorTraits {
673     static const bool canCompareWithMemcmp = false;
674 };
675 
676 // Shared global empty string.
677 WTF_EXPORT const String& emptyString();
678 
679 }
680 
681 using WTF::CString;
682 using WTF::KeepTrailingZeros;
683 using WTF::String;
684 using WTF::emptyString;
685 using WTF::append;
686 using WTF::appendNumber;
687 using WTF::charactersAreAllASCII;
688 using WTF::charactersToIntStrict;
689 using WTF::charactersToUIntStrict;
690 using WTF::charactersToInt64Strict;
691 using WTF::charactersToUInt64Strict;
692 using WTF::charactersToIntPtrStrict;
693 using WTF::charactersToInt;
694 using WTF::charactersToUInt;
695 using WTF::charactersToInt64;
696 using WTF::charactersToUInt64;
697 using WTF::charactersToIntPtr;
698 using WTF::charactersToDouble;
699 using WTF::charactersToFloat;
700 using WTF::equal;
701 using WTF::equalIgnoringCase;
702 using WTF::find;
703 using WTF::isAllSpecialCharacters;
704 using WTF::isSpaceOrNewline;
705 using WTF::reverseFind;
706 
707 #include "wtf/text/AtomicString.h"
708 #endif
709