1 /* 2 * The authors of this software are Rob Pike and Ken Thompson. 3 * Copyright (c) 2002 by Lucent Technologies. 4 * Permission to use, copy, modify, and distribute this software for any 5 * purpose without fee is hereby granted, provided that this entire notice 6 * is included in all copies of any software which is or includes a copy 7 * or modification of this software and in all copies of the supporting 8 * documentation for such software. 9 * THIS SOFTWARE IS BEING PROVIDED "AS IS", WITHOUT ANY EXPRESS OR IMPLIED 10 * WARRANTY. IN PARTICULAR, NEITHER THE AUTHORS NOR LUCENT TECHNOLOGIES MAKE ANY 11 * REPRESENTATION OR WARRANTY OF ANY KIND CONCERNING THE MERCHANTABILITY 12 * OF THIS SOFTWARE OR ITS FITNESS FOR ANY PARTICULAR PURPOSE. 13 * 14 * This file and rune.cc have been converted to compile as C++ code 15 * in name space re2. 16 */ 17 #ifndef RE2_UTIL_UTF_H__ 18 #define RE2_UTIL_UTF_H__ 19 20 #include <stdint.h> 21 22 namespace re2 { 23 24 typedef signed int Rune; /* Code-point values in Unicode 4.0 are 21 bits wide.*/ 25 26 enum 27 { 28 UTFmax = 4, /* maximum bytes per rune */ 29 Runesync = 0x80, /* cannot represent part of a UTF sequence (<) */ 30 Runeself = 0x80, /* rune and UTF sequences are the same (<) */ 31 Runeerror = 0xFFFD, /* decoding error in UTF */ 32 Runemax = 0x10FFFF, /* maximum rune value */ 33 }; 34 35 int runetochar(char* s, const Rune* r); 36 int chartorune(Rune* r, const char* s); 37 int fullrune(const char* s, int n); 38 int utflen(const char* s); 39 char* utfrune(const char*, Rune); 40 41 } // namespace re2 42 43 #endif // RE2_UTIL_UTF_H__ 44