1 /* 2 * The authors of this software are Rob Pike and Ken Thompson. 3 * Copyright (c) 2002 by Lucent Technologies. 4 * Permission to use, copy, modify, and distribute this software for any 5 * purpose without fee is hereby granted, provided that this entire notice 6 * is included in all copies of any software which is or includes a copy 7 * or modification of this software and in all copies of the supporting 8 * documentation for such software. 9 * THIS SOFTWARE IS BEING PROVIDED "AS IS", WITHOUT ANY EXPRESS OR IMPLIED 10 * WARRANTY. IN PARTICULAR, NEITHER THE AUTHORS NOR LUCENT TECHNOLOGIES MAKE ANY 11 * REPRESENTATION OR WARRANTY OF ANY KIND CONCERNING THE MERCHANTABILITY 12 * OF THIS SOFTWARE OR ITS FITNESS FOR ANY PARTICULAR PURPOSE. 13 * 14 * This file and rune.cc have been converted to compile as C++ code 15 * in name space re2. 16 */ 17 18 #ifndef UTIL_UTF_H_ 19 #define UTIL_UTF_H_ 20 21 #include <stdint.h> 22 23 namespace re2 { 24 25 typedef signed int Rune; /* Code-point values in Unicode 4.0 are 21 bits wide.*/ 26 27 enum 28 { 29 UTFmax = 4, /* maximum bytes per rune */ 30 Runesync = 0x80, /* cannot represent part of a UTF sequence (<) */ 31 Runeself = 0x80, /* rune and UTF sequences are the same (<) */ 32 Runeerror = 0xFFFD, /* decoding error in UTF */ 33 Runemax = 0x10FFFF, /* maximum rune value */ 34 }; 35 36 int runetochar(char* s, const Rune* r); 37 int chartorune(Rune* r, const char* s); 38 int fullrune(const char* s, int n); 39 int utflen(const char* s); 40 char* utfrune(const char*, Rune); 41 42 } // namespace re2 43 44 #endif // UTIL_UTF_H_ 45