1 // Copyright 2011 the V8 project authors. All rights reserved. 2 // Redistribution and use in source and binary forms, with or without 3 // modification, are permitted provided that the following conditions are 4 // met: 5 // 6 // * Redistributions of source code must retain the above copyright 7 // notice, this list of conditions and the following disclaimer. 8 // * Redistributions in binary form must reproduce the above 9 // copyright notice, this list of conditions and the following 10 // disclaimer in the documentation and/or other materials provided 11 // with the distribution. 12 // * Neither the name of Google Inc. nor the names of its 13 // contributors may be used to endorse or promote products derived 14 // from this software without specific prior written permission. 15 // 16 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 17 // "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 18 // LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 19 // A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 20 // OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 21 // SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 22 // LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 23 // DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 24 // THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 25 // (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 26 // OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 27 28 #ifndef V8_SCANNER_CHARACTER_STREAMS_H_ 29 #define V8_SCANNER_CHARACTER_STREAMS_H_ 30 31 #include "scanner.h" 32 33 namespace v8 { 34 namespace internal { 35 36 // A buffered character stream based on a random access character 37 // source (ReadBlock can be called with pos_ pointing to any position, 38 // even positions before the current). 39 class BufferedUtf16CharacterStream: public Utf16CharacterStream { 40 public: 41 BufferedUtf16CharacterStream(); 42 virtual ~BufferedUtf16CharacterStream(); 43 44 virtual void PushBack(uc32 character); 45 46 protected: 47 static const unsigned kBufferSize = 512; 48 static const unsigned kPushBackStepSize = 16; 49 50 virtual unsigned SlowSeekForward(unsigned delta); 51 virtual bool ReadBlock(); 52 virtual void SlowPushBack(uc16 character); 53 54 virtual unsigned BufferSeekForward(unsigned delta) = 0; 55 virtual unsigned FillBuffer(unsigned position, unsigned length) = 0; 56 57 const uc16* pushback_limit_; 58 uc16 buffer_[kBufferSize]; 59 }; 60 61 62 // Generic string stream. 63 class GenericStringUtf16CharacterStream: public BufferedUtf16CharacterStream { 64 public: 65 GenericStringUtf16CharacterStream(Handle<String> data, 66 unsigned start_position, 67 unsigned end_position); 68 virtual ~GenericStringUtf16CharacterStream(); 69 70 protected: 71 virtual unsigned BufferSeekForward(unsigned delta); 72 virtual unsigned FillBuffer(unsigned position, unsigned length); 73 74 Handle<String> string_; 75 unsigned start_position_; 76 unsigned length_; 77 }; 78 79 80 // Utf16 stream based on a literal UTF-8 string. 81 class Utf8ToUtf16CharacterStream: public BufferedUtf16CharacterStream { 82 public: 83 Utf8ToUtf16CharacterStream(const byte* data, unsigned length); 84 virtual ~Utf8ToUtf16CharacterStream(); 85 86 protected: 87 virtual unsigned BufferSeekForward(unsigned delta); 88 virtual unsigned FillBuffer(unsigned char_position, unsigned length); 89 void SetRawPosition(unsigned char_position); 90 91 const byte* raw_data_; 92 unsigned raw_data_length_; // Measured in bytes, not characters. 93 unsigned raw_data_pos_; 94 // The character position of the character at raw_data[raw_data_pos_]. 95 // Not necessarily the same as pos_. 96 unsigned raw_character_position_; 97 }; 98 99 100 // UTF16 buffer to read characters from an external string. 101 class ExternalTwoByteStringUtf16CharacterStream: public Utf16CharacterStream { 102 public: 103 ExternalTwoByteStringUtf16CharacterStream(Handle<ExternalTwoByteString> data, 104 int start_position, 105 int end_position); 106 virtual ~ExternalTwoByteStringUtf16CharacterStream(); 107 PushBack(uc32 character)108 virtual void PushBack(uc32 character) { 109 ASSERT(buffer_cursor_ > raw_data_); 110 buffer_cursor_--; 111 pos_--; 112 } 113 114 protected: SlowSeekForward(unsigned delta)115 virtual unsigned SlowSeekForward(unsigned delta) { 116 // Fast case always handles seeking. 117 return 0; 118 } ReadBlock()119 virtual bool ReadBlock() { 120 // Entire string is read at start. 121 return false; 122 } 123 Handle<ExternalTwoByteString> source_; 124 const uc16* raw_data_; // Pointer to the actual array of characters. 125 }; 126 127 } } // namespace v8::internal 128 129 #endif // V8_SCANNER_CHARACTER_STREAMS_H_ 130