1 //===- BitstreamReader.cpp - BitstreamReader implementation ---------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9
10 #include "llvm/Bitcode/BitstreamReader.h"
11 #include "llvm/ADT/StringRef.h"
12 #include <cassert>
13 #include <string>
14
15 using namespace llvm;
16
17 //===----------------------------------------------------------------------===//
18 // BitstreamCursor implementation
19 //===----------------------------------------------------------------------===//
20
21 /// EnterSubBlock - Having read the ENTER_SUBBLOCK abbrevid, enter
22 /// the block, and return true if the block has an error.
EnterSubBlock(unsigned BlockID,unsigned * NumWordsP)23 bool BitstreamCursor::EnterSubBlock(unsigned BlockID, unsigned *NumWordsP) {
24 // Save the current block's state on BlockScope.
25 BlockScope.push_back(Block(CurCodeSize));
26 BlockScope.back().PrevAbbrevs.swap(CurAbbrevs);
27
28 // Add the abbrevs specific to this block to the CurAbbrevs list.
29 if (BlockInfo) {
30 if (const BitstreamBlockInfo::BlockInfo *Info =
31 BlockInfo->getBlockInfo(BlockID)) {
32 CurAbbrevs.insert(CurAbbrevs.end(), Info->Abbrevs.begin(),
33 Info->Abbrevs.end());
34 }
35 }
36
37 // Get the codesize of this block.
38 CurCodeSize = ReadVBR(bitc::CodeLenWidth);
39 // We can't read more than MaxChunkSize at a time
40 if (CurCodeSize > MaxChunkSize)
41 return true;
42
43 SkipToFourByteBoundary();
44 unsigned NumWords = Read(bitc::BlockSizeWidth);
45 if (NumWordsP) *NumWordsP = NumWords;
46
47 // Validate that this block is sane.
48 return CurCodeSize == 0 || AtEndOfStream();
49 }
50
readAbbreviatedField(BitstreamCursor & Cursor,const BitCodeAbbrevOp & Op)51 static uint64_t readAbbreviatedField(BitstreamCursor &Cursor,
52 const BitCodeAbbrevOp &Op) {
53 assert(!Op.isLiteral() && "Not to be used with literals!");
54
55 // Decode the value as we are commanded.
56 switch (Op.getEncoding()) {
57 case BitCodeAbbrevOp::Array:
58 case BitCodeAbbrevOp::Blob:
59 llvm_unreachable("Should not reach here");
60 case BitCodeAbbrevOp::Fixed:
61 assert((unsigned)Op.getEncodingData() <= Cursor.MaxChunkSize);
62 return Cursor.Read((unsigned)Op.getEncodingData());
63 case BitCodeAbbrevOp::VBR:
64 assert((unsigned)Op.getEncodingData() <= Cursor.MaxChunkSize);
65 return Cursor.ReadVBR64((unsigned)Op.getEncodingData());
66 case BitCodeAbbrevOp::Char6:
67 return BitCodeAbbrevOp::DecodeChar6(Cursor.Read(6));
68 }
69 llvm_unreachable("invalid abbreviation encoding");
70 }
71
skipAbbreviatedField(BitstreamCursor & Cursor,const BitCodeAbbrevOp & Op)72 static void skipAbbreviatedField(BitstreamCursor &Cursor,
73 const BitCodeAbbrevOp &Op) {
74 assert(!Op.isLiteral() && "Not to be used with literals!");
75
76 // Decode the value as we are commanded.
77 switch (Op.getEncoding()) {
78 case BitCodeAbbrevOp::Array:
79 case BitCodeAbbrevOp::Blob:
80 llvm_unreachable("Should not reach here");
81 case BitCodeAbbrevOp::Fixed:
82 assert((unsigned)Op.getEncodingData() <= Cursor.MaxChunkSize);
83 Cursor.Read((unsigned)Op.getEncodingData());
84 break;
85 case BitCodeAbbrevOp::VBR:
86 assert((unsigned)Op.getEncodingData() <= Cursor.MaxChunkSize);
87 Cursor.ReadVBR64((unsigned)Op.getEncodingData());
88 break;
89 case BitCodeAbbrevOp::Char6:
90 Cursor.Read(6);
91 break;
92 }
93 }
94
95 /// skipRecord - Read the current record and discard it.
skipRecord(unsigned AbbrevID)96 unsigned BitstreamCursor::skipRecord(unsigned AbbrevID) {
97 // Skip unabbreviated records by reading past their entries.
98 if (AbbrevID == bitc::UNABBREV_RECORD) {
99 unsigned Code = ReadVBR(6);
100 unsigned NumElts = ReadVBR(6);
101 for (unsigned i = 0; i != NumElts; ++i)
102 (void)ReadVBR64(6);
103 return Code;
104 }
105
106 const BitCodeAbbrev *Abbv = getAbbrev(AbbrevID);
107 const BitCodeAbbrevOp &CodeOp = Abbv->getOperandInfo(0);
108 unsigned Code;
109 if (CodeOp.isLiteral())
110 Code = CodeOp.getLiteralValue();
111 else {
112 if (CodeOp.getEncoding() == BitCodeAbbrevOp::Array ||
113 CodeOp.getEncoding() == BitCodeAbbrevOp::Blob)
114 report_fatal_error("Abbreviation starts with an Array or a Blob");
115 Code = readAbbreviatedField(*this, CodeOp);
116 }
117
118 for (unsigned i = 1, e = Abbv->getNumOperandInfos(); i < e; ++i) {
119 const BitCodeAbbrevOp &Op = Abbv->getOperandInfo(i);
120 if (Op.isLiteral())
121 continue;
122
123 if (Op.getEncoding() != BitCodeAbbrevOp::Array &&
124 Op.getEncoding() != BitCodeAbbrevOp::Blob) {
125 skipAbbreviatedField(*this, Op);
126 continue;
127 }
128
129 if (Op.getEncoding() == BitCodeAbbrevOp::Array) {
130 // Array case. Read the number of elements as a vbr6.
131 unsigned NumElts = ReadVBR(6);
132
133 // Get the element encoding.
134 assert(i+2 == e && "array op not second to last?");
135 const BitCodeAbbrevOp &EltEnc = Abbv->getOperandInfo(++i);
136
137 // Read all the elements.
138 // Decode the value as we are commanded.
139 switch (EltEnc.getEncoding()) {
140 default:
141 report_fatal_error("Array element type can't be an Array or a Blob");
142 case BitCodeAbbrevOp::Fixed:
143 assert((unsigned)EltEnc.getEncodingData() <= MaxChunkSize);
144 JumpToBit(GetCurrentBitNo() + NumElts * EltEnc.getEncodingData());
145 break;
146 case BitCodeAbbrevOp::VBR:
147 assert((unsigned)EltEnc.getEncodingData() <= MaxChunkSize);
148 for (; NumElts; --NumElts)
149 ReadVBR64((unsigned)EltEnc.getEncodingData());
150 break;
151 case BitCodeAbbrevOp::Char6:
152 JumpToBit(GetCurrentBitNo() + NumElts * 6);
153 break;
154 }
155 continue;
156 }
157
158 assert(Op.getEncoding() == BitCodeAbbrevOp::Blob);
159 // Blob case. Read the number of bytes as a vbr6.
160 unsigned NumElts = ReadVBR(6);
161 SkipToFourByteBoundary(); // 32-bit alignment
162
163 // Figure out where the end of this blob will be including tail padding.
164 size_t NewEnd = GetCurrentBitNo()+((NumElts+3)&~3)*8;
165
166 // If this would read off the end of the bitcode file, just set the
167 // record to empty and return.
168 if (!canSkipToPos(NewEnd/8)) {
169 skipToEnd();
170 break;
171 }
172
173 // Skip over the blob.
174 JumpToBit(NewEnd);
175 }
176 return Code;
177 }
178
readRecord(unsigned AbbrevID,SmallVectorImpl<uint64_t> & Vals,StringRef * Blob)179 unsigned BitstreamCursor::readRecord(unsigned AbbrevID,
180 SmallVectorImpl<uint64_t> &Vals,
181 StringRef *Blob) {
182 if (AbbrevID == bitc::UNABBREV_RECORD) {
183 unsigned Code = ReadVBR(6);
184 unsigned NumElts = ReadVBR(6);
185 for (unsigned i = 0; i != NumElts; ++i)
186 Vals.push_back(ReadVBR64(6));
187 return Code;
188 }
189
190 const BitCodeAbbrev *Abbv = getAbbrev(AbbrevID);
191
192 // Read the record code first.
193 assert(Abbv->getNumOperandInfos() != 0 && "no record code in abbreviation?");
194 const BitCodeAbbrevOp &CodeOp = Abbv->getOperandInfo(0);
195 unsigned Code;
196 if (CodeOp.isLiteral())
197 Code = CodeOp.getLiteralValue();
198 else {
199 if (CodeOp.getEncoding() == BitCodeAbbrevOp::Array ||
200 CodeOp.getEncoding() == BitCodeAbbrevOp::Blob)
201 report_fatal_error("Abbreviation starts with an Array or a Blob");
202 Code = readAbbreviatedField(*this, CodeOp);
203 }
204
205 for (unsigned i = 1, e = Abbv->getNumOperandInfos(); i != e; ++i) {
206 const BitCodeAbbrevOp &Op = Abbv->getOperandInfo(i);
207 if (Op.isLiteral()) {
208 Vals.push_back(Op.getLiteralValue());
209 continue;
210 }
211
212 if (Op.getEncoding() != BitCodeAbbrevOp::Array &&
213 Op.getEncoding() != BitCodeAbbrevOp::Blob) {
214 Vals.push_back(readAbbreviatedField(*this, Op));
215 continue;
216 }
217
218 if (Op.getEncoding() == BitCodeAbbrevOp::Array) {
219 // Array case. Read the number of elements as a vbr6.
220 unsigned NumElts = ReadVBR(6);
221
222 // Get the element encoding.
223 if (i + 2 != e)
224 report_fatal_error("Array op not second to last");
225 const BitCodeAbbrevOp &EltEnc = Abbv->getOperandInfo(++i);
226 if (!EltEnc.isEncoding())
227 report_fatal_error(
228 "Array element type has to be an encoding of a type");
229
230 // Read all the elements.
231 switch (EltEnc.getEncoding()) {
232 default:
233 report_fatal_error("Array element type can't be an Array or a Blob");
234 case BitCodeAbbrevOp::Fixed:
235 for (; NumElts; --NumElts)
236 Vals.push_back(Read((unsigned)EltEnc.getEncodingData()));
237 break;
238 case BitCodeAbbrevOp::VBR:
239 for (; NumElts; --NumElts)
240 Vals.push_back(ReadVBR64((unsigned)EltEnc.getEncodingData()));
241 break;
242 case BitCodeAbbrevOp::Char6:
243 for (; NumElts; --NumElts)
244 Vals.push_back(BitCodeAbbrevOp::DecodeChar6(Read(6)));
245 }
246 continue;
247 }
248
249 assert(Op.getEncoding() == BitCodeAbbrevOp::Blob);
250 // Blob case. Read the number of bytes as a vbr6.
251 unsigned NumElts = ReadVBR(6);
252 SkipToFourByteBoundary(); // 32-bit alignment
253
254 // Figure out where the end of this blob will be including tail padding.
255 size_t CurBitPos = GetCurrentBitNo();
256 size_t NewEnd = CurBitPos+((NumElts+3)&~3)*8;
257
258 // If this would read off the end of the bitcode file, just set the
259 // record to empty and return.
260 if (!canSkipToPos(NewEnd/8)) {
261 Vals.append(NumElts, 0);
262 skipToEnd();
263 break;
264 }
265
266 // Otherwise, inform the streamer that we need these bytes in memory. Skip
267 // over tail padding first, in case jumping to NewEnd invalidates the Blob
268 // pointer.
269 JumpToBit(NewEnd);
270 const char *Ptr = (const char *)getPointerToBit(CurBitPos, NumElts);
271
272 // If we can return a reference to the data, do so to avoid copying it.
273 if (Blob) {
274 *Blob = StringRef(Ptr, NumElts);
275 } else {
276 // Otherwise, unpack into Vals with zero extension.
277 for (; NumElts; --NumElts)
278 Vals.push_back((unsigned char)*Ptr++);
279 }
280 }
281
282 return Code;
283 }
284
ReadAbbrevRecord()285 void BitstreamCursor::ReadAbbrevRecord() {
286 auto Abbv = std::make_shared<BitCodeAbbrev>();
287 unsigned NumOpInfo = ReadVBR(5);
288 for (unsigned i = 0; i != NumOpInfo; ++i) {
289 bool IsLiteral = Read(1);
290 if (IsLiteral) {
291 Abbv->Add(BitCodeAbbrevOp(ReadVBR64(8)));
292 continue;
293 }
294
295 BitCodeAbbrevOp::Encoding E = (BitCodeAbbrevOp::Encoding)Read(3);
296 if (BitCodeAbbrevOp::hasEncodingData(E)) {
297 uint64_t Data = ReadVBR64(5);
298
299 // As a special case, handle fixed(0) (i.e., a fixed field with zero bits)
300 // and vbr(0) as a literal zero. This is decoded the same way, and avoids
301 // a slow path in Read() to have to handle reading zero bits.
302 if ((E == BitCodeAbbrevOp::Fixed || E == BitCodeAbbrevOp::VBR) &&
303 Data == 0) {
304 Abbv->Add(BitCodeAbbrevOp(0));
305 continue;
306 }
307
308 if ((E == BitCodeAbbrevOp::Fixed || E == BitCodeAbbrevOp::VBR) &&
309 Data > MaxChunkSize)
310 report_fatal_error(
311 "Fixed or VBR abbrev record with size > MaxChunkData");
312
313 Abbv->Add(BitCodeAbbrevOp(E, Data));
314 } else
315 Abbv->Add(BitCodeAbbrevOp(E));
316 }
317
318 if (Abbv->getNumOperandInfos() == 0)
319 report_fatal_error("Abbrev record with no operands");
320 CurAbbrevs.push_back(std::move(Abbv));
321 }
322
323 Optional<BitstreamBlockInfo>
ReadBlockInfoBlock(bool ReadBlockInfoNames)324 BitstreamCursor::ReadBlockInfoBlock(bool ReadBlockInfoNames) {
325 if (EnterSubBlock(bitc::BLOCKINFO_BLOCK_ID)) return None;
326
327 BitstreamBlockInfo NewBlockInfo;
328
329 SmallVector<uint64_t, 64> Record;
330 BitstreamBlockInfo::BlockInfo *CurBlockInfo = nullptr;
331
332 // Read all the records for this module.
333 while (true) {
334 BitstreamEntry Entry = advanceSkippingSubblocks(AF_DontAutoprocessAbbrevs);
335
336 switch (Entry.Kind) {
337 case llvm::BitstreamEntry::SubBlock: // Handled for us already.
338 case llvm::BitstreamEntry::Error:
339 return None;
340 case llvm::BitstreamEntry::EndBlock:
341 return std::move(NewBlockInfo);
342 case llvm::BitstreamEntry::Record:
343 // The interesting case.
344 break;
345 }
346
347 // Read abbrev records, associate them with CurBID.
348 if (Entry.ID == bitc::DEFINE_ABBREV) {
349 if (!CurBlockInfo) return None;
350 ReadAbbrevRecord();
351
352 // ReadAbbrevRecord installs the abbrev in CurAbbrevs. Move it to the
353 // appropriate BlockInfo.
354 CurBlockInfo->Abbrevs.push_back(std::move(CurAbbrevs.back()));
355 CurAbbrevs.pop_back();
356 continue;
357 }
358
359 // Read a record.
360 Record.clear();
361 switch (readRecord(Entry.ID, Record)) {
362 default: break; // Default behavior, ignore unknown content.
363 case bitc::BLOCKINFO_CODE_SETBID:
364 if (Record.size() < 1) return None;
365 CurBlockInfo = &NewBlockInfo.getOrCreateBlockInfo((unsigned)Record[0]);
366 break;
367 case bitc::BLOCKINFO_CODE_BLOCKNAME: {
368 if (!CurBlockInfo) return None;
369 if (!ReadBlockInfoNames)
370 break; // Ignore name.
371 std::string Name;
372 for (unsigned i = 0, e = Record.size(); i != e; ++i)
373 Name += (char)Record[i];
374 CurBlockInfo->Name = Name;
375 break;
376 }
377 case bitc::BLOCKINFO_CODE_SETRECORDNAME: {
378 if (!CurBlockInfo) return None;
379 if (!ReadBlockInfoNames)
380 break; // Ignore name.
381 std::string Name;
382 for (unsigned i = 1, e = Record.size(); i != e; ++i)
383 Name += (char)Record[i];
384 CurBlockInfo->RecordNames.push_back(std::make_pair((unsigned)Record[0],
385 Name));
386 break;
387 }
388 }
389 }
390 }
391