1 //===-- EDToken.cpp - LLVM Enhanced Disassembler --------------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file implements the Enhanced Disassembler library's token class. The
11 // token is responsible for vending information about the token, such as its
12 // type and logical value.
13 //
14 //===----------------------------------------------------------------------===//
15
16 #include "EDToken.h"
17 #include "EDDisassembler.h"
18 #include "llvm/MC/MCParser/MCAsmLexer.h"
19 #include "llvm/MC/MCParser/MCParsedAsmOperand.h"
20 #include "llvm/ADT/SmallVector.h"
21 using namespace llvm;
22
EDToken(StringRef str,enum tokenType type,uint64_t localType,EDDisassembler & disassembler)23 EDToken::EDToken(StringRef str,
24 enum tokenType type,
25 uint64_t localType,
26 EDDisassembler &disassembler) :
27 Disassembler(disassembler),
28 Str(str),
29 Type(type),
30 LocalType(localType),
31 OperandID(-1) {
32 }
33
~EDToken()34 EDToken::~EDToken() {
35 }
36
makeLiteral(bool sign,uint64_t absoluteValue)37 void EDToken::makeLiteral(bool sign, uint64_t absoluteValue) {
38 Type = kTokenLiteral;
39 LiteralSign = sign;
40 LiteralAbsoluteValue = absoluteValue;
41 }
42
makeRegister(unsigned registerID)43 void EDToken::makeRegister(unsigned registerID) {
44 Type = kTokenRegister;
45 RegisterID = registerID;
46 }
47
setOperandID(int operandID)48 void EDToken::setOperandID(int operandID) {
49 OperandID = operandID;
50 }
51
type() const52 enum EDToken::tokenType EDToken::type() const {
53 return Type;
54 }
55
localType() const56 uint64_t EDToken::localType() const {
57 return LocalType;
58 }
59
string() const60 StringRef EDToken::string() const {
61 return Str;
62 }
63
operandID() const64 int EDToken::operandID() const {
65 return OperandID;
66 }
67
literalSign() const68 int EDToken::literalSign() const {
69 if (Type != kTokenLiteral)
70 return -1;
71 return (LiteralSign ? 1 : 0);
72 }
73
literalAbsoluteValue(uint64_t & value) const74 int EDToken::literalAbsoluteValue(uint64_t &value) const {
75 if (Type != kTokenLiteral)
76 return -1;
77 value = LiteralAbsoluteValue;
78 return 0;
79 }
80
registerID(unsigned & registerID) const81 int EDToken::registerID(unsigned ®isterID) const {
82 if (Type != kTokenRegister)
83 return -1;
84 registerID = RegisterID;
85 return 0;
86 }
87
tokenize(std::vector<EDToken * > & tokens,std::string & str,const signed char * operandOrder,EDDisassembler & disassembler)88 int EDToken::tokenize(std::vector<EDToken*> &tokens,
89 std::string &str,
90 const signed char *operandOrder,
91 EDDisassembler &disassembler) {
92 SmallVector<MCParsedAsmOperand*, 5> parsedOperands;
93 SmallVector<AsmToken, 10> asmTokens;
94
95 if (disassembler.parseInst(parsedOperands, asmTokens, str))
96 {
97 for (unsigned i = 0, e = parsedOperands.size(); i != e; ++i)
98 delete parsedOperands[i];
99 return -1;
100 }
101
102 SmallVectorImpl<MCParsedAsmOperand*>::iterator operandIterator;
103 unsigned int operandIndex;
104 SmallVectorImpl<AsmToken>::iterator tokenIterator;
105
106 operandIterator = parsedOperands.begin();
107 operandIndex = 0;
108
109 bool readOpcode = false;
110
111 const char *wsPointer = asmTokens.begin()->getLoc().getPointer();
112
113 for (tokenIterator = asmTokens.begin();
114 tokenIterator != asmTokens.end();
115 ++tokenIterator) {
116 SMLoc tokenLoc = tokenIterator->getLoc();
117
118 const char *tokenPointer = tokenLoc.getPointer();
119
120 if (tokenPointer > wsPointer) {
121 unsigned long wsLength = tokenPointer - wsPointer;
122
123 EDToken *whitespaceToken = new EDToken(StringRef(wsPointer, wsLength),
124 EDToken::kTokenWhitespace,
125 0,
126 disassembler);
127
128 tokens.push_back(whitespaceToken);
129 }
130
131 wsPointer = tokenPointer + tokenIterator->getString().size();
132
133 while (operandIterator != parsedOperands.end() &&
134 tokenLoc.getPointer() >
135 (*operandIterator)->getEndLoc().getPointer()) {
136 ++operandIterator;
137 ++operandIndex;
138 }
139
140 EDToken *token;
141
142 switch (tokenIterator->getKind()) {
143 case AsmToken::Identifier:
144 if (!readOpcode) {
145 token = new EDToken(tokenIterator->getString(),
146 EDToken::kTokenOpcode,
147 (uint64_t)tokenIterator->getKind(),
148 disassembler);
149 readOpcode = true;
150 break;
151 }
152 // any identifier that isn't an opcode is mere punctuation; so we fall
153 // through
154 default:
155 token = new EDToken(tokenIterator->getString(),
156 EDToken::kTokenPunctuation,
157 (uint64_t)tokenIterator->getKind(),
158 disassembler);
159 break;
160 case AsmToken::Integer:
161 {
162 token = new EDToken(tokenIterator->getString(),
163 EDToken::kTokenLiteral,
164 (uint64_t)tokenIterator->getKind(),
165 disassembler);
166
167 int64_t intVal = tokenIterator->getIntVal();
168
169 if (intVal < 0)
170 token->makeLiteral(true, -intVal);
171 else
172 token->makeLiteral(false, intVal);
173 break;
174 }
175 case AsmToken::Register:
176 {
177 token = new EDToken(tokenIterator->getString(),
178 EDToken::kTokenLiteral,
179 (uint64_t)tokenIterator->getKind(),
180 disassembler);
181
182 token->makeRegister((unsigned)tokenIterator->getRegVal());
183 break;
184 }
185 }
186
187 if (operandIterator != parsedOperands.end() &&
188 tokenLoc.getPointer() >=
189 (*operandIterator)->getStartLoc().getPointer()) {
190 /// operandIndex == 0 means the operand is the instruction (which the
191 /// AsmParser treats as an operand but edis does not). We therefore skip
192 /// operandIndex == 0 and subtract 1 from all other operand indices.
193
194 if (operandIndex > 0)
195 token->setOperandID(operandOrder[operandIndex - 1]);
196 }
197
198 tokens.push_back(token);
199 }
200
201 // Free any parsed operands.
202 for (unsigned i = 0, e = parsedOperands.size(); i != e; ++i)
203 delete parsedOperands[i];
204
205 return 0;
206 }
207
getString(const char * & buf)208 int EDToken::getString(const char*& buf) {
209 if (PermStr.length() == 0) {
210 PermStr = Str.str();
211 }
212 buf = PermStr.c_str();
213 return 0;
214 }
215