1 // Copyright (c) 1994-2006 Sun Microsystems Inc.
2 // All Rights Reserved.
3 //
4 // Redistribution and use in source and binary forms, with or without
5 // modification, are permitted provided that the following conditions are
6 // met:
7 //
8 // - Redistributions of source code must retain the above copyright notice,
9 // this list of conditions and the following disclaimer.
10 //
11 // - Redistribution in binary form must reproduce the above copyright
12 // notice, this list of conditions and the following disclaimer in the
13 // documentation and/or other materials provided with the distribution.
14 //
15 // - Neither the name of Sun Microsystems or the names of contributors may
16 // be used to endorse or promote products derived from this software without
17 // specific prior written permission.
18 //
19 // THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS
20 // IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO,
21 // THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
22 // PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
23 // CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
24 // EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
25 // PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
26 // PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
27 // LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
28 // NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
29 // SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
30
31 // The original source code covered by the above license above has been
32 // modified significantly by Google Inc.
33 // Copyright 2012 the V8 project authors. All rights reserved.
34
35 // A lightweight X64 Assembler.
36
37 #ifndef V8_X64_ASSEMBLER_X64_H_
38 #define V8_X64_ASSEMBLER_X64_H_
39
40 #include "serialize.h"
41
42 namespace v8 {
43 namespace internal {
44
45 // Utility functions
46
47 // Test whether a 64-bit value is in a specific range.
is_uint32(int64_t x)48 inline bool is_uint32(int64_t x) {
49 static const uint64_t kMaxUInt32 = V8_UINT64_C(0xffffffff);
50 return static_cast<uint64_t>(x) <= kMaxUInt32;
51 }
52
is_int32(int64_t x)53 inline bool is_int32(int64_t x) {
54 static const int64_t kMinInt32 = -V8_INT64_C(0x80000000);
55 return is_uint32(x - kMinInt32);
56 }
57
uint_is_int32(uint64_t x)58 inline bool uint_is_int32(uint64_t x) {
59 static const uint64_t kMaxInt32 = V8_UINT64_C(0x7fffffff);
60 return x <= kMaxInt32;
61 }
62
is_uint32(uint64_t x)63 inline bool is_uint32(uint64_t x) {
64 static const uint64_t kMaxUInt32 = V8_UINT64_C(0xffffffff);
65 return x <= kMaxUInt32;
66 }
67
68 // CPU Registers.
69 //
70 // 1) We would prefer to use an enum, but enum values are assignment-
71 // compatible with int, which has caused code-generation bugs.
72 //
73 // 2) We would prefer to use a class instead of a struct but we don't like
74 // the register initialization to depend on the particular initialization
75 // order (which appears to be different on OS X, Linux, and Windows for the
76 // installed versions of C++ we tried). Using a struct permits C-style
77 // "initialization". Also, the Register objects cannot be const as this
78 // forces initialization stubs in MSVC, making us dependent on initialization
79 // order.
80 //
81 // 3) By not using an enum, we are possibly preventing the compiler from
82 // doing certain constant folds, which may significantly reduce the
83 // code generated for some assembly instructions (because they boil down
84 // to a few constants). If this is a problem, we could change the code
85 // such that we use an enum in optimized mode, and the struct in debug
86 // mode. This way we get the compile-time error checking in debug mode
87 // and best performance in optimized code.
88 //
89
90 struct Register {
91 // The non-allocatable registers are:
92 // rsp - stack pointer
93 // rbp - frame pointer
94 // rsi - context register
95 // r10 - fixed scratch register
96 // r12 - smi constant register
97 // r13 - root register
98 static const int kNumRegisters = 16;
99 static const int kNumAllocatableRegisters = 10;
100
ToAllocationIndexRegister101 static int ToAllocationIndex(Register reg) {
102 return kAllocationIndexByRegisterCode[reg.code()];
103 }
104
FromAllocationIndexRegister105 static Register FromAllocationIndex(int index) {
106 ASSERT(index >= 0 && index < kNumAllocatableRegisters);
107 Register result = { kRegisterCodeByAllocationIndex[index] };
108 return result;
109 }
110
AllocationIndexToStringRegister111 static const char* AllocationIndexToString(int index) {
112 ASSERT(index >= 0 && index < kNumAllocatableRegisters);
113 const char* const names[] = {
114 "rax",
115 "rbx",
116 "rdx",
117 "rcx",
118 "rdi",
119 "r8",
120 "r9",
121 "r11",
122 "r14",
123 "r15"
124 };
125 return names[index];
126 }
127
from_codeRegister128 static Register from_code(int code) {
129 Register r = { code };
130 return r;
131 }
is_validRegister132 bool is_valid() const { return 0 <= code_ && code_ < kNumRegisters; }
isRegister133 bool is(Register reg) const { return code_ == reg.code_; }
134 // rax, rbx, rcx and rdx are byte registers, the rest are not.
is_byte_registerRegister135 bool is_byte_register() const { return code_ <= 3; }
codeRegister136 int code() const {
137 ASSERT(is_valid());
138 return code_;
139 }
bitRegister140 int bit() const {
141 return 1 << code_;
142 }
143
144 // Return the high bit of the register code as a 0 or 1. Used often
145 // when constructing the REX prefix byte.
high_bitRegister146 int high_bit() const {
147 return code_ >> 3;
148 }
149 // Return the 3 low bits of the register code. Used when encoding registers
150 // in modR/M, SIB, and opcode bytes.
low_bitsRegister151 int low_bits() const {
152 return code_ & 0x7;
153 }
154
155 // Unfortunately we can't make this private in a struct when initializing
156 // by assignment.
157 int code_;
158
159 private:
160 static const int kRegisterCodeByAllocationIndex[kNumAllocatableRegisters];
161 static const int kAllocationIndexByRegisterCode[kNumRegisters];
162 };
163
164 const int kRegister_rax_Code = 0;
165 const int kRegister_rcx_Code = 1;
166 const int kRegister_rdx_Code = 2;
167 const int kRegister_rbx_Code = 3;
168 const int kRegister_rsp_Code = 4;
169 const int kRegister_rbp_Code = 5;
170 const int kRegister_rsi_Code = 6;
171 const int kRegister_rdi_Code = 7;
172 const int kRegister_r8_Code = 8;
173 const int kRegister_r9_Code = 9;
174 const int kRegister_r10_Code = 10;
175 const int kRegister_r11_Code = 11;
176 const int kRegister_r12_Code = 12;
177 const int kRegister_r13_Code = 13;
178 const int kRegister_r14_Code = 14;
179 const int kRegister_r15_Code = 15;
180 const int kRegister_no_reg_Code = -1;
181
182 const Register rax = { kRegister_rax_Code };
183 const Register rcx = { kRegister_rcx_Code };
184 const Register rdx = { kRegister_rdx_Code };
185 const Register rbx = { kRegister_rbx_Code };
186 const Register rsp = { kRegister_rsp_Code };
187 const Register rbp = { kRegister_rbp_Code };
188 const Register rsi = { kRegister_rsi_Code };
189 const Register rdi = { kRegister_rdi_Code };
190 const Register r8 = { kRegister_r8_Code };
191 const Register r9 = { kRegister_r9_Code };
192 const Register r10 = { kRegister_r10_Code };
193 const Register r11 = { kRegister_r11_Code };
194 const Register r12 = { kRegister_r12_Code };
195 const Register r13 = { kRegister_r13_Code };
196 const Register r14 = { kRegister_r14_Code };
197 const Register r15 = { kRegister_r15_Code };
198 const Register no_reg = { kRegister_no_reg_Code };
199
200
201 struct XMMRegister {
202 static const int kNumRegisters = 16;
203 static const int kNumAllocatableRegisters = 15;
204
ToAllocationIndexXMMRegister205 static int ToAllocationIndex(XMMRegister reg) {
206 ASSERT(reg.code() != 0);
207 return reg.code() - 1;
208 }
209
FromAllocationIndexXMMRegister210 static XMMRegister FromAllocationIndex(int index) {
211 ASSERT(0 <= index && index < kNumAllocatableRegisters);
212 XMMRegister result = { index + 1 };
213 return result;
214 }
215
AllocationIndexToStringXMMRegister216 static const char* AllocationIndexToString(int index) {
217 ASSERT(index >= 0 && index < kNumAllocatableRegisters);
218 const char* const names[] = {
219 "xmm1",
220 "xmm2",
221 "xmm3",
222 "xmm4",
223 "xmm5",
224 "xmm6",
225 "xmm7",
226 "xmm8",
227 "xmm9",
228 "xmm10",
229 "xmm11",
230 "xmm12",
231 "xmm13",
232 "xmm14",
233 "xmm15"
234 };
235 return names[index];
236 }
237
from_codeXMMRegister238 static XMMRegister from_code(int code) {
239 ASSERT(code >= 0);
240 ASSERT(code < kNumRegisters);
241 XMMRegister r = { code };
242 return r;
243 }
is_validXMMRegister244 bool is_valid() const { return 0 <= code_ && code_ < kNumRegisters; }
isXMMRegister245 bool is(XMMRegister reg) const { return code_ == reg.code_; }
codeXMMRegister246 int code() const {
247 ASSERT(is_valid());
248 return code_;
249 }
250
251 // Return the high bit of the register code as a 0 or 1. Used often
252 // when constructing the REX prefix byte.
high_bitXMMRegister253 int high_bit() const {
254 return code_ >> 3;
255 }
256 // Return the 3 low bits of the register code. Used when encoding registers
257 // in modR/M, SIB, and opcode bytes.
low_bitsXMMRegister258 int low_bits() const {
259 return code_ & 0x7;
260 }
261
262 int code_;
263 };
264
265 const XMMRegister xmm0 = { 0 };
266 const XMMRegister xmm1 = { 1 };
267 const XMMRegister xmm2 = { 2 };
268 const XMMRegister xmm3 = { 3 };
269 const XMMRegister xmm4 = { 4 };
270 const XMMRegister xmm5 = { 5 };
271 const XMMRegister xmm6 = { 6 };
272 const XMMRegister xmm7 = { 7 };
273 const XMMRegister xmm8 = { 8 };
274 const XMMRegister xmm9 = { 9 };
275 const XMMRegister xmm10 = { 10 };
276 const XMMRegister xmm11 = { 11 };
277 const XMMRegister xmm12 = { 12 };
278 const XMMRegister xmm13 = { 13 };
279 const XMMRegister xmm14 = { 14 };
280 const XMMRegister xmm15 = { 15 };
281
282
283 typedef XMMRegister DoubleRegister;
284
285
286 enum Condition {
287 // any value < 0 is considered no_condition
288 no_condition = -1,
289
290 overflow = 0,
291 no_overflow = 1,
292 below = 2,
293 above_equal = 3,
294 equal = 4,
295 not_equal = 5,
296 below_equal = 6,
297 above = 7,
298 negative = 8,
299 positive = 9,
300 parity_even = 10,
301 parity_odd = 11,
302 less = 12,
303 greater_equal = 13,
304 less_equal = 14,
305 greater = 15,
306
307 // Fake conditions that are handled by the
308 // opcodes using them.
309 always = 16,
310 never = 17,
311 // aliases
312 carry = below,
313 not_carry = above_equal,
314 zero = equal,
315 not_zero = not_equal,
316 sign = negative,
317 not_sign = positive,
318 last_condition = greater
319 };
320
321
322 // Returns the equivalent of !cc.
323 // Negation of the default no_condition (-1) results in a non-default
324 // no_condition value (-2). As long as tests for no_condition check
325 // for condition < 0, this will work as expected.
NegateCondition(Condition cc)326 inline Condition NegateCondition(Condition cc) {
327 return static_cast<Condition>(cc ^ 1);
328 }
329
330
331 // Corresponds to transposing the operands of a comparison.
ReverseCondition(Condition cc)332 inline Condition ReverseCondition(Condition cc) {
333 switch (cc) {
334 case below:
335 return above;
336 case above:
337 return below;
338 case above_equal:
339 return below_equal;
340 case below_equal:
341 return above_equal;
342 case less:
343 return greater;
344 case greater:
345 return less;
346 case greater_equal:
347 return less_equal;
348 case less_equal:
349 return greater_equal;
350 default:
351 return cc;
352 };
353 }
354
355
356 // -----------------------------------------------------------------------------
357 // Machine instruction Immediates
358
359 class Immediate BASE_EMBEDDED {
360 public:
Immediate(int32_t value)361 explicit Immediate(int32_t value) : value_(value) {}
362
363 private:
364 int32_t value_;
365
366 friend class Assembler;
367 };
368
369
370 // -----------------------------------------------------------------------------
371 // Machine instruction Operands
372
373 enum ScaleFactor {
374 times_1 = 0,
375 times_2 = 1,
376 times_4 = 2,
377 times_8 = 3,
378 times_int_size = times_4,
379 times_pointer_size = times_8
380 };
381
382
383 class Operand BASE_EMBEDDED {
384 public:
385 // [base + disp/r]
386 Operand(Register base, int32_t disp);
387
388 // [base + index*scale + disp/r]
389 Operand(Register base,
390 Register index,
391 ScaleFactor scale,
392 int32_t disp);
393
394 // [index*scale + disp/r]
395 Operand(Register index,
396 ScaleFactor scale,
397 int32_t disp);
398
399 // Offset from existing memory operand.
400 // Offset is added to existing displacement as 32-bit signed values and
401 // this must not overflow.
402 Operand(const Operand& base, int32_t offset);
403
404 // Checks whether either base or index register is the given register.
405 // Does not check the "reg" part of the Operand.
406 bool AddressUsesRegister(Register reg) const;
407
408 // Queries related to the size of the generated instruction.
409 // Whether the generated instruction will have a REX prefix.
requires_rex()410 bool requires_rex() const { return rex_ != 0; }
411 // Size of the ModR/M, SIB and displacement parts of the generated
412 // instruction.
operand_size()413 int operand_size() const { return len_; }
414
415 private:
416 byte rex_;
417 byte buf_[6];
418 // The number of bytes of buf_ in use.
419 byte len_;
420
421 // Set the ModR/M byte without an encoded 'reg' register. The
422 // register is encoded later as part of the emit_operand operation.
423 // set_modrm can be called before or after set_sib and set_disp*.
424 inline void set_modrm(int mod, Register rm);
425
426 // Set the SIB byte if one is needed. Sets the length to 2 rather than 1.
427 inline void set_sib(ScaleFactor scale, Register index, Register base);
428
429 // Adds operand displacement fields (offsets added to the memory address).
430 // Needs to be called after set_sib, not before it.
431 inline void set_disp8(int disp);
432 inline void set_disp32(int disp);
433
434 friend class Assembler;
435 };
436
437
438 // CpuFeatures keeps track of which features are supported by the target CPU.
439 // Supported features must be enabled by a Scope before use.
440 // Example:
441 // if (CpuFeatures::IsSupported(SSE3)) {
442 // CpuFeatures::Scope fscope(SSE3);
443 // // Generate SSE3 floating point code.
444 // } else {
445 // // Generate standard x87 or SSE2 floating point code.
446 // }
447 class CpuFeatures : public AllStatic {
448 public:
449 // Detect features of the target CPU. Set safe defaults if the serializer
450 // is enabled (snapshots must be portable).
451 static void Probe();
452
453 // Check whether a feature is supported by the target CPU.
IsSupported(CpuFeature f)454 static bool IsSupported(CpuFeature f) {
455 ASSERT(initialized_);
456 if (f == SSE2 && !FLAG_enable_sse2) return false;
457 if (f == SSE3 && !FLAG_enable_sse3) return false;
458 if (f == CMOV && !FLAG_enable_cmov) return false;
459 if (f == RDTSC && !FLAG_enable_rdtsc) return false;
460 if (f == SAHF && !FLAG_enable_sahf) return false;
461 return (supported_ & (V8_UINT64_C(1) << f)) != 0;
462 }
463
464 #ifdef DEBUG
465 // Check whether a feature is currently enabled.
IsEnabled(CpuFeature f)466 static bool IsEnabled(CpuFeature f) {
467 ASSERT(initialized_);
468 Isolate* isolate = Isolate::UncheckedCurrent();
469 if (isolate == NULL) {
470 // When no isolate is available, work as if we're running in
471 // release mode.
472 return IsSupported(f);
473 }
474 uint64_t enabled = isolate->enabled_cpu_features();
475 return (enabled & (V8_UINT64_C(1) << f)) != 0;
476 }
477 #endif
478
479 // Enable a specified feature within a scope.
480 class Scope BASE_EMBEDDED {
481 #ifdef DEBUG
482
483 public:
Scope(CpuFeature f)484 explicit Scope(CpuFeature f) {
485 uint64_t mask = V8_UINT64_C(1) << f;
486 ASSERT(CpuFeatures::IsSupported(f));
487 ASSERT(!Serializer::enabled() ||
488 (CpuFeatures::found_by_runtime_probing_ & mask) == 0);
489 isolate_ = Isolate::UncheckedCurrent();
490 old_enabled_ = 0;
491 if (isolate_ != NULL) {
492 old_enabled_ = isolate_->enabled_cpu_features();
493 isolate_->set_enabled_cpu_features(old_enabled_ | mask);
494 }
495 }
~Scope()496 ~Scope() {
497 ASSERT_EQ(Isolate::UncheckedCurrent(), isolate_);
498 if (isolate_ != NULL) {
499 isolate_->set_enabled_cpu_features(old_enabled_);
500 }
501 }
502
503 private:
504 Isolate* isolate_;
505 uint64_t old_enabled_;
506 #else
507
508 public:
509 explicit Scope(CpuFeature f) {}
510 #endif
511 };
512
513 private:
514 // Safe defaults include SSE2 and CMOV for X64. It is always available, if
515 // anyone checks, but they shouldn't need to check.
516 // The required user mode extensions in X64 are (from AMD64 ABI Table A.1):
517 // fpu, tsc, cx8, cmov, mmx, sse, sse2, fxsr, syscall
518 static const uint64_t kDefaultCpuFeatures = (1 << SSE2 | 1 << CMOV);
519
520 #ifdef DEBUG
521 static bool initialized_;
522 #endif
523 static uint64_t supported_;
524 static uint64_t found_by_runtime_probing_;
525
526 DISALLOW_COPY_AND_ASSIGN(CpuFeatures);
527 };
528
529
530 class Assembler : public AssemblerBase {
531 private:
532 // We check before assembling an instruction that there is sufficient
533 // space to write an instruction and its relocation information.
534 // The relocation writer's position must be kGap bytes above the end of
535 // the generated instructions. This leaves enough space for the
536 // longest possible x64 instruction, 15 bytes, and the longest possible
537 // relocation information encoding, RelocInfoWriter::kMaxLength == 16.
538 // (There is a 15 byte limit on x64 instruction length that rules out some
539 // otherwise valid instructions.)
540 // This allows for a single, fast space check per instruction.
541 static const int kGap = 32;
542
543 public:
544 // Create an assembler. Instructions and relocation information are emitted
545 // into a buffer, with the instructions starting from the beginning and the
546 // relocation information starting from the end of the buffer. See CodeDesc
547 // for a detailed comment on the layout (globals.h).
548 //
549 // If the provided buffer is NULL, the assembler allocates and grows its own
550 // buffer, and buffer_size determines the initial buffer size. The buffer is
551 // owned by the assembler and deallocated upon destruction of the assembler.
552 //
553 // If the provided buffer is not NULL, the assembler uses the provided buffer
554 // for code generation and assumes its size to be buffer_size. If the buffer
555 // is too small, a fatal error occurs. No deallocation of the buffer is done
556 // upon destruction of the assembler.
557 Assembler(Isolate* isolate, void* buffer, int buffer_size);
558 ~Assembler();
559
560 // Overrides the default provided by FLAG_debug_code.
set_emit_debug_code(bool value)561 void set_emit_debug_code(bool value) { emit_debug_code_ = value; }
562
563 // GetCode emits any pending (non-emitted) code and fills the descriptor
564 // desc. GetCode() is idempotent; it returns the same result if no other
565 // Assembler functions are invoked in between GetCode() calls.
566 void GetCode(CodeDesc* desc);
567
568 // Read/Modify the code target in the relative branch/call instruction at pc.
569 // On the x64 architecture, we use relative jumps with a 32-bit displacement
570 // to jump to other Code objects in the Code space in the heap.
571 // Jumps to C functions are done indirectly through a 64-bit register holding
572 // the absolute address of the target.
573 // These functions convert between absolute Addresses of Code objects and
574 // the relative displacements stored in the code.
575 static inline Address target_address_at(Address pc);
576 static inline void set_target_address_at(Address pc, Address target);
577
578 // This sets the branch destination (which is in the instruction on x64).
579 // This is for calls and branches within generated code.
deserialization_set_special_target_at(Address instruction_payload,Address target)580 inline static void deserialization_set_special_target_at(
581 Address instruction_payload, Address target) {
582 set_target_address_at(instruction_payload, target);
583 }
584
585 // This sets the branch destination (which is a load instruction on x64).
586 // This is for calls and branches to runtime code.
set_external_target_at(Address instruction_payload,Address target)587 inline static void set_external_target_at(Address instruction_payload,
588 Address target) {
589 *reinterpret_cast<Address*>(instruction_payload) = target;
590 }
591
592 inline Handle<Object> code_target_object_handle_at(Address pc);
593 // Number of bytes taken up by the branch target in the code.
594 static const int kSpecialTargetSize = 4; // Use 32-bit displacement.
595 // Distance between the address of the code target in the call instruction
596 // and the return address pushed on the stack.
597 static const int kCallTargetAddressOffset = 4; // Use 32-bit displacement.
598 // Distance between the start of the JS return sequence and where the
599 // 32-bit displacement of a near call would be, relative to the pushed
600 // return address. TODO: Use return sequence length instead.
601 // Should equal Debug::kX64JSReturnSequenceLength - kCallTargetAddressOffset;
602 static const int kPatchReturnSequenceAddressOffset = 13 - 4;
603 // Distance between start of patched debug break slot and where the
604 // 32-bit displacement of a near call would be, relative to the pushed
605 // return address. TODO: Use return sequence length instead.
606 // Should equal Debug::kX64JSReturnSequenceLength - kCallTargetAddressOffset;
607 static const int kPatchDebugBreakSlotAddressOffset = 13 - 4;
608 // TODO(X64): Rename this, removing the "Real", after changing the above.
609 static const int kRealPatchReturnSequenceAddressOffset = 2;
610
611 // Some x64 JS code is padded with int3 to make it large
612 // enough to hold an instruction when the debugger patches it.
613 static const int kJumpInstructionLength = 13;
614 static const int kCallInstructionLength = 13;
615 static const int kJSReturnSequenceLength = 13;
616 static const int kShortCallInstructionLength = 5;
617
618 // The debug break slot must be able to contain a call instruction.
619 static const int kDebugBreakSlotLength = kCallInstructionLength;
620
621 // One byte opcode for test eax,0xXXXXXXXX.
622 static const byte kTestEaxByte = 0xA9;
623 // One byte opcode for test al, 0xXX.
624 static const byte kTestAlByte = 0xA8;
625 // One byte opcode for nop.
626 static const byte kNopByte = 0x90;
627
628 // One byte prefix for a short conditional jump.
629 static const byte kJccShortPrefix = 0x70;
630 static const byte kJncShortOpcode = kJccShortPrefix | not_carry;
631 static const byte kJcShortOpcode = kJccShortPrefix | carry;
632
633
634
635 // ---------------------------------------------------------------------------
636 // Code generation
637 //
638 // Function names correspond one-to-one to x64 instruction mnemonics.
639 // Unless specified otherwise, instructions operate on 64-bit operands.
640 //
641 // If we need versions of an assembly instruction that operate on different
642 // width arguments, we add a single-letter suffix specifying the width.
643 // This is done for the following instructions: mov, cmp, inc, dec,
644 // add, sub, and test.
645 // There are no versions of these instructions without the suffix.
646 // - Instructions on 8-bit (byte) operands/registers have a trailing 'b'.
647 // - Instructions on 16-bit (word) operands/registers have a trailing 'w'.
648 // - Instructions on 32-bit (doubleword) operands/registers use 'l'.
649 // - Instructions on 64-bit (quadword) operands/registers use 'q'.
650 //
651 // Some mnemonics, such as "and", are the same as C++ keywords.
652 // Naming conflicts with C++ keywords are resolved by adding a trailing '_'.
653
654 // Insert the smallest number of nop instructions
655 // possible to align the pc offset to a multiple
656 // of m, where m must be a power of 2.
657 void Align(int m);
658 void Nop(int bytes = 1);
659 // Aligns code to something that's optimal for a jump target for the platform.
660 void CodeTargetAlign();
661
662 // Stack
663 void pushfq();
664 void popfq();
665
666 void push(Immediate value);
667 // Push a 32 bit integer, and guarantee that it is actually pushed as a
668 // 32 bit value, the normal push will optimize the 8 bit case.
669 void push_imm32(int32_t imm32);
670 void push(Register src);
671 void push(const Operand& src);
672
673 void pop(Register dst);
674 void pop(const Operand& dst);
675
676 void enter(Immediate size);
677 void leave();
678
679 // Moves
680 void movb(Register dst, const Operand& src);
681 void movb(Register dst, Immediate imm);
682 void movb(const Operand& dst, Register src);
683
684 // Move the low 16 bits of a 64-bit register value to a 16-bit
685 // memory location.
686 void movw(const Operand& dst, Register src);
687
688 void movl(Register dst, Register src);
689 void movl(Register dst, const Operand& src);
690 void movl(const Operand& dst, Register src);
691 void movl(const Operand& dst, Immediate imm);
692 // Load a 32-bit immediate value, zero-extended to 64 bits.
693 void movl(Register dst, Immediate imm32);
694
695 // Move 64 bit register value to 64-bit memory location.
696 void movq(const Operand& dst, Register src);
697 // Move 64 bit memory location to 64-bit register value.
698 void movq(Register dst, const Operand& src);
699 void movq(Register dst, Register src);
700 // Sign extends immediate 32-bit value to 64 bits.
701 void movq(Register dst, Immediate x);
702 // Move the offset of the label location relative to the current
703 // position (after the move) to the destination.
704 void movl(const Operand& dst, Label* src);
705
706 // Move sign extended immediate to memory location.
707 void movq(const Operand& dst, Immediate value);
708 // Instructions to load a 64-bit immediate into a register.
709 // All 64-bit immediates must have a relocation mode.
710 void movq(Register dst, void* ptr, RelocInfo::Mode rmode);
711 void movq(Register dst, int64_t value, RelocInfo::Mode rmode);
712 void movq(Register dst, const char* s, RelocInfo::Mode rmode);
713 // Moves the address of the external reference into the register.
714 void movq(Register dst, ExternalReference ext);
715 void movq(Register dst, Handle<Object> handle, RelocInfo::Mode rmode);
716
717 void movsxbq(Register dst, const Operand& src);
718 void movsxwq(Register dst, const Operand& src);
719 void movsxlq(Register dst, Register src);
720 void movsxlq(Register dst, const Operand& src);
721 void movzxbq(Register dst, const Operand& src);
722 void movzxbl(Register dst, const Operand& src);
723 void movzxwq(Register dst, const Operand& src);
724 void movzxwl(Register dst, const Operand& src);
725
726 // Repeated moves.
727
728 void repmovsb();
729 void repmovsw();
730 void repmovsl();
731 void repmovsq();
732
733 // Instruction to load from an immediate 64-bit pointer into RAX.
734 void load_rax(void* ptr, RelocInfo::Mode rmode);
735 void load_rax(ExternalReference ext);
736
737 // Conditional moves.
738 void cmovq(Condition cc, Register dst, Register src);
739 void cmovq(Condition cc, Register dst, const Operand& src);
740 void cmovl(Condition cc, Register dst, Register src);
741 void cmovl(Condition cc, Register dst, const Operand& src);
742
743 // Exchange two registers
744 void xchg(Register dst, Register src);
745
746 // Arithmetics
addl(Register dst,Register src)747 void addl(Register dst, Register src) {
748 arithmetic_op_32(0x03, dst, src);
749 }
750
addl(Register dst,Immediate src)751 void addl(Register dst, Immediate src) {
752 immediate_arithmetic_op_32(0x0, dst, src);
753 }
754
addl(Register dst,const Operand & src)755 void addl(Register dst, const Operand& src) {
756 arithmetic_op_32(0x03, dst, src);
757 }
758
addl(const Operand & dst,Immediate src)759 void addl(const Operand& dst, Immediate src) {
760 immediate_arithmetic_op_32(0x0, dst, src);
761 }
762
addl(const Operand & dst,Register src)763 void addl(const Operand& dst, Register src) {
764 arithmetic_op_32(0x01, src, dst);
765 }
766
addq(Register dst,Register src)767 void addq(Register dst, Register src) {
768 arithmetic_op(0x03, dst, src);
769 }
770
addq(Register dst,const Operand & src)771 void addq(Register dst, const Operand& src) {
772 arithmetic_op(0x03, dst, src);
773 }
774
addq(const Operand & dst,Register src)775 void addq(const Operand& dst, Register src) {
776 arithmetic_op(0x01, src, dst);
777 }
778
addq(Register dst,Immediate src)779 void addq(Register dst, Immediate src) {
780 immediate_arithmetic_op(0x0, dst, src);
781 }
782
addq(const Operand & dst,Immediate src)783 void addq(const Operand& dst, Immediate src) {
784 immediate_arithmetic_op(0x0, dst, src);
785 }
786
sbbl(Register dst,Register src)787 void sbbl(Register dst, Register src) {
788 arithmetic_op_32(0x1b, dst, src);
789 }
790
sbbq(Register dst,Register src)791 void sbbq(Register dst, Register src) {
792 arithmetic_op(0x1b, dst, src);
793 }
794
cmpb(Register dst,Immediate src)795 void cmpb(Register dst, Immediate src) {
796 immediate_arithmetic_op_8(0x7, dst, src);
797 }
798
799 void cmpb_al(Immediate src);
800
cmpb(Register dst,Register src)801 void cmpb(Register dst, Register src) {
802 arithmetic_op(0x3A, dst, src);
803 }
804
cmpb(Register dst,const Operand & src)805 void cmpb(Register dst, const Operand& src) {
806 arithmetic_op(0x3A, dst, src);
807 }
808
cmpb(const Operand & dst,Register src)809 void cmpb(const Operand& dst, Register src) {
810 arithmetic_op(0x38, src, dst);
811 }
812
cmpb(const Operand & dst,Immediate src)813 void cmpb(const Operand& dst, Immediate src) {
814 immediate_arithmetic_op_8(0x7, dst, src);
815 }
816
cmpw(const Operand & dst,Immediate src)817 void cmpw(const Operand& dst, Immediate src) {
818 immediate_arithmetic_op_16(0x7, dst, src);
819 }
820
cmpw(Register dst,Immediate src)821 void cmpw(Register dst, Immediate src) {
822 immediate_arithmetic_op_16(0x7, dst, src);
823 }
824
cmpw(Register dst,const Operand & src)825 void cmpw(Register dst, const Operand& src) {
826 arithmetic_op_16(0x3B, dst, src);
827 }
828
cmpw(Register dst,Register src)829 void cmpw(Register dst, Register src) {
830 arithmetic_op_16(0x3B, dst, src);
831 }
832
cmpw(const Operand & dst,Register src)833 void cmpw(const Operand& dst, Register src) {
834 arithmetic_op_16(0x39, src, dst);
835 }
836
cmpl(Register dst,Register src)837 void cmpl(Register dst, Register src) {
838 arithmetic_op_32(0x3B, dst, src);
839 }
840
cmpl(Register dst,const Operand & src)841 void cmpl(Register dst, const Operand& src) {
842 arithmetic_op_32(0x3B, dst, src);
843 }
844
cmpl(const Operand & dst,Register src)845 void cmpl(const Operand& dst, Register src) {
846 arithmetic_op_32(0x39, src, dst);
847 }
848
cmpl(Register dst,Immediate src)849 void cmpl(Register dst, Immediate src) {
850 immediate_arithmetic_op_32(0x7, dst, src);
851 }
852
cmpl(const Operand & dst,Immediate src)853 void cmpl(const Operand& dst, Immediate src) {
854 immediate_arithmetic_op_32(0x7, dst, src);
855 }
856
cmpq(Register dst,Register src)857 void cmpq(Register dst, Register src) {
858 arithmetic_op(0x3B, dst, src);
859 }
860
cmpq(Register dst,const Operand & src)861 void cmpq(Register dst, const Operand& src) {
862 arithmetic_op(0x3B, dst, src);
863 }
864
cmpq(const Operand & dst,Register src)865 void cmpq(const Operand& dst, Register src) {
866 arithmetic_op(0x39, src, dst);
867 }
868
cmpq(Register dst,Immediate src)869 void cmpq(Register dst, Immediate src) {
870 immediate_arithmetic_op(0x7, dst, src);
871 }
872
cmpq(const Operand & dst,Immediate src)873 void cmpq(const Operand& dst, Immediate src) {
874 immediate_arithmetic_op(0x7, dst, src);
875 }
876
and_(Register dst,Register src)877 void and_(Register dst, Register src) {
878 arithmetic_op(0x23, dst, src);
879 }
880
and_(Register dst,const Operand & src)881 void and_(Register dst, const Operand& src) {
882 arithmetic_op(0x23, dst, src);
883 }
884
and_(const Operand & dst,Register src)885 void and_(const Operand& dst, Register src) {
886 arithmetic_op(0x21, src, dst);
887 }
888
and_(Register dst,Immediate src)889 void and_(Register dst, Immediate src) {
890 immediate_arithmetic_op(0x4, dst, src);
891 }
892
and_(const Operand & dst,Immediate src)893 void and_(const Operand& dst, Immediate src) {
894 immediate_arithmetic_op(0x4, dst, src);
895 }
896
andl(Register dst,Immediate src)897 void andl(Register dst, Immediate src) {
898 immediate_arithmetic_op_32(0x4, dst, src);
899 }
900
andl(Register dst,Register src)901 void andl(Register dst, Register src) {
902 arithmetic_op_32(0x23, dst, src);
903 }
904
andl(Register dst,const Operand & src)905 void andl(Register dst, const Operand& src) {
906 arithmetic_op_32(0x23, dst, src);
907 }
908
andb(Register dst,Immediate src)909 void andb(Register dst, Immediate src) {
910 immediate_arithmetic_op_8(0x4, dst, src);
911 }
912
913 void decq(Register dst);
914 void decq(const Operand& dst);
915 void decl(Register dst);
916 void decl(const Operand& dst);
917 void decb(Register dst);
918 void decb(const Operand& dst);
919
920 // Sign-extends rax into rdx:rax.
921 void cqo();
922 // Sign-extends eax into edx:eax.
923 void cdq();
924
925 // Divide rdx:rax by src. Quotient in rax, remainder in rdx.
926 void idivq(Register src);
927 // Divide edx:eax by lower 32 bits of src. Quotient in eax, rem. in edx.
928 void idivl(Register src);
929
930 // Signed multiply instructions.
931 void imul(Register src); // rdx:rax = rax * src.
932 void imul(Register dst, Register src); // dst = dst * src.
933 void imul(Register dst, const Operand& src); // dst = dst * src.
934 void imul(Register dst, Register src, Immediate imm); // dst = src * imm.
935 // Signed 32-bit multiply instructions.
936 void imull(Register dst, Register src); // dst = dst * src.
937 void imull(Register dst, const Operand& src); // dst = dst * src.
938 void imull(Register dst, Register src, Immediate imm); // dst = src * imm.
939
940 void incq(Register dst);
941 void incq(const Operand& dst);
942 void incl(Register dst);
943 void incl(const Operand& dst);
944
945 void lea(Register dst, const Operand& src);
946 void leal(Register dst, const Operand& src);
947
948 // Multiply rax by src, put the result in rdx:rax.
949 void mul(Register src);
950
951 void neg(Register dst);
952 void neg(const Operand& dst);
953 void negl(Register dst);
954
955 void not_(Register dst);
956 void not_(const Operand& dst);
957 void notl(Register dst);
958
or_(Register dst,Register src)959 void or_(Register dst, Register src) {
960 arithmetic_op(0x0B, dst, src);
961 }
962
orl(Register dst,Register src)963 void orl(Register dst, Register src) {
964 arithmetic_op_32(0x0B, dst, src);
965 }
966
or_(Register dst,const Operand & src)967 void or_(Register dst, const Operand& src) {
968 arithmetic_op(0x0B, dst, src);
969 }
970
orl(Register dst,const Operand & src)971 void orl(Register dst, const Operand& src) {
972 arithmetic_op_32(0x0B, dst, src);
973 }
974
or_(const Operand & dst,Register src)975 void or_(const Operand& dst, Register src) {
976 arithmetic_op(0x09, src, dst);
977 }
978
or_(Register dst,Immediate src)979 void or_(Register dst, Immediate src) {
980 immediate_arithmetic_op(0x1, dst, src);
981 }
982
orl(Register dst,Immediate src)983 void orl(Register dst, Immediate src) {
984 immediate_arithmetic_op_32(0x1, dst, src);
985 }
986
or_(const Operand & dst,Immediate src)987 void or_(const Operand& dst, Immediate src) {
988 immediate_arithmetic_op(0x1, dst, src);
989 }
990
orl(const Operand & dst,Immediate src)991 void orl(const Operand& dst, Immediate src) {
992 immediate_arithmetic_op_32(0x1, dst, src);
993 }
994
995
rcl(Register dst,Immediate imm8)996 void rcl(Register dst, Immediate imm8) {
997 shift(dst, imm8, 0x2);
998 }
999
rol(Register dst,Immediate imm8)1000 void rol(Register dst, Immediate imm8) {
1001 shift(dst, imm8, 0x0);
1002 }
1003
rcr(Register dst,Immediate imm8)1004 void rcr(Register dst, Immediate imm8) {
1005 shift(dst, imm8, 0x3);
1006 }
1007
ror(Register dst,Immediate imm8)1008 void ror(Register dst, Immediate imm8) {
1009 shift(dst, imm8, 0x1);
1010 }
1011
1012 // Shifts dst:src left by cl bits, affecting only dst.
1013 void shld(Register dst, Register src);
1014
1015 // Shifts src:dst right by cl bits, affecting only dst.
1016 void shrd(Register dst, Register src);
1017
1018 // Shifts dst right, duplicating sign bit, by shift_amount bits.
1019 // Shifting by 1 is handled efficiently.
sar(Register dst,Immediate shift_amount)1020 void sar(Register dst, Immediate shift_amount) {
1021 shift(dst, shift_amount, 0x7);
1022 }
1023
1024 // Shifts dst right, duplicating sign bit, by shift_amount bits.
1025 // Shifting by 1 is handled efficiently.
sarl(Register dst,Immediate shift_amount)1026 void sarl(Register dst, Immediate shift_amount) {
1027 shift_32(dst, shift_amount, 0x7);
1028 }
1029
1030 // Shifts dst right, duplicating sign bit, by cl % 64 bits.
sar_cl(Register dst)1031 void sar_cl(Register dst) {
1032 shift(dst, 0x7);
1033 }
1034
1035 // Shifts dst right, duplicating sign bit, by cl % 64 bits.
sarl_cl(Register dst)1036 void sarl_cl(Register dst) {
1037 shift_32(dst, 0x7);
1038 }
1039
shl(Register dst,Immediate shift_amount)1040 void shl(Register dst, Immediate shift_amount) {
1041 shift(dst, shift_amount, 0x4);
1042 }
1043
shl_cl(Register dst)1044 void shl_cl(Register dst) {
1045 shift(dst, 0x4);
1046 }
1047
shll_cl(Register dst)1048 void shll_cl(Register dst) {
1049 shift_32(dst, 0x4);
1050 }
1051
shll(Register dst,Immediate shift_amount)1052 void shll(Register dst, Immediate shift_amount) {
1053 shift_32(dst, shift_amount, 0x4);
1054 }
1055
shr(Register dst,Immediate shift_amount)1056 void shr(Register dst, Immediate shift_amount) {
1057 shift(dst, shift_amount, 0x5);
1058 }
1059
shr_cl(Register dst)1060 void shr_cl(Register dst) {
1061 shift(dst, 0x5);
1062 }
1063
shrl_cl(Register dst)1064 void shrl_cl(Register dst) {
1065 shift_32(dst, 0x5);
1066 }
1067
shrl(Register dst,Immediate shift_amount)1068 void shrl(Register dst, Immediate shift_amount) {
1069 shift_32(dst, shift_amount, 0x5);
1070 }
1071
1072 void store_rax(void* dst, RelocInfo::Mode mode);
1073 void store_rax(ExternalReference ref);
1074
subq(Register dst,Register src)1075 void subq(Register dst, Register src) {
1076 arithmetic_op(0x2B, dst, src);
1077 }
1078
subq(Register dst,const Operand & src)1079 void subq(Register dst, const Operand& src) {
1080 arithmetic_op(0x2B, dst, src);
1081 }
1082
subq(const Operand & dst,Register src)1083 void subq(const Operand& dst, Register src) {
1084 arithmetic_op(0x29, src, dst);
1085 }
1086
subq(Register dst,Immediate src)1087 void subq(Register dst, Immediate src) {
1088 immediate_arithmetic_op(0x5, dst, src);
1089 }
1090
subq(const Operand & dst,Immediate src)1091 void subq(const Operand& dst, Immediate src) {
1092 immediate_arithmetic_op(0x5, dst, src);
1093 }
1094
subl(Register dst,Register src)1095 void subl(Register dst, Register src) {
1096 arithmetic_op_32(0x2B, dst, src);
1097 }
1098
subl(Register dst,const Operand & src)1099 void subl(Register dst, const Operand& src) {
1100 arithmetic_op_32(0x2B, dst, src);
1101 }
1102
subl(const Operand & dst,Immediate src)1103 void subl(const Operand& dst, Immediate src) {
1104 immediate_arithmetic_op_32(0x5, dst, src);
1105 }
1106
subl(Register dst,Immediate src)1107 void subl(Register dst, Immediate src) {
1108 immediate_arithmetic_op_32(0x5, dst, src);
1109 }
1110
subb(Register dst,Immediate src)1111 void subb(Register dst, Immediate src) {
1112 immediate_arithmetic_op_8(0x5, dst, src);
1113 }
1114
1115 void testb(Register dst, Register src);
1116 void testb(Register reg, Immediate mask);
1117 void testb(const Operand& op, Immediate mask);
1118 void testb(const Operand& op, Register reg);
1119 void testl(Register dst, Register src);
1120 void testl(Register reg, Immediate mask);
1121 void testl(const Operand& op, Immediate mask);
1122 void testq(const Operand& op, Register reg);
1123 void testq(Register dst, Register src);
1124 void testq(Register dst, Immediate mask);
1125
xor_(Register dst,Register src)1126 void xor_(Register dst, Register src) {
1127 if (dst.code() == src.code()) {
1128 arithmetic_op_32(0x33, dst, src);
1129 } else {
1130 arithmetic_op(0x33, dst, src);
1131 }
1132 }
1133
xorl(Register dst,Register src)1134 void xorl(Register dst, Register src) {
1135 arithmetic_op_32(0x33, dst, src);
1136 }
1137
xorl(Register dst,const Operand & src)1138 void xorl(Register dst, const Operand& src) {
1139 arithmetic_op_32(0x33, dst, src);
1140 }
1141
xorl(Register dst,Immediate src)1142 void xorl(Register dst, Immediate src) {
1143 immediate_arithmetic_op_32(0x6, dst, src);
1144 }
1145
xorl(const Operand & dst,Immediate src)1146 void xorl(const Operand& dst, Immediate src) {
1147 immediate_arithmetic_op_32(0x6, dst, src);
1148 }
1149
xor_(Register dst,const Operand & src)1150 void xor_(Register dst, const Operand& src) {
1151 arithmetic_op(0x33, dst, src);
1152 }
1153
xor_(const Operand & dst,Register src)1154 void xor_(const Operand& dst, Register src) {
1155 arithmetic_op(0x31, src, dst);
1156 }
1157
xor_(Register dst,Immediate src)1158 void xor_(Register dst, Immediate src) {
1159 immediate_arithmetic_op(0x6, dst, src);
1160 }
1161
xor_(const Operand & dst,Immediate src)1162 void xor_(const Operand& dst, Immediate src) {
1163 immediate_arithmetic_op(0x6, dst, src);
1164 }
1165
1166 // Bit operations.
1167 void bt(const Operand& dst, Register src);
1168 void bts(const Operand& dst, Register src);
1169
1170 // Miscellaneous
1171 void clc();
1172 void cld();
1173 void cpuid();
1174 void hlt();
1175 void int3();
1176 void nop();
1177 void rdtsc();
1178 void ret(int imm16);
1179 void setcc(Condition cc, Register reg);
1180
1181 // Label operations & relative jumps (PPUM Appendix D)
1182 //
1183 // Takes a branch opcode (cc) and a label (L) and generates
1184 // either a backward branch or a forward branch and links it
1185 // to the label fixup chain. Usage:
1186 //
1187 // Label L; // unbound label
1188 // j(cc, &L); // forward branch to unbound label
1189 // bind(&L); // bind label to the current pc
1190 // j(cc, &L); // backward branch to bound label
1191 // bind(&L); // illegal: a label may be bound only once
1192 //
1193 // Note: The same Label can be used for forward and backward branches
1194 // but it may be bound only once.
1195
1196 void bind(Label* L); // binds an unbound label L to the current code position
1197
1198 // Calls
1199 // Call near relative 32-bit displacement, relative to next instruction.
1200 void call(Label* L);
1201 void call(Handle<Code> target,
1202 RelocInfo::Mode rmode = RelocInfo::CODE_TARGET,
1203 unsigned ast_id = kNoASTId);
1204
1205 // Calls directly to the given address using a relative offset.
1206 // Should only ever be used in Code objects for calls within the
1207 // same Code object. Should not be used when generating new code (use labels),
1208 // but only when patching existing code.
1209 void call(Address target);
1210
1211 // Call near absolute indirect, address in register
1212 void call(Register adr);
1213
1214 // Call near indirect
1215 void call(const Operand& operand);
1216
1217 // Jumps
1218 // Jump short or near relative.
1219 // Use a 32-bit signed displacement.
1220 // Unconditional jump to L
1221 void jmp(Label* L, Label::Distance distance = Label::kFar);
1222 void jmp(Handle<Code> target, RelocInfo::Mode rmode);
1223
1224 // Jump near absolute indirect (r64)
1225 void jmp(Register adr);
1226
1227 // Jump near absolute indirect (m64)
1228 void jmp(const Operand& src);
1229
1230 // Conditional jumps
1231 void j(Condition cc,
1232 Label* L,
1233 Label::Distance distance = Label::kFar);
1234 void j(Condition cc, Handle<Code> target, RelocInfo::Mode rmode);
1235
1236 // Floating-point operations
1237 void fld(int i);
1238
1239 void fld1();
1240 void fldz();
1241 void fldpi();
1242 void fldln2();
1243
1244 void fld_s(const Operand& adr);
1245 void fld_d(const Operand& adr);
1246
1247 void fstp_s(const Operand& adr);
1248 void fstp_d(const Operand& adr);
1249 void fstp(int index);
1250
1251 void fild_s(const Operand& adr);
1252 void fild_d(const Operand& adr);
1253
1254 void fist_s(const Operand& adr);
1255
1256 void fistp_s(const Operand& adr);
1257 void fistp_d(const Operand& adr);
1258
1259 void fisttp_s(const Operand& adr);
1260 void fisttp_d(const Operand& adr);
1261
1262 void fabs();
1263 void fchs();
1264
1265 void fadd(int i);
1266 void fsub(int i);
1267 void fmul(int i);
1268 void fdiv(int i);
1269
1270 void fisub_s(const Operand& adr);
1271
1272 void faddp(int i = 1);
1273 void fsubp(int i = 1);
1274 void fsubrp(int i = 1);
1275 void fmulp(int i = 1);
1276 void fdivp(int i = 1);
1277 void fprem();
1278 void fprem1();
1279
1280 void fxch(int i = 1);
1281 void fincstp();
1282 void ffree(int i = 0);
1283
1284 void ftst();
1285 void fucomp(int i);
1286 void fucompp();
1287 void fucomi(int i);
1288 void fucomip();
1289
1290 void fcompp();
1291 void fnstsw_ax();
1292 void fwait();
1293 void fnclex();
1294
1295 void fsin();
1296 void fcos();
1297 void fptan();
1298 void fyl2x();
1299 void f2xm1();
1300 void fscale();
1301 void fninit();
1302
1303 void frndint();
1304
1305 void sahf();
1306
1307 // SSE2 instructions
1308 void movd(XMMRegister dst, Register src);
1309 void movd(Register dst, XMMRegister src);
1310 void movq(XMMRegister dst, Register src);
1311 void movq(Register dst, XMMRegister src);
1312 void movq(XMMRegister dst, XMMRegister src);
1313 void extractps(Register dst, XMMRegister src, byte imm8);
1314
1315 // Don't use this unless it's important to keep the
1316 // top half of the destination register unchanged.
1317 // Used movaps when moving double values and movq for integer
1318 // values in xmm registers.
1319 void movsd(XMMRegister dst, XMMRegister src);
1320
1321 void movsd(const Operand& dst, XMMRegister src);
1322 void movsd(XMMRegister dst, const Operand& src);
1323
1324 void movdqa(const Operand& dst, XMMRegister src);
1325 void movdqa(XMMRegister dst, const Operand& src);
1326
1327 void movapd(XMMRegister dst, XMMRegister src);
1328 void movaps(XMMRegister dst, XMMRegister src);
1329
1330 void movss(XMMRegister dst, const Operand& src);
1331 void movss(const Operand& dst, XMMRegister src);
1332
1333 void cvttss2si(Register dst, const Operand& src);
1334 void cvttss2si(Register dst, XMMRegister src);
1335 void cvttsd2si(Register dst, const Operand& src);
1336 void cvttsd2si(Register dst, XMMRegister src);
1337 void cvttsd2siq(Register dst, XMMRegister src);
1338
1339 void cvtlsi2sd(XMMRegister dst, const Operand& src);
1340 void cvtlsi2sd(XMMRegister dst, Register src);
1341 void cvtqsi2sd(XMMRegister dst, const Operand& src);
1342 void cvtqsi2sd(XMMRegister dst, Register src);
1343
1344 void cvtlsi2ss(XMMRegister dst, Register src);
1345
1346 void cvtss2sd(XMMRegister dst, XMMRegister src);
1347 void cvtss2sd(XMMRegister dst, const Operand& src);
1348 void cvtsd2ss(XMMRegister dst, XMMRegister src);
1349
1350 void cvtsd2si(Register dst, XMMRegister src);
1351 void cvtsd2siq(Register dst, XMMRegister src);
1352
1353 void addsd(XMMRegister dst, XMMRegister src);
1354 void subsd(XMMRegister dst, XMMRegister src);
1355 void mulsd(XMMRegister dst, XMMRegister src);
1356 void divsd(XMMRegister dst, XMMRegister src);
1357
1358 void andpd(XMMRegister dst, XMMRegister src);
1359 void orpd(XMMRegister dst, XMMRegister src);
1360 void xorpd(XMMRegister dst, XMMRegister src);
1361 void xorps(XMMRegister dst, XMMRegister src);
1362 void sqrtsd(XMMRegister dst, XMMRegister src);
1363
1364 void ucomisd(XMMRegister dst, XMMRegister src);
1365 void ucomisd(XMMRegister dst, const Operand& src);
1366
1367 enum RoundingMode {
1368 kRoundToNearest = 0x0,
1369 kRoundDown = 0x1,
1370 kRoundUp = 0x2,
1371 kRoundToZero = 0x3
1372 };
1373
1374 void roundsd(XMMRegister dst, XMMRegister src, RoundingMode mode);
1375
1376 void movmskpd(Register dst, XMMRegister src);
1377
1378 // The first argument is the reg field, the second argument is the r/m field.
1379 void emit_sse_operand(XMMRegister dst, XMMRegister src);
1380 void emit_sse_operand(XMMRegister reg, const Operand& adr);
1381 void emit_sse_operand(XMMRegister dst, Register src);
1382 void emit_sse_operand(Register dst, XMMRegister src);
1383
1384 // Debugging
1385 void Print();
1386
1387 // Check the code size generated from label to here.
SizeOfCodeGeneratedSince(Label * label)1388 int SizeOfCodeGeneratedSince(Label* label) {
1389 return pc_offset() - label->pos();
1390 }
1391
1392 // Mark address of the ExitJSFrame code.
1393 void RecordJSReturn();
1394
1395 // Mark address of a debug break slot.
1396 void RecordDebugBreakSlot();
1397
1398 // Record a comment relocation entry that can be used by a disassembler.
1399 // Use --code-comments to enable.
1400 void RecordComment(const char* msg, bool force = false);
1401
1402 // Writes a single word of data in the code stream.
1403 // Used for inline tables, e.g., jump-tables.
1404 void db(uint8_t data);
1405 void dd(uint32_t data);
1406
pc_offset()1407 int pc_offset() const { return static_cast<int>(pc_ - buffer_); }
1408
positions_recorder()1409 PositionsRecorder* positions_recorder() { return &positions_recorder_; }
1410
1411 // Check if there is less than kGap bytes available in the buffer.
1412 // If this is the case, we need to grow the buffer before emitting
1413 // an instruction or relocation information.
buffer_overflow()1414 inline bool buffer_overflow() const {
1415 return pc_ >= reloc_info_writer.pos() - kGap;
1416 }
1417
1418 // Get the number of bytes available in the buffer.
available_space()1419 inline int available_space() const {
1420 return static_cast<int>(reloc_info_writer.pos() - pc_);
1421 }
1422
1423 static bool IsNop(Address addr);
1424
1425 // Avoid overflows for displacements etc.
1426 static const int kMaximalBufferSize = 512*MB;
1427 static const int kMinimalBufferSize = 4*KB;
1428
byte_at(int pos)1429 byte byte_at(int pos) { return buffer_[pos]; }
set_byte_at(int pos,byte value)1430 void set_byte_at(int pos, byte value) { buffer_[pos] = value; }
1431
1432 protected:
emit_debug_code()1433 bool emit_debug_code() const { return emit_debug_code_; }
1434
1435 private:
addr_at(int pos)1436 byte* addr_at(int pos) { return buffer_ + pos; }
long_at(int pos)1437 uint32_t long_at(int pos) {
1438 return *reinterpret_cast<uint32_t*>(addr_at(pos));
1439 }
long_at_put(int pos,uint32_t x)1440 void long_at_put(int pos, uint32_t x) {
1441 *reinterpret_cast<uint32_t*>(addr_at(pos)) = x;
1442 }
1443
1444 // code emission
1445 void GrowBuffer();
1446
emit(byte x)1447 void emit(byte x) { *pc_++ = x; }
1448 inline void emitl(uint32_t x);
1449 inline void emitq(uint64_t x, RelocInfo::Mode rmode);
1450 inline void emitw(uint16_t x);
1451 inline void emit_code_target(Handle<Code> target,
1452 RelocInfo::Mode rmode,
1453 unsigned ast_id = kNoASTId);
emit(Immediate x)1454 void emit(Immediate x) { emitl(x.value_); }
1455
1456 // Emits a REX prefix that encodes a 64-bit operand size and
1457 // the top bit of both register codes.
1458 // High bit of reg goes to REX.R, high bit of rm_reg goes to REX.B.
1459 // REX.W is set.
1460 inline void emit_rex_64(XMMRegister reg, Register rm_reg);
1461 inline void emit_rex_64(Register reg, XMMRegister rm_reg);
1462 inline void emit_rex_64(Register reg, Register rm_reg);
1463
1464 // Emits a REX prefix that encodes a 64-bit operand size and
1465 // the top bit of the destination, index, and base register codes.
1466 // The high bit of reg is used for REX.R, the high bit of op's base
1467 // register is used for REX.B, and the high bit of op's index register
1468 // is used for REX.X. REX.W is set.
1469 inline void emit_rex_64(Register reg, const Operand& op);
1470 inline void emit_rex_64(XMMRegister reg, const Operand& op);
1471
1472 // Emits a REX prefix that encodes a 64-bit operand size and
1473 // the top bit of the register code.
1474 // The high bit of register is used for REX.B.
1475 // REX.W is set and REX.R and REX.X are clear.
1476 inline void emit_rex_64(Register rm_reg);
1477
1478 // Emits a REX prefix that encodes a 64-bit operand size and
1479 // the top bit of the index and base register codes.
1480 // The high bit of op's base register is used for REX.B, and the high
1481 // bit of op's index register is used for REX.X.
1482 // REX.W is set and REX.R clear.
1483 inline void emit_rex_64(const Operand& op);
1484
1485 // Emit a REX prefix that only sets REX.W to choose a 64-bit operand size.
emit_rex_64()1486 void emit_rex_64() { emit(0x48); }
1487
1488 // High bit of reg goes to REX.R, high bit of rm_reg goes to REX.B.
1489 // REX.W is clear.
1490 inline void emit_rex_32(Register reg, Register rm_reg);
1491
1492 // The high bit of reg is used for REX.R, the high bit of op's base
1493 // register is used for REX.B, and the high bit of op's index register
1494 // is used for REX.X. REX.W is cleared.
1495 inline void emit_rex_32(Register reg, const Operand& op);
1496
1497 // High bit of rm_reg goes to REX.B.
1498 // REX.W, REX.R and REX.X are clear.
1499 inline void emit_rex_32(Register rm_reg);
1500
1501 // High bit of base goes to REX.B and high bit of index to REX.X.
1502 // REX.W and REX.R are clear.
1503 inline void emit_rex_32(const Operand& op);
1504
1505 // High bit of reg goes to REX.R, high bit of rm_reg goes to REX.B.
1506 // REX.W is cleared. If no REX bits are set, no byte is emitted.
1507 inline void emit_optional_rex_32(Register reg, Register rm_reg);
1508
1509 // The high bit of reg is used for REX.R, the high bit of op's base
1510 // register is used for REX.B, and the high bit of op's index register
1511 // is used for REX.X. REX.W is cleared. If no REX bits are set, nothing
1512 // is emitted.
1513 inline void emit_optional_rex_32(Register reg, const Operand& op);
1514
1515 // As for emit_optional_rex_32(Register, Register), except that
1516 // the registers are XMM registers.
1517 inline void emit_optional_rex_32(XMMRegister reg, XMMRegister base);
1518
1519 // As for emit_optional_rex_32(Register, Register), except that
1520 // one of the registers is an XMM registers.
1521 inline void emit_optional_rex_32(XMMRegister reg, Register base);
1522
1523 // As for emit_optional_rex_32(Register, Register), except that
1524 // one of the registers is an XMM registers.
1525 inline void emit_optional_rex_32(Register reg, XMMRegister base);
1526
1527 // As for emit_optional_rex_32(Register, const Operand&), except that
1528 // the register is an XMM register.
1529 inline void emit_optional_rex_32(XMMRegister reg, const Operand& op);
1530
1531 // Optionally do as emit_rex_32(Register) if the register number has
1532 // the high bit set.
1533 inline void emit_optional_rex_32(Register rm_reg);
1534
1535 // Optionally do as emit_rex_32(const Operand&) if the operand register
1536 // numbers have a high bit set.
1537 inline void emit_optional_rex_32(const Operand& op);
1538
1539
1540 // Emit the ModR/M byte, and optionally the SIB byte and
1541 // 1- or 4-byte offset for a memory operand. Also encodes
1542 // the second operand of the operation, a register or operation
1543 // subcode, into the reg field of the ModR/M byte.
emit_operand(Register reg,const Operand & adr)1544 void emit_operand(Register reg, const Operand& adr) {
1545 emit_operand(reg.low_bits(), adr);
1546 }
1547
1548 // Emit the ModR/M byte, and optionally the SIB byte and
1549 // 1- or 4-byte offset for a memory operand. Also used to encode
1550 // a three-bit opcode extension into the ModR/M byte.
1551 void emit_operand(int rm, const Operand& adr);
1552
1553 // Emit a ModR/M byte with registers coded in the reg and rm_reg fields.
emit_modrm(Register reg,Register rm_reg)1554 void emit_modrm(Register reg, Register rm_reg) {
1555 emit(0xC0 | reg.low_bits() << 3 | rm_reg.low_bits());
1556 }
1557
1558 // Emit a ModR/M byte with an operation subcode in the reg field and
1559 // a register in the rm_reg field.
emit_modrm(int code,Register rm_reg)1560 void emit_modrm(int code, Register rm_reg) {
1561 ASSERT(is_uint3(code));
1562 emit(0xC0 | code << 3 | rm_reg.low_bits());
1563 }
1564
1565 // Emit the code-object-relative offset of the label's position
1566 inline void emit_code_relative_offset(Label* label);
1567
1568 // Emit machine code for one of the operations ADD, ADC, SUB, SBC,
1569 // AND, OR, XOR, or CMP. The encodings of these operations are all
1570 // similar, differing just in the opcode or in the reg field of the
1571 // ModR/M byte.
1572 void arithmetic_op_16(byte opcode, Register reg, Register rm_reg);
1573 void arithmetic_op_16(byte opcode, Register reg, const Operand& rm_reg);
1574 void arithmetic_op_32(byte opcode, Register reg, Register rm_reg);
1575 void arithmetic_op_32(byte opcode, Register reg, const Operand& rm_reg);
1576 void arithmetic_op(byte opcode, Register reg, Register rm_reg);
1577 void arithmetic_op(byte opcode, Register reg, const Operand& rm_reg);
1578 void immediate_arithmetic_op(byte subcode, Register dst, Immediate src);
1579 void immediate_arithmetic_op(byte subcode, const Operand& dst, Immediate src);
1580 // Operate on a byte in memory or register.
1581 void immediate_arithmetic_op_8(byte subcode,
1582 Register dst,
1583 Immediate src);
1584 void immediate_arithmetic_op_8(byte subcode,
1585 const Operand& dst,
1586 Immediate src);
1587 // Operate on a word in memory or register.
1588 void immediate_arithmetic_op_16(byte subcode,
1589 Register dst,
1590 Immediate src);
1591 void immediate_arithmetic_op_16(byte subcode,
1592 const Operand& dst,
1593 Immediate src);
1594 // Operate on a 32-bit word in memory or register.
1595 void immediate_arithmetic_op_32(byte subcode,
1596 Register dst,
1597 Immediate src);
1598 void immediate_arithmetic_op_32(byte subcode,
1599 const Operand& dst,
1600 Immediate src);
1601
1602 // Emit machine code for a shift operation.
1603 void shift(Register dst, Immediate shift_amount, int subcode);
1604 void shift_32(Register dst, Immediate shift_amount, int subcode);
1605 // Shift dst by cl % 64 bits.
1606 void shift(Register dst, int subcode);
1607 void shift_32(Register dst, int subcode);
1608
1609 void emit_farith(int b1, int b2, int i);
1610
1611 // labels
1612 // void print(Label* L);
1613 void bind_to(Label* L, int pos);
1614
1615 // record reloc info for current pc_
1616 void RecordRelocInfo(RelocInfo::Mode rmode, intptr_t data = 0);
1617
1618 friend class CodePatcher;
1619 friend class EnsureSpace;
1620 friend class RegExpMacroAssemblerX64;
1621
1622 // Code buffer:
1623 // The buffer into which code and relocation info are generated.
1624 byte* buffer_;
1625 int buffer_size_;
1626 // True if the assembler owns the buffer, false if buffer is external.
1627 bool own_buffer_;
1628
1629 // code generation
1630 byte* pc_; // the program counter; moves forward
1631 RelocInfoWriter reloc_info_writer;
1632
1633 List< Handle<Code> > code_targets_;
1634
1635 PositionsRecorder positions_recorder_;
1636
1637 bool emit_debug_code_;
1638
1639 friend class PositionsRecorder;
1640 };
1641
1642
1643 // Helper class that ensures that there is enough space for generating
1644 // instructions and relocation information. The constructor makes
1645 // sure that there is enough space and (in debug mode) the destructor
1646 // checks that we did not generate too much.
1647 class EnsureSpace BASE_EMBEDDED {
1648 public:
EnsureSpace(Assembler * assembler)1649 explicit EnsureSpace(Assembler* assembler) : assembler_(assembler) {
1650 if (assembler_->buffer_overflow()) assembler_->GrowBuffer();
1651 #ifdef DEBUG
1652 space_before_ = assembler_->available_space();
1653 #endif
1654 }
1655
1656 #ifdef DEBUG
~EnsureSpace()1657 ~EnsureSpace() {
1658 int bytes_generated = space_before_ - assembler_->available_space();
1659 ASSERT(bytes_generated < assembler_->kGap);
1660 }
1661 #endif
1662
1663 private:
1664 Assembler* assembler_;
1665 #ifdef DEBUG
1666 int space_before_;
1667 #endif
1668 };
1669
1670 } } // namespace v8::internal
1671
1672 #endif // V8_X64_ASSEMBLER_X64_H_
1673