Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2014 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
| 17 | #ifndef ART_COMPILER_UTILS_X86_64_ASSEMBLER_X86_64_H_ |
| 18 | #define ART_COMPILER_UTILS_X86_64_ASSEMBLER_X86_64_H_ |
| 19 | |
| 20 | #include <vector> |
Vladimir Marko | 80afd02 | 2015-05-19 18:08:00 +0100 | [diff] [blame] | 21 | |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 22 | #include "arch/x86_64/instruction_set_features_x86_64.h" |
Vladimir Marko | 93205e3 | 2016-04-13 11:59:46 +0100 | [diff] [blame] | 23 | #include "base/arena_containers.h" |
David Brazdil | d9c9037 | 2016-09-14 16:53:55 +0100 | [diff] [blame] | 24 | #include "base/array_ref.h" |
Vladimir Marko | 80afd02 | 2015-05-19 18:08:00 +0100 | [diff] [blame] | 25 | #include "base/bit_utils.h" |
David Sehr | 1979c64 | 2018-04-26 14:41:18 -0700 | [diff] [blame] | 26 | #include "base/globals.h" |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 27 | #include "base/macros.h" |
| 28 | #include "constants_x86_64.h" |
Andreas Gampe | 09659c2 | 2017-09-18 18:23:32 -0700 | [diff] [blame] | 29 | #include "heap_poisoning.h" |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 30 | #include "managed_register_x86_64.h" |
| 31 | #include "offsets.h" |
| 32 | #include "utils/assembler.h" |
Andreas Gampe | 3b165bc | 2016-08-01 22:07:04 -0700 | [diff] [blame] | 33 | #include "utils/jni_macro_assembler.h" |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 34 | |
| 35 | namespace art { |
| 36 | namespace x86_64 { |
| 37 | |
avignate | 5408b6b | 2014-06-04 17:59:44 +0700 | [diff] [blame] | 38 | // Encodes an immediate value for operands. |
| 39 | // |
| 40 | // Note: Immediates can be 64b on x86-64 for certain instructions, but are often restricted |
| 41 | // to 32b. |
| 42 | // |
| 43 | // Note: As we support cross-compilation, the value type must be int64_t. Please be aware of |
| 44 | // conversion rules in expressions regarding negation, especially size_t on 32b. |
Ian Rogers | cf7f191 | 2014-10-22 22:06:39 -0700 | [diff] [blame] | 45 | class Immediate : public ValueObject { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 46 | public: |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 47 | explicit Immediate(int64_t value_in) : value_(value_in) {} |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 48 | |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 49 | int64_t value() const { return value_; } |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 50 | |
Andreas Gampe | ab1eb0d | 2015-02-13 19:23:55 -0800 | [diff] [blame] | 51 | bool is_int8() const { return IsInt<8>(value_); } |
| 52 | bool is_uint8() const { return IsUint<8>(value_); } |
| 53 | bool is_int16() const { return IsInt<16>(value_); } |
| 54 | bool is_uint16() const { return IsUint<16>(value_); } |
| 55 | bool is_int32() const { return IsInt<32>(value_); } |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 56 | |
| 57 | private: |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 58 | const int64_t value_; |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 59 | }; |
| 60 | |
| 61 | |
Ian Rogers | cf7f191 | 2014-10-22 22:06:39 -0700 | [diff] [blame] | 62 | class Operand : public ValueObject { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 63 | public: |
| 64 | uint8_t mod() const { |
| 65 | return (encoding_at(0) >> 6) & 3; |
| 66 | } |
| 67 | |
| 68 | Register rm() const { |
| 69 | return static_cast<Register>(encoding_at(0) & 7); |
| 70 | } |
| 71 | |
| 72 | ScaleFactor scale() const { |
| 73 | return static_cast<ScaleFactor>((encoding_at(1) >> 6) & 3); |
| 74 | } |
| 75 | |
| 76 | Register index() const { |
| 77 | return static_cast<Register>((encoding_at(1) >> 3) & 7); |
| 78 | } |
| 79 | |
| 80 | Register base() const { |
| 81 | return static_cast<Register>(encoding_at(1) & 7); |
| 82 | } |
| 83 | |
Aart Bik | f7754e8 | 2017-09-20 10:33:06 -0700 | [diff] [blame] | 84 | CpuRegister cpu_rm() const { |
| 85 | int ext = (rex_ & 1) != 0 ? x86_64::R8 : x86_64::RAX; |
| 86 | return static_cast<CpuRegister>(rm() + ext); |
| 87 | } |
| 88 | |
| 89 | CpuRegister cpu_index() const { |
| 90 | int ext = (rex_ & 2) != 0 ? x86_64::R8 : x86_64::RAX; |
| 91 | return static_cast<CpuRegister>(index() + ext); |
| 92 | } |
| 93 | |
| 94 | CpuRegister cpu_base() const { |
| 95 | int ext = (rex_ & 1) != 0 ? x86_64::R8 : x86_64::RAX; |
| 96 | return static_cast<CpuRegister>(base() + ext); |
| 97 | } |
| 98 | |
Ian Rogers | 790a6b7 | 2014-04-01 10:36:00 -0700 | [diff] [blame] | 99 | uint8_t rex() const { |
| 100 | return rex_; |
| 101 | } |
| 102 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 103 | int8_t disp8() const { |
| 104 | CHECK_GE(length_, 2); |
| 105 | return static_cast<int8_t>(encoding_[length_ - 1]); |
| 106 | } |
| 107 | |
| 108 | int32_t disp32() const { |
| 109 | CHECK_GE(length_, 5); |
| 110 | int32_t value; |
| 111 | memcpy(&value, &encoding_[length_ - 4], sizeof(value)); |
| 112 | return value; |
| 113 | } |
| 114 | |
Ulya Trafimovich | af5d304 | 2021-06-10 15:29:21 +0100 | [diff] [blame] | 115 | int32_t disp() const { |
| 116 | switch (mod()) { |
| 117 | case 0: |
| 118 | // With mod 00b RBP is special and means disp32 (either in r/m or in SIB base). |
| 119 | return (rm() == RBP || (rm() == RSP && base() == RBP)) ? disp32() : 0; |
| 120 | case 1: |
| 121 | return disp8(); |
| 122 | case 2: |
| 123 | return disp32(); |
| 124 | default: |
| 125 | // Mod 11b means reg/reg, so there is no address and consequently no displacement. |
| 126 | DCHECK(false) << "there is no displacement in x86_64 reg/reg operand"; |
| 127 | UNREACHABLE(); |
| 128 | } |
| 129 | } |
| 130 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 131 | bool IsRegister(CpuRegister reg) const { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 132 | return ((encoding_[0] & 0xF8) == 0xC0) // Addressing mode is register only. |
Ian Rogers | 790a6b7 | 2014-04-01 10:36:00 -0700 | [diff] [blame] | 133 | && ((encoding_[0] & 0x07) == reg.LowBits()) // Register codes match. |
| 134 | && (reg.NeedsRex() == ((rex_ & 1) != 0)); // REX.000B bits match. |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 135 | } |
| 136 | |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 137 | AssemblerFixup* GetFixup() const { |
| 138 | return fixup_; |
| 139 | } |
| 140 | |
Ulya Trafimovich | af5d304 | 2021-06-10 15:29:21 +0100 | [diff] [blame] | 141 | inline bool operator==(const Operand &op) const { |
| 142 | return rex_ == op.rex_ && |
| 143 | length_ == op.length_ && |
| 144 | memcmp(encoding_, op.encoding_, length_) == 0 && |
| 145 | fixup_ == op.fixup_; |
| 146 | } |
| 147 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 148 | protected: |
| 149 | // Operand can be sub classed (e.g: Address). |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 150 | Operand() : rex_(0), length_(0), fixup_(nullptr) { } |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 151 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 152 | void SetModRM(uint8_t mod_in, CpuRegister rm_in) { |
| 153 | CHECK_EQ(mod_in & ~3, 0); |
| 154 | if (rm_in.NeedsRex()) { |
Ian Rogers | 790a6b7 | 2014-04-01 10:36:00 -0700 | [diff] [blame] | 155 | rex_ |= 0x41; // REX.000B |
| 156 | } |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 157 | encoding_[0] = (mod_in << 6) | rm_in.LowBits(); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 158 | length_ = 1; |
| 159 | } |
| 160 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 161 | void SetSIB(ScaleFactor scale_in, CpuRegister index_in, CpuRegister base_in) { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 162 | CHECK_EQ(length_, 1); |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 163 | CHECK_EQ(scale_in & ~3, 0); |
| 164 | if (base_in.NeedsRex()) { |
Ian Rogers | 790a6b7 | 2014-04-01 10:36:00 -0700 | [diff] [blame] | 165 | rex_ |= 0x41; // REX.000B |
| 166 | } |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 167 | if (index_in.NeedsRex()) { |
Ian Rogers | 790a6b7 | 2014-04-01 10:36:00 -0700 | [diff] [blame] | 168 | rex_ |= 0x42; // REX.00X0 |
| 169 | } |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 170 | encoding_[1] = (scale_in << 6) | (static_cast<uint8_t>(index_in.LowBits()) << 3) | |
| 171 | static_cast<uint8_t>(base_in.LowBits()); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 172 | length_ = 2; |
| 173 | } |
| 174 | |
| 175 | void SetDisp8(int8_t disp) { |
| 176 | CHECK(length_ == 1 || length_ == 2); |
| 177 | encoding_[length_++] = static_cast<uint8_t>(disp); |
| 178 | } |
| 179 | |
| 180 | void SetDisp32(int32_t disp) { |
| 181 | CHECK(length_ == 1 || length_ == 2); |
| 182 | int disp_size = sizeof(disp); |
| 183 | memmove(&encoding_[length_], &disp, disp_size); |
| 184 | length_ += disp_size; |
| 185 | } |
| 186 | |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 187 | void SetFixup(AssemblerFixup* fixup) { |
| 188 | fixup_ = fixup; |
| 189 | } |
| 190 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 191 | private: |
Ian Rogers | 790a6b7 | 2014-04-01 10:36:00 -0700 | [diff] [blame] | 192 | uint8_t rex_; |
| 193 | uint8_t length_; |
| 194 | uint8_t encoding_[6]; |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 195 | AssemblerFixup* fixup_; |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 196 | |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 197 | explicit Operand(CpuRegister reg) : rex_(0), length_(0), fixup_(nullptr) { SetModRM(3, reg); } |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 198 | |
| 199 | // Get the operand encoding byte at the given index. |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 200 | uint8_t encoding_at(int index_in) const { |
| 201 | CHECK_GE(index_in, 0); |
| 202 | CHECK_LT(index_in, length_); |
| 203 | return encoding_[index_in]; |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 204 | } |
| 205 | |
| 206 | friend class X86_64Assembler; |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 207 | }; |
| 208 | |
| 209 | |
| 210 | class Address : public Operand { |
| 211 | public: |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 212 | Address(CpuRegister base_in, int32_t disp) { |
| 213 | Init(base_in, disp); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 214 | } |
| 215 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 216 | Address(CpuRegister base_in, Offset disp) { |
| 217 | Init(base_in, disp.Int32Value()); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 218 | } |
| 219 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 220 | Address(CpuRegister base_in, FrameOffset disp) { |
| 221 | CHECK_EQ(base_in.AsRegister(), RSP); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 222 | Init(CpuRegister(RSP), disp.Int32Value()); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 223 | } |
| 224 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 225 | Address(CpuRegister base_in, MemberOffset disp) { |
| 226 | Init(base_in, disp.Int32Value()); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 227 | } |
| 228 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 229 | void Init(CpuRegister base_in, int32_t disp) { |
Nicolas Geoffray | 784cc5c | 2014-12-18 20:25:18 +0000 | [diff] [blame] | 230 | if (disp == 0 && base_in.LowBits() != RBP) { |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 231 | SetModRM(0, base_in); |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 232 | if (base_in.LowBits() == RSP) { |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 233 | SetSIB(TIMES_1, CpuRegister(RSP), base_in); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 234 | } |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 235 | } else if (disp >= -128 && disp <= 127) { |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 236 | SetModRM(1, base_in); |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 237 | if (base_in.LowBits() == RSP) { |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 238 | SetSIB(TIMES_1, CpuRegister(RSP), base_in); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 239 | } |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 240 | SetDisp8(disp); |
| 241 | } else { |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 242 | SetModRM(2, base_in); |
Nicolas Geoffray | 9889396 | 2015-01-21 12:32:32 +0000 | [diff] [blame] | 243 | if (base_in.LowBits() == RSP) { |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 244 | SetSIB(TIMES_1, CpuRegister(RSP), base_in); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 245 | } |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 246 | SetDisp32(disp); |
| 247 | } |
| 248 | } |
| 249 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 250 | Address(CpuRegister index_in, ScaleFactor scale_in, int32_t disp) { |
| 251 | CHECK_NE(index_in.AsRegister(), RSP); // Illegal addressing mode. |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 252 | SetModRM(0, CpuRegister(RSP)); |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 253 | SetSIB(scale_in, index_in, CpuRegister(RBP)); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 254 | SetDisp32(disp); |
| 255 | } |
| 256 | |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 257 | Address(CpuRegister base_in, CpuRegister index_in, ScaleFactor scale_in, int32_t disp) { |
| 258 | CHECK_NE(index_in.AsRegister(), RSP); // Illegal addressing mode. |
Nicolas Geoffray | 784cc5c | 2014-12-18 20:25:18 +0000 | [diff] [blame] | 259 | if (disp == 0 && base_in.LowBits() != RBP) { |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 260 | SetModRM(0, CpuRegister(RSP)); |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 261 | SetSIB(scale_in, index_in, base_in); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 262 | } else if (disp >= -128 && disp <= 127) { |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 263 | SetModRM(1, CpuRegister(RSP)); |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 264 | SetSIB(scale_in, index_in, base_in); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 265 | SetDisp8(disp); |
| 266 | } else { |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 267 | SetModRM(2, CpuRegister(RSP)); |
Andreas Gampe | 277ccbd | 2014-11-03 21:36:10 -0800 | [diff] [blame] | 268 | SetSIB(scale_in, index_in, base_in); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 269 | SetDisp32(disp); |
| 270 | } |
| 271 | } |
| 272 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 273 | // If no_rip is true then the Absolute address isn't RIP relative. |
Ian Rogers | 1373595 | 2014-10-08 12:43:28 -0700 | [diff] [blame] | 274 | static Address Absolute(uintptr_t addr, bool no_rip = false) { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 275 | Address result; |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 276 | if (no_rip) { |
| 277 | result.SetModRM(0, CpuRegister(RSP)); |
| 278 | result.SetSIB(TIMES_1, CpuRegister(RSP), CpuRegister(RBP)); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 279 | result.SetDisp32(addr); |
| 280 | } else { |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 281 | // RIP addressing is done using RBP as the base register. |
| 282 | // The value in RBP isn't used. Instead the offset is added to RIP. |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 283 | result.SetModRM(0, CpuRegister(RBP)); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 284 | result.SetDisp32(addr); |
| 285 | } |
| 286 | return result; |
| 287 | } |
| 288 | |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 289 | // An RIP relative address that will be fixed up later. |
| 290 | static Address RIP(AssemblerFixup* fixup) { |
| 291 | Address result; |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 292 | // RIP addressing is done using RBP as the base register. |
| 293 | // The value in RBP isn't used. Instead the offset is added to RIP. |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 294 | result.SetModRM(0, CpuRegister(RBP)); |
| 295 | result.SetDisp32(0); |
| 296 | result.SetFixup(fixup); |
| 297 | return result; |
| 298 | } |
| 299 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 300 | // If no_rip is true then the Absolute address isn't RIP relative. |
Andreas Gampe | 542451c | 2016-07-26 09:02:02 -0700 | [diff] [blame] | 301 | static Address Absolute(ThreadOffset64 addr, bool no_rip = false) { |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 302 | return Absolute(addr.Int32Value(), no_rip); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 303 | } |
| 304 | |
Ulya Trafimovich | af5d304 | 2021-06-10 15:29:21 +0100 | [diff] [blame] | 305 | // Break the address into pieces and reassemble it again with a new displacement. |
| 306 | // Note that it may require a new addressing mode if displacement size is changed. |
| 307 | static Address displace(const Address &addr, int32_t disp) { |
| 308 | const int32_t new_disp = addr.disp() + disp; |
| 309 | const bool sib = addr.rm() == RSP; |
| 310 | const bool rbp = RBP == (sib ? addr.base() : addr.rm()); |
| 311 | Address new_addr; |
| 312 | if (addr.mod() == 0 && rbp) { |
| 313 | // Special case: mod 00b and RBP in r/m or SIB base => 32-bit displacement. |
| 314 | // This case includes RIP-relative addressing. |
| 315 | new_addr.SetModRM(0, addr.cpu_rm()); |
| 316 | if (sib) { |
| 317 | new_addr.SetSIB(addr.scale(), addr.cpu_index(), addr.cpu_base()); |
| 318 | } |
| 319 | new_addr.SetDisp32(new_disp); |
| 320 | } else if (new_disp == 0 && !rbp) { |
| 321 | // Mod 00b (excluding a special case for RBP) => no displacement. |
| 322 | new_addr.SetModRM(0, addr.cpu_rm()); |
| 323 | if (sib) { |
| 324 | new_addr.SetSIB(addr.scale(), addr.cpu_index(), addr.cpu_base()); |
| 325 | } |
| 326 | } else if (new_disp >= -128 && new_disp <= 127) { |
| 327 | // Mod 01b => 8-bit displacement. |
| 328 | new_addr.SetModRM(1, addr.cpu_rm()); |
| 329 | if (sib) { |
| 330 | new_addr.SetSIB(addr.scale(), addr.cpu_index(), addr.cpu_base()); |
| 331 | } |
| 332 | new_addr.SetDisp8(new_disp); |
| 333 | } else { |
| 334 | // Mod 10b => 32-bit displacement. |
| 335 | new_addr.SetModRM(2, addr.cpu_rm()); |
| 336 | if (sib) { |
| 337 | new_addr.SetSIB(addr.scale(), addr.cpu_index(), addr.cpu_base()); |
| 338 | } |
| 339 | new_addr.SetDisp32(new_disp); |
| 340 | } |
| 341 | new_addr.SetFixup(addr.GetFixup()); |
| 342 | return new_addr; |
| 343 | } |
| 344 | |
| 345 | inline bool operator==(const Address& addr) const { |
| 346 | return static_cast<const Operand&>(*this) == static_cast<const Operand&>(addr); |
| 347 | } |
| 348 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 349 | private: |
| 350 | Address() {} |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 351 | }; |
| 352 | |
Aart Bik | f7754e8 | 2017-09-20 10:33:06 -0700 | [diff] [blame] | 353 | std::ostream& operator<<(std::ostream& os, const Address& addr); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 354 | |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 355 | /** |
| 356 | * Class to handle constant area values. |
| 357 | */ |
| 358 | class ConstantArea { |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 359 | public: |
Vladimir Marko | e764d2e | 2017-10-05 14:35:55 +0100 | [diff] [blame] | 360 | explicit ConstantArea(ArenaAllocator* allocator) |
| 361 | : buffer_(allocator->Adapter(kArenaAllocAssembler)) {} |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 362 | |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 363 | // Add a double to the constant area, returning the offset into |
| 364 | // the constant area where the literal resides. |
| 365 | size_t AddDouble(double v); |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 366 | |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 367 | // Add a float to the constant area, returning the offset into |
| 368 | // the constant area where the literal resides. |
| 369 | size_t AddFloat(float v); |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 370 | |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 371 | // Add an int32_t to the constant area, returning the offset into |
| 372 | // the constant area where the literal resides. |
| 373 | size_t AddInt32(int32_t v); |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 374 | |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 375 | // Add an int32_t to the end of the constant area, returning the offset into |
| 376 | // the constant area where the literal resides. |
| 377 | size_t AppendInt32(int32_t v); |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 378 | |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 379 | // Add an int64_t to the constant area, returning the offset into |
| 380 | // the constant area where the literal resides. |
| 381 | size_t AddInt64(int64_t v); |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 382 | |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 383 | size_t GetSize() const { |
| 384 | return buffer_.size() * elem_size_; |
| 385 | } |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 386 | |
Vladimir Marko | 93205e3 | 2016-04-13 11:59:46 +0100 | [diff] [blame] | 387 | ArrayRef<const int32_t> GetBuffer() const { |
| 388 | return ArrayRef<const int32_t>(buffer_); |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 389 | } |
| 390 | |
| 391 | private: |
| 392 | static constexpr size_t elem_size_ = sizeof(int32_t); |
Vladimir Marko | 93205e3 | 2016-04-13 11:59:46 +0100 | [diff] [blame] | 393 | ArenaVector<int32_t> buffer_; |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 394 | }; |
| 395 | |
| 396 | |
Mark Mendell | 73f455e | 2015-08-21 09:30:05 -0400 | [diff] [blame] | 397 | // This is equivalent to the Label class, used in a slightly different context. We |
| 398 | // inherit the functionality of the Label class, but prevent unintended |
| 399 | // derived-to-base conversions by making the base class private. |
| 400 | class NearLabel : private Label { |
| 401 | public: |
| 402 | NearLabel() : Label() {} |
| 403 | |
| 404 | // Expose the Label routines that we need. |
| 405 | using Label::Position; |
| 406 | using Label::LinkPosition; |
| 407 | using Label::IsBound; |
| 408 | using Label::IsUnused; |
| 409 | using Label::IsLinked; |
| 410 | |
| 411 | private: |
| 412 | using Label::BindTo; |
| 413 | using Label::LinkTo; |
| 414 | |
| 415 | friend class x86_64::X86_64Assembler; |
| 416 | |
| 417 | DISALLOW_COPY_AND_ASSIGN(NearLabel); |
| 418 | }; |
| 419 | |
| 420 | |
Roland Levillain | bbc6e7e | 2018-08-24 16:58:47 +0100 | [diff] [blame] | 421 | class X86_64Assembler final : public Assembler { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 422 | public: |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 423 | explicit X86_64Assembler(ArenaAllocator* allocator, |
| 424 | const X86_64InstructionSetFeatures* instruction_set_features = nullptr) |
| 425 | : Assembler(allocator), |
| 426 | constant_area_(allocator), |
| 427 | has_AVX_(instruction_set_features != nullptr ? instruction_set_features->HasAVX(): false), |
| 428 | has_AVX2_(instruction_set_features != nullptr ? instruction_set_features->HasAVX2() : false) {} |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 429 | virtual ~X86_64Assembler() {} |
| 430 | |
| 431 | /* |
| 432 | * Emit Machine Instructions. |
| 433 | */ |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 434 | void call(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 435 | void call(const Address& address); |
| 436 | void call(Label* label); |
| 437 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 438 | void pushq(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 439 | void pushq(const Address& address); |
| 440 | void pushq(const Immediate& imm); |
| 441 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 442 | void popq(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 443 | void popq(const Address& address); |
| 444 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 445 | void movq(CpuRegister dst, const Immediate& src); |
| 446 | void movl(CpuRegister dst, const Immediate& src); |
| 447 | void movq(CpuRegister dst, CpuRegister src); |
| 448 | void movl(CpuRegister dst, CpuRegister src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 449 | |
Mark Mendell | 7a08fb5 | 2015-07-15 14:09:35 -0400 | [diff] [blame] | 450 | void movntl(const Address& dst, CpuRegister src); |
| 451 | void movntq(const Address& dst, CpuRegister src); |
| 452 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 453 | void movq(CpuRegister dst, const Address& src); |
| 454 | void movl(CpuRegister dst, const Address& src); |
| 455 | void movq(const Address& dst, CpuRegister src); |
Mark Mendell | cfa410b | 2015-05-25 16:02:44 -0400 | [diff] [blame] | 456 | void movq(const Address& dst, const Immediate& imm); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 457 | void movl(const Address& dst, CpuRegister src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 458 | void movl(const Address& dst, const Immediate& imm); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 459 | |
Andreas Gampe | 71fb52f | 2014-12-29 17:43:08 -0800 | [diff] [blame] | 460 | void cmov(Condition c, CpuRegister dst, CpuRegister src); // This is the 64b version. |
| 461 | void cmov(Condition c, CpuRegister dst, CpuRegister src, bool is64bit); |
Mark Mendell | abdac47 | 2016-02-12 13:49:03 -0500 | [diff] [blame] | 462 | void cmov(Condition c, CpuRegister dst, const Address& src, bool is64bit); |
Andreas Gampe | 71fb52f | 2014-12-29 17:43:08 -0800 | [diff] [blame] | 463 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 464 | void movzxb(CpuRegister dst, CpuRegister src); |
| 465 | void movzxb(CpuRegister dst, const Address& src); |
| 466 | void movsxb(CpuRegister dst, CpuRegister src); |
| 467 | void movsxb(CpuRegister dst, const Address& src); |
| 468 | void movb(CpuRegister dst, const Address& src); |
| 469 | void movb(const Address& dst, CpuRegister src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 470 | void movb(const Address& dst, const Immediate& imm); |
| 471 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 472 | void movzxw(CpuRegister dst, CpuRegister src); |
| 473 | void movzxw(CpuRegister dst, const Address& src); |
| 474 | void movsxw(CpuRegister dst, CpuRegister src); |
| 475 | void movsxw(CpuRegister dst, const Address& src); |
| 476 | void movw(CpuRegister dst, const Address& src); |
| 477 | void movw(const Address& dst, CpuRegister src); |
Nicolas Geoffray | 26a25ef | 2014-09-30 13:54:09 +0100 | [diff] [blame] | 478 | void movw(const Address& dst, const Immediate& imm); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 479 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 480 | void leaq(CpuRegister dst, const Address& src); |
Nicolas Geoffray | 748f140 | 2015-01-27 08:17:54 +0000 | [diff] [blame] | 481 | void leal(CpuRegister dst, const Address& src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 482 | |
Aart Bik | c778226 | 2017-01-13 16:20:08 -0800 | [diff] [blame] | 483 | void movaps(XmmRegister dst, XmmRegister src); // move |
| 484 | void movaps(XmmRegister dst, const Address& src); // load aligned |
| 485 | void movups(XmmRegister dst, const Address& src); // load unaligned |
| 486 | void movaps(const Address& dst, XmmRegister src); // store aligned |
| 487 | void movups(const Address& dst, XmmRegister src); // store unaligned |
Nicolas Geoffray | 7fb49da | 2014-10-06 09:12:41 +0100 | [diff] [blame] | 488 | |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 489 | void vmovaps(XmmRegister dst, XmmRegister src); // move |
| 490 | void vmovaps(XmmRegister dst, const Address& src); // load aligned |
| 491 | void vmovaps(const Address& dst, XmmRegister src); // store aligned |
| 492 | void vmovups(XmmRegister dst, const Address& src); // load unaligned |
| 493 | void vmovups(const Address& dst, XmmRegister src); // store unaligned |
| 494 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 495 | void movss(XmmRegister dst, const Address& src); |
| 496 | void movss(const Address& dst, XmmRegister src); |
| 497 | void movss(XmmRegister dst, XmmRegister src); |
| 498 | |
Roland Levillain | dff1f28 | 2014-11-05 14:15:05 +0000 | [diff] [blame] | 499 | void movsxd(CpuRegister dst, CpuRegister src); |
| 500 | void movsxd(CpuRegister dst, const Address& src); |
| 501 | |
Andreas Gampe | 71fb52f | 2014-12-29 17:43:08 -0800 | [diff] [blame] | 502 | void movd(XmmRegister dst, CpuRegister src); // Note: this is the r64 version, formally movq. |
| 503 | void movd(CpuRegister dst, XmmRegister src); // Note: this is the r64 version, formally movq. |
| 504 | void movd(XmmRegister dst, CpuRegister src, bool is64bit); |
| 505 | void movd(CpuRegister dst, XmmRegister src, bool is64bit); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 506 | |
| 507 | void addss(XmmRegister dst, XmmRegister src); |
| 508 | void addss(XmmRegister dst, const Address& src); |
| 509 | void subss(XmmRegister dst, XmmRegister src); |
| 510 | void subss(XmmRegister dst, const Address& src); |
| 511 | void mulss(XmmRegister dst, XmmRegister src); |
| 512 | void mulss(XmmRegister dst, const Address& src); |
| 513 | void divss(XmmRegister dst, XmmRegister src); |
| 514 | void divss(XmmRegister dst, const Address& src); |
| 515 | |
Aart Bik | c778226 | 2017-01-13 16:20:08 -0800 | [diff] [blame] | 516 | void addps(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 517 | void subps(XmmRegister dst, XmmRegister src); |
| 518 | void mulps(XmmRegister dst, XmmRegister src); |
| 519 | void divps(XmmRegister dst, XmmRegister src); |
| 520 | |
Shalini Salomi Bodapati | b45a435 | 2019-07-10 16:09:41 +0530 | [diff] [blame] | 521 | void vmulps(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 522 | void vmulpd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 523 | void vdivps(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 524 | void vdivpd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 525 | |
Shalini Salomi Bodapati | 81d15be | 2019-05-30 11:00:42 +0530 | [diff] [blame] | 526 | void vaddps(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 527 | void vsubps(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 528 | void vsubpd(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 529 | void vaddpd(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 530 | |
Shalini Salomi Bodapati | 6545ee3 | 2021-11-02 20:01:06 +0530 | [diff] [blame] | 531 | void vfmadd213ss(XmmRegister accumulator, XmmRegister left, XmmRegister right); |
| 532 | void vfmadd213sd(XmmRegister accumulator, XmmRegister left, XmmRegister right); |
| 533 | |
Aart Bik | c778226 | 2017-01-13 16:20:08 -0800 | [diff] [blame] | 534 | void movapd(XmmRegister dst, XmmRegister src); // move |
| 535 | void movapd(XmmRegister dst, const Address& src); // load aligned |
| 536 | void movupd(XmmRegister dst, const Address& src); // load unaligned |
| 537 | void movapd(const Address& dst, XmmRegister src); // store aligned |
| 538 | void movupd(const Address& dst, XmmRegister src); // store unaligned |
| 539 | |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 540 | void vmovapd(XmmRegister dst, XmmRegister src); // move |
| 541 | void vmovapd(XmmRegister dst, const Address& src); // load aligned |
| 542 | void vmovapd(const Address& dst, XmmRegister src); // store aligned |
| 543 | void vmovupd(XmmRegister dst, const Address& src); // load unaligned |
| 544 | void vmovupd(const Address& dst, XmmRegister src); // store unaligned |
| 545 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 546 | void movsd(XmmRegister dst, const Address& src); |
| 547 | void movsd(const Address& dst, XmmRegister src); |
| 548 | void movsd(XmmRegister dst, XmmRegister src); |
| 549 | |
| 550 | void addsd(XmmRegister dst, XmmRegister src); |
| 551 | void addsd(XmmRegister dst, const Address& src); |
| 552 | void subsd(XmmRegister dst, XmmRegister src); |
| 553 | void subsd(XmmRegister dst, const Address& src); |
| 554 | void mulsd(XmmRegister dst, XmmRegister src); |
| 555 | void mulsd(XmmRegister dst, const Address& src); |
| 556 | void divsd(XmmRegister dst, XmmRegister src); |
| 557 | void divsd(XmmRegister dst, const Address& src); |
| 558 | |
Aart Bik | c778226 | 2017-01-13 16:20:08 -0800 | [diff] [blame] | 559 | void addpd(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 560 | void subpd(XmmRegister dst, XmmRegister src); |
| 561 | void mulpd(XmmRegister dst, XmmRegister src); |
| 562 | void divpd(XmmRegister dst, XmmRegister src); |
| 563 | |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 564 | void movdqa(XmmRegister dst, XmmRegister src); // move |
| 565 | void movdqa(XmmRegister dst, const Address& src); // load aligned |
| 566 | void movdqu(XmmRegister dst, const Address& src); // load unaligned |
| 567 | void movdqa(const Address& dst, XmmRegister src); // store aligned |
| 568 | void movdqu(const Address& dst, XmmRegister src); // store unaligned |
| 569 | |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 570 | void vmovdqa(XmmRegister dst, XmmRegister src); // move |
| 571 | void vmovdqa(XmmRegister dst, const Address& src); // load aligned |
| 572 | void vmovdqa(const Address& dst, XmmRegister src); // store aligned |
| 573 | void vmovdqu(XmmRegister dst, const Address& src); // load unaligned |
| 574 | void vmovdqu(const Address& dst, XmmRegister src); // store unaligned |
| 575 | |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 576 | void paddb(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 577 | void psubb(XmmRegister dst, XmmRegister src); |
| 578 | |
Shalini Salomi Bodapati | 81d15be | 2019-05-30 11:00:42 +0530 | [diff] [blame] | 579 | void vpaddb(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 580 | void vpaddw(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 581 | |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 582 | void paddw(XmmRegister dst, XmmRegister src); |
| 583 | void psubw(XmmRegister dst, XmmRegister src); |
| 584 | void pmullw(XmmRegister dst, XmmRegister src); |
Shalini Salomi Bodapati | b45a435 | 2019-07-10 16:09:41 +0530 | [diff] [blame] | 585 | void vpmullw(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 586 | |
Shalini Salomi Bodapati | 81d15be | 2019-05-30 11:00:42 +0530 | [diff] [blame] | 587 | void vpsubb(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 588 | void vpsubw(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 589 | void vpsubd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 590 | |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 591 | void paddd(XmmRegister dst, XmmRegister src); |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 592 | void psubd(XmmRegister dst, XmmRegister src); |
| 593 | void pmulld(XmmRegister dst, XmmRegister src); |
Shalini Salomi Bodapati | b45a435 | 2019-07-10 16:09:41 +0530 | [diff] [blame] | 594 | void vpmulld(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 595 | |
Shalini Salomi Bodapati | 81d15be | 2019-05-30 11:00:42 +0530 | [diff] [blame] | 596 | void vpaddd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 597 | |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 598 | void paddq(XmmRegister dst, XmmRegister src); |
| 599 | void psubq(XmmRegister dst, XmmRegister src); |
| 600 | |
Shalini Salomi Bodapati | 81d15be | 2019-05-30 11:00:42 +0530 | [diff] [blame] | 601 | void vpaddq(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 602 | void vpsubq(XmmRegister dst, XmmRegister add_left, XmmRegister add_right); |
| 603 | |
Aart Bik | 4ca1735 | 2018-03-07 15:47:39 -0800 | [diff] [blame] | 604 | void paddusb(XmmRegister dst, XmmRegister src); |
| 605 | void paddsb(XmmRegister dst, XmmRegister src); |
| 606 | void paddusw(XmmRegister dst, XmmRegister src); |
| 607 | void paddsw(XmmRegister dst, XmmRegister src); |
| 608 | void psubusb(XmmRegister dst, XmmRegister src); |
| 609 | void psubsb(XmmRegister dst, XmmRegister src); |
| 610 | void psubusw(XmmRegister dst, XmmRegister src); |
| 611 | void psubsw(XmmRegister dst, XmmRegister src); |
| 612 | |
Andreas Gampe | 851df20 | 2014-11-12 14:05:46 -0800 | [diff] [blame] | 613 | void cvtsi2ss(XmmRegister dst, CpuRegister src); // Note: this is the r/m32 version. |
Roland Levillain | 6d0e483 | 2014-11-27 18:31:21 +0000 | [diff] [blame] | 614 | void cvtsi2ss(XmmRegister dst, CpuRegister src, bool is64bit); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 615 | void cvtsi2ss(XmmRegister dst, const Address& src, bool is64bit); |
Andreas Gampe | 851df20 | 2014-11-12 14:05:46 -0800 | [diff] [blame] | 616 | void cvtsi2sd(XmmRegister dst, CpuRegister src); // Note: this is the r/m32 version. |
Roland Levillain | 647b9ed | 2014-11-27 12:06:00 +0000 | [diff] [blame] | 617 | void cvtsi2sd(XmmRegister dst, CpuRegister src, bool is64bit); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 618 | void cvtsi2sd(XmmRegister dst, const Address& src, bool is64bit); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 619 | |
Andreas Gampe | 851df20 | 2014-11-12 14:05:46 -0800 | [diff] [blame] | 620 | void cvtss2si(CpuRegister dst, XmmRegister src); // Note: this is the r32 version. |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 621 | void cvtss2sd(XmmRegister dst, XmmRegister src); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 622 | void cvtss2sd(XmmRegister dst, const Address& src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 623 | |
Andreas Gampe | 851df20 | 2014-11-12 14:05:46 -0800 | [diff] [blame] | 624 | void cvtsd2si(CpuRegister dst, XmmRegister src); // Note: this is the r32 version. |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 625 | void cvtsd2ss(XmmRegister dst, XmmRegister src); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 626 | void cvtsd2ss(XmmRegister dst, const Address& src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 627 | |
Andreas Gampe | 851df20 | 2014-11-12 14:05:46 -0800 | [diff] [blame] | 628 | void cvttss2si(CpuRegister dst, XmmRegister src); // Note: this is the r32 version. |
Roland Levillain | 624279f | 2014-12-04 11:54:28 +0000 | [diff] [blame] | 629 | void cvttss2si(CpuRegister dst, XmmRegister src, bool is64bit); |
Andreas Gampe | 851df20 | 2014-11-12 14:05:46 -0800 | [diff] [blame] | 630 | void cvttsd2si(CpuRegister dst, XmmRegister src); // Note: this is the r32 version. |
Roland Levillain | 4c0b61f | 2014-12-05 12:06:01 +0000 | [diff] [blame] | 631 | void cvttsd2si(CpuRegister dst, XmmRegister src, bool is64bit); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 632 | |
Aart Bik | 3ae3b59 | 2017-02-24 14:09:15 -0800 | [diff] [blame] | 633 | void cvtdq2ps(XmmRegister dst, XmmRegister src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 634 | void cvtdq2pd(XmmRegister dst, XmmRegister src); |
| 635 | |
| 636 | void comiss(XmmRegister a, XmmRegister b); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 637 | void comiss(XmmRegister a, const Address& b); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 638 | void comisd(XmmRegister a, XmmRegister b); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 639 | void comisd(XmmRegister a, const Address& b); |
Calin Juravle | ddb7df2 | 2014-11-25 20:56:51 +0000 | [diff] [blame] | 640 | void ucomiss(XmmRegister a, XmmRegister b); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 641 | void ucomiss(XmmRegister a, const Address& b); |
Calin Juravle | ddb7df2 | 2014-11-25 20:56:51 +0000 | [diff] [blame] | 642 | void ucomisd(XmmRegister a, XmmRegister b); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 643 | void ucomisd(XmmRegister a, const Address& b); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 644 | |
Mark Mendell | fb8d279 | 2015-03-31 22:16:59 -0400 | [diff] [blame] | 645 | void roundsd(XmmRegister dst, XmmRegister src, const Immediate& imm); |
| 646 | void roundss(XmmRegister dst, XmmRegister src, const Immediate& imm); |
| 647 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 648 | void sqrtsd(XmmRegister dst, XmmRegister src); |
| 649 | void sqrtss(XmmRegister dst, XmmRegister src); |
| 650 | |
| 651 | void xorpd(XmmRegister dst, const Address& src); |
| 652 | void xorpd(XmmRegister dst, XmmRegister src); |
| 653 | void xorps(XmmRegister dst, const Address& src); |
| 654 | void xorps(XmmRegister dst, XmmRegister src); |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 655 | void pxor(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
Neeraj Solanki | 48349ad | 2019-08-05 23:16:56 +0530 | [diff] [blame] | 656 | void vpxor(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 657 | void vxorps(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 658 | void vxorpd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 659 | |
| 660 | void andpd(XmmRegister dst, const Address& src); |
Andreas Gampe | 71fb52f | 2014-12-29 17:43:08 -0800 | [diff] [blame] | 661 | void andpd(XmmRegister dst, XmmRegister src); |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 662 | void andps(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 663 | void pand(XmmRegister dst, XmmRegister src); |
Neeraj Solanki | 48349ad | 2019-08-05 23:16:56 +0530 | [diff] [blame] | 664 | void vpand(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 665 | void vandps(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 666 | void vandpd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
Andreas Gampe | 71fb52f | 2014-12-29 17:43:08 -0800 | [diff] [blame] | 667 | |
Shalini Salomi Bodapati | 8e5bc2d | 2018-10-24 11:50:56 +0530 | [diff] [blame] | 668 | void andn(CpuRegister dst, CpuRegister src1, CpuRegister src2); |
Aart Bik | 21c580b | 2017-03-13 11:52:07 -0700 | [diff] [blame] | 669 | void andnpd(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 670 | void andnps(XmmRegister dst, XmmRegister src); |
| 671 | void pandn(XmmRegister dst, XmmRegister src); |
Neeraj Solanki | 48349ad | 2019-08-05 23:16:56 +0530 | [diff] [blame] | 672 | void vpandn(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 673 | void vandnps(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 674 | void vandnpd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
Aart Bik | 21c580b | 2017-03-13 11:52:07 -0700 | [diff] [blame] | 675 | |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 676 | void orpd(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
Andreas Gampe | 71fb52f | 2014-12-29 17:43:08 -0800 | [diff] [blame] | 677 | void orps(XmmRegister dst, XmmRegister src); |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 678 | void por(XmmRegister dst, XmmRegister src); |
Neeraj Solanki | 48349ad | 2019-08-05 23:16:56 +0530 | [diff] [blame] | 679 | void vpor(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 680 | void vorps(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
| 681 | void vorpd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 682 | |
Aart Bik | 67d3fd7 | 2017-03-31 15:11:53 -0700 | [diff] [blame] | 683 | void pavgb(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 684 | void pavgw(XmmRegister dst, XmmRegister src); |
Aart Bik | 6005a87 | 2017-07-24 13:33:39 -0700 | [diff] [blame] | 685 | void psadbw(XmmRegister dst, XmmRegister src); |
| 686 | void pmaddwd(XmmRegister dst, XmmRegister src); |
Alex Light | 43f2f75 | 2019-12-04 17:48:45 +0000 | [diff] [blame] | 687 | void vpmaddwd(XmmRegister dst, XmmRegister src1, XmmRegister src2); |
Aart Bik | 6005a87 | 2017-07-24 13:33:39 -0700 | [diff] [blame] | 688 | void phaddw(XmmRegister dst, XmmRegister src); |
| 689 | void phaddd(XmmRegister dst, XmmRegister src); |
| 690 | void haddps(XmmRegister dst, XmmRegister src); |
| 691 | void haddpd(XmmRegister dst, XmmRegister src); |
| 692 | void phsubw(XmmRegister dst, XmmRegister src); |
| 693 | void phsubd(XmmRegister dst, XmmRegister src); |
| 694 | void hsubps(XmmRegister dst, XmmRegister src); |
| 695 | void hsubpd(XmmRegister dst, XmmRegister src); |
Aart Bik | 67d3fd7 | 2017-03-31 15:11:53 -0700 | [diff] [blame] | 696 | |
Aart Bik | c8e93c7 | 2017-05-10 10:49:22 -0700 | [diff] [blame] | 697 | void pminsb(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 698 | void pmaxsb(XmmRegister dst, XmmRegister src); |
| 699 | void pminsw(XmmRegister dst, XmmRegister src); |
| 700 | void pmaxsw(XmmRegister dst, XmmRegister src); |
| 701 | void pminsd(XmmRegister dst, XmmRegister src); |
| 702 | void pmaxsd(XmmRegister dst, XmmRegister src); |
| 703 | |
| 704 | void pminub(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 705 | void pmaxub(XmmRegister dst, XmmRegister src); |
| 706 | void pminuw(XmmRegister dst, XmmRegister src); |
| 707 | void pmaxuw(XmmRegister dst, XmmRegister src); |
| 708 | void pminud(XmmRegister dst, XmmRegister src); |
| 709 | void pmaxud(XmmRegister dst, XmmRegister src); |
| 710 | |
| 711 | void minps(XmmRegister dst, XmmRegister src); // no addr variant (for now) |
| 712 | void maxps(XmmRegister dst, XmmRegister src); |
| 713 | void minpd(XmmRegister dst, XmmRegister src); |
| 714 | void maxpd(XmmRegister dst, XmmRegister src); |
| 715 | |
Aart Bik | 4b45533 | 2017-03-15 11:19:35 -0700 | [diff] [blame] | 716 | void pcmpeqb(XmmRegister dst, XmmRegister src); |
| 717 | void pcmpeqw(XmmRegister dst, XmmRegister src); |
| 718 | void pcmpeqd(XmmRegister dst, XmmRegister src); |
| 719 | void pcmpeqq(XmmRegister dst, XmmRegister src); |
| 720 | |
Aart Bik | 8939c64 | 2017-04-03 14:09:01 -0700 | [diff] [blame] | 721 | void pcmpgtb(XmmRegister dst, XmmRegister src); |
| 722 | void pcmpgtw(XmmRegister dst, XmmRegister src); |
| 723 | void pcmpgtd(XmmRegister dst, XmmRegister src); |
| 724 | void pcmpgtq(XmmRegister dst, XmmRegister src); // SSE4.2 |
| 725 | |
Aart Bik | 12e06ed | 2017-01-31 16:11:24 -0800 | [diff] [blame] | 726 | void shufpd(XmmRegister dst, XmmRegister src, const Immediate& imm); |
| 727 | void shufps(XmmRegister dst, XmmRegister src, const Immediate& imm); |
Aart Bik | 68555e9 | 2017-02-13 14:28:45 -0800 | [diff] [blame] | 728 | void pshufd(XmmRegister dst, XmmRegister src, const Immediate& imm); |
Aart Bik | 12e06ed | 2017-01-31 16:11:24 -0800 | [diff] [blame] | 729 | |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 730 | void punpcklbw(XmmRegister dst, XmmRegister src); |
| 731 | void punpcklwd(XmmRegister dst, XmmRegister src); |
| 732 | void punpckldq(XmmRegister dst, XmmRegister src); |
| 733 | void punpcklqdq(XmmRegister dst, XmmRegister src); |
| 734 | |
Aart Bik | 3332db8 | 2017-08-11 15:10:30 -0700 | [diff] [blame] | 735 | void punpckhbw(XmmRegister dst, XmmRegister src); |
| 736 | void punpckhwd(XmmRegister dst, XmmRegister src); |
| 737 | void punpckhdq(XmmRegister dst, XmmRegister src); |
| 738 | void punpckhqdq(XmmRegister dst, XmmRegister src); |
| 739 | |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 740 | void psllw(XmmRegister reg, const Immediate& shift_count); |
| 741 | void pslld(XmmRegister reg, const Immediate& shift_count); |
| 742 | void psllq(XmmRegister reg, const Immediate& shift_count); |
| 743 | |
| 744 | void psraw(XmmRegister reg, const Immediate& shift_count); |
| 745 | void psrad(XmmRegister reg, const Immediate& shift_count); |
| 746 | // no psraq |
| 747 | |
| 748 | void psrlw(XmmRegister reg, const Immediate& shift_count); |
| 749 | void psrld(XmmRegister reg, const Immediate& shift_count); |
| 750 | void psrlq(XmmRegister reg, const Immediate& shift_count); |
Aart Bik | 3332db8 | 2017-08-11 15:10:30 -0700 | [diff] [blame] | 751 | void psrldq(XmmRegister reg, const Immediate& shift_count); |
Aart Bik | e69d7a9 | 2017-02-17 11:48:23 -0800 | [diff] [blame] | 752 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 753 | void flds(const Address& src); |
| 754 | void fstps(const Address& dst); |
Mark Mendell | 24f2dfa | 2015-01-14 19:51:45 -0500 | [diff] [blame] | 755 | void fsts(const Address& dst); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 756 | |
| 757 | void fldl(const Address& src); |
| 758 | void fstpl(const Address& dst); |
Mark Mendell | 24f2dfa | 2015-01-14 19:51:45 -0500 | [diff] [blame] | 759 | void fstl(const Address& dst); |
| 760 | |
| 761 | void fstsw(); |
| 762 | |
| 763 | void fucompp(); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 764 | |
| 765 | void fnstcw(const Address& dst); |
| 766 | void fldcw(const Address& src); |
| 767 | |
| 768 | void fistpl(const Address& dst); |
| 769 | void fistps(const Address& dst); |
| 770 | void fildl(const Address& src); |
Roland Levillain | 0a18601 | 2015-04-13 17:00:20 +0100 | [diff] [blame] | 771 | void filds(const Address& src); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 772 | |
| 773 | void fincstp(); |
| 774 | void ffree(const Immediate& index); |
| 775 | |
| 776 | void fsin(); |
| 777 | void fcos(); |
| 778 | void fptan(); |
Mark Mendell | 24f2dfa | 2015-01-14 19:51:45 -0500 | [diff] [blame] | 779 | void fprem(); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 780 | |
Ulya Trafimovich | cd8286f | 2021-07-12 16:40:16 +0100 | [diff] [blame] | 781 | void xchgb(CpuRegister dst, CpuRegister src); |
| 782 | void xchgb(CpuRegister reg, const Address& address); |
| 783 | |
| 784 | void xchgw(CpuRegister dst, CpuRegister src); |
| 785 | void xchgw(CpuRegister reg, const Address& address); |
| 786 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 787 | void xchgl(CpuRegister dst, CpuRegister src); |
| 788 | void xchgl(CpuRegister reg, const Address& address); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 789 | |
Ulya Trafimovich | cd8286f | 2021-07-12 16:40:16 +0100 | [diff] [blame] | 790 | void xchgq(CpuRegister dst, CpuRegister src); |
| 791 | void xchgq(CpuRegister reg, const Address& address); |
| 792 | |
Ulya Trafimovich | 5d446a3 | 2021-07-20 15:51:48 +0100 | [diff] [blame] | 793 | void xaddb(CpuRegister dst, CpuRegister src); |
| 794 | void xaddb(const Address& address, CpuRegister reg); |
| 795 | |
| 796 | void xaddw(CpuRegister dst, CpuRegister src); |
| 797 | void xaddw(const Address& address, CpuRegister reg); |
| 798 | |
| 799 | void xaddl(CpuRegister dst, CpuRegister src); |
| 800 | void xaddl(const Address& address, CpuRegister reg); |
| 801 | |
| 802 | void xaddq(CpuRegister dst, CpuRegister src); |
| 803 | void xaddq(const Address& address, CpuRegister reg); |
| 804 | |
Serguei Katkov | 3b62593 | 2016-05-06 10:24:17 +0600 | [diff] [blame] | 805 | void cmpb(const Address& address, const Immediate& imm); |
Nicolas Geoffray | 3c04974 | 2014-09-24 18:10:46 +0100 | [diff] [blame] | 806 | void cmpw(const Address& address, const Immediate& imm); |
| 807 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 808 | void cmpl(CpuRegister reg, const Immediate& imm); |
| 809 | void cmpl(CpuRegister reg0, CpuRegister reg1); |
| 810 | void cmpl(CpuRegister reg, const Address& address); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 811 | void cmpl(const Address& address, CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 812 | void cmpl(const Address& address, const Immediate& imm); |
| 813 | |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 814 | void cmpq(CpuRegister reg0, CpuRegister reg1); |
Nicolas Geoffray | 96f89a2 | 2014-07-11 10:57:49 +0100 | [diff] [blame] | 815 | void cmpq(CpuRegister reg0, const Immediate& imm); |
| 816 | void cmpq(CpuRegister reg0, const Address& address); |
Calin Juravle | d6fb6cf | 2014-11-11 19:07:44 +0000 | [diff] [blame] | 817 | void cmpq(const Address& address, const Immediate& imm); |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 818 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 819 | void testl(CpuRegister reg1, CpuRegister reg2); |
Calin Juravle | cd6dffe | 2015-01-08 17:35:35 +0000 | [diff] [blame] | 820 | void testl(CpuRegister reg, const Address& address); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 821 | void testl(CpuRegister reg, const Immediate& imm); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 822 | |
Calin Juravle | d6fb6cf | 2014-11-11 19:07:44 +0000 | [diff] [blame] | 823 | void testq(CpuRegister reg1, CpuRegister reg2); |
Nicolas Geoffray | f12feb8 | 2014-07-17 18:32:41 +0100 | [diff] [blame] | 824 | void testq(CpuRegister reg, const Address& address); |
| 825 | |
Vladimir Marko | 953437b | 2016-08-24 08:30:46 +0000 | [diff] [blame] | 826 | void testb(const Address& address, const Immediate& imm); |
| 827 | void testl(const Address& address, const Immediate& imm); |
| 828 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 829 | void andl(CpuRegister dst, const Immediate& imm); |
| 830 | void andl(CpuRegister dst, CpuRegister src); |
Nicolas Geoffray | 9574c4b | 2014-11-12 13:19:37 +0000 | [diff] [blame] | 831 | void andl(CpuRegister reg, const Address& address); |
Nicolas Geoffray | 412f10c | 2014-06-19 10:00:34 +0100 | [diff] [blame] | 832 | void andq(CpuRegister dst, const Immediate& imm); |
Nicolas Geoffray | 9574c4b | 2014-11-12 13:19:37 +0000 | [diff] [blame] | 833 | void andq(CpuRegister dst, CpuRegister src); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 834 | void andq(CpuRegister reg, const Address& address); |
Nicolas Geoffray | 9e5ad47 | 2020-08-26 15:27:38 +0100 | [diff] [blame] | 835 | void andw(const Address& address, const Immediate& imm); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 836 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 837 | void orl(CpuRegister dst, const Immediate& imm); |
| 838 | void orl(CpuRegister dst, CpuRegister src); |
Nicolas Geoffray | 9574c4b | 2014-11-12 13:19:37 +0000 | [diff] [blame] | 839 | void orl(CpuRegister reg, const Address& address); |
| 840 | void orq(CpuRegister dst, CpuRegister src); |
Mark Mendell | 3f6c7f6 | 2015-03-13 13:47:53 -0400 | [diff] [blame] | 841 | void orq(CpuRegister dst, const Immediate& imm); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 842 | void orq(CpuRegister reg, const Address& address); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 843 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 844 | void xorl(CpuRegister dst, CpuRegister src); |
Nicolas Geoffray | 9574c4b | 2014-11-12 13:19:37 +0000 | [diff] [blame] | 845 | void xorl(CpuRegister dst, const Immediate& imm); |
| 846 | void xorl(CpuRegister reg, const Address& address); |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 847 | void xorq(CpuRegister dst, const Immediate& imm); |
Nicolas Geoffray | 412f10c | 2014-06-19 10:00:34 +0100 | [diff] [blame] | 848 | void xorq(CpuRegister dst, CpuRegister src); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 849 | void xorq(CpuRegister reg, const Address& address); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 850 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 851 | void addl(CpuRegister dst, CpuRegister src); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 852 | void addl(CpuRegister reg, const Immediate& imm); |
| 853 | void addl(CpuRegister reg, const Address& address); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 854 | void addl(const Address& address, CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 855 | void addl(const Address& address, const Immediate& imm); |
Nicolas Geoffray | ded5594 | 2018-01-26 16:33:41 +0000 | [diff] [blame] | 856 | void addw(const Address& address, const Immediate& imm); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 857 | |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 858 | void addq(CpuRegister reg, const Immediate& imm); |
| 859 | void addq(CpuRegister dst, CpuRegister src); |
Nicolas Geoffray | 96f89a2 | 2014-07-11 10:57:49 +0100 | [diff] [blame] | 860 | void addq(CpuRegister dst, const Address& address); |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 861 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 862 | void subl(CpuRegister dst, CpuRegister src); |
| 863 | void subl(CpuRegister reg, const Immediate& imm); |
| 864 | void subl(CpuRegister reg, const Address& address); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 865 | |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 866 | void subq(CpuRegister reg, const Immediate& imm); |
| 867 | void subq(CpuRegister dst, CpuRegister src); |
Nicolas Geoffray | 96f89a2 | 2014-07-11 10:57:49 +0100 | [diff] [blame] | 868 | void subq(CpuRegister dst, const Address& address); |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 869 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 870 | void cdq(); |
Calin Juravle | d6fb6cf | 2014-11-11 19:07:44 +0000 | [diff] [blame] | 871 | void cqo(); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 872 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 873 | void idivl(CpuRegister reg); |
Calin Juravle | d6fb6cf | 2014-11-11 19:07:44 +0000 | [diff] [blame] | 874 | void idivq(CpuRegister reg); |
Vladimir Marko | be7fe3b | 2020-07-09 10:58:12 +0100 | [diff] [blame] | 875 | void divl(CpuRegister reg); |
| 876 | void divq(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 877 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 878 | void imull(CpuRegister dst, CpuRegister src); |
| 879 | void imull(CpuRegister reg, const Immediate& imm); |
Mark Mendell | 4a2aa4a | 2015-07-27 16:13:10 -0400 | [diff] [blame] | 880 | void imull(CpuRegister dst, CpuRegister src, const Immediate& imm); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 881 | void imull(CpuRegister reg, const Address& address); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 882 | |
Guillaume Sanchez | 0f88e87 | 2015-03-30 17:55:45 +0100 | [diff] [blame] | 883 | void imulq(CpuRegister src); |
Calin Juravle | 34bacdf | 2014-10-07 20:23:36 +0100 | [diff] [blame] | 884 | void imulq(CpuRegister dst, CpuRegister src); |
| 885 | void imulq(CpuRegister reg, const Immediate& imm); |
| 886 | void imulq(CpuRegister reg, const Address& address); |
Mark Mendell | 3f6c7f6 | 2015-03-13 13:47:53 -0400 | [diff] [blame] | 887 | void imulq(CpuRegister dst, CpuRegister reg, const Immediate& imm); |
Calin Juravle | 34bacdf | 2014-10-07 20:23:36 +0100 | [diff] [blame] | 888 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 889 | void imull(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 890 | void imull(const Address& address); |
| 891 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 892 | void mull(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 893 | void mull(const Address& address); |
| 894 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 895 | void shll(CpuRegister reg, const Immediate& imm); |
| 896 | void shll(CpuRegister operand, CpuRegister shifter); |
| 897 | void shrl(CpuRegister reg, const Immediate& imm); |
| 898 | void shrl(CpuRegister operand, CpuRegister shifter); |
| 899 | void sarl(CpuRegister reg, const Immediate& imm); |
| 900 | void sarl(CpuRegister operand, CpuRegister shifter); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 901 | |
Calin Juravle | 9aec02f | 2014-11-18 23:06:35 +0000 | [diff] [blame] | 902 | void shlq(CpuRegister reg, const Immediate& imm); |
| 903 | void shlq(CpuRegister operand, CpuRegister shifter); |
Nicolas Geoffray | 1a43dd7 | 2014-07-17 15:15:34 +0100 | [diff] [blame] | 904 | void shrq(CpuRegister reg, const Immediate& imm); |
Calin Juravle | 9aec02f | 2014-11-18 23:06:35 +0000 | [diff] [blame] | 905 | void shrq(CpuRegister operand, CpuRegister shifter); |
| 906 | void sarq(CpuRegister reg, const Immediate& imm); |
| 907 | void sarq(CpuRegister operand, CpuRegister shifter); |
Nicolas Geoffray | 1a43dd7 | 2014-07-17 15:15:34 +0100 | [diff] [blame] | 908 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 909 | void negl(CpuRegister reg); |
Roland Levillain | 2e07b4f | 2014-10-23 18:12:09 +0100 | [diff] [blame] | 910 | void negq(CpuRegister reg); |
Roland Levillain | 7056643 | 2014-10-24 16:20:17 +0100 | [diff] [blame] | 911 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 912 | void notl(CpuRegister reg); |
Roland Levillain | 7056643 | 2014-10-24 16:20:17 +0100 | [diff] [blame] | 913 | void notq(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 914 | |
| 915 | void enter(const Immediate& imm); |
| 916 | void leave(); |
| 917 | |
| 918 | void ret(); |
| 919 | void ret(const Immediate& imm); |
| 920 | |
| 921 | void nop(); |
| 922 | void int3(); |
| 923 | void hlt(); |
| 924 | |
| 925 | void j(Condition condition, Label* label); |
Mark Mendell | 73f455e | 2015-08-21 09:30:05 -0400 | [diff] [blame] | 926 | void j(Condition condition, NearLabel* label); |
| 927 | void jrcxz(NearLabel* label); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 928 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 929 | void jmp(CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 930 | void jmp(const Address& address); |
| 931 | void jmp(Label* label); |
Mark Mendell | 73f455e | 2015-08-21 09:30:05 -0400 | [diff] [blame] | 932 | void jmp(NearLabel* label); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 933 | |
| 934 | X86_64Assembler* lock(); |
Ulya Trafimovich | 5b8eb16 | 2021-06-28 12:38:20 +0100 | [diff] [blame] | 935 | void cmpxchgb(const Address& address, CpuRegister reg); |
| 936 | void cmpxchgw(const Address& address, CpuRegister reg); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 937 | void cmpxchgl(const Address& address, CpuRegister reg); |
Mark Mendell | 58d25fd | 2015-04-03 14:52:31 -0400 | [diff] [blame] | 938 | void cmpxchgq(const Address& address, CpuRegister reg); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 939 | |
| 940 | void mfence(); |
| 941 | |
| 942 | X86_64Assembler* gs(); |
| 943 | |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 944 | void setcc(Condition condition, CpuRegister dst); |
| 945 | |
Andreas Gampe | 71fb52f | 2014-12-29 17:43:08 -0800 | [diff] [blame] | 946 | void bswapl(CpuRegister dst); |
| 947 | void bswapq(CpuRegister dst); |
| 948 | |
Mark Mendell | bcee092 | 2015-09-15 21:45:01 -0400 | [diff] [blame] | 949 | void bsfl(CpuRegister dst, CpuRegister src); |
| 950 | void bsfl(CpuRegister dst, const Address& src); |
| 951 | void bsfq(CpuRegister dst, CpuRegister src); |
| 952 | void bsfq(CpuRegister dst, const Address& src); |
| 953 | |
Shalini Salomi Bodapati | 8e5bc2d | 2018-10-24 11:50:56 +0530 | [diff] [blame] | 954 | void blsi(CpuRegister dst, CpuRegister src); // no addr variant (for now) |
| 955 | void blsmsk(CpuRegister dst, CpuRegister src); // no addr variant (for now) |
| 956 | void blsr(CpuRegister dst, CpuRegister src); // no addr variant (for now) |
| 957 | |
Mark Mendell | 8ae3ffb | 2015-08-12 21:16:41 -0400 | [diff] [blame] | 958 | void bsrl(CpuRegister dst, CpuRegister src); |
| 959 | void bsrl(CpuRegister dst, const Address& src); |
| 960 | void bsrq(CpuRegister dst, CpuRegister src); |
| 961 | void bsrq(CpuRegister dst, const Address& src); |
| 962 | |
Aart Bik | 3f67e69 | 2016-01-15 14:35:12 -0800 | [diff] [blame] | 963 | void popcntl(CpuRegister dst, CpuRegister src); |
| 964 | void popcntl(CpuRegister dst, const Address& src); |
| 965 | void popcntq(CpuRegister dst, CpuRegister src); |
| 966 | void popcntq(CpuRegister dst, const Address& src); |
| 967 | |
Mark Mendell | bcee092 | 2015-09-15 21:45:01 -0400 | [diff] [blame] | 968 | void rorl(CpuRegister reg, const Immediate& imm); |
| 969 | void rorl(CpuRegister operand, CpuRegister shifter); |
| 970 | void roll(CpuRegister reg, const Immediate& imm); |
| 971 | void roll(CpuRegister operand, CpuRegister shifter); |
| 972 | |
| 973 | void rorq(CpuRegister reg, const Immediate& imm); |
| 974 | void rorq(CpuRegister operand, CpuRegister shifter); |
| 975 | void rolq(CpuRegister reg, const Immediate& imm); |
| 976 | void rolq(CpuRegister operand, CpuRegister shifter); |
| 977 | |
jessicahandojo | b03d640 | 2016-09-07 12:16:53 -0700 | [diff] [blame] | 978 | void repne_scasb(); |
Andreas Gampe | 21030dd | 2015-05-07 14:46:15 -0700 | [diff] [blame] | 979 | void repne_scasw(); |
agicsaki | 71311f8 | 2015-07-27 11:34:13 -0700 | [diff] [blame] | 980 | void repe_cmpsw(); |
agicsaki | 970abfb | 2015-07-31 10:31:14 -0700 | [diff] [blame] | 981 | void repe_cmpsl(); |
agicsaki | 3fd0e6a | 2015-08-03 20:14:29 -0700 | [diff] [blame] | 982 | void repe_cmpsq(); |
Mark Mendell | b9c4bbe | 2015-07-01 14:26:52 -0400 | [diff] [blame] | 983 | void rep_movsw(); |
Shalini Salomi Bodapati | 927a996 | 2022-02-11 18:01:22 +0530 | [diff] [blame] | 984 | void rep_movsb(); |
| 985 | void rep_movsl(); |
Andreas Gampe | 21030dd | 2015-05-07 14:46:15 -0700 | [diff] [blame] | 986 | |
Ulya Trafimovich | 06ed744 | 2021-11-19 12:22:49 +0000 | [diff] [blame] | 987 | void ud2(); |
| 988 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 989 | // |
| 990 | // Macros for High-level operations. |
| 991 | // |
| 992 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 993 | void AddImmediate(CpuRegister reg, const Immediate& imm); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 994 | |
| 995 | void LoadDoubleConstant(XmmRegister dst, double value); |
| 996 | |
Ulya Trafimovich | 5b8eb16 | 2021-06-28 12:38:20 +0100 | [diff] [blame] | 997 | void LockCmpxchgb(const Address& address, CpuRegister reg) { |
| 998 | lock()->cmpxchgb(address, reg); |
| 999 | } |
| 1000 | |
| 1001 | void LockCmpxchgw(const Address& address, CpuRegister reg) { |
| 1002 | AssemblerBuffer::EnsureCapacity ensured(&buffer_); |
| 1003 | // We make sure that the operand size override bytecode is emited before the lock bytecode. |
| 1004 | // We test against clang which enforces this bytecode order. |
| 1005 | EmitOperandSizeOverride(); |
| 1006 | EmitUint8(0xF0); |
| 1007 | EmitOptionalRex32(reg, address); |
| 1008 | EmitUint8(0x0F); |
| 1009 | EmitUint8(0xB1); |
| 1010 | EmitOperand(reg.LowBits(), address); |
| 1011 | } |
| 1012 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1013 | void LockCmpxchgl(const Address& address, CpuRegister reg) { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1014 | lock()->cmpxchgl(address, reg); |
| 1015 | } |
| 1016 | |
Mark Mendell | 58d25fd | 2015-04-03 14:52:31 -0400 | [diff] [blame] | 1017 | void LockCmpxchgq(const Address& address, CpuRegister reg) { |
| 1018 | lock()->cmpxchgq(address, reg); |
| 1019 | } |
| 1020 | |
Ulya Trafimovich | 244f22b | 2021-07-20 16:56:30 +0100 | [diff] [blame] | 1021 | void LockXaddb(const Address& address, CpuRegister reg) { |
| 1022 | lock()->xaddb(address, reg); |
| 1023 | } |
| 1024 | |
| 1025 | void LockXaddw(const Address& address, CpuRegister reg) { |
| 1026 | AssemblerBuffer::EnsureCapacity ensured(&buffer_); |
| 1027 | // We make sure that the operand size override bytecode is emited before the lock bytecode. |
| 1028 | // We test against clang which enforces this bytecode order. |
| 1029 | EmitOperandSizeOverride(); |
| 1030 | EmitUint8(0xF0); |
| 1031 | EmitOptionalRex32(reg, address); |
| 1032 | EmitUint8(0x0F); |
| 1033 | EmitUint8(0xC1); |
| 1034 | EmitOperand(reg.LowBits(), address); |
| 1035 | } |
| 1036 | |
| 1037 | void LockXaddl(const Address& address, CpuRegister reg) { |
| 1038 | lock()->xaddl(address, reg); |
| 1039 | } |
| 1040 | |
| 1041 | void LockXaddq(const Address& address, CpuRegister reg) { |
| 1042 | lock()->xaddq(address, reg); |
| 1043 | } |
| 1044 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1045 | // |
| 1046 | // Misc. functionality |
| 1047 | // |
| 1048 | int PreferredLoopAlignment() { return 16; } |
| 1049 | void Align(int alignment, int offset); |
Roland Levillain | bbc6e7e | 2018-08-24 16:58:47 +0100 | [diff] [blame] | 1050 | void Bind(Label* label) override; |
| 1051 | void Jump(Label* label) override { |
Andreas Gampe | 85b62f2 | 2015-09-09 13:15:38 -0700 | [diff] [blame] | 1052 | jmp(label); |
| 1053 | } |
Mark Mendell | 73f455e | 2015-08-21 09:30:05 -0400 | [diff] [blame] | 1054 | void Bind(NearLabel* label); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1055 | |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 1056 | // Add a double to the constant area, returning the offset into |
| 1057 | // the constant area where the literal resides. |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 1058 | size_t AddDouble(double v) { return constant_area_.AddDouble(v); } |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1059 | |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 1060 | // Add a float to the constant area, returning the offset into |
| 1061 | // the constant area where the literal resides. |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 1062 | size_t AddFloat(float v) { return constant_area_.AddFloat(v); } |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1063 | |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 1064 | // Add an int32_t to the constant area, returning the offset into |
| 1065 | // the constant area where the literal resides. |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 1066 | size_t AddInt32(int32_t v) { |
| 1067 | return constant_area_.AddInt32(v); |
| 1068 | } |
| 1069 | |
| 1070 | // Add an int32_t to the end of the constant area, returning the offset into |
| 1071 | // the constant area where the literal resides. |
| 1072 | size_t AppendInt32(int32_t v) { |
| 1073 | return constant_area_.AppendInt32(v); |
| 1074 | } |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1075 | |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 1076 | // Add an int64_t to the constant area, returning the offset into |
| 1077 | // the constant area where the literal resides. |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 1078 | size_t AddInt64(int64_t v) { return constant_area_.AddInt64(v); } |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1079 | |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 1080 | // Add the contents of the constant area to the assembler buffer. |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1081 | void AddConstantArea(); |
| 1082 | |
Mark Mendell | 39dcf55 | 2015-04-09 20:42:42 -0400 | [diff] [blame] | 1083 | // Is the constant area empty? Return true if there are no literals in the constant area. |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1084 | bool IsConstantAreaEmpty() const { return constant_area_.GetSize() == 0; } |
| 1085 | |
Mark Mendell | 9c86b48 | 2015-09-18 13:36:07 -0400 | [diff] [blame] | 1086 | // Return the current size of the constant area. |
| 1087 | size_t ConstantAreaSize() const { return constant_area_.GetSize(); } |
| 1088 | |
Roland Levillain | 4d02711 | 2015-07-01 15:41:14 +0100 | [diff] [blame] | 1089 | // |
| 1090 | // Heap poisoning. |
| 1091 | // |
| 1092 | |
| 1093 | // Poison a heap reference contained in `reg`. |
| 1094 | void PoisonHeapReference(CpuRegister reg) { negl(reg); } |
| 1095 | // Unpoison a heap reference contained in `reg`. |
| 1096 | void UnpoisonHeapReference(CpuRegister reg) { negl(reg); } |
Roland Levillain | 0b671c0 | 2016-08-19 12:02:34 +0100 | [diff] [blame] | 1097 | // Poison a heap reference contained in `reg` if heap poisoning is enabled. |
| 1098 | void MaybePoisonHeapReference(CpuRegister reg) { |
| 1099 | if (kPoisonHeapReferences) { |
| 1100 | PoisonHeapReference(reg); |
| 1101 | } |
| 1102 | } |
Roland Levillain | 4d02711 | 2015-07-01 15:41:14 +0100 | [diff] [blame] | 1103 | // Unpoison a heap reference contained in `reg` if heap poisoning is enabled. |
| 1104 | void MaybeUnpoisonHeapReference(CpuRegister reg) { |
| 1105 | if (kPoisonHeapReferences) { |
| 1106 | UnpoisonHeapReference(reg); |
| 1107 | } |
| 1108 | } |
| 1109 | |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 1110 | bool CpuHasAVXorAVX2FeatureFlag(); |
| 1111 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1112 | private: |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1113 | void EmitUint8(uint8_t value); |
| 1114 | void EmitInt32(int32_t value); |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 1115 | void EmitInt64(int64_t value); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1116 | void EmitRegisterOperand(uint8_t rm, uint8_t reg); |
| 1117 | void EmitXmmRegisterOperand(uint8_t rm, XmmRegister reg); |
| 1118 | void EmitFixup(AssemblerFixup* fixup); |
| 1119 | void EmitOperandSizeOverride(); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1120 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1121 | void EmitOperand(uint8_t rm, const Operand& operand); |
Nicolas Geoffray | ded5594 | 2018-01-26 16:33:41 +0000 | [diff] [blame] | 1122 | void EmitImmediate(const Immediate& imm, bool is_16_op = false); |
| 1123 | void EmitComplex( |
| 1124 | uint8_t rm, const Operand& operand, const Immediate& immediate, bool is_16_op = false); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1125 | void EmitLabel(Label* label, int instruction_size); |
| 1126 | void EmitLabelLink(Label* label); |
Mark Mendell | 73f455e | 2015-08-21 09:30:05 -0400 | [diff] [blame] | 1127 | void EmitLabelLink(NearLabel* label); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1128 | |
Nicolas Geoffray | 1a43dd7 | 2014-07-17 15:15:34 +0100 | [diff] [blame] | 1129 | void EmitGenericShift(bool wide, int rm, CpuRegister reg, const Immediate& imm); |
Calin Juravle | 9aec02f | 2014-11-18 23:06:35 +0000 | [diff] [blame] | 1130 | void EmitGenericShift(bool wide, int rm, CpuRegister operand, CpuRegister shifter); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1131 | |
| 1132 | // If any input is not false, output the necessary rex prefix. |
| 1133 | void EmitOptionalRex(bool force, bool w, bool r, bool x, bool b); |
| 1134 | |
| 1135 | // Emit a rex prefix byte if necessary for reg. ie if reg is a register in the range R8 to R15. |
| 1136 | void EmitOptionalRex32(CpuRegister reg); |
| 1137 | void EmitOptionalRex32(CpuRegister dst, CpuRegister src); |
| 1138 | void EmitOptionalRex32(XmmRegister dst, XmmRegister src); |
| 1139 | void EmitOptionalRex32(CpuRegister dst, XmmRegister src); |
| 1140 | void EmitOptionalRex32(XmmRegister dst, CpuRegister src); |
| 1141 | void EmitOptionalRex32(const Operand& operand); |
| 1142 | void EmitOptionalRex32(CpuRegister dst, const Operand& operand); |
| 1143 | void EmitOptionalRex32(XmmRegister dst, const Operand& operand); |
| 1144 | |
| 1145 | // Emit a REX.W prefix plus necessary register bit encodings. |
Calin Juravle | d6fb6cf | 2014-11-11 19:07:44 +0000 | [diff] [blame] | 1146 | void EmitRex64(); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1147 | void EmitRex64(CpuRegister reg); |
Calin Juravle | d6fb6cf | 2014-11-11 19:07:44 +0000 | [diff] [blame] | 1148 | void EmitRex64(const Operand& operand); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1149 | void EmitRex64(CpuRegister dst, CpuRegister src); |
| 1150 | void EmitRex64(CpuRegister dst, const Operand& operand); |
Mark Mendell | 40741f3 | 2015-04-20 22:10:34 -0400 | [diff] [blame] | 1151 | void EmitRex64(XmmRegister dst, const Operand& operand); |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 1152 | void EmitRex64(XmmRegister dst, CpuRegister src); |
Roland Levillain | 624279f | 2014-12-04 11:54:28 +0000 | [diff] [blame] | 1153 | void EmitRex64(CpuRegister dst, XmmRegister src); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1154 | |
| 1155 | // Emit a REX prefix to normalize byte registers plus necessary register bit encodings. |
Ulya Trafimovich | cd8286f | 2021-07-12 16:40:16 +0100 | [diff] [blame] | 1156 | // `normalize_both` parameter controls if the REX prefix is checked only for the `src` register |
| 1157 | // (which is the case for instructions like `movzxb rax, bpl`), or for both `src` and `dst` |
| 1158 | // registers (which is the case of instructions like `xchg bpl, al`). By default only `src` is |
| 1159 | // used to decide if REX is needed. |
| 1160 | void EmitOptionalByteRegNormalizingRex32(CpuRegister dst, |
| 1161 | CpuRegister src, |
| 1162 | bool normalize_both = false); |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1163 | void EmitOptionalByteRegNormalizingRex32(CpuRegister dst, const Operand& operand); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1164 | |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 1165 | uint8_t EmitVexPrefixByteZero(bool is_twobyte_form); |
| 1166 | uint8_t EmitVexPrefixByteOne(bool R, bool X, bool B, int SET_VEX_M); |
| 1167 | uint8_t EmitVexPrefixByteOne(bool R, |
| 1168 | X86_64ManagedRegister operand, |
| 1169 | int SET_VEX_L, |
| 1170 | int SET_VEX_PP); |
| 1171 | uint8_t EmitVexPrefixByteTwo(bool W, |
| 1172 | X86_64ManagedRegister operand, |
| 1173 | int SET_VEX_L, |
| 1174 | int SET_VEX_PP); |
| 1175 | uint8_t EmitVexPrefixByteTwo(bool W, |
| 1176 | int SET_VEX_L, |
| 1177 | int SET_VEX_PP); |
Ulya Trafimovich | cd8286f | 2021-07-12 16:40:16 +0100 | [diff] [blame] | 1178 | |
| 1179 | // Helper function to emit a shorter variant of XCHG if at least one operand is RAX/EAX/AX. |
| 1180 | bool try_xchg_rax(CpuRegister dst, |
| 1181 | CpuRegister src, |
| 1182 | void (X86_64Assembler::*prefix_fn)(CpuRegister)); |
| 1183 | |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1184 | ConstantArea constant_area_; |
jaishank | 20d1c94 | 2019-03-08 15:08:17 +0530 | [diff] [blame] | 1185 | bool has_AVX_; // x86 256bit SIMD AVX. |
| 1186 | bool has_AVX2_; // x86 256bit SIMD AVX 2.0. |
Mark Mendell | f55c3e0 | 2015-03-26 21:07:46 -0400 | [diff] [blame] | 1187 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1188 | DISALLOW_COPY_AND_ASSIGN(X86_64Assembler); |
| 1189 | }; |
| 1190 | |
| 1191 | inline void X86_64Assembler::EmitUint8(uint8_t value) { |
| 1192 | buffer_.Emit<uint8_t>(value); |
| 1193 | } |
| 1194 | |
| 1195 | inline void X86_64Assembler::EmitInt32(int32_t value) { |
| 1196 | buffer_.Emit<int32_t>(value); |
| 1197 | } |
| 1198 | |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 1199 | inline void X86_64Assembler::EmitInt64(int64_t value) { |
Roland Levillain | 55dcfb5 | 2014-10-24 18:09:09 +0100 | [diff] [blame] | 1200 | // Write this 64-bit value as two 32-bit words for alignment reasons |
| 1201 | // (this is essentially when running on ARM, which does not allow |
| 1202 | // 64-bit unaligned accesses). We assume little-endianness here. |
| 1203 | EmitInt32(Low32Bits(value)); |
| 1204 | EmitInt32(High32Bits(value)); |
Andreas Gampe | 5a4fa82 | 2014-03-31 16:50:12 -0700 | [diff] [blame] | 1205 | } |
| 1206 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1207 | inline void X86_64Assembler::EmitRegisterOperand(uint8_t rm, uint8_t reg) { |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1208 | CHECK_GE(rm, 0); |
| 1209 | CHECK_LT(rm, 8); |
Nicolas Geoffray | 102cbed | 2014-10-15 18:31:05 +0100 | [diff] [blame] | 1210 | buffer_.Emit<uint8_t>((0xC0 | (reg & 7)) + (rm << 3)); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1211 | } |
| 1212 | |
Ian Rogers | dd7624d | 2014-03-14 17:43:00 -0700 | [diff] [blame] | 1213 | inline void X86_64Assembler::EmitXmmRegisterOperand(uint8_t rm, XmmRegister reg) { |
| 1214 | EmitRegisterOperand(rm, static_cast<uint8_t>(reg.AsFloatRegister())); |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1215 | } |
| 1216 | |
| 1217 | inline void X86_64Assembler::EmitFixup(AssemblerFixup* fixup) { |
| 1218 | buffer_.EmitFixup(fixup); |
| 1219 | } |
| 1220 | |
| 1221 | inline void X86_64Assembler::EmitOperandSizeOverride() { |
| 1222 | EmitUint8(0x66); |
| 1223 | } |
| 1224 | |
Dmitry Petrochenko | fca8220 | 2014-03-21 11:21:37 +0700 | [diff] [blame] | 1225 | } // namespace x86_64 |
| 1226 | } // namespace art |
| 1227 | |
| 1228 | #endif // ART_COMPILER_UTILS_X86_64_ASSEMBLER_X86_64_H_ |