| /* |
| * Copyright (C) 2011 The Android Open Source Project |
| * |
| * Licensed under the Apache License, Version 2.0 (the "License"); |
| * you may not use this file except in compliance with the License. |
| * You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| #include "codegen_arm64.h" |
| |
| #include "arch/arm64/instruction_set_features_arm64.h" |
| #include "arm64_lir.h" |
| #include "base/logging.h" |
| #include "dex/compiler_ir.h" |
| #include "dex/quick/mir_to_lir-inl.h" |
| #include "driver/compiler_driver.h" |
| |
| namespace art { |
| |
| // The macros below are exclusively used in the encoding map. |
| |
| // Most generic way of providing two variants for one instructions. |
| #define CUSTOM_VARIANTS(variant1, variant2) variant1, variant2 |
| |
| // Used for instructions which do not have a wide variant. |
| #define NO_VARIANTS(variant) \ |
| CUSTOM_VARIANTS(variant, 0) |
| |
| // Used for instructions which have a wide variant with the sf bit set to 1. |
| #define SF_VARIANTS(sf0_skeleton) \ |
| CUSTOM_VARIANTS(sf0_skeleton, (sf0_skeleton | 0x80000000)) |
| |
| // Used for instructions which have a wide variant with the size bits set to either x0 or x1. |
| #define SIZE_VARIANTS(sizex0_skeleton) \ |
| CUSTOM_VARIANTS(sizex0_skeleton, (sizex0_skeleton | 0x40000000)) |
| |
| // Used for instructions which have a wide variant with the sf and n bits set to 1. |
| #define SF_N_VARIANTS(sf0_n0_skeleton) \ |
| CUSTOM_VARIANTS(sf0_n0_skeleton, (sf0_n0_skeleton | 0x80400000)) |
| |
| // Used for FP instructions which have a single and double precision variants, with he type bits set |
| // to either 00 or 01. |
| #define FLOAT_VARIANTS(type00_skeleton) \ |
| CUSTOM_VARIANTS(type00_skeleton, (type00_skeleton | 0x00400000)) |
| |
| /* |
| * opcode: A64Opcode enum |
| * variants: instruction skeletons supplied via CUSTOM_VARIANTS or derived macros. |
| * a{n}k: key to applying argument {n} \ |
| * a{n}s: argument {n} start bit position | n = 0, 1, 2, 3 |
| * a{n}e: argument {n} end bit position / |
| * flags: instruction attributes (used in optimization) |
| * name: mnemonic name |
| * fmt: for pretty-printing |
| * fixup: used for second-pass fixes (e.g. adresses fixups in branch instructions). |
| */ |
| #define ENCODING_MAP(opcode, variants, a0k, a0s, a0e, a1k, a1s, a1e, a2k, a2s, a2e, \ |
| a3k, a3s, a3e, flags, name, fmt, fixup) \ |
| {variants, {{a0k, a0s, a0e}, {a1k, a1s, a1e}, {a2k, a2s, a2e}, \ |
| {a3k, a3s, a3e}}, opcode, flags, name, fmt, 4, fixup} |
| |
| /* Instruction dump string format keys: !pf, where "!" is the start |
| * of the key, "p" is which numeric operand to use and "f" is the |
| * print format. |
| * |
| * [p]ositions: |
| * 0 -> operands[0] (dest) |
| * 1 -> operands[1] (src1) |
| * 2 -> operands[2] (src2) |
| * 3 -> operands[3] (extra) |
| * |
| * [f]ormats: |
| * d -> decimal |
| * D -> decimal*4 or decimal*8 depending on the instruction width |
| * E -> decimal*4 |
| * F -> decimal*2 |
| * G -> ", lsl #2" or ", lsl #3" depending on the instruction width |
| * c -> branch condition (eq, ne, etc.) |
| * t -> pc-relative target |
| * p -> pc-relative address |
| * s -> single precision floating point register |
| * S -> double precision floating point register |
| * f -> single or double precision register (depending on instruction width) |
| * I -> 8-bit immediate floating point number |
| * l -> logical immediate |
| * M -> 16-bit shift expression ("" or ", lsl #16" or ", lsl #32"...) |
| * B -> dmb option string (sy, st, ish, ishst, nsh, hshst) |
| * H -> operand shift |
| * h -> 6-bit shift immediate |
| * T -> register shift (either ", lsl #0" or ", lsl #12") |
| * e -> register extend (e.g. uxtb #1) |
| * o -> register shift (e.g. lsl #1) for Word registers |
| * w -> word (32-bit) register wn, or wzr |
| * W -> word (32-bit) register wn, or wsp |
| * x -> extended (64-bit) register xn, or xzr |
| * X -> extended (64-bit) register xn, or sp |
| * r -> register with same width as instruction, r31 -> wzr, xzr |
| * R -> register with same width as instruction, r31 -> wsp, sp |
| * |
| * [!] escape. To insert "!", use "!!" |
| */ |
| /* NOTE: must be kept in sync with enum A64Opcode from arm64_lir.h */ |
| const A64EncodingMap Arm64Mir2Lir::EncodingMap[kA64Last] = { |
| ENCODING_MAP(WIDE(kA64Adc3rrr), SF_VARIANTS(0x1a000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12 | USES_CCODES, |
| "adc", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Add4RRdT), SF_VARIANTS(0x11000000), |
| kFmtRegROrSp, 4, 0, kFmtRegROrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtBitBlt, 23, 22, IS_QUAD_OP | REG_DEF0_USE1, |
| "add", "!0R, !1R, #!2d!3T", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Add4rrro), SF_VARIANTS(0x0b000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtShift, -1, -1, IS_QUAD_OP | REG_DEF0_USE12, |
| "add", "!0r, !1r, !2r!3o", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Add4RRre), SF_VARIANTS(0x0b200000), |
| kFmtRegROrSp, 4, 0, kFmtRegROrSp, 9, 5, kFmtRegR, 20, 16, |
| kFmtExtend, -1, -1, IS_QUAD_OP | REG_DEF0_USE12, |
| "add", "!0r, !1r, !2r!3e", kFixupNone), |
| // Note: adr is binary, but declared as tertiary. The third argument is used while doing the |
| // fixups and contains information to identify the adr label. |
| ENCODING_MAP(kA64Adr2xd, NO_VARIANTS(0x10000000), |
| kFmtRegX, 4, 0, kFmtImm21, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0 | NEEDS_FIXUP, |
| "adr", "!0x, #!1d", kFixupAdr), |
| ENCODING_MAP(kA64Adrp2xd, NO_VARIANTS(0x90000000), |
| kFmtRegX, 4, 0, kFmtImm21, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0 | NEEDS_FIXUP, |
| "adrp", "!0x, #!1d", kFixupLabel), |
| ENCODING_MAP(WIDE(kA64And3Rrl), SF_VARIANTS(0x12000000), |
| kFmtRegROrSp, 4, 0, kFmtRegR, 9, 5, kFmtBitBlt, 22, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1, |
| "and", "!0R, !1r, #!2l", kFixupNone), |
| ENCODING_MAP(WIDE(kA64And4rrro), SF_VARIANTS(0x0a000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtShift, -1, -1, IS_QUAD_OP | REG_DEF0_USE12, |
| "and", "!0r, !1r, !2r!3o", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Asr3rrd), CUSTOM_VARIANTS(0x13007c00, 0x9340fc00), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtBitBlt, 21, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1, |
| "asr", "!0r, !1r, #!2d", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Asr3rrr), SF_VARIANTS(0x1ac02800), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "asr", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(kA64B2ct, NO_VARIANTS(0x54000000), |
| kFmtBitBlt, 3, 0, kFmtBitBlt, 23, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | IS_BRANCH | USES_CCODES | |
| NEEDS_FIXUP, "b.!0c", "!1t", kFixupCondBranch), |
| ENCODING_MAP(kA64Blr1x, NO_VARIANTS(0xd63f0000), |
| kFmtRegX, 9, 5, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, |
| IS_UNARY_OP | REG_USE0 | IS_BRANCH | REG_DEF_LR, |
| "blr", "!0x", kFixupNone), |
| ENCODING_MAP(kA64Br1x, NO_VARIANTS(0xd61f0000), |
| kFmtRegX, 9, 5, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_UNARY_OP | REG_USE0 | IS_BRANCH, |
| "br", "!0x", kFixupNone), |
| ENCODING_MAP(kA64Bl1t, NO_VARIANTS(0x94000000), |
| kFmtBitBlt, 25, 0, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_UNARY_OP | IS_BRANCH | REG_DEF_LR | NEEDS_FIXUP, |
| "bl", "!0T", kFixupLabel), |
| ENCODING_MAP(kA64Brk1d, NO_VARIANTS(0xd4200000), |
| kFmtBitBlt, 20, 5, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_UNARY_OP | IS_BRANCH, |
| "brk", "!0d", kFixupNone), |
| ENCODING_MAP(kA64B1t, NO_VARIANTS(0x14000000), |
| kFmtBitBlt, 25, 0, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_UNARY_OP | IS_BRANCH | NEEDS_FIXUP, |
| "b", "!0t", kFixupT1Branch), |
| ENCODING_MAP(WIDE(kA64Cbnz2rt), SF_VARIANTS(0x35000000), |
| kFmtRegR, 4, 0, kFmtBitBlt, 23, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, |
| IS_BINARY_OP | REG_USE0 | IS_BRANCH | NEEDS_FIXUP, |
| "cbnz", "!0r, !1t", kFixupCBxZ), |
| ENCODING_MAP(WIDE(kA64Cbz2rt), SF_VARIANTS(0x34000000), |
| kFmtRegR, 4, 0, kFmtBitBlt, 23, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, |
| IS_BINARY_OP | REG_USE0 | IS_BRANCH | NEEDS_FIXUP, |
| "cbz", "!0r, !1t", kFixupCBxZ), |
| ENCODING_MAP(WIDE(kA64Cmn3rro), SF_VARIANTS(0x2b00001f), |
| kFmtRegR, 9, 5, kFmtRegR, 20, 16, kFmtShift, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | SETS_CCODES, |
| "cmn", "!0r, !1r!2o", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Cmn3Rre), SF_VARIANTS(0x2b20001f), |
| kFmtRegROrSp, 9, 5, kFmtRegR, 20, 16, kFmtExtend, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | SETS_CCODES, |
| "cmn", "!0R, !1r!2e", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Cmn3RdT), SF_VARIANTS(0x3100001f), |
| kFmtRegROrSp, 9, 5, kFmtBitBlt, 21, 10, kFmtBitBlt, 23, 22, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE0 | SETS_CCODES, |
| "cmn", "!0R, #!1d!2T", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Cmp3rro), SF_VARIANTS(0x6b00001f), |
| kFmtRegR, 9, 5, kFmtRegR, 20, 16, kFmtShift, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | SETS_CCODES, |
| "cmp", "!0r, !1r!2o", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Cmp3Rre), SF_VARIANTS(0x6b20001f), |
| kFmtRegROrSp, 9, 5, kFmtRegR, 20, 16, kFmtExtend, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | SETS_CCODES, |
| "cmp", "!0R, !1r!2e", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Cmp3RdT), SF_VARIANTS(0x7100001f), |
| kFmtRegROrSp, 9, 5, kFmtBitBlt, 21, 10, kFmtBitBlt, 23, 22, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE0 | SETS_CCODES, |
| "cmp", "!0R, #!1d!2T", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Csel4rrrc), SF_VARIANTS(0x1a800000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtBitBlt, 15, 12, IS_QUAD_OP | REG_DEF0_USE12 | USES_CCODES, |
| "csel", "!0r, !1r, !2r, !3c", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Csinc4rrrc), SF_VARIANTS(0x1a800400), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtBitBlt, 15, 12, IS_QUAD_OP | REG_DEF0_USE12 | USES_CCODES, |
| "csinc", "!0r, !1r, !2r, !3c", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Csinv4rrrc), SF_VARIANTS(0x5a800000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtBitBlt, 15, 12, IS_QUAD_OP | REG_DEF0_USE12 | USES_CCODES, |
| "csinv", "!0r, !1r, !2r, !3c", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Csneg4rrrc), SF_VARIANTS(0x5a800400), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtBitBlt, 15, 12, IS_QUAD_OP | REG_DEF0_USE12 | USES_CCODES, |
| "csneg", "!0r, !1r, !2r, !3c", kFixupNone), |
| ENCODING_MAP(kA64Dmb1B, NO_VARIANTS(0xd50330bf), |
| kFmtBitBlt, 11, 8, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_UNARY_OP | IS_VOLATILE, |
| "dmb", "#!0B", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Eor3Rrl), SF_VARIANTS(0x52000000), |
| kFmtRegROrSp, 4, 0, kFmtRegR, 9, 5, kFmtBitBlt, 22, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1, |
| "eor", "!0R, !1r, #!2l", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Eor4rrro), SF_VARIANTS(0x4a000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtShift, -1, -1, IS_QUAD_OP | REG_DEF0_USE12, |
| "eor", "!0r, !1r, !2r!3o", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Extr4rrrd), SF_N_VARIANTS(0x13800000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtBitBlt, 15, 10, IS_QUAD_OP | REG_DEF0_USE12, |
| "extr", "!0r, !1r, !2r, #!3d", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fabs2ff), FLOAT_VARIANTS(0x1e20c000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP| REG_DEF0_USE1, |
| "fabs", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fadd3fff), FLOAT_VARIANTS(0x1e202800), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtRegF, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "fadd", "!0f, !1f, !2f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fcmp1f), FLOAT_VARIANTS(0x1e202008), |
| kFmtRegF, 9, 5, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_UNARY_OP | REG_USE0 | SETS_CCODES, |
| "fcmp", "!0f, #0", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fcmp2ff), FLOAT_VARIANTS(0x1e202000), |
| kFmtRegF, 9, 5, kFmtRegF, 20, 16, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_USE01 | SETS_CCODES, |
| "fcmp", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fcvtzs2wf), FLOAT_VARIANTS(0x1e380000), |
| kFmtRegW, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fcvtzs", "!0w, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fcvtzs2xf), FLOAT_VARIANTS(0x9e380000), |
| kFmtRegX, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fcvtzs", "!0x, !1f", kFixupNone), |
| ENCODING_MAP(kA64Fcvt2Ss, NO_VARIANTS(0x1e22C000), |
| kFmtRegD, 4, 0, kFmtRegS, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fcvt", "!0S, !1s", kFixupNone), |
| ENCODING_MAP(kA64Fcvt2sS, NO_VARIANTS(0x1e624000), |
| kFmtRegS, 4, 0, kFmtRegD, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fcvt", "!0s, !1S", kFixupNone), |
| ENCODING_MAP(kA64Fcvtms2ws, NO_VARIANTS(0x1e300000), |
| kFmtRegW, 4, 0, kFmtRegS, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fcvtms", "!0w, !1s", kFixupNone), |
| ENCODING_MAP(kA64Fcvtms2xS, NO_VARIANTS(0x9e700000), |
| kFmtRegX, 4, 0, kFmtRegD, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fcvtms", "!0x, !1S", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fdiv3fff), FLOAT_VARIANTS(0x1e201800), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtRegF, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "fdiv", "!0f, !1f, !2f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fmax3fff), FLOAT_VARIANTS(0x1e204800), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtRegF, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "fmax", "!0f, !1f, !2f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fmin3fff), FLOAT_VARIANTS(0x1e205800), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtRegF, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "fmin", "!0f, !1f, !2f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fmov2ff), FLOAT_VARIANTS(0x1e204000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1 | IS_MOVE, |
| "fmov", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fmov2fI), FLOAT_VARIANTS(0x1e201000), |
| kFmtRegF, 4, 0, kFmtBitBlt, 20, 13, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0, |
| "fmov", "!0f, #!1I", kFixupNone), |
| ENCODING_MAP(kA64Fmov2sw, NO_VARIANTS(0x1e270000), |
| kFmtRegS, 4, 0, kFmtRegW, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fmov", "!0s, !1w", kFixupNone), |
| ENCODING_MAP(kA64Fmov2Sx, NO_VARIANTS(0x9e670000), |
| kFmtRegD, 4, 0, kFmtRegX, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fmov", "!0S, !1x", kFixupNone), |
| ENCODING_MAP(kA64Fmov2ws, NO_VARIANTS(0x1e260000), |
| kFmtRegW, 4, 0, kFmtRegS, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fmov", "!0w, !1s", kFixupNone), |
| ENCODING_MAP(kA64Fmov2xS, NO_VARIANTS(0x9e660000), |
| kFmtRegX, 4, 0, kFmtRegD, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fmov", "!0x, !1S", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fmul3fff), FLOAT_VARIANTS(0x1e200800), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtRegF, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "fmul", "!0f, !1f, !2f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fneg2ff), FLOAT_VARIANTS(0x1e214000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fneg", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Frintp2ff), FLOAT_VARIANTS(0x1e24c000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "frintp", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Frintm2ff), FLOAT_VARIANTS(0x1e254000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "frintm", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Frintn2ff), FLOAT_VARIANTS(0x1e244000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "frintn", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Frintz2ff), FLOAT_VARIANTS(0x1e25c000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "frintz", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fsqrt2ff), FLOAT_VARIANTS(0x1e61c000), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "fsqrt", "!0f, !1f", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Fsub3fff), FLOAT_VARIANTS(0x1e203800), |
| kFmtRegF, 4, 0, kFmtRegF, 9, 5, kFmtRegF, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "fsub", "!0f, !1f, !2f", kFixupNone), |
| ENCODING_MAP(kA64Ldrb3wXd, NO_VARIANTS(0x39400000), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD_OFF, |
| "ldrb", "!0w, [!1X, #!2d]", kFixupNone), |
| ENCODING_MAP(kA64Ldrb3wXx, NO_VARIANTS(0x38606800), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12 | IS_LOAD, |
| "ldrb", "!0w, [!1X, !2x]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldrsb3rXd), CUSTOM_VARIANTS(0x39c00000, 0x39800000), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD_OFF, |
| "ldrsb", "!0r, [!1X, #!2d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldrsb3rXx), CUSTOM_VARIANTS(0x38e06800, 0x38a06800), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12 | IS_LOAD, |
| "ldrsb", "!0r, [!1X, !2x]", kFixupNone), |
| ENCODING_MAP(kA64Ldrh3wXF, NO_VARIANTS(0x79400000), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD_OFF, |
| "ldrh", "!0w, [!1X, #!2F]", kFixupNone), |
| ENCODING_MAP(kA64Ldrh4wXxd, NO_VARIANTS(0x78606800), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtBitBlt, 12, 12, IS_QUAD_OP | REG_DEF0_USE12 | IS_LOAD_OFF, |
| "ldrh", "!0w, [!1X, !2x, lsl #!3d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldrsh3rXF), CUSTOM_VARIANTS(0x79c00000, 0x79800000), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD_OFF, |
| "ldrsh", "!0r, [!1X, #!2F]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldrsh4rXxd), CUSTOM_VARIANTS(0x78e06800, 0x78906800), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtBitBlt, 12, 12, IS_QUAD_OP | REG_DEF0_USE12 | IS_LOAD_OFF, |
| "ldrsh", "!0r, [!1X, !2x, lsl #!3d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldr2fp), SIZE_VARIANTS(0x1c000000), |
| kFmtRegF, 4, 0, kFmtBitBlt, 23, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, |
| IS_BINARY_OP | REG_DEF0 | REG_USE_PC | IS_LOAD | NEEDS_FIXUP, |
| "ldr", "!0f, !1p", kFixupLoad), |
| ENCODING_MAP(WIDE(kA64Ldr2rp), SIZE_VARIANTS(0x18000000), |
| kFmtRegR, 4, 0, kFmtBitBlt, 23, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, |
| IS_BINARY_OP | REG_DEF0 | REG_USE_PC | IS_LOAD | NEEDS_FIXUP, |
| "ldr", "!0r, !1p", kFixupLoad), |
| ENCODING_MAP(WIDE(kA64Ldr3fXD), SIZE_VARIANTS(0xbd400000), |
| kFmtRegF, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD_OFF, |
| "ldr", "!0f, [!1X, #!2D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldr3rXD), SIZE_VARIANTS(0xb9400000), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD_OFF, |
| "ldr", "!0r, [!1X, #!2D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldr4fXxG), SIZE_VARIANTS(0xbc606800), |
| kFmtRegF, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtBitBlt, 12, 12, IS_QUAD_OP | REG_DEF0_USE12 | IS_LOAD, |
| "ldr", "!0f, [!1X, !2x!3G]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldr4rXxG), SIZE_VARIANTS(0xb8606800), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtBitBlt, 12, 12, IS_QUAD_OP | REG_DEF0_USE12 | IS_LOAD, |
| "ldr", "!0r, [!1X, !2x!3G]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64LdrPost3rXd), SIZE_VARIANTS(0xb8400400), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 20, 12, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF01 | REG_USE1 | IS_LOAD, |
| "ldr", "!0r, [!1X], #!2d", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldp4ffXD), CUSTOM_VARIANTS(0x2d400000, 0x6d400000), |
| kFmtRegF, 4, 0, kFmtRegF, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_USE2 | REG_DEF01 | IS_LOAD_OFF, |
| "ldp", "!0f, !1f, [!2X, #!3D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldp4rrXD), SF_VARIANTS(0x29400000), |
| kFmtRegR, 4, 0, kFmtRegR, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_USE2 | REG_DEF01 | IS_LOAD_OFF, |
| "ldp", "!0r, !1r, [!2X, #!3D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64LdpPost4rrXD), CUSTOM_VARIANTS(0x28c00000, 0xa8c00000), |
| kFmtRegR, 4, 0, kFmtRegR, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_USE2 | REG_DEF012 | IS_LOAD, |
| "ldp", "!0r, !1r, [!2X], #!3D", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldur3fXd), CUSTOM_VARIANTS(0xbc400000, 0xfc400000), |
| kFmtRegF, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 20, 12, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD, |
| "ldur", "!0f, [!1X, #!2d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldur3rXd), SIZE_VARIANTS(0xb8400000), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 20, 12, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | IS_LOAD, |
| "ldur", "!0r, [!1X, #!2d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldxr2rX), SIZE_VARIANTS(0x885f7c00), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1 | IS_LOADX, |
| "ldxr", "!0r, [!1X]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ldaxr2rX), SIZE_VARIANTS(0x885ffc00), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1 | IS_LOADX, |
| "ldaxr", "!0r, [!1X]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Lsl3rrr), SF_VARIANTS(0x1ac02000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "lsl", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Lsr3rrd), CUSTOM_VARIANTS(0x53007c00, 0xd340fc00), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtBitBlt, 21, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1, |
| "lsr", "!0r, !1r, #!2d", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Lsr3rrr), SF_VARIANTS(0x1ac02400), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "lsr", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Madd4rrrr), SF_VARIANTS(0x1b000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtRegR, 14, 10, IS_QUAD_OP | REG_DEF0_USE123 | NEEDS_FIXUP, |
| "madd", "!0r, !1r, !2r, !3r", kFixupA53Erratum835769), |
| ENCODING_MAP(WIDE(kA64Movk3rdM), SF_VARIANTS(0x72800000), |
| kFmtRegR, 4, 0, kFmtBitBlt, 20, 5, kFmtBitBlt, 22, 21, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE0, |
| "movk", "!0r, #!1d!2M", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Movn3rdM), SF_VARIANTS(0x12800000), |
| kFmtRegR, 4, 0, kFmtBitBlt, 20, 5, kFmtBitBlt, 22, 21, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0, |
| "movn", "!0r, #!1d!2M", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Movz3rdM), SF_VARIANTS(0x52800000), |
| kFmtRegR, 4, 0, kFmtBitBlt, 20, 5, kFmtBitBlt, 22, 21, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0, |
| "movz", "!0r, #!1d!2M", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Mov2rr), SF_VARIANTS(0x2a0003e0), |
| kFmtRegR, 4, 0, kFmtRegR, 20, 16, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1 | IS_MOVE, |
| "mov", "!0r, !1r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Mvn2rr), SF_VARIANTS(0x2a2003e0), |
| kFmtRegR, 4, 0, kFmtRegR, 20, 16, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "mvn", "!0r, !1r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Mul3rrr), SF_VARIANTS(0x1b007c00), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "mul", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Msub4rrrr), SF_VARIANTS(0x1b008000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtRegR, 14, 10, IS_QUAD_OP | REG_DEF0_USE123 | NEEDS_FIXUP, |
| "msub", "!0r, !1r, !2r, !3r", kFixupA53Erratum835769), |
| ENCODING_MAP(WIDE(kA64Neg3rro), SF_VARIANTS(0x4b0003e0), |
| kFmtRegR, 4, 0, kFmtRegR, 20, 16, kFmtShift, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1, |
| "neg", "!0r, !1r!2o", kFixupNone), |
| ENCODING_MAP(kA64Nop0, NO_VARIANTS(0xd503201f), |
| kFmtUnused, -1, -1, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, NO_OPERAND, |
| "nop", "", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Orr3Rrl), SF_VARIANTS(0x32000000), |
| kFmtRegROrSp, 4, 0, kFmtRegR, 9, 5, kFmtBitBlt, 22, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1, |
| "orr", "!0R, !1r, #!2l", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Orr4rrro), SF_VARIANTS(0x2a000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtShift, -1, -1, IS_QUAD_OP | REG_DEF0_USE12, |
| "orr", "!0r, !1r, !2r!3o", kFixupNone), |
| ENCODING_MAP(kA64Ret, NO_VARIANTS(0xd65f03c0), |
| kFmtUnused, -1, -1, kFmtUnused, -1, -1, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, NO_OPERAND | IS_BRANCH, |
| "ret", "", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Rbit2rr), SF_VARIANTS(0x5ac00000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "rbit", "!0r, !1r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Rev2rr), CUSTOM_VARIANTS(0x5ac00800, 0xdac00c00), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "rev", "!0r, !1r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Rev162rr), SF_VARIANTS(0x5ac00400), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "rev16", "!0r, !1r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Ror3rrr), SF_VARIANTS(0x1ac02c00), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "ror", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Sbc3rrr), SF_VARIANTS(0x5a000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12 | USES_CCODES, |
| "sbc", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Sbfm4rrdd), SF_N_VARIANTS(0x13000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtBitBlt, 21, 16, |
| kFmtBitBlt, 15, 10, IS_QUAD_OP | REG_DEF0_USE1, |
| "sbfm", "!0r, !1r, #!2d, #!3d", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Scvtf2fw), FLOAT_VARIANTS(0x1e220000), |
| kFmtRegF, 4, 0, kFmtRegW, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "scvtf", "!0f, !1w", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Scvtf2fx), FLOAT_VARIANTS(0x9e220000), |
| kFmtRegF, 4, 0, kFmtRegX, 9, 5, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_BINARY_OP | REG_DEF0_USE1, |
| "scvtf", "!0f, !1x", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Sdiv3rrr), SF_VARIANTS(0x1ac00c00), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "sdiv", "!0r, !1r, !2r", kFixupNone), |
| ENCODING_MAP(kA64Smull3xww, NO_VARIANTS(0x9b207c00), |
| kFmtRegX, 4, 0, kFmtRegW, 9, 5, kFmtRegW, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "smull", "!0x, !1w, !2w", kFixupNone), |
| ENCODING_MAP(kA64Smulh3xxx, NO_VARIANTS(0x9b407c00), |
| kFmtRegX, 4, 0, kFmtRegX, 9, 5, kFmtRegX, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12, |
| "smulh", "!0x, !1x, !2x", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Stp4ffXD), CUSTOM_VARIANTS(0x2d000000, 0x6d000000), |
| kFmtRegF, 4, 0, kFmtRegF, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_USE012 | IS_STORE_OFF, |
| "stp", "!0f, !1f, [!2X, #!3D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Stp4rrXD), SF_VARIANTS(0x29000000), |
| kFmtRegR, 4, 0, kFmtRegR, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_USE012 | IS_STORE_OFF, |
| "stp", "!0r, !1r, [!2X, #!3D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64StpPost4rrXD), CUSTOM_VARIANTS(0x28800000, 0xa8800000), |
| kFmtRegR, 4, 0, kFmtRegR, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_DEF2 | REG_USE012 | IS_STORE, |
| "stp", "!0r, !1r, [!2X], #!3D", kFixupNone), |
| ENCODING_MAP(WIDE(kA64StpPre4ffXD), CUSTOM_VARIANTS(0x2d800000, 0x6d800000), |
| kFmtRegF, 4, 0, kFmtRegF, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_DEF2 | REG_USE012 | IS_STORE, |
| "stp", "!0f, !1f, [!2X, #!3D]!!", kFixupNone), |
| ENCODING_MAP(WIDE(kA64StpPre4rrXD), CUSTOM_VARIANTS(0x29800000, 0xa9800000), |
| kFmtRegR, 4, 0, kFmtRegR, 14, 10, kFmtRegXOrSp, 9, 5, |
| kFmtBitBlt, 21, 15, IS_QUAD_OP | REG_DEF2 | REG_USE012 | IS_STORE, |
| "stp", "!0r, !1r, [!2X, #!3D]!!", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Str3fXD), CUSTOM_VARIANTS(0xbd000000, 0xfd000000), |
| kFmtRegF, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | IS_STORE_OFF, |
| "str", "!0f, [!1X, #!2D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Str4fXxG), CUSTOM_VARIANTS(0xbc206800, 0xfc206800), |
| kFmtRegF, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtBitBlt, 12, 12, IS_QUAD_OP | REG_USE012 | IS_STORE, |
| "str", "!0f, [!1X, !2x!3G]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Str3rXD), SIZE_VARIANTS(0xb9000000), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | IS_STORE_OFF, |
| "str", "!0r, [!1X, #!2D]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Str4rXxG), SIZE_VARIANTS(0xb8206800), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtBitBlt, 12, 12, IS_QUAD_OP | REG_USE012 | IS_STORE, |
| "str", "!0r, [!1X, !2x!3G]", kFixupNone), |
| ENCODING_MAP(kA64Strb3wXd, NO_VARIANTS(0x39000000), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | IS_STORE_OFF, |
| "strb", "!0w, [!1X, #!2d]", kFixupNone), |
| ENCODING_MAP(kA64Strb3wXx, NO_VARIANTS(0x38206800), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE012 | IS_STORE, |
| "strb", "!0w, [!1X, !2x]", kFixupNone), |
| ENCODING_MAP(kA64Strh3wXF, NO_VARIANTS(0x79000000), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | IS_STORE_OFF, |
| "strh", "!0w, [!1X, #!2F]", kFixupNone), |
| ENCODING_MAP(kA64Strh4wXxd, NO_VARIANTS(0x78206800), |
| kFmtRegW, 4, 0, kFmtRegXOrSp, 9, 5, kFmtRegX, 20, 16, |
| kFmtBitBlt, 12, 12, IS_QUAD_OP | REG_USE012 | IS_STORE, |
| "strh", "!0w, [!1X, !2x, lsl #!3d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64StrPost3rXd), SIZE_VARIANTS(0xb8000400), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 20, 12, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | REG_DEF1 | IS_STORE, |
| "str", "!0r, [!1X], #!2d", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Stur3fXd), CUSTOM_VARIANTS(0xbc000000, 0xfc000000), |
| kFmtRegF, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 20, 12, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | IS_STORE, |
| "stur", "!0f, [!1X, #!2d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Stur3rXd), SIZE_VARIANTS(0xb8000000), |
| kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, kFmtBitBlt, 20, 12, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | IS_STORE, |
| "stur", "!0r, [!1X, #!2d]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Stxr3wrX), SIZE_VARIANTS(0x88007c00), |
| kFmtRegW, 20, 16, kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12 | IS_STOREX, |
| "stxr", "!0w, !1r, [!2X]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Stlxr3wrX), SIZE_VARIANTS(0x8800fc00), |
| kFmtRegW, 20, 16, kFmtRegR, 4, 0, kFmtRegXOrSp, 9, 5, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE12 | IS_STOREX, |
| "stlxr", "!0w, !1r, [!2X]", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Sub4RRdT), SF_VARIANTS(0x51000000), |
| kFmtRegROrSp, 4, 0, kFmtRegROrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtBitBlt, 23, 22, IS_QUAD_OP | REG_DEF0_USE1, |
| "sub", "!0R, !1R, #!2d!3T", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Sub4rrro), SF_VARIANTS(0x4b000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtRegR, 20, 16, |
| kFmtShift, -1, -1, IS_QUAD_OP | REG_DEF0_USE12, |
| "sub", "!0r, !1r, !2r!3o", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Sub4RRre), SF_VARIANTS(0x4b200000), |
| kFmtRegROrSp, 4, 0, kFmtRegROrSp, 9, 5, kFmtRegR, 20, 16, |
| kFmtExtend, -1, -1, IS_QUAD_OP | REG_DEF0_USE12, |
| "sub", "!0r, !1r, !2r!3e", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Subs3rRd), SF_VARIANTS(0x71000000), |
| kFmtRegR, 4, 0, kFmtRegROrSp, 9, 5, kFmtBitBlt, 21, 10, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_DEF0_USE1 | SETS_CCODES, |
| "subs", "!0r, !1R, #!2d", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Tst2rl), SF_VARIANTS(0x7200001f), |
| kFmtRegR, 9, 5, kFmtBitBlt, 22, 10, kFmtUnused, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE0 | SETS_CCODES, |
| "tst", "!0r, !1l", kFixupNone), |
| ENCODING_MAP(WIDE(kA64Tst3rro), SF_VARIANTS(0x6a00001f), |
| kFmtRegR, 9, 5, kFmtRegR, 20, 16, kFmtShift, -1, -1, |
| kFmtUnused, -1, -1, IS_TERTIARY_OP | REG_USE01 | SETS_CCODES, |
| "tst", "!0r, !1r!2o", kFixupNone), |
| // NOTE: Tbz/Tbnz does not require SETS_CCODES, but it may be replaced by some other LIRs |
| // which require SETS_CCODES in the fix-up stage. |
| ENCODING_MAP(WIDE(kA64Tbnz3rht), CUSTOM_VARIANTS(0x37000000, 0x37000000), |
| kFmtRegR, 4, 0, kFmtImm6Shift, -1, -1, kFmtBitBlt, 18, 5, kFmtUnused, -1, -1, |
| IS_TERTIARY_OP | REG_USE0 | IS_BRANCH | NEEDS_FIXUP | SETS_CCODES, |
| "tbnz", "!0r, #!1h, !2t", kFixupTBxZ), |
| ENCODING_MAP(WIDE(kA64Tbz3rht), CUSTOM_VARIANTS(0x36000000, 0x36000000), |
| kFmtRegR, 4, 0, kFmtImm6Shift, -1, -1, kFmtBitBlt, 18, 5, kFmtUnused, -1, -1, |
| IS_TERTIARY_OP | REG_USE0 | IS_BRANCH | NEEDS_FIXUP | SETS_CCODES, |
| "tbz", "!0r, #!1h, !2t", kFixupTBxZ), |
| ENCODING_MAP(WIDE(kA64Ubfm4rrdd), SF_N_VARIANTS(0x53000000), |
| kFmtRegR, 4, 0, kFmtRegR, 9, 5, kFmtBitBlt, 21, 16, |
| kFmtBitBlt, 15, 10, IS_QUAD_OP | REG_DEF0_USE1, |
| "ubfm", "!0r, !1r, !2d, !3d", kFixupNone), |
| }; |
| |
| // new_lir replaces orig_lir in the pcrel_fixup list. |
| void Arm64Mir2Lir::ReplaceFixup(LIR* prev_lir, LIR* orig_lir, LIR* new_lir) { |
| new_lir->u.a.pcrel_next = orig_lir->u.a.pcrel_next; |
| if (UNLIKELY(prev_lir == nullptr)) { |
| first_fixup_ = new_lir; |
| } else { |
| prev_lir->u.a.pcrel_next = new_lir; |
| } |
| orig_lir->flags.fixup = kFixupNone; |
| } |
| |
| // new_lir is inserted before orig_lir in the pcrel_fixup list. |
| void Arm64Mir2Lir::InsertFixupBefore(LIR* prev_lir, LIR* orig_lir, LIR* new_lir) { |
| new_lir->u.a.pcrel_next = orig_lir; |
| if (UNLIKELY(prev_lir == nullptr)) { |
| first_fixup_ = new_lir; |
| } else { |
| DCHECK(prev_lir->u.a.pcrel_next == orig_lir); |
| prev_lir->u.a.pcrel_next = new_lir; |
| } |
| } |
| |
| /* Nop, used for aligning code. Nop is an alias for hint #0. */ |
| #define PADDING_NOP (UINT32_C(0xd503201f)) |
| |
| uint8_t* Arm64Mir2Lir::EncodeLIRs(uint8_t* write_pos, LIR* lir) { |
| uint8_t* const write_buffer = write_pos; |
| for (; lir != nullptr; lir = NEXT_LIR(lir)) { |
| lir->offset = (write_pos - write_buffer); |
| bool opcode_is_wide = IS_WIDE(lir->opcode); |
| A64Opcode opcode = UNWIDE(lir->opcode); |
| |
| if (UNLIKELY(IsPseudoLirOp(opcode))) { |
| continue; |
| } |
| |
| if (LIKELY(!lir->flags.is_nop)) { |
| const A64EncodingMap *encoder = &EncodingMap[opcode]; |
| |
| // Select the right variant of the skeleton. |
| uint32_t bits = opcode_is_wide ? encoder->xskeleton : encoder->wskeleton; |
| DCHECK(!opcode_is_wide || IS_WIDE(encoder->opcode)); |
| |
| for (int i = 0; i < 4; i++) { |
| A64EncodingKind kind = encoder->field_loc[i].kind; |
| uint32_t operand = lir->operands[i]; |
| uint32_t value; |
| |
| if (LIKELY(static_cast<unsigned>(kind) <= kFmtBitBlt)) { |
| // Note: this will handle kFmtReg* and kFmtBitBlt. |
| |
| if (static_cast<unsigned>(kind) < kFmtBitBlt) { |
| bool is_zero = A64_REG_IS_ZR(operand); |
| |
| if (kIsDebugBuild && (kFailOnSizeError || kReportSizeError)) { |
| // Register usage checks: First establish register usage requirements based on the |
| // format in `kind'. |
| bool want_float = false; // Want a float (rather than core) register. |
| bool want_64_bit = false; // Want a 64-bit (rather than 32-bit) register. |
| bool want_var_size = true; // Want register with variable size (kFmtReg{R,F}). |
| bool want_zero = false; // Want the zero (rather than sp) register. |
| switch (kind) { |
| case kFmtRegX: |
| want_64_bit = true; |
| FALLTHROUGH_INTENDED; |
| case kFmtRegW: |
| want_var_size = false; |
| FALLTHROUGH_INTENDED; |
| case kFmtRegR: |
| want_zero = true; |
| break; |
| case kFmtRegXOrSp: |
| want_64_bit = true; |
| FALLTHROUGH_INTENDED; |
| case kFmtRegWOrSp: |
| want_var_size = false; |
| break; |
| case kFmtRegROrSp: |
| break; |
| case kFmtRegD: |
| want_64_bit = true; |
| FALLTHROUGH_INTENDED; |
| case kFmtRegS: |
| want_var_size = false; |
| FALLTHROUGH_INTENDED; |
| case kFmtRegF: |
| want_float = true; |
| break; |
| default: |
| LOG(FATAL) << "Bad fmt for arg n. " << i << " of " << encoder->name |
| << " (" << kind << ")"; |
| break; |
| } |
| |
| // want_var_size == true means kind == kFmtReg{R,F}. In these two cases, we want |
| // the register size to be coherent with the instruction width. |
| if (want_var_size) { |
| want_64_bit = opcode_is_wide; |
| } |
| |
| // Now check that the requirements are satisfied. |
| RegStorage reg(operand | RegStorage::kValid); |
| const char *expected = nullptr; |
| if (want_float) { |
| if (!reg.IsFloat()) { |
| expected = "float register"; |
| } else if (reg.IsDouble() != want_64_bit) { |
| expected = (want_64_bit) ? "double register" : "single register"; |
| } |
| } else { |
| if (reg.IsFloat()) { |
| expected = "core register"; |
| } else if (reg.Is64Bit() != want_64_bit) { |
| expected = (want_64_bit) ? "x-register" : "w-register"; |
| } else if (A64_REGSTORAGE_IS_SP_OR_ZR(reg) && is_zero != want_zero) { |
| expected = (want_zero) ? "zero-register" : "sp-register"; |
| } |
| } |
| |
| // Fail, if `expected' contains an unsatisfied requirement. |
| if (expected != nullptr) { |
| LOG(WARNING) << "Method: " << PrettyMethod(cu_->method_idx, *cu_->dex_file) |
| << " @ 0x" << std::hex << lir->dalvik_offset; |
| if (kFailOnSizeError) { |
| LOG(FATAL) << "Bad argument n. " << i << " of " << encoder->name |
| << "(" << UNWIDE(encoder->opcode) << ", " << encoder->fmt << ")" |
| << ". Expected " << expected << ", got 0x" << std::hex << operand; |
| } else { |
| LOG(WARNING) << "Bad argument n. " << i << " of " << encoder->name |
| << ". Expected " << expected << ", got 0x" << std::hex << operand; |
| } |
| } |
| } |
| |
| // In the lines below, we rely on (operand & 0x1f) == 31 to be true for register sp |
| // and zr. This means that these two registers do not need any special treatment, as |
| // their bottom 5 bits are correctly set to 31 == 0b11111, which is the right |
| // value for encoding both sp and zr. |
| static_assert((rxzr & 0x1f) == 0x1f, "rzr register number must be 31"); |
| static_assert((rsp & 0x1f) == 0x1f, "rsp register number must be 31"); |
| } |
| |
| value = (operand << encoder->field_loc[i].start) & |
| ((1 << (encoder->field_loc[i].end + 1)) - 1); |
| bits |= value; |
| } else { |
| switch (kind) { |
| case kFmtSkip: |
| break; // Nothing to do, but continue to next. |
| case kFmtUnused: |
| i = 4; // Done, break out of the enclosing loop. |
| break; |
| case kFmtShift: |
| // Intentional fallthrough. |
| case kFmtExtend: |
| DCHECK_EQ((operand & (1 << 6)) == 0, kind == kFmtShift); |
| value = (operand & 0x3f) << 10; |
| value |= ((operand & 0x1c0) >> 6) << 21; |
| bits |= value; |
| break; |
| case kFmtImm21: |
| value = (operand & 0x3) << 29; |
| value |= ((operand & 0x1ffffc) >> 2) << 5; |
| bits |= value; |
| break; |
| case kFmtImm6Shift: |
| value = (operand & 0x1f) << 19; |
| value |= ((operand & 0x20) >> 5) << 31; |
| bits |= value; |
| break; |
| default: |
| LOG(FATAL) << "Bad fmt for arg. " << i << " in " << encoder->name |
| << " (" << kind << ")"; |
| } |
| } |
| } |
| |
| DCHECK_EQ(encoder->size, 4); |
| write_pos[0] = (bits & 0xff); |
| write_pos[1] = ((bits >> 8) & 0xff); |
| write_pos[2] = ((bits >> 16) & 0xff); |
| write_pos[3] = ((bits >> 24) & 0xff); |
| write_pos += 4; |
| } |
| } |
| |
| return write_pos; |
| } |
| |
| // Align data offset on 8 byte boundary: it will only contain double-word items, as word immediates |
| // are better set directly from the code (they will require no more than 2 instructions). |
| #define ALIGNED_DATA_OFFSET(offset) (((offset) + 0x7) & ~0x7) |
| |
| /* |
| * Get the LIR which emits the instruction preceding the given LIR. |
| * Returns nullptr, if no previous emitting insn found. |
| */ |
| static LIR* GetPrevEmittingLIR(LIR* lir) { |
| DCHECK(lir != nullptr); |
| LIR* prev_lir = lir->prev; |
| while ((prev_lir != nullptr) && |
| (prev_lir->flags.is_nop || Mir2Lir::IsPseudoLirOp(prev_lir->opcode))) { |
| prev_lir = prev_lir->prev; |
| } |
| return prev_lir; |
| } |
| |
| // Assemble the LIR into binary instruction format. |
| void Arm64Mir2Lir::AssembleLIR() { |
| LIR* lir; |
| LIR* prev_lir; |
| cu_->NewTimingSplit("Assemble"); |
| int assembler_retries = 0; |
| CodeOffset starting_offset = LinkFixupInsns(first_lir_insn_, last_lir_insn_, 0); |
| data_offset_ = ALIGNED_DATA_OFFSET(starting_offset); |
| int32_t offset_adjustment; |
| AssignDataOffsets(); |
| |
| /* |
| * Note: generation must be 1 on first pass (to distinguish from initialized state of 0 |
| * for non-visited nodes). Start at zero here, and bit will be flipped to 1 on entry to the loop. |
| */ |
| int generation = 0; |
| while (true) { |
| offset_adjustment = 0; |
| AssemblerStatus res = kSuccess; // Assume success |
| generation ^= 1; |
| // Note: nodes requiring possible fixup linked in ascending order. |
| lir = first_fixup_; |
| prev_lir = nullptr; |
| while (lir != nullptr) { |
| // NOTE: Any new non-pc_rel instructions inserted due to retry must be explicitly encoded at |
| // the time of insertion. Note that inserted instructions don't need use/def flags, but do |
| // need size and pc-rel status properly updated. |
| lir->offset += offset_adjustment; |
| // During pass, allows us to tell whether a node has been updated with offset_adjustment yet. |
| lir->flags.generation = generation; |
| switch (static_cast<FixupKind>(lir->flags.fixup)) { |
| case kFixupLabel: |
| case kFixupNone: |
| case kFixupVLoad: |
| break; |
| case kFixupT1Branch: { |
| LIR *target_lir = lir->target; |
| DCHECK(target_lir); |
| CodeOffset pc = lir->offset; |
| CodeOffset target = target_lir->offset + |
| ((target_lir->flags.generation == lir->flags.generation) ? 0 : offset_adjustment); |
| int32_t delta = target - pc; |
| DCHECK_EQ(delta & 0x3, 0); |
| if (!IS_SIGNED_IMM26(delta >> 2)) { |
| LOG(FATAL) << "Invalid jump range in kFixupT1Branch"; |
| } |
| lir->operands[0] = delta >> 2; |
| if (!(cu_->disable_opt & (1 << kSafeOptimizations)) && lir->operands[0] == 1) { |
| // Useless branch. |
| offset_adjustment -= lir->flags.size; |
| lir->flags.is_nop = true; |
| // Don't unlink - just set to do-nothing. |
| lir->flags.fixup = kFixupNone; |
| res = kRetryAll; |
| } |
| break; |
| } |
| case kFixupLoad: |
| case kFixupCBxZ: |
| case kFixupCondBranch: { |
| LIR *target_lir = lir->target; |
| DCHECK(target_lir); |
| CodeOffset pc = lir->offset; |
| CodeOffset target = target_lir->offset + |
| ((target_lir->flags.generation == lir->flags.generation) ? 0 : offset_adjustment); |
| int32_t delta = target - pc; |
| DCHECK_EQ(delta & 0x3, 0); |
| if (!IS_SIGNED_IMM19(delta >> 2)) { |
| LOG(FATAL) << "Invalid jump range in kFixupLoad"; |
| } |
| lir->operands[1] = delta >> 2; |
| break; |
| } |
| case kFixupTBxZ: { |
| int16_t opcode = lir->opcode; |
| RegStorage reg(lir->operands[0] | RegStorage::kValid); |
| int32_t imm = lir->operands[1]; |
| DCHECK_EQ(IS_WIDE(opcode), reg.Is64Bit()); |
| DCHECK_LT(imm, 64); |
| if (imm >= 32) { |
| DCHECK(IS_WIDE(opcode)); |
| } else if (kIsDebugBuild && IS_WIDE(opcode)) { |
| // "tbz/tbnz x0, #imm(<32)" is the same with "tbz/tbnz w0, #imm(<32)", but GCC/oatdump |
| // will disassemble it as "tbz/tbnz w0, #imm(<32)". So unwide the LIR to make the |
| // compiler log behave the same with those disassembler in debug build. |
| // This will also affect tst instruction if it need to be replaced, but there is no |
| // performance difference between "tst Xt" and "tst Wt". |
| lir->opcode = UNWIDE(opcode); |
| lir->operands[0] = As32BitReg(reg).GetReg(); |
| } |
| |
| // Fix-up branch offset. |
| LIR *target_lir = lir->target; |
| DCHECK(target_lir); |
| CodeOffset pc = lir->offset; |
| CodeOffset target = target_lir->offset + |
| ((target_lir->flags.generation == lir->flags.generation) ? 0 : offset_adjustment); |
| int32_t delta = target - pc; |
| DCHECK_EQ(delta & 0x3, 0); |
| // Check if branch offset can be encoded in tbz/tbnz. |
| if (!IS_SIGNED_IMM14(delta >> 2)) { |
| DexOffset dalvik_offset = lir->dalvik_offset; |
| LIR* targetLIR = lir->target; |
| // "tbz/tbnz Rt, #imm, label" -> "tst Rt, #(1<<imm)". |
| offset_adjustment -= lir->flags.size; |
| int32_t encodedImm = EncodeLogicalImmediate(IS_WIDE(opcode), 1 << lir->operands[1]); |
| DCHECK_NE(encodedImm, -1); |
| lir->opcode = IS_WIDE(opcode) ? WIDE(kA64Tst2rl) : kA64Tst2rl; |
| lir->operands[1] = encodedImm; |
| lir->target = nullptr; |
| lir->flags.fixup = EncodingMap[kA64Tst2rl].fixup; |
| lir->flags.size = EncodingMap[kA64Tst2rl].size; |
| offset_adjustment += lir->flags.size; |
| // Insert "beq/bneq label". |
| opcode = UNWIDE(opcode); |
| DCHECK(opcode == kA64Tbz3rht || opcode == kA64Tbnz3rht); |
| LIR* new_lir = RawLIR(dalvik_offset, kA64B2ct, |
| opcode == kA64Tbz3rht ? kArmCondEq : kArmCondNe, 0, 0, 0, 0, targetLIR); |
| InsertLIRAfter(lir, new_lir); |
| new_lir->offset = lir->offset + lir->flags.size; |
| new_lir->flags.generation = generation; |
| new_lir->flags.fixup = EncodingMap[kA64B2ct].fixup; |
| new_lir->flags.size = EncodingMap[kA64B2ct].size; |
| offset_adjustment += new_lir->flags.size; |
| // lir no longer pcrel, unlink and link in new_lir. |
| ReplaceFixup(prev_lir, lir, new_lir); |
| prev_lir = new_lir; // Continue with the new instruction. |
| lir = new_lir->u.a.pcrel_next; |
| res = kRetryAll; |
| continue; |
| } |
| lir->operands[2] = delta >> 2; |
| break; |
| } |
| case kFixupAdr: { |
| LIR* target_lir = lir->target; |
| int32_t delta; |
| if (target_lir) { |
| CodeOffset target_offs = ((target_lir->flags.generation == lir->flags.generation) ? |
| 0 : offset_adjustment) + target_lir->offset; |
| delta = target_offs - lir->offset; |
| } else if (lir->operands[2] >= 0) { |
| const EmbeddedData* tab = UnwrapPointer<EmbeddedData>(lir->operands[2]); |
| delta = tab->offset + offset_adjustment - lir->offset; |
| } else { |
| // No fixup: this usage allows to retrieve the current PC. |
| delta = lir->operands[1]; |
| } |
| if (!IS_SIGNED_IMM21(delta)) { |
| LOG(FATAL) << "Jump range above 1MB in kFixupAdr"; |
| } |
| lir->operands[1] = delta; |
| break; |
| } |
| case kFixupA53Erratum835769: |
| // Avoid emitting code that could trigger Cortex A53's erratum 835769. |
| // This fixup should be carried out for all multiply-accumulate instructions: madd, msub, |
| // smaddl, smsubl, umaddl and umsubl. |
| if (cu_->compiler_driver->GetInstructionSetFeatures()->AsArm64InstructionSetFeatures() |
| ->NeedFixCortexA53_835769()) { |
| // Check that this is a 64-bit multiply-accumulate. |
| if (IS_WIDE(lir->opcode)) { |
| LIR* prev_insn = GetPrevEmittingLIR(lir); |
| if (prev_insn == nullptr) { |
| break; |
| } |
| uint64_t prev_insn_flags = EncodingMap[UNWIDE(prev_insn->opcode)].flags; |
| // Check that the instruction preceding the multiply-accumulate is a load or store. |
| if ((prev_insn_flags & IS_LOAD) != 0 || (prev_insn_flags & IS_STORE) != 0) { |
| // insert a NOP between the load/store and the multiply-accumulate. |
| LIR* new_lir = RawLIR(lir->dalvik_offset, kA64Nop0, 0, 0, 0, 0, 0, nullptr); |
| new_lir->offset = lir->offset; |
| new_lir->flags.fixup = kFixupNone; |
| new_lir->flags.size = EncodingMap[kA64Nop0].size; |
| InsertLIRBefore(lir, new_lir); |
| lir->offset += new_lir->flags.size; |
| offset_adjustment += new_lir->flags.size; |
| res = kRetryAll; |
| } |
| } |
| } |
| break; |
| default: |
| LOG(FATAL) << "Unexpected case " << lir->flags.fixup; |
| } |
| prev_lir = lir; |
| lir = lir->u.a.pcrel_next; |
| } |
| |
| if (res == kSuccess) { |
| DCHECK_EQ(offset_adjustment, 0); |
| break; |
| } else { |
| assembler_retries++; |
| if (assembler_retries > MAX_ASSEMBLER_RETRIES) { |
| CodegenDump(); |
| LOG(FATAL) << "Assembler error - too many retries"; |
| } |
| starting_offset += offset_adjustment; |
| data_offset_ = ALIGNED_DATA_OFFSET(starting_offset); |
| AssignDataOffsets(); |
| } |
| } |
| |
| // Build the CodeBuffer. |
| DCHECK_LE(data_offset_, total_size_); |
| code_buffer_.reserve(total_size_); |
| code_buffer_.resize(starting_offset); |
| uint8_t* write_pos = &code_buffer_[0]; |
| write_pos = EncodeLIRs(write_pos, first_lir_insn_); |
| DCHECK_EQ(static_cast<CodeOffset>(write_pos - &code_buffer_[0]), starting_offset); |
| |
| DCHECK_EQ(data_offset_, ALIGNED_DATA_OFFSET(code_buffer_.size())); |
| |
| // Install literals |
| InstallLiteralPools(); |
| |
| // Install switch tables |
| InstallSwitchTables(); |
| |
| // Install fill array data |
| InstallFillArrayData(); |
| |
| // Create the mapping table and native offset to reference map. |
| cu_->NewTimingSplit("PcMappingTable"); |
| CreateMappingTables(); |
| |
| cu_->NewTimingSplit("GcMap"); |
| CreateNativeGcMap(); |
| } |
| |
| size_t Arm64Mir2Lir::GetInsnSize(LIR* lir) { |
| A64Opcode opcode = UNWIDE(lir->opcode); |
| DCHECK(!IsPseudoLirOp(opcode)); |
| return EncodingMap[opcode].size; |
| } |
| |
| // Encode instruction bit pattern and assign offsets. |
| uint32_t Arm64Mir2Lir::LinkFixupInsns(LIR* head_lir, LIR* tail_lir, uint32_t offset) { |
| LIR* end_lir = tail_lir->next; |
| |
| LIR* last_fixup = nullptr; |
| for (LIR* lir = head_lir; lir != end_lir; lir = NEXT_LIR(lir)) { |
| A64Opcode opcode = UNWIDE(lir->opcode); |
| if (!lir->flags.is_nop) { |
| if (lir->flags.fixup != kFixupNone) { |
| if (!IsPseudoLirOp(opcode)) { |
| lir->flags.size = EncodingMap[opcode].size; |
| lir->flags.fixup = EncodingMap[opcode].fixup; |
| } else { |
| DCHECK_NE(static_cast<int>(opcode), kPseudoPseudoAlign4); |
| lir->flags.size = 0; |
| lir->flags.fixup = kFixupLabel; |
| } |
| // Link into the fixup chain. |
| lir->flags.use_def_invalid = true; |
| lir->u.a.pcrel_next = nullptr; |
| if (first_fixup_ == nullptr) { |
| first_fixup_ = lir; |
| } else { |
| last_fixup->u.a.pcrel_next = lir; |
| } |
| last_fixup = lir; |
| lir->offset = offset; |
| } |
| offset += lir->flags.size; |
| } |
| } |
| return offset; |
| } |
| |
| void Arm64Mir2Lir::AssignDataOffsets() { |
| /* Set up offsets for literals */ |
| CodeOffset offset = data_offset_; |
| |
| offset = AssignLiteralOffset(offset); |
| |
| offset = AssignSwitchTablesOffset(offset); |
| |
| total_size_ = AssignFillArrayDataOffset(offset); |
| } |
| |
| } // namespace art |