blob: 23bdd87239421decd615fe66e08d0ed725d645e2 [file] [log] [blame]
/*
* Copyright (C) 2013 The Android Open Source Project
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#ifndef ART_COMPILER_DEX_MIR_GRAPH_H_
#define ART_COMPILER_DEX_MIR_GRAPH_H_
#include <stdint.h>
#include "compiler_ir.h"
#include "dex_file.h"
#include "dex_instruction.h"
#include "driver/dex_compilation_unit.h"
#include "invoke_type.h"
#include "mir_field_info.h"
#include "mir_method_info.h"
#include "utils/arena_bit_vector.h"
#include "utils/arena_containers.h"
#include "utils/scoped_arena_containers.h"
#include "reg_location.h"
#include "reg_storage.h"
namespace art {
class DexFileMethodInliner;
class GlobalValueNumbering;
enum DataFlowAttributePos {
kUA = 0,
kUB,
kUC,
kAWide,
kBWide,
kCWide,
kDA,
kIsMove,
kSetsConst,
kFormat35c,
kFormat3rc,
kFormatExtended, // Extended format for extended MIRs.
kNullCheckA, // Null check of A.
kNullCheckB, // Null check of B.
kNullCheckOut0, // Null check out outgoing arg0.
kDstNonNull, // May assume dst is non-null.
kRetNonNull, // May assume retval is non-null.
kNullTransferSrc0, // Object copy src[0] -> dst.
kNullTransferSrcN, // Phi null check state transfer.
kRangeCheckC, // Range check of C.
kFPA,
kFPB,
kFPC,
kCoreA,
kCoreB,
kCoreC,
kRefA,
kRefB,
kRefC,
kUsesMethodStar, // Implicit use of Method*.
kUsesIField, // Accesses an instance field (IGET/IPUT).
kUsesSField, // Accesses a static field (SGET/SPUT).
kCanInitializeClass, // Can trigger class initialization (SGET/SPUT/INVOKE_STATIC).
kDoLVN, // Worth computing local value numbers.
};
#define DF_NOP UINT64_C(0)
#define DF_UA (UINT64_C(1) << kUA)
#define DF_UB (UINT64_C(1) << kUB)
#define DF_UC (UINT64_C(1) << kUC)
#define DF_A_WIDE (UINT64_C(1) << kAWide)
#define DF_B_WIDE (UINT64_C(1) << kBWide)
#define DF_C_WIDE (UINT64_C(1) << kCWide)
#define DF_DA (UINT64_C(1) << kDA)
#define DF_IS_MOVE (UINT64_C(1) << kIsMove)
#define DF_SETS_CONST (UINT64_C(1) << kSetsConst)
#define DF_FORMAT_35C (UINT64_C(1) << kFormat35c)
#define DF_FORMAT_3RC (UINT64_C(1) << kFormat3rc)
#define DF_FORMAT_EXTENDED (UINT64_C(1) << kFormatExtended)
#define DF_NULL_CHK_A (UINT64_C(1) << kNullCheckA)
#define DF_NULL_CHK_B (UINT64_C(1) << kNullCheckB)
#define DF_NULL_CHK_OUT0 (UINT64_C(1) << kNullCheckOut0)
#define DF_NON_NULL_DST (UINT64_C(1) << kDstNonNull)
#define DF_NON_NULL_RET (UINT64_C(1) << kRetNonNull)
#define DF_NULL_TRANSFER_0 (UINT64_C(1) << kNullTransferSrc0)
#define DF_NULL_TRANSFER_N (UINT64_C(1) << kNullTransferSrcN)
#define DF_RANGE_CHK_C (UINT64_C(1) << kRangeCheckC)
#define DF_FP_A (UINT64_C(1) << kFPA)
#define DF_FP_B (UINT64_C(1) << kFPB)
#define DF_FP_C (UINT64_C(1) << kFPC)
#define DF_CORE_A (UINT64_C(1) << kCoreA)
#define DF_CORE_B (UINT64_C(1) << kCoreB)
#define DF_CORE_C (UINT64_C(1) << kCoreC)
#define DF_REF_A (UINT64_C(1) << kRefA)
#define DF_REF_B (UINT64_C(1) << kRefB)
#define DF_REF_C (UINT64_C(1) << kRefC)
#define DF_UMS (UINT64_C(1) << kUsesMethodStar)
#define DF_IFIELD (UINT64_C(1) << kUsesIField)
#define DF_SFIELD (UINT64_C(1) << kUsesSField)
#define DF_CLINIT (UINT64_C(1) << kCanInitializeClass)
#define DF_LVN (UINT64_C(1) << kDoLVN)
#define DF_HAS_USES (DF_UA | DF_UB | DF_UC)
#define DF_HAS_DEFS (DF_DA)
#define DF_HAS_NULL_CHKS (DF_NULL_CHK_A | \
DF_NULL_CHK_B | \
DF_NULL_CHK_OUT0)
#define DF_HAS_RANGE_CHKS (DF_RANGE_CHK_C)
#define DF_HAS_NR_CHKS (DF_HAS_NULL_CHKS | \
DF_HAS_RANGE_CHKS)
#define DF_A_IS_REG (DF_UA | DF_DA)
#define DF_B_IS_REG (DF_UB)
#define DF_C_IS_REG (DF_UC)
#define DF_USES_FP (DF_FP_A | DF_FP_B | DF_FP_C)
#define DF_NULL_TRANSFER (DF_NULL_TRANSFER_0 | DF_NULL_TRANSFER_N)
#define DF_IS_INVOKE (DF_FORMAT_35C | DF_FORMAT_3RC)
enum OatMethodAttributes {
kIsLeaf, // Method is leaf.
};
#define METHOD_IS_LEAF (1 << kIsLeaf)
// Minimum field size to contain Dalvik v_reg number.
#define VREG_NUM_WIDTH 16
#define INVALID_SREG (-1)
#define INVALID_VREG (0xFFFFU)
#define INVALID_OFFSET (0xDEADF00FU)
#define MIR_IGNORE_NULL_CHECK (1 << kMIRIgnoreNullCheck)
#define MIR_IGNORE_RANGE_CHECK (1 << kMIRIgnoreRangeCheck)
#define MIR_STORE_NON_NULL_VALUE (1 << kMIRStoreNonNullValue)
#define MIR_CLASS_IS_INITIALIZED (1 << kMIRClassIsInitialized)
#define MIR_CLASS_IS_IN_DEX_CACHE (1 << kMIRClassIsInDexCache)
#define MIR_IGNORE_DIV_ZERO_CHECK (1 << kMirIgnoreDivZeroCheck)
#define MIR_INLINED (1 << kMIRInlined)
#define MIR_INLINED_PRED (1 << kMIRInlinedPred)
#define MIR_CALLEE (1 << kMIRCallee)
#define MIR_IGNORE_SUSPEND_CHECK (1 << kMIRIgnoreSuspendCheck)
#define MIR_DUP (1 << kMIRDup)
#define MIR_MARK (1 << kMIRMark)
#define MIR_STORE_NON_TEMPORAL (1 << kMIRStoreNonTemporal)
#define BLOCK_NAME_LEN 80
typedef uint16_t BasicBlockId;
static const BasicBlockId NullBasicBlockId = 0;
static constexpr bool kLeafOptimization = false;
/*
* In general, vreg/sreg describe Dalvik registers that originated with dx. However,
* it is useful to have compiler-generated temporary registers and have them treated
* in the same manner as dx-generated virtual registers. This struct records the SSA
* name of compiler-introduced temporaries.
*/
struct CompilerTemp {
int32_t v_reg; // Virtual register number for temporary.
int32_t s_reg_low; // SSA name for low Dalvik word.
};
enum CompilerTempType {
kCompilerTempVR, // A virtual register temporary.
kCompilerTempSpecialMethodPtr, // Temporary that keeps track of current method pointer.
kCompilerTempBackend, // Temporary that is used by backend.
};
// When debug option enabled, records effectiveness of null and range check elimination.
struct Checkstats {
int32_t null_checks;
int32_t null_checks_eliminated;
int32_t range_checks;
int32_t range_checks_eliminated;
};
// Dataflow attributes of a basic block.
struct BasicBlockDataFlow {
ArenaBitVector* use_v;
ArenaBitVector* def_v;
ArenaBitVector* live_in_v;
int32_t* vreg_to_ssa_map_exit;
};
/*
* Normalized use/def for a MIR operation using SSA names rather than vregs. Note that
* uses/defs retain the Dalvik convention that long operations operate on a pair of 32-bit
* vregs. For example, "ADD_LONG v0, v2, v3" would have 2 defs (v0/v1) and 4 uses (v2/v3, v4/v5).
* Following SSA renaming, this is the primary struct used by code generators to locate
* operand and result registers. This is a somewhat confusing and unhelpful convention that
* we may want to revisit in the future.
*
* TODO:
* 1. Add accessors for uses/defs and make data private
* 2. Change fp_use/fp_def to a bit array (could help memory usage)
* 3. Combine array storage into internal array and handled via accessors from 1.
*/
struct SSARepresentation {
int32_t* uses;
bool* fp_use;
int32_t* defs;
bool* fp_def;
int16_t num_uses_allocated;
int16_t num_defs_allocated;
int16_t num_uses;
int16_t num_defs;
static uint32_t GetStartUseIndex(Instruction::Code opcode);
};
/*
* The Midlevel Intermediate Representation node, which may be largely considered a
* wrapper around a Dalvik byte code.
*/
class MIR : public ArenaObject<kArenaAllocMIR> {
public:
/*
* TODO: remove embedded DecodedInstruction to save space, keeping only opcode. Recover
* additional fields on as-needed basis. Question: how to support MIR Pseudo-ops; probably
* need to carry aux data pointer.
*/
struct DecodedInstruction {
uint32_t vA;
uint32_t vB;
uint64_t vB_wide; /* for k51l */
uint32_t vC;
uint32_t arg[5]; /* vC/D/E/F/G in invoke or filled-new-array */
Instruction::Code opcode;
explicit DecodedInstruction():vA(0), vB(0), vB_wide(0), vC(0), opcode(Instruction::NOP) {
}
/*
* Given a decoded instruction representing a const bytecode, it updates
* the out arguments with proper values as dictated by the constant bytecode.
*/
bool GetConstant(int64_t* ptr_value, bool* wide) const;
static bool IsPseudoMirOp(Instruction::Code opcode) {
return static_cast<int>(opcode) >= static_cast<int>(kMirOpFirst);
}
static bool IsPseudoMirOp(int opcode) {
return opcode >= static_cast<int>(kMirOpFirst);
}
bool IsInvoke() const {
return ((FlagsOf() & Instruction::kInvoke) == Instruction::kInvoke);
}
bool IsStore() const {
return ((FlagsOf() & Instruction::kStore) == Instruction::kStore);
}
bool IsLoad() const {
return ((FlagsOf() & Instruction::kLoad) == Instruction::kLoad);
}
bool IsConditionalBranch() const {
return (FlagsOf() == (Instruction::kContinue | Instruction::kBranch));
}
/**
* @brief Is the register C component of the decoded instruction a constant?
*/
bool IsCFieldOrConstant() const {
return ((FlagsOf() & Instruction::kRegCFieldOrConstant) == Instruction::kRegCFieldOrConstant);
}
/**
* @brief Is the register C component of the decoded instruction a constant?
*/
bool IsBFieldOrConstant() const {
return ((FlagsOf() & Instruction::kRegBFieldOrConstant) == Instruction::kRegBFieldOrConstant);
}
bool IsCast() const {
return ((FlagsOf() & Instruction::kCast) == Instruction::kCast);
}
/**
* @brief Does the instruction clobber memory?
* @details Clobber means that the instruction changes the memory not in a punctual way.
* Therefore any supposition on memory aliasing or memory contents should be disregarded
* when crossing such an instruction.
*/
bool Clobbers() const {
return ((FlagsOf() & Instruction::kClobber) == Instruction::kClobber);
}
bool IsLinear() const {
return (FlagsOf() & (Instruction::kAdd | Instruction::kSubtract)) != 0;
}
int FlagsOf() const;
} dalvikInsn;
NarrowDexOffset offset; // Offset of the instruction in code units.
uint16_t optimization_flags;
int16_t m_unit_index; // From which method was this MIR included
BasicBlockId bb;
MIR* next;
SSARepresentation* ssa_rep;
union {
// Incoming edges for phi node.
BasicBlockId* phi_incoming;
// Establish link from check instruction (kMirOpCheck) to the actual throwing instruction.
MIR* throw_insn;
// Branch condition for fused cmp or select.
ConditionCode ccode;
// IGET/IPUT lowering info index, points to MIRGraph::ifield_lowering_infos_. Due to limit on
// the number of code points (64K) and size of IGET/IPUT insn (2), this will never exceed 32K.
uint32_t ifield_lowering_info;
// SGET/SPUT lowering info index, points to MIRGraph::sfield_lowering_infos_. Due to limit on
// the number of code points (64K) and size of SGET/SPUT insn (2), this will never exceed 32K.
uint32_t sfield_lowering_info;
// INVOKE data index, points to MIRGraph::method_lowering_infos_.
uint32_t method_lowering_info;
} meta;
explicit MIR() : offset(0), optimization_flags(0), m_unit_index(0), bb(NullBasicBlockId),
next(nullptr), ssa_rep(nullptr) {
memset(&meta, 0, sizeof(meta));
}
uint32_t GetStartUseIndex() const {
return SSARepresentation::GetStartUseIndex(dalvikInsn.opcode);
}
MIR* Copy(CompilationUnit *c_unit);
MIR* Copy(MIRGraph* mir_Graph);
};
struct SuccessorBlockInfo;
class BasicBlock : public DeletableArenaObject<kArenaAllocBB> {
public:
BasicBlock(BasicBlockId block_id, BBType type, ArenaAllocator* allocator)
: id(block_id),
dfs_id(), start_offset(), fall_through(), taken(), i_dom(), nesting_depth(),
block_type(type),
successor_block_list_type(kNotUsed),
visited(), hidden(), catch_entry(), explicit_throw(), conditional_branch(),
terminated_by_return(), dominates_return(), use_lvn(), first_mir_insn(),
last_mir_insn(), data_flow_info(), dominators(), i_dominated(), dom_frontier(),
predecessors(allocator->Adapter(kArenaAllocBBPredecessors)),
successor_blocks(allocator->Adapter(kArenaAllocSuccessor)) {
}
BasicBlockId id;
BasicBlockId dfs_id;
NarrowDexOffset start_offset; // Offset in code units.
BasicBlockId fall_through;
BasicBlockId taken;
BasicBlockId i_dom; // Immediate dominator.
uint16_t nesting_depth;
BBType block_type:4;
BlockListType successor_block_list_type:4;
bool visited:1;
bool hidden:1;
bool catch_entry:1;
bool explicit_throw:1;
bool conditional_branch:1;
bool terminated_by_return:1; // Block ends with a Dalvik return opcode.
bool dominates_return:1; // Is a member of return extended basic block.
bool use_lvn:1; // Run local value numbering on this block.
MIR* first_mir_insn;
MIR* last_mir_insn;
BasicBlockDataFlow* data_flow_info;
ArenaBitVector* dominators;
ArenaBitVector* i_dominated; // Set nodes being immediately dominated.
ArenaBitVector* dom_frontier; // Dominance frontier.
ArenaVector<BasicBlockId> predecessors;
ArenaVector<SuccessorBlockInfo*> successor_blocks;
void AppendMIR(MIR* mir);
void AppendMIRList(MIR* first_list_mir, MIR* last_list_mir);
void AppendMIRList(const std::vector<MIR*>& insns);
void PrependMIR(MIR* mir);
void PrependMIRList(MIR* first_list_mir, MIR* last_list_mir);
void PrependMIRList(const std::vector<MIR*>& to_add);
void InsertMIRAfter(MIR* current_mir, MIR* new_mir);
void InsertMIRListAfter(MIR* insert_after, MIR* first_list_mir, MIR* last_list_mir);
MIR* FindPreviousMIR(MIR* mir);
void InsertMIRBefore(MIR* insert_before, MIR* list);
void InsertMIRListBefore(MIR* insert_before, MIR* first_list_mir, MIR* last_list_mir);
bool RemoveMIR(MIR* mir);
bool RemoveMIRList(MIR* first_list_mir, MIR* last_list_mir);
BasicBlock* Copy(CompilationUnit* c_unit);
BasicBlock* Copy(MIRGraph* mir_graph);
/**
* @brief Reset the optimization_flags field of each MIR.
*/
void ResetOptimizationFlags(uint16_t reset_flags);
/**
* @brief Kill the BasicBlock.
* @details Unlink predecessors and successors, remove all MIRs, set the block type to kDead
* and set hidden to true.
*/
void Kill(MIRGraph* mir_graph);
/**
* @brief Is ssa_reg the last SSA definition of that VR in the block?
*/
bool IsSSALiveOut(const CompilationUnit* c_unit, int ssa_reg);
/**
* @brief Replace the edge going to old_bb to now go towards new_bb.
*/
bool ReplaceChild(BasicBlockId old_bb, BasicBlockId new_bb);
/**
* @brief Erase the predecessor old_pred.
*/
void ErasePredecessor(BasicBlockId old_pred);
/**
* @brief Update the predecessor array from old_pred to new_pred.
*/
void UpdatePredecessor(BasicBlockId old_pred, BasicBlockId new_pred);
/**
* @brief Return first non-Phi insn.
*/
MIR* GetFirstNonPhiInsn();
/**
* @brief Used to obtain the next MIR that follows unconditionally.
* @details The implementation does not guarantee that a MIR does not
* follow even if this method returns nullptr.
* @param mir_graph the MIRGraph.
* @param current The MIR for which to find an unconditional follower.
* @return Returns the following MIR if one can be found.
*/
MIR* GetNextUnconditionalMir(MIRGraph* mir_graph, MIR* current);
bool IsExceptionBlock() const;
private:
DISALLOW_COPY_AND_ASSIGN(BasicBlock);
};
/*
* The "blocks" field in "successor_block_list" points to an array of elements with the type
* "SuccessorBlockInfo". For catch blocks, key is type index for the exception. For switch
* blocks, key is the case value.
*/
struct SuccessorBlockInfo {
BasicBlockId block;
int key;
};
/**
* @class ChildBlockIterator
* @brief Enable an easy iteration of the children.
*/
class ChildBlockIterator {
public:
/**
* @brief Constructs a child iterator.
* @param bb The basic whose children we need to iterate through.
* @param mir_graph The MIRGraph used to get the basic block during iteration.
*/
ChildBlockIterator(BasicBlock* bb, MIRGraph* mir_graph);
BasicBlock* Next();
private:
BasicBlock* basic_block_;
MIRGraph* mir_graph_;
bool visited_fallthrough_;
bool visited_taken_;
bool have_successors_;
ArenaVector<SuccessorBlockInfo*>::const_iterator successor_iter_;
};
/*
* Collection of information describing an invoke, and the destination of
* the subsequent MOVE_RESULT (if applicable). Collected as a unit to enable
* more efficient invoke code generation.
*/
struct CallInfo {
int num_arg_words; // Note: word count, not arg count.
RegLocation* args; // One for each word of arguments.
RegLocation result; // Eventual target of MOVE_RESULT.
int opt_flags;
InvokeType type;
uint32_t dex_idx;
uint32_t index; // Method idx for invokes, type idx for FilledNewArray.
uintptr_t direct_code;
uintptr_t direct_method;
RegLocation target; // Target of following move_result.
bool skip_this;
bool is_range;
DexOffset offset; // Offset in code units.
MIR* mir;
};
const RegLocation bad_loc = {kLocDalvikFrame, 0, 0, 0, 0, 0, 0, 0, 0, RegStorage(), INVALID_SREG,
INVALID_SREG};
class MIRGraph {
public:
MIRGraph(CompilationUnit* cu, ArenaAllocator* arena);
virtual ~MIRGraph();
/*
* Examine the graph to determine whether it's worthwile to spend the time compiling
* this method.
*/
bool SkipCompilation(std::string* skip_message);
/*
* Should we skip the compilation of this method based on its name?
*/
bool SkipCompilationByName(const std::string& methodname);
/*
* Parse dex method and add MIR at current insert point. Returns id (which is
* actually the index of the method in the m_units_ array).
*/
void InlineMethod(const DexFile::CodeItem* code_item, uint32_t access_flags,
InvokeType invoke_type, uint16_t class_def_idx,
uint32_t method_idx, jobject class_loader, const DexFile& dex_file);
/* Find existing block */
BasicBlock* FindBlock(DexOffset code_offset) {
return FindBlock(code_offset, false, NULL);
}
const uint16_t* GetCurrentInsns() const {
return current_code_item_->insns_;
}
/**
* @brief Used to obtain the raw dex bytecode instruction pointer.
* @param m_unit_index The method index in MIRGraph (caused by having multiple methods).
* This is guaranteed to contain index 0 which is the base method being compiled.
* @return Returns the raw instruction pointer.
*/
const uint16_t* GetInsns(int m_unit_index) const {
return m_units_[m_unit_index]->GetCodeItem()->insns_;
}
/**
* @brief Used to obtain the raw data table.
* @param mir sparse switch, packed switch, of fill-array-data
* @param table_offset The table offset from start of method.
* @return Returns the raw table pointer.
*/
const uint16_t* GetTable(MIR* mir, uint32_t table_offset) const {
return GetInsns(mir->m_unit_index) + mir->offset + static_cast<int32_t>(table_offset);
}
unsigned int GetNumBlocks() const {
return block_list_.size();
}
/**
* @brief Provides the total size in code units of all instructions in MIRGraph.
* @details Includes the sizes of all methods in compilation unit.
* @return Returns the cumulative sum of all insn sizes (in code units).
*/
size_t GetNumDalvikInsns() const;
ArenaBitVector* GetTryBlockAddr() const {
return try_block_addr_;
}
BasicBlock* GetEntryBlock() const {
return entry_block_;
}
BasicBlock* GetExitBlock() const {
return exit_block_;
}
BasicBlock* GetBasicBlock(unsigned int block_id) const {
DCHECK_LT(block_id, block_list_.size()); // NOTE: NullBasicBlockId is 0.
return (block_id == NullBasicBlockId) ? NULL : block_list_[block_id];
}
size_t GetBasicBlockListCount() const {
return block_list_.size();
}
const ArenaVector<BasicBlock*>& GetBlockList() {
return block_list_;
}
const ArenaVector<BasicBlockId>& GetDfsOrder() {
return dfs_order_;
}
const ArenaVector<BasicBlockId>& GetDfsPostOrder() {
return dfs_post_order_;
}
const ArenaVector<BasicBlockId>& GetDomPostOrder() {
return dom_post_order_traversal_;
}
int GetDefCount() const {
return def_count_;
}
ArenaAllocator* GetArena() const {
return arena_;
}
void EnableOpcodeCounting() {
opcode_count_ = static_cast<int*>(arena_->Alloc(kNumPackedOpcodes * sizeof(int),
kArenaAllocMisc));
}
void ShowOpcodeStats();
DexCompilationUnit* GetCurrentDexCompilationUnit() const {
return m_units_[current_method_];
}
/**
* @brief Dump a CFG into a dot file format.
* @param dir_prefix the directory the file will be created in.
* @param all_blocks does the dumper use all the basic blocks or use the reachable blocks.
* @param suffix does the filename require a suffix or not (default = nullptr).
*/
void DumpCFG(const char* dir_prefix, bool all_blocks, const char* suffix = nullptr);
bool HasFieldAccess() const {
return (merged_df_flags_ & (DF_IFIELD | DF_SFIELD)) != 0u;
}
bool HasStaticFieldAccess() const {
return (merged_df_flags_ & DF_SFIELD) != 0u;
}
bool HasInvokes() const {
// NOTE: These formats include the rare filled-new-array/range.
return (merged_df_flags_ & (DF_FORMAT_35C | DF_FORMAT_3RC)) != 0u;
}
void DoCacheFieldLoweringInfo();
const MirIFieldLoweringInfo& GetIFieldLoweringInfo(MIR* mir) const {
return GetIFieldLoweringInfo(mir->meta.ifield_lowering_info);
}
const MirIFieldLoweringInfo& GetIFieldLoweringInfo(uint32_t lowering_info) const {
DCHECK_LT(lowering_info, ifield_lowering_infos_.size());
return ifield_lowering_infos_[lowering_info];
}
size_t GetIFieldLoweringInfoCount() const {
return ifield_lowering_infos_.size();
}
const MirSFieldLoweringInfo& GetSFieldLoweringInfo(MIR* mir) const {
return GetSFieldLoweringInfo(mir->meta.sfield_lowering_info);
}
const MirSFieldLoweringInfo& GetSFieldLoweringInfo(uint32_t lowering_info) const {
DCHECK_LT(lowering_info, sfield_lowering_infos_.size());
return sfield_lowering_infos_[lowering_info];
}
size_t GetSFieldLoweringInfoCount() const {
return sfield_lowering_infos_.size();
}
void DoCacheMethodLoweringInfo();
const MirMethodLoweringInfo& GetMethodLoweringInfo(MIR* mir) {
DCHECK_LT(mir->meta.method_lowering_info, method_lowering_infos_.size());
return method_lowering_infos_[mir->meta.method_lowering_info];
}
void ComputeInlineIFieldLoweringInfo(uint16_t field_idx, MIR* invoke, MIR* iget_or_iput);
void InitRegLocations();
void RemapRegLocations();
void DumpRegLocTable(RegLocation* table, int count);
void BasicBlockOptimizationStart();
void BasicBlockOptimization();
void BasicBlockOptimizationEnd();
const ArenaVector<BasicBlockId>& GetTopologicalSortOrder() {
DCHECK(!topological_order_.empty());
return topological_order_;
}
const ArenaVector<BasicBlockId>& GetTopologicalSortOrderLoopEnds() {
DCHECK(!topological_order_loop_ends_.empty());
return topological_order_loop_ends_;
}
const ArenaVector<BasicBlockId>& GetTopologicalSortOrderIndexes() {
DCHECK(!topological_order_indexes_.empty());
return topological_order_indexes_;
}
ArenaVector<std::pair<uint16_t, bool>>* GetTopologicalSortOrderLoopHeadStack() {
DCHECK(!topological_order_.empty()); // Checking the main array, not the stack.
return &topological_order_loop_head_stack_;
}
size_t GetMaxNestedLoops() const {
return max_nested_loops_;
}
bool IsLoopHead(BasicBlockId bb_id) {
return topological_order_loop_ends_[topological_order_indexes_[bb_id]] != 0u;
}
bool IsConst(int32_t s_reg) const {
return is_constant_v_->IsBitSet(s_reg);
}
bool IsConst(RegLocation loc) const {
return loc.orig_sreg < 0 ? false : IsConst(loc.orig_sreg);
}
int32_t ConstantValue(RegLocation loc) const {
DCHECK(IsConst(loc));
return constant_values_[loc.orig_sreg];
}
int32_t ConstantValue(int32_t s_reg) const {
DCHECK(IsConst(s_reg));
return constant_values_[s_reg];
}
/**
* @brief Used to obtain 64-bit value of a pair of ssa registers.
* @param s_reg_low The ssa register representing the low bits.
* @param s_reg_high The ssa register representing the high bits.
* @return Retusn the 64-bit constant value.
*/
int64_t ConstantValueWide(int32_t s_reg_low, int32_t s_reg_high) const {
DCHECK(IsConst(s_reg_low));
DCHECK(IsConst(s_reg_high));
return (static_cast<int64_t>(constant_values_[s_reg_high]) << 32) |
Low32Bits(static_cast<int64_t>(constant_values_[s_reg_low]));
}
int64_t ConstantValueWide(RegLocation loc) const {
DCHECK(IsConst(loc));
DCHECK(!loc.high_word); // Do not allow asking for the high partner.
DCHECK_LT(loc.orig_sreg + 1, GetNumSSARegs());
return (static_cast<int64_t>(constant_values_[loc.orig_sreg + 1]) << 32) |
Low32Bits(static_cast<int64_t>(constant_values_[loc.orig_sreg]));
}
/**
* @brief Used to mark ssa register as being constant.
* @param ssa_reg The ssa register.
* @param value The constant value of ssa register.
*/
void SetConstant(int32_t ssa_reg, int32_t value);
/**
* @brief Used to mark ssa register and its wide counter-part as being constant.
* @param ssa_reg The ssa register.
* @param value The 64-bit constant value of ssa register and its pair.
*/
void SetConstantWide(int32_t ssa_reg, int64_t value);
bool IsConstantNullRef(RegLocation loc) const {
return loc.ref && loc.is_const && (ConstantValue(loc) == 0);
}
int GetNumSSARegs() const {
return num_ssa_regs_;
}
void SetNumSSARegs(int new_num) {
/*
* TODO: It's theoretically possible to exceed 32767, though any cases which did
* would be filtered out with current settings. When orig_sreg field is removed
* from RegLocation, expand s_reg_low to handle all possible cases and remove DCHECK().
*/
CHECK_EQ(new_num, static_cast<int16_t>(new_num));
num_ssa_regs_ = new_num;
}
unsigned int GetNumReachableBlocks() const {
return num_reachable_blocks_;
}
uint32_t GetUseCount(int sreg) const {
DCHECK_LT(static_cast<size_t>(sreg), use_counts_.size());
return use_counts_[sreg];
}
uint32_t GetRawUseCount(int sreg) const {
DCHECK_LT(static_cast<size_t>(sreg), raw_use_counts_.size());
return raw_use_counts_[sreg];
}
int GetSSASubscript(int ssa_reg) const {
DCHECK_LT(static_cast<size_t>(ssa_reg), ssa_subscripts_.size());
return ssa_subscripts_[ssa_reg];
}
RegLocation GetRawSrc(MIR* mir, int num) {
DCHECK(num < mir->ssa_rep->num_uses);
RegLocation res = reg_location_[mir->ssa_rep->uses[num]];
return res;
}
RegLocation GetRawDest(MIR* mir) {
DCHECK_GT(mir->ssa_rep->num_defs, 0);
RegLocation res = reg_location_[mir->ssa_rep->defs[0]];
return res;
}
RegLocation GetDest(MIR* mir) {
RegLocation res = GetRawDest(mir);
DCHECK(!res.wide);
return res;
}
RegLocation GetSrc(MIR* mir, int num) {
RegLocation res = GetRawSrc(mir, num);
DCHECK(!res.wide);
return res;
}
RegLocation GetDestWide(MIR* mir) {
RegLocation res = GetRawDest(mir);
DCHECK(res.wide);
return res;
}
RegLocation GetSrcWide(MIR* mir, int low) {
RegLocation res = GetRawSrc(mir, low);
DCHECK(res.wide);
return res;
}
RegLocation GetBadLoc() {
return bad_loc;
}
int GetMethodSReg() const {
return method_sreg_;
}
/**
* @brief Used to obtain the number of compiler temporaries being used.
* @return Returns the number of compiler temporaries.
*/
size_t GetNumUsedCompilerTemps() const {
// Assume that the special temps will always be used.
return GetNumNonSpecialCompilerTemps() + max_available_special_compiler_temps_;
}
/**
* @brief Used to obtain number of bytes needed for special temps.
* @details This space is always needed because temps have special location on stack.
* @return Returns number of bytes for the special temps.
*/
size_t GetNumBytesForSpecialTemps() const;
/**
* @brief Used by backend as a hint for maximum number of bytes for non-special temps.
* @details Returns 4 bytes for each temp because that is the maximum amount needed
* for storing each temp. The BE could be smarter though and allocate a smaller
* spill region.
* @return Returns the maximum number of bytes needed for non-special temps.
*/
size_t GetMaximumBytesForNonSpecialTemps() const {
return GetNumNonSpecialCompilerTemps() * sizeof(uint32_t);
}
/**
* @brief Used to obtain the number of non-special compiler temporaries being used.
* @return Returns the number of non-special compiler temporaries.
*/
size_t GetNumNonSpecialCompilerTemps() const {
return num_non_special_compiler_temps_;
}
/**
* @brief Used to set the total number of available non-special compiler temporaries.
* @details Can fail setting the new max if there are more temps being used than the new_max.
* @param new_max The new maximum number of non-special compiler temporaries.
* @return Returns true if the max was set and false if failed to set.
*/
bool SetMaxAvailableNonSpecialCompilerTemps(size_t new_max) {
// Make sure that enough temps still exist for backend and also that the
// new max can still keep around all of the already requested temps.
if (new_max < (GetNumNonSpecialCompilerTemps() + reserved_temps_for_backend_)) {
return false;
} else {
max_available_non_special_compiler_temps_ = new_max;
return true;
}
}
/**
* @brief Provides the number of non-special compiler temps available for use by ME.
* @details Even if this returns zero, special compiler temps are guaranteed to be available.
* Additionally, this makes sure to not use any temps reserved for BE only.
* @return Returns the number of available temps.
*/
size_t GetNumAvailableVRTemps();
/**
* @brief Used to obtain the maximum number of compiler temporaries that can be requested.
* @return Returns the maximum number of compiler temporaries, whether used or not.
*/
size_t GetMaxPossibleCompilerTemps() const {
return max_available_special_compiler_temps_ + max_available_non_special_compiler_temps_;
}
/**
* @brief Used to signal that the compiler temps have been committed.
* @details This should be used once the number of temps can no longer change,
* such as after frame size is committed and cannot be changed.
*/
void CommitCompilerTemps() {
compiler_temps_committed_ = true;
}
/**
* @brief Used to obtain a new unique compiler temporary.
* @details Two things are done for convenience when allocating a new compiler
* temporary. The ssa register is automatically requested and the information
* about reg location is filled. This helps when the temp is requested post
* ssa initialization, such as when temps are requested by the backend.
* @warning If the temp requested will be used for ME and have multiple versions,
* the sreg provided by the temp will be invalidated on next ssa recalculation.
* @param ct_type Type of compiler temporary requested.
* @param wide Whether we should allocate a wide temporary.
* @return Returns the newly created compiler temporary.
*/
CompilerTemp* GetNewCompilerTemp(CompilerTempType ct_type, bool wide);
bool MethodIsLeaf() {
return attributes_ & METHOD_IS_LEAF;
}
RegLocation GetRegLocation(int index) {
DCHECK((index >= 0) && (index < num_ssa_regs_));
return reg_location_[index];
}
RegLocation GetMethodLoc() {
return reg_location_[method_sreg_];
}
bool IsBackEdge(BasicBlock* branch_bb, BasicBlockId target_bb_id) {
DCHECK_NE(target_bb_id, NullBasicBlockId);
DCHECK_LT(target_bb_id, topological_order_indexes_.size());
DCHECK_LT(branch_bb->id, topological_order_indexes_.size());
return topological_order_indexes_[target_bb_id] <= topological_order_indexes_[branch_bb->id];
}
bool IsSuspendCheckEdge(BasicBlock* branch_bb, BasicBlockId target_bb_id) {
if (!IsBackEdge(branch_bb, target_bb_id)) {
return false;
}
if (suspend_checks_in_loops_ == nullptr) {
// We didn't run suspend check elimination.
return true;
}
uint16_t target_depth = GetBasicBlock(target_bb_id)->nesting_depth;
return (suspend_checks_in_loops_[branch_bb->id] & (1u << (target_depth - 1u))) == 0;
}
void CountBranch(DexOffset target_offset) {
if (target_offset <= current_offset_) {
backward_branches_++;
} else {
forward_branches_++;
}
}
int GetBranchCount() {
return backward_branches_ + forward_branches_;
}
// Is this vreg in the in set?
bool IsInVReg(uint32_t vreg) {
return (vreg >= GetFirstInVR()) && (vreg < GetFirstTempVR());
}
uint32_t GetNumOfCodeVRs() const {
return current_code_item_->registers_size_;
}
uint32_t GetNumOfCodeAndTempVRs() const {
// Include all of the possible temps so that no structures overflow when initialized.
return GetNumOfCodeVRs() + GetMaxPossibleCompilerTemps();
}
uint32_t GetNumOfLocalCodeVRs() const {
// This also refers to the first "in" VR.
return GetNumOfCodeVRs() - current_code_item_->ins_size_;
}
uint32_t GetNumOfInVRs() const {
return current_code_item_->ins_size_;
}
uint32_t GetNumOfOutVRs() const {
return current_code_item_->outs_size_;
}
uint32_t GetFirstInVR() const {
return GetNumOfLocalCodeVRs();
}
uint32_t GetFirstTempVR() const {
// Temp VRs immediately follow code VRs.
return GetNumOfCodeVRs();
}
uint32_t GetFirstSpecialTempVR() const {
// Special temps appear first in the ordering before non special temps.
return GetFirstTempVR();
}
uint32_t GetFirstNonSpecialTempVR() const {
// We always leave space for all the special temps before the non-special ones.
return GetFirstSpecialTempVR() + max_available_special_compiler_temps_;
}
bool HasTryCatchBlocks() const {
return current_code_item_->tries_size_ != 0;
}
void DumpCheckStats();
MIR* FindMoveResult(BasicBlock* bb, MIR* mir);
int SRegToVReg(int ssa_reg) const;
void VerifyDataflow();
void CheckForDominanceFrontier(BasicBlock* dom_bb, const BasicBlock* succ_bb);
bool EliminateNullChecksGate();
bool EliminateNullChecks(BasicBlock* bb);
void EliminateNullChecksEnd();
bool InferTypes(BasicBlock* bb);
bool EliminateClassInitChecksGate();
bool EliminateClassInitChecks(BasicBlock* bb);
void EliminateClassInitChecksEnd();
bool ApplyGlobalValueNumberingGate();
bool ApplyGlobalValueNumbering(BasicBlock* bb);
void ApplyGlobalValueNumberingEnd();
bool EliminateSuspendChecksGate();
bool EliminateSuspendChecks(BasicBlock* bb);
void EliminateSuspendChecksEnd();
uint16_t GetGvnIFieldId(MIR* mir) const {
DCHECK(IsInstructionIGetOrIPut(mir->dalvikInsn.opcode));
DCHECK_LT(mir->meta.ifield_lowering_info, ifield_lowering_infos_.size());
DCHECK(temp_.gvn.ifield_ids_ != nullptr);
return temp_.gvn.ifield_ids_[mir->meta.ifield_lowering_info];
}
uint16_t GetGvnSFieldId(MIR* mir) const {
DCHECK(IsInstructionSGetOrSPut(mir->dalvikInsn.opcode));
DCHECK_LT(mir->meta.sfield_lowering_info, sfield_lowering_infos_.size());
DCHECK(temp_.gvn.sfield_ids_ != nullptr);
return temp_.gvn.sfield_ids_[mir->meta.sfield_lowering_info];
}
/*
* Type inference handling helpers. Because Dalvik's bytecode is not fully typed,
* we have to do some work to figure out the sreg type. For some operations it is
* clear based on the opcode (i.e. ADD_FLOAT v0, v1, v2), but for others (MOVE), we
* may never know the "real" type.
*
* We perform the type inference operation by using an iterative walk over
* the graph, propagating types "defined" by typed opcodes to uses and defs in
* non-typed opcodes (such as MOVE). The Setxx(index) helpers are used to set defined
* types on typed opcodes (such as ADD_INT). The Setxx(index, is_xx) form is used to
* propagate types through non-typed opcodes such as PHI and MOVE. The is_xx flag
* tells whether our guess of the type is based on a previously typed definition.
* If so, the defined type takes precedence. Note that it's possible to have the same sreg
* show multiple defined types because dx treats constants as untyped bit patterns.
* The return value of the Setxx() helpers says whether or not the Setxx() action changed
* the current guess, and is used to know when to terminate the iterative walk.
*/
bool SetFp(int index, bool is_fp);
bool SetFp(int index);
bool SetCore(int index, bool is_core);
bool SetCore(int index);
bool SetRef(int index, bool is_ref);
bool SetRef(int index);
bool SetWide(int index, bool is_wide);
bool SetWide(int index);
bool SetHigh(int index, bool is_high);
bool SetHigh(int index);
bool PuntToInterpreter() {
return punt_to_interpreter_;
}
void SetPuntToInterpreter(bool val) {
punt_to_interpreter_ = val;
}
void DisassembleExtendedInstr(const MIR* mir, std::string* decoded_mir);
char* GetDalvikDisassembly(const MIR* mir);
void ReplaceSpecialChars(std::string& str);
std::string GetSSAName(int ssa_reg);
std::string GetSSANameWithConst(int ssa_reg, bool singles_only);
void GetBlockName(BasicBlock* bb, char* name);
const char* GetShortyFromTargetIdx(int);
const char* GetShortyFromMethodReference(const MethodReference& target_method);
void DumpMIRGraph();
CallInfo* NewMemCallInfo(BasicBlock* bb, MIR* mir, InvokeType type, bool is_range);
BasicBlock* NewMemBB(BBType block_type, int block_id);
MIR* NewMIR();
MIR* AdvanceMIR(BasicBlock** p_bb, MIR* mir);
BasicBlock* NextDominatedBlock(BasicBlock* bb);
bool LayoutBlocks(BasicBlock* bb);
void ComputeTopologicalSortOrder();
BasicBlock* CreateNewBB(BBType block_type);
bool InlineSpecialMethodsGate();
void InlineSpecialMethodsStart();
void InlineSpecialMethods(BasicBlock* bb);
void InlineSpecialMethodsEnd();
/**
* @brief Perform the initial preparation for the Method Uses.
*/
void InitializeMethodUses();
/**
* @brief Perform the initial preparation for the Constant Propagation.
*/
void InitializeConstantPropagation();
/**
* @brief Perform the initial preparation for the SSA Transformation.
*/
void SSATransformationStart();
/**
* @brief Insert a the operands for the Phi nodes.
* @param bb the considered BasicBlock.
* @return true
*/
bool InsertPhiNodeOperands(BasicBlock* bb);
/**
* @brief Perform the cleanup after the SSA Transformation.
*/
void SSATransformationEnd();
/**
* @brief Perform constant propagation on a BasicBlock.
* @param bb the considered BasicBlock.
*/
void DoConstantPropagation(BasicBlock* bb);
/**
* @brief Count the uses in the BasicBlock
* @param bb the BasicBlock
*/
void CountUses(BasicBlock* bb);
static uint64_t GetDataFlowAttributes(Instruction::Code opcode);
static uint64_t GetDataFlowAttributes(MIR* mir);
/**
* @brief Combine BasicBlocks
* @param the BasicBlock we are considering
*/
void CombineBlocks(BasicBlock* bb);
void ClearAllVisitedFlags();
void AllocateSSAUseData(MIR *mir, int num_uses);
void AllocateSSADefData(MIR *mir, int num_defs);
void CalculateBasicBlockInformation();
void ComputeDFSOrders();
void ComputeDefBlockMatrix();
void ComputeDominators();
void CompilerInitializeSSAConversion();
virtual void InitializeBasicBlockDataFlow();
void InsertPhiNodes();
void DoDFSPreOrderSSARename(BasicBlock* block);
bool DfsOrdersUpToDate() const {
return dfs_orders_up_to_date_;
}
bool DominationUpToDate() const {
return domination_up_to_date_;
}
bool MirSsaRepUpToDate() const {
return mir_ssa_rep_up_to_date_;
}
bool TopologicalOrderUpToDate() const {
return topological_order_up_to_date_;
}
/*
* IsDebugBuild sanity check: keep track of the Dex PCs for catch entries so that later on
* we can verify that all catch entries have native PC entries.
*/
std::set<uint32_t> catches_;
// TODO: make these private.
RegLocation* reg_location_; // Map SSA names to location.
ArenaSafeMap<unsigned int, unsigned int> block_id_map_; // Block collapse lookup cache.
static const char* extended_mir_op_names_[kMirOpLast - kMirOpFirst];
void HandleSSADef(int* defs, int dalvik_reg, int reg_index);
bool InferTypeAndSize(BasicBlock* bb, MIR* mir, bool changed);
protected:
int FindCommonParent(int block1, int block2);
void ComputeSuccLineIn(ArenaBitVector* dest, const ArenaBitVector* src1,
const ArenaBitVector* src2);
void HandleLiveInUse(ArenaBitVector* use_v, ArenaBitVector* def_v,
ArenaBitVector* live_in_v, int dalvik_reg_id);
void HandleDef(ArenaBitVector* def_v, int dalvik_reg_id);
void HandleExtended(ArenaBitVector* use_v, ArenaBitVector* def_v,
ArenaBitVector* live_in_v,
const MIR::DecodedInstruction& d_insn);
bool DoSSAConversion(BasicBlock* bb);
int ParseInsn(const uint16_t* code_ptr, MIR::DecodedInstruction* decoded_instruction);
bool ContentIsInsn(const uint16_t* code_ptr);
BasicBlock* SplitBlock(DexOffset code_offset, BasicBlock* orig_block,
BasicBlock** immed_pred_block_p);
BasicBlock* FindBlock(DexOffset code_offset, bool create, BasicBlock** immed_pred_block_p);
void ProcessTryCatchBlocks();
bool IsBadMonitorExitCatch(NarrowDexOffset monitor_exit_offset, NarrowDexOffset catch_offset);
BasicBlock* ProcessCanBranch(BasicBlock* cur_block, MIR* insn, DexOffset cur_offset, int width,
int flags, const uint16_t* code_ptr, const uint16_t* code_end);
BasicBlock* ProcessCanSwitch(BasicBlock* cur_block, MIR* insn, DexOffset cur_offset, int width,
int flags);
BasicBlock* ProcessCanThrow(BasicBlock* cur_block, MIR* insn, DexOffset cur_offset, int width,
int flags, ArenaBitVector* try_block_addr, const uint16_t* code_ptr,
const uint16_t* code_end);
int AddNewSReg(int v_reg);
void HandleSSAUse(int* uses, int dalvik_reg, int reg_index);
void DataFlowSSAFormat35C(MIR* mir);
void DataFlowSSAFormat3RC(MIR* mir);
void DataFlowSSAFormatExtended(MIR* mir);
bool FindLocalLiveIn(BasicBlock* bb);
bool VerifyPredInfo(BasicBlock* bb);
BasicBlock* NeedsVisit(BasicBlock* bb);
BasicBlock* NextUnvisitedSuccessor(BasicBlock* bb);
void MarkPreOrder(BasicBlock* bb);
void RecordDFSOrders(BasicBlock* bb);
void ComputeDomPostOrderTraversal(BasicBlock* bb);
int GetSSAUseCount(int s_reg);
bool BasicBlockOpt(BasicBlock* bb);
void MultiplyAddOpt(BasicBlock* bb);
/**
* @brief Check whether the given MIR is possible to throw an exception.
* @param mir The mir to check.
* @return Returns 'true' if the given MIR might throw an exception.
*/
bool CanThrow(MIR* mir);
/**
* @brief Combine multiply and add/sub MIRs into corresponding extended MAC MIR.
* @param mul_mir The multiply MIR to be combined.
* @param add_mir The add/sub MIR to be combined.
* @param mul_is_first_addend 'true' if multiply product is the first addend of add operation.
* @param is_wide 'true' if the operations are long type.
* @param is_sub 'true' if it is a multiply-subtract operation.
*/
void CombineMultiplyAdd(MIR* mul_mir, MIR* add_mir, bool mul_is_first_addend,
bool is_wide, bool is_sub);
/*
* @brief Check whether the first MIR anti-depends on the second MIR.
* @details To check whether one of first MIR's uses of vregs is redefined by the second MIR,
* i.e. there is a write-after-read dependency.
* @param first The first MIR.
* @param second The second MIR.
* @param Returns true if there is a write-after-read dependency.
*/
bool HasAntiDependency(MIR* first, MIR* second);
bool BuildExtendedBBList(class BasicBlock* bb);
bool FillDefBlockMatrix(BasicBlock* bb);
void InitializeDominationInfo(BasicBlock* bb);
bool ComputeblockIDom(BasicBlock* bb);
bool ComputeBlockDominators(BasicBlock* bb);
bool SetDominators(BasicBlock* bb);
bool ComputeBlockLiveIns(BasicBlock* bb);
bool ComputeDominanceFrontier(BasicBlock* bb);
void CountChecks(BasicBlock* bb);
void AnalyzeBlock(BasicBlock* bb, struct MethodStats* stats);
bool ComputeSkipCompilation(struct MethodStats* stats, bool skip_default,
std::string* skip_message);
CompilationUnit* const cu_;
ArenaVector<int> ssa_base_vregs_;
ArenaVector<int> ssa_subscripts_;
ArenaBitVector* is_constant_v_; // length == num_ssa_reg
int* constant_values_; // length == num_ssa_reg
// Use counts of ssa names.
ArenaVector<uint32_t> use_counts_; // Weighted by nesting depth
ArenaVector<uint32_t> raw_use_counts_; // Not weighted
unsigned int num_reachable_blocks_;
unsigned int max_num_reachable_blocks_;
bool dfs_orders_up_to_date_;
bool domination_up_to_date_;
bool mir_ssa_rep_up_to_date_;
bool topological_order_up_to_date_;
ArenaVector<BasicBlockId> dfs_order_;
ArenaVector<BasicBlockId> dfs_post_order_;
ArenaVector<BasicBlockId> dom_post_order_traversal_;
ArenaVector<BasicBlockId> topological_order_;
// Indexes in topological_order_ need to be only as big as the BasicBlockId.
static_assert(sizeof(BasicBlockId) == sizeof(uint16_t), "Assuming 16 bit BasicBlockId");
// For each loop head, remember the past-the-end index of the end of the loop. 0 if not loop head.
ArenaVector<uint16_t> topological_order_loop_ends_;
// Map BB ids to topological_order_ indexes. 0xffff if not included (hidden or null block).
ArenaVector<uint16_t> topological_order_indexes_;
// Stack of the loop head indexes and recalculation flags for RepeatingTopologicalSortIterator.
ArenaVector<std::pair<uint16_t, bool>> topological_order_loop_head_stack_;
size_t max_nested_loops_;
int* i_dom_list_;
std::unique_ptr<ScopedArenaAllocator> temp_scoped_alloc_;
// Union of temporaries used by different passes.
union {
// Class init check elimination.
struct {
size_t num_class_bits; // 2 bits per class: class initialized and class in dex cache.
ArenaBitVector* work_classes_to_check;
ArenaBitVector** ending_classes_to_check_matrix; // num_blocks_ x num_class_bits.
uint16_t* indexes;
} cice;
// Null check elimination.
struct {
size_t num_vregs;
ArenaBitVector* work_vregs_to_check;
ArenaBitVector** ending_vregs_to_check_matrix; // num_blocks_ x num_vregs.
} nce;
// Special method inlining.
struct {
size_t num_indexes;
ArenaBitVector* processed_indexes;
uint16_t* lowering_infos;
} smi;
// SSA transformation.
struct {
size_t num_vregs;
ArenaBitVector* work_live_vregs;
ArenaBitVector** def_block_matrix; // num_vregs x num_blocks_.
// Map original Dalvik virtual reg i to the current SSA name.
int* vreg_to_ssa_map_; // length == method->registers_size
int* ssa_last_defs_; // length == method->registers_size
} ssa;
// Global value numbering.
struct {
GlobalValueNumbering* gvn;
uint16_t* ifield_ids_; // Part of GVN/LVN but cached here for LVN to avoid recalculation.
uint16_t* sfield_ids_; // Ditto.
} gvn;
// Suspend check elimination.
struct {
DexFileMethodInliner* inliner;
} sce;
} temp_;
static const int kInvalidEntry = -1;
ArenaVector<BasicBlock*> block_list_;
ArenaBitVector* try_block_addr_;
BasicBlock* entry_block_;
BasicBlock* exit_block_;
const DexFile::CodeItem* current_code_item_;
ArenaVector<uint16_t> dex_pc_to_block_map_; // FindBlock lookup cache.
ArenaVector<DexCompilationUnit*> m_units_; // List of methods included in this graph
typedef std::pair<int, int> MIRLocation; // Insert point, (m_unit_ index, offset)
ArenaVector<MIRLocation> method_stack_; // Include stack
int current_method_;
DexOffset current_offset_; // Offset in code units
int def_count_; // Used to estimate size of ssa name storage.
int* opcode_count_; // Dex opcode coverage stats.
int num_ssa_regs_; // Number of names following SSA transformation.
ArenaVector<BasicBlockId> extended_basic_blocks_; // Heads of block "traces".
int method_sreg_;
unsigned int attributes_;
Checkstats* checkstats_;
ArenaAllocator* const arena_;
int backward_branches_;
int forward_branches_;
size_t num_non_special_compiler_temps_; // Keeps track of allocated non-special compiler temps. These are VRs that are in compiler temp region on stack.
size_t max_available_non_special_compiler_temps_; // Keeps track of maximum available non-special temps.
size_t max_available_special_compiler_temps_; // Keeps track of maximum available special temps.
bool requested_backend_temp_; // Keeps track whether BE temps have been requested.
size_t reserved_temps_for_backend_; // Keeps track of the remaining temps that are reserved for BE.
bool compiler_temps_committed_; // Keeps track whether number of temps has been frozen (for example post frame size calculation).
bool punt_to_interpreter_; // Difficult or not worthwhile - just interpret.
uint64_t merged_df_flags_;
ArenaVector<MirIFieldLoweringInfo> ifield_lowering_infos_;
ArenaVector<MirSFieldLoweringInfo> sfield_lowering_infos_;
ArenaVector<MirMethodLoweringInfo> method_lowering_infos_;
// In the suspend check elimination pass we determine for each basic block and enclosing
// loop whether there's guaranteed to be a suspend check on the path from the loop head
// to this block. If so, we can eliminate the back-edge suspend check.
// The bb->id is index into suspend_checks_in_loops_ and the loop head's depth is bit index
// in a suspend_checks_in_loops_[bb->id].
uint32_t* suspend_checks_in_loops_;
static const uint64_t oat_data_flow_attributes_[kMirOpLast];
friend class MirOptimizationTest;
friend class ClassInitCheckEliminationTest;
friend class SuspendCheckEliminationTest;
friend class NullCheckEliminationTest;
friend class GlobalValueNumberingTest;
friend class LocalValueNumberingTest;
friend class TopologicalSortOrderTest;
};
} // namespace art
#endif // ART_COMPILER_DEX_MIR_GRAPH_H_