1*795d594fSAndroid Build Coastguard Worker /* 2*795d594fSAndroid Build Coastguard Worker * Copyright (C) 2018 The Android Open Source Project 3*795d594fSAndroid Build Coastguard Worker * 4*795d594fSAndroid Build Coastguard Worker * Licensed under the Apache License, Version 2.0 (the "License"); 5*795d594fSAndroid Build Coastguard Worker * you may not use this file except in compliance with the License. 6*795d594fSAndroid Build Coastguard Worker * You may obtain a copy of the License at 7*795d594fSAndroid Build Coastguard Worker * 8*795d594fSAndroid Build Coastguard Worker * http://www.apache.org/licenses/LICENSE-2.0 9*795d594fSAndroid Build Coastguard Worker * 10*795d594fSAndroid Build Coastguard Worker * Unless required by applicable law or agreed to in writing, software 11*795d594fSAndroid Build Coastguard Worker * distributed under the License is distributed on an "AS IS" BASIS, 12*795d594fSAndroid Build Coastguard Worker * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 13*795d594fSAndroid Build Coastguard Worker * See the License for the specific language governing permissions and 14*795d594fSAndroid Build Coastguard Worker * limitations under the License. 15*795d594fSAndroid Build Coastguard Worker */ 16*795d594fSAndroid Build Coastguard Worker 17*795d594fSAndroid Build Coastguard Worker #ifndef ART_COMPILER_OPTIMIZING_LOOP_ANALYSIS_H_ 18*795d594fSAndroid Build Coastguard Worker #define ART_COMPILER_OPTIMIZING_LOOP_ANALYSIS_H_ 19*795d594fSAndroid Build Coastguard Worker 20*795d594fSAndroid Build Coastguard Worker #include "base/macros.h" 21*795d594fSAndroid Build Coastguard Worker #include "nodes.h" 22*795d594fSAndroid Build Coastguard Worker 23*795d594fSAndroid Build Coastguard Worker namespace art HIDDEN { 24*795d594fSAndroid Build Coastguard Worker 25*795d594fSAndroid Build Coastguard Worker class CodeGenerator; 26*795d594fSAndroid Build Coastguard Worker class InductionVarRange; 27*795d594fSAndroid Build Coastguard Worker class LoopAnalysis; 28*795d594fSAndroid Build Coastguard Worker 29*795d594fSAndroid Build Coastguard Worker // Class to hold cached information on properties of the loop. 30*795d594fSAndroid Build Coastguard Worker class LoopAnalysisInfo : public ValueObject { 31*795d594fSAndroid Build Coastguard Worker public: 32*795d594fSAndroid Build Coastguard Worker // No loop unrolling factor (just one copy of the loop-body). 33*795d594fSAndroid Build Coastguard Worker static constexpr uint32_t kNoUnrollingFactor = 1; 34*795d594fSAndroid Build Coastguard Worker // Used for unknown and non-constant trip counts (see InductionVarRange::HasKnownTripCount). 35*795d594fSAndroid Build Coastguard Worker static constexpr int64_t kUnknownTripCount = -1; 36*795d594fSAndroid Build Coastguard Worker LoopAnalysisInfo(HLoopInformation * loop_info)37*795d594fSAndroid Build Coastguard Worker explicit LoopAnalysisInfo(HLoopInformation* loop_info) 38*795d594fSAndroid Build Coastguard Worker : trip_count_(kUnknownTripCount), 39*795d594fSAndroid Build Coastguard Worker bb_num_(0), 40*795d594fSAndroid Build Coastguard Worker instr_num_(0), 41*795d594fSAndroid Build Coastguard Worker exits_num_(0), 42*795d594fSAndroid Build Coastguard Worker invariant_exits_num_(0), 43*795d594fSAndroid Build Coastguard Worker has_instructions_preventing_scalar_peeling_(false), 44*795d594fSAndroid Build Coastguard Worker has_instructions_preventing_scalar_unrolling_(false), 45*795d594fSAndroid Build Coastguard Worker has_long_type_instructions_(false), 46*795d594fSAndroid Build Coastguard Worker loop_info_(loop_info) {} 47*795d594fSAndroid Build Coastguard Worker GetTripCount()48*795d594fSAndroid Build Coastguard Worker int64_t GetTripCount() const { return trip_count_; } GetNumberOfBasicBlocks()49*795d594fSAndroid Build Coastguard Worker size_t GetNumberOfBasicBlocks() const { return bb_num_; } GetNumberOfInstructions()50*795d594fSAndroid Build Coastguard Worker size_t GetNumberOfInstructions() const { return instr_num_; } GetNumberOfExits()51*795d594fSAndroid Build Coastguard Worker size_t GetNumberOfExits() const { return exits_num_; } GetNumberOfInvariantExits()52*795d594fSAndroid Build Coastguard Worker size_t GetNumberOfInvariantExits() const { return invariant_exits_num_; } 53*795d594fSAndroid Build Coastguard Worker HasInstructionsPreventingScalarPeeling()54*795d594fSAndroid Build Coastguard Worker bool HasInstructionsPreventingScalarPeeling() const { 55*795d594fSAndroid Build Coastguard Worker return has_instructions_preventing_scalar_peeling_; 56*795d594fSAndroid Build Coastguard Worker } 57*795d594fSAndroid Build Coastguard Worker HasInstructionsPreventingScalarUnrolling()58*795d594fSAndroid Build Coastguard Worker bool HasInstructionsPreventingScalarUnrolling() const { 59*795d594fSAndroid Build Coastguard Worker return has_instructions_preventing_scalar_unrolling_; 60*795d594fSAndroid Build Coastguard Worker } 61*795d594fSAndroid Build Coastguard Worker HasInstructionsPreventingScalarOpts()62*795d594fSAndroid Build Coastguard Worker bool HasInstructionsPreventingScalarOpts() const { 63*795d594fSAndroid Build Coastguard Worker return HasInstructionsPreventingScalarPeeling() || HasInstructionsPreventingScalarUnrolling(); 64*795d594fSAndroid Build Coastguard Worker } 65*795d594fSAndroid Build Coastguard Worker HasLongTypeInstructions()66*795d594fSAndroid Build Coastguard Worker bool HasLongTypeInstructions() const { 67*795d594fSAndroid Build Coastguard Worker return has_long_type_instructions_; 68*795d594fSAndroid Build Coastguard Worker } 69*795d594fSAndroid Build Coastguard Worker GetLoopInfo()70*795d594fSAndroid Build Coastguard Worker HLoopInformation* GetLoopInfo() const { return loop_info_; } 71*795d594fSAndroid Build Coastguard Worker 72*795d594fSAndroid Build Coastguard Worker private: 73*795d594fSAndroid Build Coastguard Worker // Trip count of the loop if known, kUnknownTripCount otherwise. 74*795d594fSAndroid Build Coastguard Worker int64_t trip_count_; 75*795d594fSAndroid Build Coastguard Worker // Number of basic blocks in the loop body. 76*795d594fSAndroid Build Coastguard Worker size_t bb_num_; 77*795d594fSAndroid Build Coastguard Worker // Number of instructions in the loop body. 78*795d594fSAndroid Build Coastguard Worker size_t instr_num_; 79*795d594fSAndroid Build Coastguard Worker // Number of loop's exits. 80*795d594fSAndroid Build Coastguard Worker size_t exits_num_; 81*795d594fSAndroid Build Coastguard Worker // Number of "if" loop exits (with HIf instruction) whose condition is loop-invariant. 82*795d594fSAndroid Build Coastguard Worker size_t invariant_exits_num_; 83*795d594fSAndroid Build Coastguard Worker // Whether the loop has instructions which make scalar loop peeling non-beneficial. 84*795d594fSAndroid Build Coastguard Worker bool has_instructions_preventing_scalar_peeling_; 85*795d594fSAndroid Build Coastguard Worker // Whether the loop has instructions which make scalar loop unrolling non-beneficial. 86*795d594fSAndroid Build Coastguard Worker bool has_instructions_preventing_scalar_unrolling_; 87*795d594fSAndroid Build Coastguard Worker // Whether the loop has instructions of primitive long type; unrolling these loop will 88*795d594fSAndroid Build Coastguard Worker // likely introduce spill/fills on 32-bit targets. 89*795d594fSAndroid Build Coastguard Worker bool has_long_type_instructions_; 90*795d594fSAndroid Build Coastguard Worker 91*795d594fSAndroid Build Coastguard Worker // Corresponding HLoopInformation. 92*795d594fSAndroid Build Coastguard Worker HLoopInformation* loop_info_; 93*795d594fSAndroid Build Coastguard Worker 94*795d594fSAndroid Build Coastguard Worker friend class LoopAnalysis; 95*795d594fSAndroid Build Coastguard Worker }; 96*795d594fSAndroid Build Coastguard Worker 97*795d594fSAndroid Build Coastguard Worker // Placeholder class for methods and routines used to analyse loops, calculate loop properties 98*795d594fSAndroid Build Coastguard Worker // and characteristics. 99*795d594fSAndroid Build Coastguard Worker class LoopAnalysis : public ValueObject { 100*795d594fSAndroid Build Coastguard Worker public: 101*795d594fSAndroid Build Coastguard Worker // Calculates loops basic properties like body size, exits number, etc. and fills 102*795d594fSAndroid Build Coastguard Worker // 'analysis_results' with this information. 103*795d594fSAndroid Build Coastguard Worker static void CalculateLoopBasicProperties(HLoopInformation* loop_info, 104*795d594fSAndroid Build Coastguard Worker LoopAnalysisInfo* analysis_results, 105*795d594fSAndroid Build Coastguard Worker int64_t trip_count); 106*795d594fSAndroid Build Coastguard Worker 107*795d594fSAndroid Build Coastguard Worker // Returns the trip count of the loop if it is known and kUnknownTripCount otherwise. 108*795d594fSAndroid Build Coastguard Worker static int64_t GetLoopTripCount(HLoopInformation* loop_info, 109*795d594fSAndroid Build Coastguard Worker const InductionVarRange* induction_range); 110*795d594fSAndroid Build Coastguard Worker 111*795d594fSAndroid Build Coastguard Worker private: 112*795d594fSAndroid Build Coastguard Worker // Returns whether an instruction makes scalar loop peeling/unrolling non-beneficial. 113*795d594fSAndroid Build Coastguard Worker // 114*795d594fSAndroid Build Coastguard Worker // If in the loop body we have a dex/runtime call then its contribution to the whole 115*795d594fSAndroid Build Coastguard Worker // loop performance will probably prevail. So peeling/unrolling optimization will not bring 116*795d594fSAndroid Build Coastguard Worker // any noticeable performance improvement. It will increase the code size. MakesScalarPeelingUnrollingNonBeneficial(HInstruction * instruction)117*795d594fSAndroid Build Coastguard Worker static bool MakesScalarPeelingUnrollingNonBeneficial(HInstruction* instruction) { 118*795d594fSAndroid Build Coastguard Worker return (instruction->IsNewArray() || 119*795d594fSAndroid Build Coastguard Worker instruction->IsNewInstance() || 120*795d594fSAndroid Build Coastguard Worker instruction->IsUnresolvedInstanceFieldGet() || 121*795d594fSAndroid Build Coastguard Worker instruction->IsUnresolvedInstanceFieldSet() || 122*795d594fSAndroid Build Coastguard Worker instruction->IsUnresolvedStaticFieldGet() || 123*795d594fSAndroid Build Coastguard Worker instruction->IsUnresolvedStaticFieldSet() || 124*795d594fSAndroid Build Coastguard Worker // TODO: Support loops with intrinsified invokes. 125*795d594fSAndroid Build Coastguard Worker instruction->IsInvoke()); 126*795d594fSAndroid Build Coastguard Worker } 127*795d594fSAndroid Build Coastguard Worker }; 128*795d594fSAndroid Build Coastguard Worker 129*795d594fSAndroid Build Coastguard Worker // 130*795d594fSAndroid Build Coastguard Worker // Helper class which holds target-dependent methods and constants needed for loop optimizations. 131*795d594fSAndroid Build Coastguard Worker // 132*795d594fSAndroid Build Coastguard Worker // To support peeling/unrolling for a new architecture one needs to create new helper class, 133*795d594fSAndroid Build Coastguard Worker // inherit it from this and add implementation for the following methods. 134*795d594fSAndroid Build Coastguard Worker // 135*795d594fSAndroid Build Coastguard Worker class ArchNoOptsLoopHelper : public ArenaObject<kArenaAllocOptimization> { 136*795d594fSAndroid Build Coastguard Worker public: ArchNoOptsLoopHelper(const CodeGenerator & codegen)137*795d594fSAndroid Build Coastguard Worker explicit ArchNoOptsLoopHelper(const CodeGenerator& codegen) : codegen_(codegen) {} ~ArchNoOptsLoopHelper()138*795d594fSAndroid Build Coastguard Worker virtual ~ArchNoOptsLoopHelper() {} 139*795d594fSAndroid Build Coastguard Worker 140*795d594fSAndroid Build Coastguard Worker // Creates an instance of specialised helper for the target or default helper if the target 141*795d594fSAndroid Build Coastguard Worker // doesn't support loop peeling and unrolling. 142*795d594fSAndroid Build Coastguard Worker static ArchNoOptsLoopHelper* Create(const CodeGenerator& codegen, ArenaAllocator* allocator); 143*795d594fSAndroid Build Coastguard Worker 144*795d594fSAndroid Build Coastguard Worker // Returns whether the loop is not beneficial for loop peeling/unrolling. 145*795d594fSAndroid Build Coastguard Worker // 146*795d594fSAndroid Build Coastguard Worker // For example, if the loop body has too many instructions then peeling/unrolling optimization 147*795d594fSAndroid Build Coastguard Worker // will not bring any noticeable performance improvement however will increase the code size. 148*795d594fSAndroid Build Coastguard Worker // 149*795d594fSAndroid Build Coastguard Worker // Returns 'true' by default, should be overridden by particular target loop helper. IsLoopNonBeneficialForScalarOpts(LoopAnalysisInfo * loop_analysis_info)150*795d594fSAndroid Build Coastguard Worker virtual bool IsLoopNonBeneficialForScalarOpts( 151*795d594fSAndroid Build Coastguard Worker [[maybe_unused]] LoopAnalysisInfo* loop_analysis_info) const { 152*795d594fSAndroid Build Coastguard Worker return true; 153*795d594fSAndroid Build Coastguard Worker } 154*795d594fSAndroid Build Coastguard Worker 155*795d594fSAndroid Build Coastguard Worker // Returns optimal scalar unrolling factor for the loop. 156*795d594fSAndroid Build Coastguard Worker // 157*795d594fSAndroid Build Coastguard Worker // Returns kNoUnrollingFactor by default, should be overridden by particular target loop helper. GetScalarUnrollingFactor(const LoopAnalysisInfo * analysis_info)158*795d594fSAndroid Build Coastguard Worker virtual uint32_t GetScalarUnrollingFactor( 159*795d594fSAndroid Build Coastguard Worker [[maybe_unused]] const LoopAnalysisInfo* analysis_info) const { 160*795d594fSAndroid Build Coastguard Worker return LoopAnalysisInfo::kNoUnrollingFactor; 161*795d594fSAndroid Build Coastguard Worker } 162*795d594fSAndroid Build Coastguard Worker 163*795d594fSAndroid Build Coastguard Worker // Returns whether scalar loop peeling is enabled, 164*795d594fSAndroid Build Coastguard Worker // 165*795d594fSAndroid Build Coastguard Worker // Returns 'false' by default, should be overridden by particular target loop helper. IsLoopPeelingEnabled()166*795d594fSAndroid Build Coastguard Worker virtual bool IsLoopPeelingEnabled() const { return false; } 167*795d594fSAndroid Build Coastguard Worker 168*795d594fSAndroid Build Coastguard Worker // Returns whether it is beneficial to fully unroll the loop. 169*795d594fSAndroid Build Coastguard Worker // 170*795d594fSAndroid Build Coastguard Worker // Returns 'false' by default, should be overridden by particular target loop helper. IsFullUnrollingBeneficial(LoopAnalysisInfo * analysis_info)171*795d594fSAndroid Build Coastguard Worker virtual bool IsFullUnrollingBeneficial([[maybe_unused]] LoopAnalysisInfo* analysis_info) const { 172*795d594fSAndroid Build Coastguard Worker return false; 173*795d594fSAndroid Build Coastguard Worker } 174*795d594fSAndroid Build Coastguard Worker 175*795d594fSAndroid Build Coastguard Worker // Returns optimal SIMD unrolling factor for the loop. 176*795d594fSAndroid Build Coastguard Worker // 177*795d594fSAndroid Build Coastguard Worker // Returns kNoUnrollingFactor by default, should be overridden by particular target loop helper. GetSIMDUnrollingFactor(HBasicBlock * block,int64_t trip_count,uint32_t max_peel,uint32_t vector_length)178*795d594fSAndroid Build Coastguard Worker virtual uint32_t GetSIMDUnrollingFactor([[maybe_unused]] HBasicBlock* block, 179*795d594fSAndroid Build Coastguard Worker [[maybe_unused]] int64_t trip_count, 180*795d594fSAndroid Build Coastguard Worker [[maybe_unused]] uint32_t max_peel, 181*795d594fSAndroid Build Coastguard Worker [[maybe_unused]] uint32_t vector_length) const { 182*795d594fSAndroid Build Coastguard Worker return LoopAnalysisInfo::kNoUnrollingFactor; 183*795d594fSAndroid Build Coastguard Worker } 184*795d594fSAndroid Build Coastguard Worker 185*795d594fSAndroid Build Coastguard Worker protected: 186*795d594fSAndroid Build Coastguard Worker const CodeGenerator& codegen_; 187*795d594fSAndroid Build Coastguard Worker }; 188*795d594fSAndroid Build Coastguard Worker 189*795d594fSAndroid Build Coastguard Worker } // namespace art 190*795d594fSAndroid Build Coastguard Worker 191*795d594fSAndroid Build Coastguard Worker #endif // ART_COMPILER_OPTIMIZING_LOOP_ANALYSIS_H_ 192