| 1 | // Copyright (c) 2018 Google LLC. |
| 2 | // |
| 3 | // Licensed under the Apache License, Version 2.0 (the "License"); |
| 4 | // you may not use this file except in compliance with the License. |
| 5 | // You may obtain a copy of the License at |
| 6 | // |
| 7 | // http://www.apache.org/licenses/LICENSE-2.0 |
| 8 | // |
| 9 | // Unless required by applicable law or agreed to in writing, software |
| 10 | // distributed under the License is distributed on an "AS IS" BASIS, |
| 11 | // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 12 | // See the License for the specific language governing permissions and |
| 13 | // limitations under the License. |
| 14 | |
| 15 | #ifndef SOURCE_OPT_LOOP_FUSION_H_ |
| 16 | #define SOURCE_OPT_LOOP_FUSION_H_ |
| 17 | |
| 18 | #include <map> |
| 19 | #include <set> |
| 20 | #include <utility> |
| 21 | #include <vector> |
| 22 | |
| 23 | #include "source/opt/ir_context.h" |
| 24 | #include "source/opt/loop_descriptor.h" |
| 25 | #include "source/opt/loop_utils.h" |
| 26 | #include "source/opt/scalar_analysis.h" |
| 27 | |
| 28 | namespace spvtools { |
| 29 | namespace opt { |
| 30 | |
| 31 | class LoopFusion { |
| 32 | public: |
| 33 | LoopFusion(IRContext* context, Loop* loop_0, Loop* loop_1) |
| 34 | : context_(context), |
| 35 | loop_0_(loop_0), |
| 36 | loop_1_(loop_1), |
| 37 | containing_function_(loop_0->GetHeaderBlock()->GetParent()) {} |
| 38 | |
| 39 | // Checks if the |loop_0| and |loop_1| are compatible for fusion. |
| 40 | // That means: |
| 41 | // * they both have one induction variable |
| 42 | // * they have the same upper and lower bounds |
| 43 | // - same inital value |
| 44 | // - same condition |
| 45 | // * they have the same update step |
| 46 | // * they are adjacent, with |loop_0| appearing before |loop_1| |
| 47 | // * there are no break/continue in either of them |
| 48 | // * they both have pre-header blocks (required for ScalarEvolutionAnalysis |
| 49 | // and dependence checking). |
| 50 | bool AreCompatible(); |
| 51 | |
| 52 | // Checks if compatible |loop_0| and |loop_1| are legal to fuse. |
| 53 | // * fused loops do not have any dependencies with dependence distance greater |
| 54 | // than 0 that did not exist in the original loops. |
| 55 | // * there are no function calls in the loops (could have side-effects) |
| 56 | bool IsLegal(); |
| 57 | |
| 58 | // Perform the actual fusion of |loop_0_| and |loop_1_|. The loops have to be |
| 59 | // compatible and the fusion has to be legal. |
| 60 | void Fuse(); |
| 61 | |
| 62 | private: |
| 63 | // Check that the initial values are the same. |
| 64 | bool CheckInit(); |
| 65 | |
| 66 | // Check that the conditions are the same. |
| 67 | bool CheckCondition(); |
| 68 | |
| 69 | // Check that the steps are the same. |
| 70 | bool CheckStep(); |
| 71 | |
| 72 | // Returns |true| if |instruction| is used in the continue or condition block |
| 73 | // of |loop|. |
| 74 | bool UsedInContinueOrConditionBlock(Instruction* instruction, Loop* loop); |
| 75 | |
| 76 | // Remove entries in |instructions| that are not used in the continue or |
| 77 | // condition block of |loop|. |
| 78 | void RemoveIfNotUsedContinueOrConditionBlock( |
| 79 | std::vector<Instruction*>* instructions, Loop* loop); |
| 80 | |
| 81 | // Returns |true| if |instruction| is used in |loop|. |
| 82 | bool IsUsedInLoop(Instruction* instruction, Loop* loop); |
| 83 | |
| 84 | // Returns |true| if |loop| has at least one barrier or function call. |
| 85 | bool ContainsBarriersOrFunctionCalls(Loop* loop); |
| 86 | |
| 87 | // Get all instructions in the |loop| (except in the latch block) that have |
| 88 | // the opcode |opcode|. |
| 89 | std::pair<std::vector<Instruction*>, std::vector<Instruction*>> |
| 90 | GetLoadsAndStoresInLoop(Loop* loop); |
| 91 | |
| 92 | // Given a vector of memory operations (OpLoad/OpStore), constructs a map from |
| 93 | // variables to the loads/stores that those variables. |
| 94 | std::map<Instruction*, std::vector<Instruction*>> LocationToMemOps( |
| 95 | const std::vector<Instruction*>& mem_ops); |
| 96 | |
| 97 | IRContext* context_; |
| 98 | |
| 99 | // The original loops to be fused. |
| 100 | Loop* loop_0_; |
| 101 | Loop* loop_1_; |
| 102 | |
| 103 | // The function that contains |loop_0_| and |loop_1_|. |
| 104 | Function* containing_function_ = nullptr; |
| 105 | |
| 106 | // The induction variables for |loop_0_| and |loop_1_|. |
| 107 | Instruction* induction_0_ = nullptr; |
| 108 | Instruction* induction_1_ = nullptr; |
| 109 | }; |
| 110 | |
| 111 | } // namespace opt |
| 112 | } // namespace spvtools |
| 113 | |
| 114 | #endif // SOURCE_OPT_LOOP_FUSION_H_ |
| 115 | |