| // Copyright (c) 2021 Google LLC. |
| // |
| // Licensed under the Apache License, Version 2.0 (the "License"); |
| // you may not use this file except in compliance with the License. |
| // You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, software |
| // distributed under the License is distributed on an "AS IS" BASIS, |
| // WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| // See the License for the specific language governing permissions and |
| // limitations under the License. |
| |
| #ifndef SOURCE_LINT_DIVERGENCE_ANALYSIS_H_ |
| #define SOURCE_LINT_DIVERGENCE_ANALYSIS_H_ |
| |
| #include <cstdint> |
| #include <ostream> |
| #include <unordered_map> |
| |
| #include "source/opt/basic_block.h" |
| #include "source/opt/control_dependence.h" |
| #include "source/opt/dataflow.h" |
| #include "source/opt/function.h" |
| #include "source/opt/instruction.h" |
| |
| namespace spvtools { |
| namespace lint { |
| |
| // Computes the static divergence level for blocks (control flow) and values. |
| // |
| // A value is uniform if all threads that execute it are guaranteed to have the |
| // same value. Similarly, a value is partially uniform if this is true only |
| // within each derivative group. If neither apply, it is divergent. |
| // |
| // Control flow through a block is uniform if for any possible execution and |
| // point in time, all threads are executing it, or no threads are executing it. |
| // In particular, it is never possible for some threads to be inside the block |
| // and some threads not executing. |
| // TODO(kuhar): Clarify the difference between uniform, divergent, and |
| // partially-uniform execution in this analysis. |
| // |
| // Caveat: |
| // As we use control dependence to determine how divergence is propagated, this |
| // analysis can be overly permissive when the merge block for a conditional |
| // branch or switch is later than (strictly postdominates) the expected merge |
| // block, which is the immediate postdominator. However, this is not expected to |
| // be a problem in practice, given that SPIR-V is generally output by compilers |
| // and other automated tools, which would assign the earliest possible merge |
| // block, rather than written by hand. |
| // TODO(kuhar): Handle late merges. |
| class DivergenceAnalysis : public opt::ForwardDataFlowAnalysis { |
| public: |
| // The tightest (most uniform) level of divergence that can be determined |
| // statically for a value or control flow for a block. |
| // |
| // The values are ordered such that A > B means that A is potentially more |
| // divergent than B. |
| // TODO(kuhar): Rename |PartiallyUniform' to something less confusing. For |
| // example, the enum could be based on scopes. |
| enum class DivergenceLevel { |
| // The value or control flow is uniform across the entire invocation group. |
| kUniform = 0, |
| // The value or control flow is uniform across the derivative group, but not |
| // the invocation group. |
| kPartiallyUniform = 1, |
| // The value or control flow is not statically uniform. |
| kDivergent = 2, |
| }; |
| |
| DivergenceAnalysis(opt::IRContext& context) |
| : ForwardDataFlowAnalysis(context, LabelPosition::kLabelsAtEnd) {} |
| |
| // Returns the divergence level for the given value (non-label instructions), |
| // or control flow for the given block. |
| DivergenceLevel GetDivergenceLevel(uint32_t id) { |
| auto it = divergence_.find(id); |
| if (it == divergence_.end()) { |
| return DivergenceLevel::kUniform; |
| } |
| return it->second; |
| } |
| |
| // Returns the divergence source for the given id. The following types of |
| // divergence flows from A to B are possible: |
| // |
| // data -> data: A is used as an operand in the definition of B. |
| // data -> control: B is control-dependent on a branch with condition A. |
| // control -> data: B is a OpPhi instruction in which A is a block operand. |
| // control -> control: B is control-dependent on A. |
| uint32_t GetDivergenceSource(uint32_t id) { |
| auto it = divergence_source_.find(id); |
| if (it == divergence_source_.end()) { |
| return 0; |
| } |
| return it->second; |
| } |
| |
| // Returns the dependence source for the control dependence for the given id. |
| // This only exists for data -> control edges. |
| // |
| // In other words, if block 2 is dependent on block 1 due to value 3 (e.g. |
| // block 1 terminates with OpBranchConditional %3 %2 %4): |
| // * GetDivergenceSource(2) = 3 |
| // * GetDivergenceDependenceSource(2) = 1 |
| // |
| // Returns 0 if not applicable. |
| uint32_t GetDivergenceDependenceSource(uint32_t id) { |
| auto it = divergence_dependence_source_.find(id); |
| if (it == divergence_dependence_source_.end()) { |
| return 0; |
| } |
| return it->second; |
| } |
| |
| void InitializeWorklist(opt::Function* function, |
| bool is_first_iteration) override { |
| // Since |EnqueueSuccessors| is complete, we only need one pass. |
| if (is_first_iteration) { |
| Setup(function); |
| opt::ForwardDataFlowAnalysis::InitializeWorklist(function, true); |
| } |
| } |
| |
| void EnqueueSuccessors(opt::Instruction* inst) override; |
| |
| VisitResult Visit(opt::Instruction* inst) override; |
| |
| private: |
| VisitResult VisitBlock(uint32_t id); |
| VisitResult VisitInstruction(opt::Instruction* inst); |
| |
| // Computes the divergence level for the result of the given instruction |
| // based on the current state of the analysis. This is always an |
| // underapproximation, which will be improved as the analysis proceeds. |
| DivergenceLevel ComputeInstructionDivergence(opt::Instruction* inst); |
| |
| // Computes the divergence level for a variable, which is used for loads. |
| DivergenceLevel ComputeVariableDivergence(opt::Instruction* var); |
| |
| // Initializes data structures for performing dataflow on the given function. |
| void Setup(opt::Function* function); |
| |
| std::unordered_map<uint32_t, DivergenceLevel> divergence_; |
| std::unordered_map<uint32_t, uint32_t> divergence_source_; |
| std::unordered_map<uint32_t, uint32_t> divergence_dependence_source_; |
| |
| // Stores the result of following unconditional branches starting from the |
| // given block. This is used to detect when reconvergence needs to be |
| // accounted for. |
| std::unordered_map<uint32_t, uint32_t> follow_unconditional_branches_; |
| |
| opt::ControlDependenceAnalysis cd_; |
| }; |
| |
| std::ostream& operator<<(std::ostream& os, |
| DivergenceAnalysis::DivergenceLevel level); |
| |
| } // namespace lint |
| } // namespace spvtools |
| |
| #endif // SOURCE_LINT_DIVERGENCE_ANALYSIS_H_ |