Mercurial > hg > CbC > CbC_llvm
view mlir/lib/Transforms/ParallelLoopCollapsing.cpp @ 201:a96fbbdf2d0f
...
author | Shinji KONO <kono@ie.u-ryukyu.ac.jp> |
---|---|
date | Fri, 04 Jun 2021 21:07:06 +0900 |
parents | 0572611fdcc8 |
children |
line wrap: on
line source
//===- ParallelLoopCollapsing.cpp - Pass collapsing parallel loop indices -===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// #include "PassDetail.h" #include "mlir/Dialect/SCF/SCF.h" #include "mlir/Transforms/LoopUtils.h" #include "mlir/Transforms/Passes.h" #include "mlir/Transforms/RegionUtils.h" #include "llvm/Support/CommandLine.h" #include "llvm/Support/Debug.h" #define DEBUG_TYPE "parallel-loop-collapsing" using namespace mlir; namespace { struct ParallelLoopCollapsing : public ParallelLoopCollapsingBase<ParallelLoopCollapsing> { void runOnOperation() override { Operation *module = getOperation(); module->walk([&](scf::ParallelOp op) { // The common case for GPU dialect will be simplifying the ParallelOp to 3 // arguments, so we do that here to simplify things. llvm::SmallVector<std::vector<unsigned>, 3> combinedLoops; if (clCollapsedIndices0.size()) combinedLoops.push_back(clCollapsedIndices0); if (clCollapsedIndices1.size()) combinedLoops.push_back(clCollapsedIndices1); if (clCollapsedIndices2.size()) combinedLoops.push_back(clCollapsedIndices2); collapseParallelLoops(op, combinedLoops); }); } }; } // namespace std::unique_ptr<Pass> mlir::createParallelLoopCollapsingPass() { return std::make_unique<ParallelLoopCollapsing>(); }