-
Notifications
You must be signed in to change notification settings - Fork 10.8k
/
NVVMAttachTarget.cpp
86 lines (76 loc) · 2.94 KB
/
NVVMAttachTarget.cpp
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
//===- NVVMAttachTarget.cpp - Attach an NVVM target -----------------------===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This file implements the `GpuNVVMAttachTarget` pass, attaching `#nvvm.target`
// attributes to GPU modules.
//
//===----------------------------------------------------------------------===//
#include "mlir/Dialect/GPU/Transforms/Passes.h"
#include "mlir/Dialect/GPU/IR/GPUDialect.h"
#include "mlir/Dialect/LLVMIR/NVVMDialect.h"
#include "mlir/IR/Builders.h"
#include "mlir/Pass/Pass.h"
#include "mlir/Target/LLVM/NVVM/Target.h"
#include "llvm/Support/Regex.h"
namespace mlir {
#define GEN_PASS_DEF_GPUNVVMATTACHTARGET
#include "mlir/Dialect/GPU/Transforms/Passes.h.inc"
} // namespace mlir
using namespace mlir;
using namespace mlir::NVVM;
namespace {
struct NVVMAttachTarget
: public impl::GpuNVVMAttachTargetBase<NVVMAttachTarget> {
using Base::Base;
DictionaryAttr getFlags(OpBuilder &builder) const;
void runOnOperation() override;
void getDependentDialects(DialectRegistry ®istry) const override {
registry.insert<NVVM::NVVMDialect>();
}
};
} // namespace
DictionaryAttr NVVMAttachTarget::getFlags(OpBuilder &builder) const {
UnitAttr unitAttr = builder.getUnitAttr();
SmallVector<NamedAttribute, 2> flags;
auto addFlag = [&](StringRef flag) {
flags.push_back(builder.getNamedAttr(flag, unitAttr));
};
if (fastFlag)
addFlag("fast");
if (ftzFlag)
addFlag("ftz");
if (!flags.empty())
return builder.getDictionaryAttr(flags);
return nullptr;
}
void NVVMAttachTarget::runOnOperation() {
OpBuilder builder(&getContext());
ArrayRef<std::string> libs(linkLibs);
SmallVector<StringRef> filesToLink(libs.begin(), libs.end());
auto target = builder.getAttr<NVVMTargetAttr>(
optLevel, triple, chip, features, getFlags(builder),
filesToLink.empty() ? nullptr : builder.getStrArrayAttr(filesToLink));
llvm::Regex matcher(moduleMatcher);
for (Region ®ion : getOperation()->getRegions())
for (Block &block : region.getBlocks())
for (auto module : block.getOps<gpu::GPUModuleOp>()) {
// Check if the name of the module matches.
if (!moduleMatcher.empty() && !matcher.match(module.getName()))
continue;
// Create the target array.
SmallVector<Attribute> targets;
if (std::optional<ArrayAttr> attrs = module.getTargets())
targets.append(attrs->getValue().begin(), attrs->getValue().end());
targets.push_back(target);
// Remove any duplicate targets.
targets.erase(std::unique(targets.begin(), targets.end()),
targets.end());
// Update the target attribute array.
module.setTargetsAttr(builder.getArrayAttr(targets));
}
}