1 | //===- OpToFuncCallLowering.h - GPU ops lowering to custom calls *- C++ -*-===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | #ifndef MLIR_CONVERSION_GPUCOMMON_OPTOFUNCCALLLOWERING_H_ |
9 | #define MLIR_CONVERSION_GPUCOMMON_OPTOFUNCCALLLOWERING_H_ |
10 | |
11 | #include "mlir/Conversion/LLVMCommon/Pattern.h" |
12 | #include "mlir/Dialect/GPU/IR/GPUDialect.h" |
13 | #include "mlir/Dialect/LLVMIR/LLVMDialect.h" |
14 | #include "mlir/IR/Builders.h" |
15 | |
16 | namespace mlir { |
17 | |
18 | /// Rewriting that replace SourceOp with a CallOp to `f32Func` or `f64Func` |
19 | /// depending on the element type that Op operates upon. The function |
20 | /// declaration is added in case it was not added before. |
21 | /// |
22 | /// If the input values are of f16 type, the value is first casted to f32, the |
23 | /// function called and then the result casted back. |
24 | /// |
25 | /// Example with NVVM: |
26 | /// %exp_f32 = math.exp %arg_f32 : f32 |
27 | /// |
28 | /// will be transformed into |
29 | /// llvm.call @__nv_expf(%arg_f32) : (f32) -> f32 |
30 | template <typename SourceOp> |
31 | struct OpToFuncCallLowering : public ConvertOpToLLVMPattern<SourceOp> { |
32 | public: |
33 | explicit OpToFuncCallLowering(LLVMTypeConverter &lowering, StringRef f32Func, |
34 | StringRef f64Func) |
35 | : ConvertOpToLLVMPattern<SourceOp>(lowering), f32Func(f32Func), |
36 | f64Func(f64Func) {} |
37 | |
38 | LogicalResult |
39 | matchAndRewrite(SourceOp op, typename SourceOp::Adaptor adaptor, |
40 | ConversionPatternRewriter &rewriter) const override { |
41 | using LLVM::LLVMFuncOp; |
42 | |
43 | static_assert( |
44 | std::is_base_of<OpTrait::OneResult<SourceOp>, SourceOp>::value, |
45 | "expected single result op" ); |
46 | |
47 | static_assert(std::is_base_of<OpTrait::SameOperandsAndResultType<SourceOp>, |
48 | SourceOp>::value, |
49 | "expected op with same operand and result types" ); |
50 | |
51 | SmallVector<Value, 1> castedOperands; |
52 | for (Value operand : adaptor.getOperands()) |
53 | castedOperands.push_back(Elt: maybeCast(operand, rewriter)); |
54 | |
55 | Type resultType = castedOperands.front().getType(); |
56 | Type funcType = getFunctionType(resultType, operands: castedOperands); |
57 | StringRef funcName = |
58 | getFunctionName(type: cast<LLVM::LLVMFunctionType>(funcType).getReturnType()); |
59 | if (funcName.empty()) |
60 | return failure(); |
61 | |
62 | LLVMFuncOp funcOp = appendOrGetFuncOp(funcName, funcType, op); |
63 | auto callOp = |
64 | rewriter.create<LLVM::CallOp>(op->getLoc(), funcOp, castedOperands); |
65 | |
66 | if (resultType == adaptor.getOperands().front().getType()) { |
67 | rewriter.replaceOp(op, {callOp.getResult()}); |
68 | return success(); |
69 | } |
70 | |
71 | Value truncated = rewriter.create<LLVM::FPTruncOp>( |
72 | op->getLoc(), adaptor.getOperands().front().getType(), |
73 | callOp.getResult()); |
74 | rewriter.replaceOp(op, {truncated}); |
75 | return success(); |
76 | } |
77 | |
78 | private: |
79 | Value maybeCast(Value operand, PatternRewriter &rewriter) const { |
80 | Type type = operand.getType(); |
81 | if (!isa<Float16Type>(type)) |
82 | return operand; |
83 | |
84 | return rewriter.create<LLVM::FPExtOp>( |
85 | operand.getLoc(), Float32Type::get(rewriter.getContext()), operand); |
86 | } |
87 | |
88 | Type getFunctionType(Type resultType, ValueRange operands) const { |
89 | SmallVector<Type> operandTypes(operands.getTypes()); |
90 | return LLVM::LLVMFunctionType::get(resultType, operandTypes); |
91 | } |
92 | |
93 | StringRef getFunctionName(Type type) const { |
94 | if (isa<Float32Type>(type)) |
95 | return f32Func; |
96 | if (isa<Float64Type>(type)) |
97 | return f64Func; |
98 | return "" ; |
99 | } |
100 | |
101 | LLVM::LLVMFuncOp appendOrGetFuncOp(StringRef funcName, Type funcType, |
102 | Operation *op) const { |
103 | using LLVM::LLVMFuncOp; |
104 | |
105 | auto funcAttr = StringAttr::get(op->getContext(), funcName); |
106 | Operation *funcOp = SymbolTable::lookupNearestSymbolFrom(op, funcAttr); |
107 | if (funcOp) |
108 | return cast<LLVMFuncOp>(*funcOp); |
109 | |
110 | mlir::OpBuilder b(op->getParentOfType<FunctionOpInterface>()); |
111 | return b.create<LLVMFuncOp>(op->getLoc(), funcName, funcType); |
112 | } |
113 | |
114 | const std::string f32Func; |
115 | const std::string f64Func; |
116 | }; |
117 | |
118 | } // namespace mlir |
119 | |
120 | #endif // MLIR_CONVERSION_GPUCOMMON_OPTOFUNCCALLLOWERING_H_ |
121 | |