| 1 | //===----- CGHLSLRuntime.cpp - Interface to HLSL Runtimes -----------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This provides an abstract class for HLSL code generation. Concrete |
| 10 | // subclasses of this implement code generation for specific HLSL |
| 11 | // runtime libraries. |
| 12 | // |
| 13 | //===----------------------------------------------------------------------===// |
| 14 | |
| 15 | #include "CGHLSLRuntime.h" |
| 16 | #include "CGDebugInfo.h" |
| 17 | #include "CodeGenFunction.h" |
| 18 | #include "CodeGenModule.h" |
| 19 | #include "TargetInfo.h" |
| 20 | #include "clang/AST/ASTContext.h" |
| 21 | #include "clang/AST/Decl.h" |
| 22 | #include "clang/AST/RecursiveASTVisitor.h" |
| 23 | #include "clang/AST/Type.h" |
| 24 | #include "clang/Basic/TargetOptions.h" |
| 25 | #include "llvm/ADT/SmallVector.h" |
| 26 | #include "llvm/Frontend/HLSL/HLSLRootSignatureUtils.h" |
| 27 | #include "llvm/IR/Constants.h" |
| 28 | #include "llvm/IR/DerivedTypes.h" |
| 29 | #include "llvm/IR/GlobalVariable.h" |
| 30 | #include "llvm/IR/LLVMContext.h" |
| 31 | #include "llvm/IR/Metadata.h" |
| 32 | #include "llvm/IR/Module.h" |
| 33 | #include "llvm/IR/Type.h" |
| 34 | #include "llvm/IR/Value.h" |
| 35 | #include "llvm/Support/Alignment.h" |
| 36 | #include "llvm/Support/ErrorHandling.h" |
| 37 | #include "llvm/Support/FormatVariadic.h" |
| 38 | #include <utility> |
| 39 | |
| 40 | using namespace clang; |
| 41 | using namespace CodeGen; |
| 42 | using namespace clang::hlsl; |
| 43 | using namespace llvm; |
| 44 | |
| 45 | using llvm::hlsl::CBufferRowSizeInBytes; |
| 46 | |
| 47 | namespace { |
| 48 | |
| 49 | void addDxilValVersion(StringRef ValVersionStr, llvm::Module &M) { |
| 50 | // The validation of ValVersionStr is done at HLSLToolChain::TranslateArgs. |
| 51 | // Assume ValVersionStr is legal here. |
| 52 | VersionTuple Version; |
| 53 | if (Version.tryParse(string: ValVersionStr) || Version.getBuild() || |
| 54 | Version.getSubminor() || !Version.getMinor()) { |
| 55 | return; |
| 56 | } |
| 57 | |
| 58 | uint64_t Major = Version.getMajor(); |
| 59 | uint64_t Minor = *Version.getMinor(); |
| 60 | |
| 61 | auto &Ctx = M.getContext(); |
| 62 | IRBuilder<> B(M.getContext()); |
| 63 | MDNode *Val = MDNode::get(Context&: Ctx, MDs: {ConstantAsMetadata::get(C: B.getInt32(C: Major)), |
| 64 | ConstantAsMetadata::get(C: B.getInt32(C: Minor))}); |
| 65 | StringRef DXILValKey = "dx.valver" ; |
| 66 | auto *DXILValMD = M.getOrInsertNamedMetadata(Name: DXILValKey); |
| 67 | DXILValMD->addOperand(M: Val); |
| 68 | } |
| 69 | |
| 70 | void addRootSignature(ArrayRef<llvm::hlsl::rootsig::RootElement> Elements, |
| 71 | llvm::Function *Fn, llvm::Module &M) { |
| 72 | auto &Ctx = M.getContext(); |
| 73 | |
| 74 | llvm::hlsl::rootsig::MetadataBuilder Builder(Ctx, Elements); |
| 75 | MDNode *RootSignature = Builder.BuildRootSignature(); |
| 76 | MDNode *FnPairing = |
| 77 | MDNode::get(Context&: Ctx, MDs: {ValueAsMetadata::get(V: Fn), RootSignature}); |
| 78 | |
| 79 | StringRef RootSignatureValKey = "dx.rootsignatures" ; |
| 80 | auto *RootSignatureValMD = M.getOrInsertNamedMetadata(Name: RootSignatureValKey); |
| 81 | RootSignatureValMD->addOperand(M: FnPairing); |
| 82 | } |
| 83 | |
| 84 | } // namespace |
| 85 | |
| 86 | llvm::Type * |
| 87 | CGHLSLRuntime::convertHLSLSpecificType(const Type *T, |
| 88 | SmallVector<int32_t> *Packoffsets) { |
| 89 | assert(T->isHLSLSpecificType() && "Not an HLSL specific type!" ); |
| 90 | |
| 91 | // Check if the target has a specific translation for this type first. |
| 92 | if (llvm::Type *TargetTy = |
| 93 | CGM.getTargetCodeGenInfo().getHLSLType(CGM, T, Packoffsets)) |
| 94 | return TargetTy; |
| 95 | |
| 96 | llvm_unreachable("Generic handling of HLSL types is not supported." ); |
| 97 | } |
| 98 | |
| 99 | llvm::Triple::ArchType CGHLSLRuntime::getArch() { |
| 100 | return CGM.getTarget().getTriple().getArch(); |
| 101 | } |
| 102 | |
| 103 | // Returns true if the type is an HLSL resource class or an array of them |
| 104 | static bool isResourceRecordTypeOrArrayOf(const clang::Type *Ty) { |
| 105 | while (const ConstantArrayType *CAT = dyn_cast<ConstantArrayType>(Val: Ty)) |
| 106 | Ty = CAT->getArrayElementTypeNoTypeQual(); |
| 107 | return Ty->isHLSLResourceRecord(); |
| 108 | } |
| 109 | |
| 110 | // Emits constant global variables for buffer constants declarations |
| 111 | // and creates metadata linking the constant globals with the buffer global. |
| 112 | void CGHLSLRuntime::emitBufferGlobalsAndMetadata(const HLSLBufferDecl *BufDecl, |
| 113 | llvm::GlobalVariable *BufGV) { |
| 114 | LLVMContext &Ctx = CGM.getLLVMContext(); |
| 115 | |
| 116 | // get the layout struct from constant buffer target type |
| 117 | llvm::Type *BufType = BufGV->getValueType(); |
| 118 | llvm::Type *BufLayoutType = |
| 119 | cast<llvm::TargetExtType>(Val: BufType)->getTypeParameter(i: 0); |
| 120 | llvm::StructType *LayoutStruct = cast<llvm::StructType>( |
| 121 | Val: cast<llvm::TargetExtType>(Val: BufLayoutType)->getTypeParameter(i: 0)); |
| 122 | |
| 123 | // Start metadata list associating the buffer global variable with its |
| 124 | // constatns |
| 125 | SmallVector<llvm::Metadata *> BufGlobals; |
| 126 | BufGlobals.push_back(Elt: ValueAsMetadata::get(V: BufGV)); |
| 127 | |
| 128 | const auto *ElemIt = LayoutStruct->element_begin(); |
| 129 | for (Decl *D : BufDecl->buffer_decls()) { |
| 130 | if (isa<CXXRecordDecl, EmptyDecl>(Val: D)) |
| 131 | // Nothing to do for this declaration. |
| 132 | continue; |
| 133 | if (isa<FunctionDecl>(Val: D)) { |
| 134 | // A function within an cbuffer is effectively a top-level function. |
| 135 | CGM.EmitTopLevelDecl(D); |
| 136 | continue; |
| 137 | } |
| 138 | VarDecl *VD = dyn_cast<VarDecl>(Val: D); |
| 139 | if (!VD) |
| 140 | continue; |
| 141 | |
| 142 | QualType VDTy = VD->getType(); |
| 143 | if (VDTy.getAddressSpace() != LangAS::hlsl_constant) { |
| 144 | if (VD->getStorageClass() == SC_Static || |
| 145 | VDTy.getAddressSpace() == LangAS::hlsl_groupshared || |
| 146 | isResourceRecordTypeOrArrayOf(Ty: VDTy.getTypePtr())) { |
| 147 | // Emit static and groupshared variables and resource classes inside |
| 148 | // cbuffer as regular globals |
| 149 | CGM.EmitGlobal(D: VD); |
| 150 | } else { |
| 151 | // Anything else that is not in the hlsl_constant address space must be |
| 152 | // an empty struct or a zero-sized array and can be ignored |
| 153 | assert(BufDecl->getASTContext().getTypeSize(VDTy) == 0 && |
| 154 | "constant buffer decl with non-zero sized type outside of " |
| 155 | "hlsl_constant address space" ); |
| 156 | } |
| 157 | continue; |
| 158 | } |
| 159 | |
| 160 | assert(ElemIt != LayoutStruct->element_end() && |
| 161 | "number of elements in layout struct does not match" ); |
| 162 | llvm::Type *LayoutType = *ElemIt++; |
| 163 | |
| 164 | // FIXME: handle resources inside user defined structs |
| 165 | // (llvm/wg-hlsl#175) |
| 166 | |
| 167 | // create global variable for the constant and to metadata list |
| 168 | GlobalVariable *ElemGV = |
| 169 | cast<GlobalVariable>(Val: CGM.GetAddrOfGlobalVar(D: VD, Ty: LayoutType)); |
| 170 | BufGlobals.push_back(Elt: ValueAsMetadata::get(V: ElemGV)); |
| 171 | } |
| 172 | assert(ElemIt == LayoutStruct->element_end() && |
| 173 | "number of elements in layout struct does not match" ); |
| 174 | |
| 175 | // add buffer metadata to the module |
| 176 | CGM.getModule() |
| 177 | .getOrInsertNamedMetadata(Name: "hlsl.cbs" ) |
| 178 | ->addOperand(M: MDNode::get(Context&: Ctx, MDs: BufGlobals)); |
| 179 | } |
| 180 | |
| 181 | // Creates resource handle type for the HLSL buffer declaration |
| 182 | static const clang::HLSLAttributedResourceType * |
| 183 | createBufferHandleType(const HLSLBufferDecl *BufDecl) { |
| 184 | ASTContext &AST = BufDecl->getASTContext(); |
| 185 | QualType QT = AST.getHLSLAttributedResourceType( |
| 186 | Wrapped: AST.HLSLResourceTy, |
| 187 | Contained: QualType(BufDecl->getLayoutStruct()->getTypeForDecl(), 0), |
| 188 | Attrs: HLSLAttributedResourceType::Attributes(ResourceClass::CBuffer)); |
| 189 | return cast<HLSLAttributedResourceType>(Val: QT.getTypePtr()); |
| 190 | } |
| 191 | |
| 192 | // Iterates over all declarations in the HLSL buffer and based on the |
| 193 | // packoffset or register(c#) annotations it fills outs the Layout |
| 194 | // vector with the user-specified layout offsets. |
| 195 | // The buffer offsets can be specified 2 ways: |
| 196 | // 1. declarations in cbuffer {} block can have a packoffset annotation |
| 197 | // (translates to HLSLPackOffsetAttr) |
| 198 | // 2. default constant buffer declarations at global scope can have |
| 199 | // register(c#) annotations (translates to HLSLResourceBindingAttr with |
| 200 | // RegisterType::C) |
| 201 | // It is not guaranteed that all declarations in a buffer have an annotation. |
| 202 | // For those where it is not specified a -1 value is added to the Layout |
| 203 | // vector. In the final layout these declarations will be placed at the end |
| 204 | // of the HLSL buffer after all of the elements with specified offset. |
| 205 | static void fillPackoffsetLayout(const HLSLBufferDecl *BufDecl, |
| 206 | SmallVector<int32_t> &Layout) { |
| 207 | assert(Layout.empty() && "expected empty vector for layout" ); |
| 208 | assert(BufDecl->hasValidPackoffset()); |
| 209 | |
| 210 | for (Decl *D : BufDecl->buffer_decls()) { |
| 211 | if (isa<CXXRecordDecl, EmptyDecl>(Val: D) || isa<FunctionDecl>(Val: D)) { |
| 212 | continue; |
| 213 | } |
| 214 | VarDecl *VD = dyn_cast<VarDecl>(Val: D); |
| 215 | if (!VD || VD->getType().getAddressSpace() != LangAS::hlsl_constant) |
| 216 | continue; |
| 217 | |
| 218 | if (!VD->hasAttrs()) { |
| 219 | Layout.push_back(Elt: -1); |
| 220 | continue; |
| 221 | } |
| 222 | |
| 223 | int32_t Offset = -1; |
| 224 | for (auto *Attr : VD->getAttrs()) { |
| 225 | if (auto *POA = dyn_cast<HLSLPackOffsetAttr>(Attr)) { |
| 226 | Offset = POA->getOffsetInBytes(); |
| 227 | break; |
| 228 | } |
| 229 | auto *RBA = dyn_cast<HLSLResourceBindingAttr>(Attr); |
| 230 | if (RBA && |
| 231 | RBA->getRegisterType() == HLSLResourceBindingAttr::RegisterType::C) { |
| 232 | Offset = RBA->getSlotNumber() * CBufferRowSizeInBytes; |
| 233 | break; |
| 234 | } |
| 235 | } |
| 236 | Layout.push_back(Elt: Offset); |
| 237 | } |
| 238 | } |
| 239 | |
| 240 | std::pair<llvm::Intrinsic::ID, bool> |
| 241 | CGHLSLRuntime::getCreateHandleFromBindingIntrinsic() { |
| 242 | switch (getArch()) { |
| 243 | case llvm::Triple::dxil: |
| 244 | return std::pair(llvm::Intrinsic::dx_resource_handlefrombinding, true); |
| 245 | case llvm::Triple::spirv: |
| 246 | return std::pair(llvm::Intrinsic::spv_resource_handlefrombinding, false); |
| 247 | default: |
| 248 | llvm_unreachable("Intrinsic resource_handlefrombinding not supported by " |
| 249 | "target architecture" ); |
| 250 | } |
| 251 | } |
| 252 | |
| 253 | std::pair<llvm::Intrinsic::ID, bool> |
| 254 | CGHLSLRuntime::getCreateHandleFromImplicitBindingIntrinsic() { |
| 255 | switch (getArch()) { |
| 256 | case llvm::Triple::dxil: |
| 257 | return std::pair(llvm::Intrinsic::dx_resource_handlefromimplicitbinding, |
| 258 | true); |
| 259 | case llvm::Triple::spirv: |
| 260 | return std::pair(llvm::Intrinsic::spv_resource_handlefromimplicitbinding, |
| 261 | false); |
| 262 | default: |
| 263 | llvm_unreachable( |
| 264 | "Intrinsic resource_handlefromimplicitbinding not supported by " |
| 265 | "target architecture" ); |
| 266 | } |
| 267 | } |
| 268 | |
| 269 | // Codegen for HLSLBufferDecl |
| 270 | void CGHLSLRuntime::addBuffer(const HLSLBufferDecl *BufDecl) { |
| 271 | |
| 272 | assert(BufDecl->isCBuffer() && "tbuffer codegen is not supported yet" ); |
| 273 | |
| 274 | // create resource handle type for the buffer |
| 275 | const clang::HLSLAttributedResourceType *ResHandleTy = |
| 276 | createBufferHandleType(BufDecl); |
| 277 | |
| 278 | // empty constant buffer is ignored |
| 279 | if (ResHandleTy->getContainedType()->getAsCXXRecordDecl()->isEmpty()) |
| 280 | return; |
| 281 | |
| 282 | // create global variable for the constant buffer |
| 283 | SmallVector<int32_t> Layout; |
| 284 | if (BufDecl->hasValidPackoffset()) |
| 285 | fillPackoffsetLayout(BufDecl, Layout); |
| 286 | |
| 287 | llvm::TargetExtType *TargetTy = |
| 288 | cast<llvm::TargetExtType>(Val: convertHLSLSpecificType( |
| 289 | ResHandleTy, BufDecl->hasValidPackoffset() ? &Layout : nullptr)); |
| 290 | llvm::GlobalVariable *BufGV = new GlobalVariable( |
| 291 | TargetTy, /*isConstant*/ false, |
| 292 | GlobalValue::LinkageTypes::ExternalLinkage, PoisonValue::get(T: TargetTy), |
| 293 | llvm::formatv("{0}{1}" , BufDecl->getName(), |
| 294 | BufDecl->isCBuffer() ? ".cb" : ".tb" ), |
| 295 | GlobalValue::NotThreadLocal); |
| 296 | CGM.getModule().insertGlobalVariable(GV: BufGV); |
| 297 | |
| 298 | // Add globals for constant buffer elements and create metadata nodes |
| 299 | emitBufferGlobalsAndMetadata(BufDecl, BufGV); |
| 300 | |
| 301 | // Initialize cbuffer from binding (implicit or explicit) |
| 302 | HLSLResourceBindingAttr *RBA = BufDecl->getAttr<HLSLResourceBindingAttr>(); |
| 303 | assert(RBA && |
| 304 | "cbuffer/tbuffer should always have resource binding attribute" ); |
| 305 | initializeBufferFromBinding(BufDecl, GV: BufGV, RBA); |
| 306 | } |
| 307 | |
| 308 | llvm::TargetExtType * |
| 309 | CGHLSLRuntime::getHLSLBufferLayoutType(const RecordType *StructType) { |
| 310 | const auto Entry = LayoutTypes.find(Val: StructType); |
| 311 | if (Entry != LayoutTypes.end()) |
| 312 | return Entry->getSecond(); |
| 313 | return nullptr; |
| 314 | } |
| 315 | |
| 316 | void CGHLSLRuntime::addHLSLBufferLayoutType(const RecordType *StructType, |
| 317 | llvm::TargetExtType *LayoutTy) { |
| 318 | assert(getHLSLBufferLayoutType(StructType) == nullptr && |
| 319 | "layout type for this struct already exist" ); |
| 320 | LayoutTypes[StructType] = LayoutTy; |
| 321 | } |
| 322 | |
| 323 | void CGHLSLRuntime::finishCodeGen() { |
| 324 | auto &TargetOpts = CGM.getTarget().getTargetOpts(); |
| 325 | auto &CodeGenOpts = CGM.getCodeGenOpts(); |
| 326 | auto &LangOpts = CGM.getLangOpts(); |
| 327 | llvm::Module &M = CGM.getModule(); |
| 328 | Triple T(M.getTargetTriple()); |
| 329 | if (T.getArch() == Triple::ArchType::dxil) |
| 330 | addDxilValVersion(ValVersionStr: TargetOpts.DxilValidatorVersion, M); |
| 331 | if (CodeGenOpts.ResMayAlias) |
| 332 | M.setModuleFlag(Behavior: llvm::Module::ModFlagBehavior::Error, Key: "dx.resmayalias" , Val: 1); |
| 333 | |
| 334 | // NativeHalfType corresponds to the -fnative-half-type clang option which is |
| 335 | // aliased by clang-dxc's -enable-16bit-types option. This option is used to |
| 336 | // set the UseNativeLowPrecision DXIL module flag in the DirectX backend |
| 337 | if (LangOpts.NativeHalfType) |
| 338 | M.setModuleFlag(Behavior: llvm::Module::ModFlagBehavior::Error, Key: "dx.nativelowprec" , |
| 339 | Val: 1); |
| 340 | |
| 341 | generateGlobalCtorDtorCalls(); |
| 342 | } |
| 343 | |
| 344 | void clang::CodeGen::CGHLSLRuntime::setHLSLEntryAttributes( |
| 345 | const FunctionDecl *FD, llvm::Function *Fn) { |
| 346 | const auto *ShaderAttr = FD->getAttr<HLSLShaderAttr>(); |
| 347 | assert(ShaderAttr && "All entry functions must have a HLSLShaderAttr" ); |
| 348 | const StringRef ShaderAttrKindStr = "hlsl.shader" ; |
| 349 | Fn->addFnAttr(ShaderAttrKindStr, |
| 350 | llvm::Triple::getEnvironmentTypeName(Kind: ShaderAttr->getType())); |
| 351 | if (HLSLNumThreadsAttr *NumThreadsAttr = FD->getAttr<HLSLNumThreadsAttr>()) { |
| 352 | const StringRef NumThreadsKindStr = "hlsl.numthreads" ; |
| 353 | std::string NumThreadsStr = |
| 354 | formatv("{0},{1},{2}" , NumThreadsAttr->getX(), NumThreadsAttr->getY(), |
| 355 | NumThreadsAttr->getZ()); |
| 356 | Fn->addFnAttr(Kind: NumThreadsKindStr, Val: NumThreadsStr); |
| 357 | } |
| 358 | if (HLSLWaveSizeAttr *WaveSizeAttr = FD->getAttr<HLSLWaveSizeAttr>()) { |
| 359 | const StringRef WaveSizeKindStr = "hlsl.wavesize" ; |
| 360 | std::string WaveSizeStr = |
| 361 | formatv("{0},{1},{2}" , WaveSizeAttr->getMin(), WaveSizeAttr->getMax(), |
| 362 | WaveSizeAttr->getPreferred()); |
| 363 | Fn->addFnAttr(Kind: WaveSizeKindStr, Val: WaveSizeStr); |
| 364 | } |
| 365 | // HLSL entry functions are materialized for module functions with |
| 366 | // HLSLShaderAttr attribute. SetLLVMFunctionAttributesForDefinition called |
| 367 | // later in the compiler-flow for such module functions is not aware of and |
| 368 | // hence not able to set attributes of the newly materialized entry functions. |
| 369 | // So, set attributes of entry function here, as appropriate. |
| 370 | if (CGM.getCodeGenOpts().OptimizationLevel == 0) |
| 371 | Fn->addFnAttr(llvm::Attribute::OptimizeNone); |
| 372 | Fn->addFnAttr(llvm::Attribute::NoInline); |
| 373 | } |
| 374 | |
| 375 | static Value *buildVectorInput(IRBuilder<> &B, Function *F, llvm::Type *Ty) { |
| 376 | if (const auto *VT = dyn_cast<FixedVectorType>(Val: Ty)) { |
| 377 | Value *Result = PoisonValue::get(T: Ty); |
| 378 | for (unsigned I = 0; I < VT->getNumElements(); ++I) { |
| 379 | Value *Elt = B.CreateCall(Callee: F, Args: {B.getInt32(C: I)}); |
| 380 | Result = B.CreateInsertElement(Vec: Result, NewElt: Elt, Idx: I); |
| 381 | } |
| 382 | return Result; |
| 383 | } |
| 384 | return B.CreateCall(Callee: F, Args: {B.getInt32(C: 0)}); |
| 385 | } |
| 386 | |
| 387 | static void addSPIRVBuiltinDecoration(llvm::GlobalVariable *GV, |
| 388 | unsigned BuiltIn) { |
| 389 | LLVMContext &Ctx = GV->getContext(); |
| 390 | IRBuilder<> B(GV->getContext()); |
| 391 | MDNode *Operands = MDNode::get( |
| 392 | Context&: Ctx, |
| 393 | MDs: {ConstantAsMetadata::get(C: B.getInt32(/* Spirv::Decoration::BuiltIn */ C: 11)), |
| 394 | ConstantAsMetadata::get(C: B.getInt32(C: BuiltIn))}); |
| 395 | MDNode *Decoration = MDNode::get(Context&: Ctx, MDs: {Operands}); |
| 396 | GV->addMetadata(Kind: "spirv.Decorations" , MD&: *Decoration); |
| 397 | } |
| 398 | |
| 399 | static llvm::Value *createSPIRVBuiltinLoad(IRBuilder<> &B, llvm::Module &M, |
| 400 | llvm::Type *Ty, const Twine &Name, |
| 401 | unsigned BuiltInID) { |
| 402 | auto *GV = new llvm::GlobalVariable( |
| 403 | M, Ty, /* isConstant= */ true, llvm::GlobalValue::ExternalLinkage, |
| 404 | /* Initializer= */ nullptr, Name, /* insertBefore= */ nullptr, |
| 405 | llvm::GlobalVariable::GeneralDynamicTLSModel, |
| 406 | /* AddressSpace */ 7, /* isExternallyInitialized= */ true); |
| 407 | addSPIRVBuiltinDecoration(GV, BuiltIn: BuiltInID); |
| 408 | return B.CreateLoad(Ty, Ptr: GV); |
| 409 | } |
| 410 | |
| 411 | llvm::Value *CGHLSLRuntime::emitInputSemantic(IRBuilder<> &B, |
| 412 | const ParmVarDecl &D, |
| 413 | llvm::Type *Ty) { |
| 414 | assert(D.hasAttrs() && "Entry parameter missing annotation attribute!" ); |
| 415 | if (D.hasAttr<HLSLSV_GroupIndexAttr>()) { |
| 416 | llvm::Function *GroupIndex = |
| 417 | CGM.getIntrinsic(IID: getFlattenedThreadIdInGroupIntrinsic()); |
| 418 | return B.CreateCall(Callee: FunctionCallee(GroupIndex)); |
| 419 | } |
| 420 | if (D.hasAttr<HLSLSV_DispatchThreadIDAttr>()) { |
| 421 | llvm::Function *ThreadIDIntrinsic = |
| 422 | CGM.getIntrinsic(IID: getThreadIdIntrinsic()); |
| 423 | return buildVectorInput(B, F: ThreadIDIntrinsic, Ty); |
| 424 | } |
| 425 | if (D.hasAttr<HLSLSV_GroupThreadIDAttr>()) { |
| 426 | llvm::Function *GroupThreadIDIntrinsic = |
| 427 | CGM.getIntrinsic(IID: getGroupThreadIdIntrinsic()); |
| 428 | return buildVectorInput(B, F: GroupThreadIDIntrinsic, Ty); |
| 429 | } |
| 430 | if (D.hasAttr<HLSLSV_GroupIDAttr>()) { |
| 431 | llvm::Function *GroupIDIntrinsic = CGM.getIntrinsic(IID: getGroupIdIntrinsic()); |
| 432 | return buildVectorInput(B, F: GroupIDIntrinsic, Ty); |
| 433 | } |
| 434 | if (D.hasAttr<HLSLSV_PositionAttr>()) { |
| 435 | if (getArch() == llvm::Triple::spirv) |
| 436 | return createSPIRVBuiltinLoad(B, M&: CGM.getModule(), Ty, Name: "sv_position" , |
| 437 | /* BuiltIn::Position */ BuiltInID: 0); |
| 438 | llvm_unreachable("SV_Position semantic not implemented for this target." ); |
| 439 | } |
| 440 | assert(false && "Unhandled parameter attribute" ); |
| 441 | return nullptr; |
| 442 | } |
| 443 | |
| 444 | void CGHLSLRuntime::emitEntryFunction(const FunctionDecl *FD, |
| 445 | llvm::Function *Fn) { |
| 446 | llvm::Module &M = CGM.getModule(); |
| 447 | llvm::LLVMContext &Ctx = M.getContext(); |
| 448 | auto *EntryTy = llvm::FunctionType::get(Result: llvm::Type::getVoidTy(C&: Ctx), isVarArg: false); |
| 449 | Function *EntryFn = |
| 450 | Function::Create(EntryTy, Function::ExternalLinkage, FD->getName(), &M); |
| 451 | |
| 452 | // Copy function attributes over, we have no argument or return attributes |
| 453 | // that can be valid on the real entry. |
| 454 | AttributeList NewAttrs = AttributeList::get(C&: Ctx, Index: AttributeList::FunctionIndex, |
| 455 | Attrs: Fn->getAttributes().getFnAttrs()); |
| 456 | EntryFn->setAttributes(NewAttrs); |
| 457 | setHLSLEntryAttributes(FD, Fn: EntryFn); |
| 458 | |
| 459 | // Set the called function as internal linkage. |
| 460 | Fn->setLinkage(GlobalValue::InternalLinkage); |
| 461 | |
| 462 | BasicBlock *BB = BasicBlock::Create(Context&: Ctx, Name: "entry" , Parent: EntryFn); |
| 463 | IRBuilder<> B(BB); |
| 464 | llvm::SmallVector<Value *> Args; |
| 465 | |
| 466 | SmallVector<OperandBundleDef, 1> OB; |
| 467 | if (CGM.shouldEmitConvergenceTokens()) { |
| 468 | assert(EntryFn->isConvergent()); |
| 469 | llvm::Value *I = |
| 470 | B.CreateIntrinsic(llvm::Intrinsic::experimental_convergence_entry, {}); |
| 471 | llvm::Value *bundleArgs[] = {I}; |
| 472 | OB.emplace_back(Args: "convergencectrl" , Args&: bundleArgs); |
| 473 | } |
| 474 | |
| 475 | // FIXME: support struct parameters where semantics are on members. |
| 476 | // See: https://github.com/llvm/llvm-project/issues/57874 |
| 477 | unsigned SRetOffset = 0; |
| 478 | for (const auto &Param : Fn->args()) { |
| 479 | if (Param.hasStructRetAttr()) { |
| 480 | // FIXME: support output. |
| 481 | // See: https://github.com/llvm/llvm-project/issues/57874 |
| 482 | SRetOffset = 1; |
| 483 | Args.emplace_back(Args: PoisonValue::get(T: Param.getType())); |
| 484 | continue; |
| 485 | } |
| 486 | const ParmVarDecl *PD = FD->getParamDecl(i: Param.getArgNo() - SRetOffset); |
| 487 | Args.push_back(Elt: emitInputSemantic(B, D: *PD, Ty: Param.getType())); |
| 488 | } |
| 489 | |
| 490 | CallInst *CI = B.CreateCall(Callee: FunctionCallee(Fn), Args, OpBundles: OB); |
| 491 | CI->setCallingConv(Fn->getCallingConv()); |
| 492 | // FIXME: Handle codegen for return type semantics. |
| 493 | // See: https://github.com/llvm/llvm-project/issues/57875 |
| 494 | B.CreateRetVoid(); |
| 495 | |
| 496 | // Add and identify root signature to function, if applicable |
| 497 | for (const Attr *Attr : FD->getAttrs()) { |
| 498 | if (const auto *RSAttr = dyn_cast<RootSignatureAttr>(Attr)) |
| 499 | addRootSignature(RSAttr->getSignatureDecl()->getRootElements(), EntryFn, |
| 500 | M); |
| 501 | } |
| 502 | } |
| 503 | |
| 504 | void CGHLSLRuntime::setHLSLFunctionAttributes(const FunctionDecl *FD, |
| 505 | llvm::Function *Fn) { |
| 506 | if (FD->isInExportDeclContext()) { |
| 507 | const StringRef ExportAttrKindStr = "hlsl.export" ; |
| 508 | Fn->addFnAttr(Kind: ExportAttrKindStr); |
| 509 | } |
| 510 | } |
| 511 | |
| 512 | static void gatherFunctions(SmallVectorImpl<Function *> &Fns, llvm::Module &M, |
| 513 | bool CtorOrDtor) { |
| 514 | const auto *GV = |
| 515 | M.getNamedGlobal(Name: CtorOrDtor ? "llvm.global_ctors" : "llvm.global_dtors" ); |
| 516 | if (!GV) |
| 517 | return; |
| 518 | const auto *CA = dyn_cast<ConstantArray>(Val: GV->getInitializer()); |
| 519 | if (!CA) |
| 520 | return; |
| 521 | // The global_ctor array elements are a struct [Priority, Fn *, COMDat]. |
| 522 | // HLSL neither supports priorities or COMDat values, so we will check those |
| 523 | // in an assert but not handle them. |
| 524 | |
| 525 | for (const auto &Ctor : CA->operands()) { |
| 526 | if (isa<ConstantAggregateZero>(Val: Ctor)) |
| 527 | continue; |
| 528 | ConstantStruct *CS = cast<ConstantStruct>(Val: Ctor); |
| 529 | |
| 530 | assert(cast<ConstantInt>(CS->getOperand(0))->getValue() == 65535 && |
| 531 | "HLSL doesn't support setting priority for global ctors." ); |
| 532 | assert(isa<ConstantPointerNull>(CS->getOperand(2)) && |
| 533 | "HLSL doesn't support COMDat for global ctors." ); |
| 534 | Fns.push_back(Elt: cast<Function>(Val: CS->getOperand(i_nocapture: 1))); |
| 535 | } |
| 536 | } |
| 537 | |
| 538 | void CGHLSLRuntime::generateGlobalCtorDtorCalls() { |
| 539 | llvm::Module &M = CGM.getModule(); |
| 540 | SmallVector<Function *> CtorFns; |
| 541 | SmallVector<Function *> DtorFns; |
| 542 | gatherFunctions(Fns&: CtorFns, M, CtorOrDtor: true); |
| 543 | gatherFunctions(Fns&: DtorFns, M, CtorOrDtor: false); |
| 544 | |
| 545 | // Insert a call to the global constructor at the beginning of the entry block |
| 546 | // to externally exported functions. This is a bit of a hack, but HLSL allows |
| 547 | // global constructors, but doesn't support driver initialization of globals. |
| 548 | for (auto &F : M.functions()) { |
| 549 | if (!F.hasFnAttribute(Kind: "hlsl.shader" )) |
| 550 | continue; |
| 551 | auto *Token = getConvergenceToken(BB&: F.getEntryBlock()); |
| 552 | Instruction *IP = &*F.getEntryBlock().begin(); |
| 553 | SmallVector<OperandBundleDef, 1> OB; |
| 554 | if (Token) { |
| 555 | llvm::Value *bundleArgs[] = {Token}; |
| 556 | OB.emplace_back(Args: "convergencectrl" , Args&: bundleArgs); |
| 557 | IP = Token->getNextNode(); |
| 558 | } |
| 559 | IRBuilder<> B(IP); |
| 560 | for (auto *Fn : CtorFns) { |
| 561 | auto CI = B.CreateCall(Callee: FunctionCallee(Fn), Args: {}, OpBundles: OB); |
| 562 | CI->setCallingConv(Fn->getCallingConv()); |
| 563 | } |
| 564 | |
| 565 | // Insert global dtors before the terminator of the last instruction |
| 566 | B.SetInsertPoint(F.back().getTerminator()); |
| 567 | for (auto *Fn : DtorFns) { |
| 568 | auto CI = B.CreateCall(Callee: FunctionCallee(Fn), Args: {}, OpBundles: OB); |
| 569 | CI->setCallingConv(Fn->getCallingConv()); |
| 570 | } |
| 571 | } |
| 572 | |
| 573 | // No need to keep global ctors/dtors for non-lib profile after call to |
| 574 | // ctors/dtors added for entry. |
| 575 | Triple T(M.getTargetTriple()); |
| 576 | if (T.getEnvironment() != Triple::EnvironmentType::Library) { |
| 577 | if (auto *GV = M.getNamedGlobal(Name: "llvm.global_ctors" )) |
| 578 | GV->eraseFromParent(); |
| 579 | if (auto *GV = M.getNamedGlobal(Name: "llvm.global_dtors" )) |
| 580 | GV->eraseFromParent(); |
| 581 | } |
| 582 | } |
| 583 | |
| 584 | static void initializeBuffer(CodeGenModule &CGM, llvm::GlobalVariable *GV, |
| 585 | Intrinsic::ID IntrID, |
| 586 | ArrayRef<llvm::Value *> Args) { |
| 587 | |
| 588 | LLVMContext &Ctx = CGM.getLLVMContext(); |
| 589 | llvm::Function *InitResFunc = llvm::Function::Create( |
| 590 | Ty: llvm::FunctionType::get(Result: CGM.VoidTy, isVarArg: false), |
| 591 | Linkage: llvm::GlobalValue::InternalLinkage, |
| 592 | N: ("_init_buffer_" + GV->getName()).str(), M&: CGM.getModule()); |
| 593 | InitResFunc->addFnAttr(llvm::Attribute::AlwaysInline); |
| 594 | |
| 595 | llvm::BasicBlock *EntryBB = |
| 596 | llvm::BasicBlock::Create(Context&: Ctx, Name: "entry" , Parent: InitResFunc); |
| 597 | CGBuilderTy Builder(CGM, Ctx); |
| 598 | const DataLayout &DL = CGM.getModule().getDataLayout(); |
| 599 | Builder.SetInsertPoint(EntryBB); |
| 600 | |
| 601 | // Make sure the global variable is buffer resource handle |
| 602 | llvm::Type *HandleTy = GV->getValueType(); |
| 603 | assert(HandleTy->isTargetExtTy() && "unexpected type of the buffer global" ); |
| 604 | |
| 605 | llvm::Value *CreateHandle = Builder.CreateIntrinsic( |
| 606 | /*ReturnType=*/RetTy: HandleTy, ID: IntrID, Args, FMFSource: nullptr, |
| 607 | Name: Twine(GV->getName()).concat(Suffix: "_h" )); |
| 608 | |
| 609 | llvm::Value *HandleRef = Builder.CreateStructGEP(Ty: GV->getValueType(), Ptr: GV, Idx: 0); |
| 610 | Builder.CreateAlignedStore(Val: CreateHandle, Ptr: HandleRef, |
| 611 | Align: HandleRef->getPointerAlignment(DL)); |
| 612 | Builder.CreateRetVoid(); |
| 613 | |
| 614 | CGM.AddCXXGlobalInit(F: InitResFunc); |
| 615 | } |
| 616 | |
| 617 | void CGHLSLRuntime::initializeBufferFromBinding(const HLSLBufferDecl *BufDecl, |
| 618 | llvm::GlobalVariable *GV, |
| 619 | HLSLResourceBindingAttr *RBA) { |
| 620 | llvm::Type *Int1Ty = llvm::Type::getInt1Ty(C&: CGM.getLLVMContext()); |
| 621 | auto *NonUniform = llvm::ConstantInt::get(Ty: Int1Ty, V: false); |
| 622 | auto *Index = llvm::ConstantInt::get(Ty: CGM.IntTy, V: 0); |
| 623 | auto *RangeSize = llvm::ConstantInt::get(Ty: CGM.IntTy, V: 1); |
| 624 | auto *Space = |
| 625 | llvm::ConstantInt::get(CGM.IntTy, RBA ? RBA->getSpaceNumber() : 0); |
| 626 | Value *Name = nullptr; |
| 627 | |
| 628 | auto [IntrinsicID, HasNameArg] = |
| 629 | RBA->hasRegisterSlot() |
| 630 | ? CGM.getHLSLRuntime().getCreateHandleFromBindingIntrinsic() |
| 631 | : CGM.getHLSLRuntime().getCreateHandleFromImplicitBindingIntrinsic(); |
| 632 | |
| 633 | if (HasNameArg) { |
| 634 | std::string Str(BufDecl->getName()); |
| 635 | std::string GlobalName(Str + ".str" ); |
| 636 | Name = CGM.GetAddrOfConstantCString(Str, GlobalName: GlobalName.c_str()).getPointer(); |
| 637 | } |
| 638 | |
| 639 | // buffer with explicit binding |
| 640 | if (RBA->hasRegisterSlot()) { |
| 641 | auto *RegSlot = llvm::ConstantInt::get(CGM.IntTy, RBA->getSlotNumber()); |
| 642 | SmallVector<Value *> Args{Space, RegSlot, RangeSize, Index, NonUniform}; |
| 643 | if (Name) |
| 644 | Args.push_back(Elt: Name); |
| 645 | initializeBuffer(CGM, GV, IntrinsicID, Args); |
| 646 | } else { |
| 647 | // buffer with implicit binding |
| 648 | auto *OrderID = |
| 649 | llvm::ConstantInt::get(CGM.IntTy, RBA->getImplicitBindingOrderID()); |
| 650 | SmallVector<Value *> Args{OrderID, Space, RangeSize, Index, NonUniform}; |
| 651 | if (Name) |
| 652 | Args.push_back(Elt: Name); |
| 653 | initializeBuffer(CGM, GV, IntrinsicID, Args); |
| 654 | } |
| 655 | } |
| 656 | |
| 657 | void CGHLSLRuntime::handleGlobalVarDefinition(const VarDecl *VD, |
| 658 | llvm::GlobalVariable *GV) { |
| 659 | if (auto Attr = VD->getAttr<HLSLVkExtBuiltinInputAttr>()) |
| 660 | addSPIRVBuiltinDecoration(GV, Attr->getBuiltIn()); |
| 661 | } |
| 662 | |
| 663 | llvm::Instruction *CGHLSLRuntime::getConvergenceToken(BasicBlock &BB) { |
| 664 | if (!CGM.shouldEmitConvergenceTokens()) |
| 665 | return nullptr; |
| 666 | |
| 667 | auto E = BB.end(); |
| 668 | for (auto I = BB.begin(); I != E; ++I) { |
| 669 | auto *II = dyn_cast<llvm::IntrinsicInst>(Val: &*I); |
| 670 | if (II && llvm::isConvergenceControlIntrinsic(IntrinsicID: II->getIntrinsicID())) { |
| 671 | return II; |
| 672 | } |
| 673 | } |
| 674 | llvm_unreachable("Convergence token should have been emitted." ); |
| 675 | return nullptr; |
| 676 | } |
| 677 | |
| 678 | class OpaqueValueVisitor : public RecursiveASTVisitor<OpaqueValueVisitor> { |
| 679 | public: |
| 680 | llvm::SmallPtrSet<OpaqueValueExpr *, 8> OVEs; |
| 681 | OpaqueValueVisitor() {} |
| 682 | |
| 683 | bool VisitOpaqueValueExpr(OpaqueValueExpr *E) { |
| 684 | OVEs.insert(Ptr: E); |
| 685 | return true; |
| 686 | } |
| 687 | }; |
| 688 | |
| 689 | void CGHLSLRuntime::emitInitListOpaqueValues(CodeGenFunction &CGF, |
| 690 | InitListExpr *E) { |
| 691 | |
| 692 | typedef CodeGenFunction::OpaqueValueMappingData OpaqueValueMappingData; |
| 693 | OpaqueValueVisitor Visitor; |
| 694 | Visitor.TraverseStmt(E); |
| 695 | for (auto *OVE : Visitor.OVEs) { |
| 696 | if (CGF.isOpaqueValueEmitted(E: OVE)) |
| 697 | continue; |
| 698 | if (OpaqueValueMappingData::shouldBindAsLValue(OVE)) { |
| 699 | LValue LV = CGF.EmitLValue(E: OVE->getSourceExpr()); |
| 700 | OpaqueValueMappingData::bind(CGF, ov: OVE, lv: LV); |
| 701 | } else { |
| 702 | RValue RV = CGF.EmitAnyExpr(E: OVE->getSourceExpr()); |
| 703 | OpaqueValueMappingData::bind(CGF, ov: OVE, rv: RV); |
| 704 | } |
| 705 | } |
| 706 | } |
| 707 | |