10#include "TargetInfo.h"
11#include "llvm/ADT/STLExtras.h"
12#include "llvm/IR/CallingConv.h"
13#include "llvm/IR/IntrinsicsNVPTX.h"
24class NVPTXTargetCodeGenInfo;
26class NVPTXABIInfo :
public ABIInfo {
27 NVPTXTargetCodeGenInfo &CGInfo;
30 NVPTXABIInfo(
CodeGenTypes &CGT, NVPTXTargetCodeGenInfo &Info)
59 return llvm::Type::getInt64Ty(
getABIInfo().getVMContext());
65 return llvm::Type::getInt64Ty(
getABIInfo().getVMContext());
69 LValue Src)
const override {
70 emitBuiltinSurfTexDeviceCopy(CGF, Dst, Src);
75 LValue Src)
const override {
76 emitBuiltinSurfTexDeviceCopy(CGF, Dst, Src);
82 static void addNVVMMetadata(llvm::GlobalValue *GV, StringRef Name,
86 addGridConstantNVVMMetadata(llvm::GlobalValue *GV,
92 llvm::Value *Handle =
nullptr;
96 if (
auto *ASC = llvm::dyn_cast_or_null<llvm::AddrSpaceCastOperator>(
C))
97 C = llvm::cast<llvm::Constant>(ASC->getPointerOperand());
98 if (
auto *GV = llvm::dyn_cast_or_null<llvm::GlobalVariable>(
C)) {
104 {GV},
"texsurf_handle");
112bool NVPTXABIInfo::isUnsupportedType(
QualType T)
const {
121 return EIT->getNumBits() >
127 return isUnsupportedType(AT->getElementType());
134 if (
const CXXRecordDecl *CXXRD = dyn_cast<CXXRecordDecl>(RD))
136 if (isUnsupportedType(I.getType()))
140 if (isUnsupportedType(I->getType()))
147 unsigned MaxSize)
const {
150 const uint64_t Alignment = getContext().getTypeAlign(Ty);
151 const unsigned Div = std::min<unsigned>(MaxSize, Alignment);
152 llvm::Type *IntType = llvm::Type::getIntNTy(getVMContext(), Div);
161 if (getContext().getLangOpts().OpenMP &&
162 getContext().getLangOpts().OpenMPIsTargetDevice &&
163 isUnsupportedType(RetTy))
164 return coerceToIntArrayWithLimit(RetTy, 64);
172 RetTy = EnumTy->getDecl()->getIntegerType();
181 Ty = EnumTy->getDecl()->getIntegerType();
187 if (getContext().getLangOpts().CUDAIsDevice) {
190 CGInfo.getCUDADeviceBuiltinSurfaceDeviceType());
193 CGInfo.getCUDADeviceBuiltinTextureDeviceType());
195 return getNaturalAlignIndirect(Ty,
true);
199 if ((EIT->getNumBits() > 128) ||
200 (!getContext().getTargetInfo().hasInt128Type() &&
201 EIT->getNumBits() > 64))
202 return getNaturalAlignIndirect(Ty,
true);
213 for (
auto &&[ArgumentsCount, I] : llvm::enumerate(FI.
arguments()))
228 getContext().getTypeInfoInChars(Ty),
233void NVPTXTargetCodeGenInfo::setTargetAttributes(
235 if (GV->isDeclaration())
237 const VarDecl *VD = dyn_cast_or_null<VarDecl>(
D);
241 addNVVMMetadata(GV,
"surface", 1);
243 addNVVMMetadata(GV,
"texture", 1);
252 llvm::Function *F = cast<llvm::Function>(GV);
258 if (FD->
hasAttr<OpenCLKernelAttr>()) {
261 F->setCallingConv(llvm::CallingConv::PTX_Kernel);
263 F->addFnAttr(llvm::Attribute::NoInline);
272 if (FD->
hasAttr<CUDAGlobalAttr>()) {
274 for (
auto IV : llvm::enumerate(FD->
parameters()))
275 if (IV.value()->hasAttr<CUDAGridConstantAttr>())
277 GCI.push_back(IV.index() + 1);
279 F->setCallingConv(llvm::CallingConv::PTX_Kernel);
280 addGridConstantNVVMMetadata(F, GCI);
282 if (CUDALaunchBoundsAttr *
Attr = FD->
getAttr<CUDALaunchBoundsAttr>())
287 if (FD->
hasAttr<NVPTXKernelAttr>()) {
288 F->setCallingConv(llvm::CallingConv::PTX_Kernel);
292void NVPTXTargetCodeGenInfo::addNVVMMetadata(llvm::GlobalValue *GV,
293 StringRef Name,
int Operand) {
294 llvm::Module *M = GV->getParent();
298 llvm::NamedMDNode *MD = M->getOrInsertNamedMetadata(
"nvvm.annotations");
301 llvm::ConstantAsMetadata::get(GV), llvm::MDString::get(Ctx, Name),
302 llvm::ConstantAsMetadata::get(
303 llvm::ConstantInt::get(llvm::Type::getInt32Ty(Ctx), Operand))};
306 MD->addOperand(llvm::MDNode::get(Ctx, MDVals));
309void NVPTXTargetCodeGenInfo::addGridConstantNVVMMetadata(
312 llvm::Module *M = GV->getParent();
313 llvm::LLVMContext &Ctx = M->getContext();
316 llvm::NamedMDNode *MD = M->getOrInsertNamedMetadata(
"nvvm.annotations");
319 if (!GridConstantArgs.empty()) {
321 for (
int I : GridConstantArgs)
322 GCM.push_back(llvm::ConstantAsMetadata::get(
323 llvm::ConstantInt::get(llvm::Type::getInt32Ty(Ctx), I)));
324 MDVals.append({llvm::MDString::get(Ctx,
"grid_constant"),
325 llvm::MDNode::get(Ctx, GCM)});
329 MD->addOperand(llvm::MDNode::get(Ctx, MDVals));
332bool NVPTXTargetCodeGenInfo::shouldEmitStaticExternCAliases()
const {
338 llvm::PointerType *PT,
341 if (PT->getAddressSpace() != Ctx.getTargetAddressSpace(LangAS::opencl_local))
342 return llvm::ConstantPointerNull::get(PT);
344 auto NPT = llvm::PointerType::get(
345 PT->getContext(), Ctx.getTargetAddressSpace(LangAS::opencl_generic));
346 return llvm::ConstantExpr::getAddrSpaceCast(
347 llvm::ConstantPointerNull::get(NPT), PT);
352 const CUDALaunchBoundsAttr *
Attr,
353 int32_t *MaxThreadsVal,
354 int32_t *MinBlocksVal,
355 int32_t *MaxClusterRankVal) {
357 llvm::APSInt MaxThreads(32);
358 MaxThreads =
Attr->getMaxThreads()->EvaluateKnownConstInt(
getContext());
359 if (MaxThreads > 0) {
361 *MaxThreadsVal = MaxThreads.getExtValue();
364 NVPTXTargetCodeGenInfo::addNVVMMetadata(F,
"maxntidx",
365 MaxThreads.getExtValue());
372 if (
Attr->getMinBlocks()) {
373 llvm::APSInt MinBlocks(32);
374 MinBlocks =
Attr->getMinBlocks()->EvaluateKnownConstInt(
getContext());
377 *MinBlocksVal = MinBlocks.getExtValue();
380 NVPTXTargetCodeGenInfo::addNVVMMetadata(F,
"minctasm",
381 MinBlocks.getExtValue());
385 if (
Attr->getMaxBlocks()) {
386 llvm::APSInt MaxBlocks(32);
387 MaxBlocks =
Attr->getMaxBlocks()->EvaluateKnownConstInt(
getContext());
389 if (MaxClusterRankVal)
390 *MaxClusterRankVal = MaxBlocks.getExtValue();
393 NVPTXTargetCodeGenInfo::addNVVMMetadata(F,
"maxclusterrank",
394 MaxBlocks.getExtValue());
400std::unique_ptr<TargetCodeGenInfo>
402 return std::make_unique<NVPTXTargetCodeGenInfo>(CGM.
getTypes());
Holds long-lived AST nodes (such as types and decls) that can be referred to throughout the semantic ...
uint64_t getTypeSize(QualType T) const
Return the size of the specified (complete) type T, in bits.
const TargetInfo & getTargetInfo() const
Attr - This represents one attribute.
A fixed int type of a specified bitwidth.
Represents a base class of a C++ class.
Represents a C++ struct/union/class.
static CharUnits fromQuantity(QuantityType Quantity)
fromQuantity - Construct a CharUnits quantity from a raw integer type.
ABIArgInfo - Helper class to encapsulate information about how a specific C type should be passed to ...
static ABIArgInfo getIgnore()
static ABIArgInfo getDirect(llvm::Type *T=nullptr, unsigned Offset=0, llvm::Type *Padding=nullptr, bool CanBeFlattened=true, unsigned Align=0)
static ABIArgInfo getExtend(QualType Ty, llvm::Type *T=nullptr)
ABIInfo - Target specific hooks for defining how a type should be passed or returned from functions.
virtual RValue EmitVAArg(CodeGen::CodeGenFunction &CGF, CodeGen::Address VAListAddr, QualType Ty, AggValueSlot Slot) const =0
EmitVAArg - Emit the target dependent code to load a value of.
virtual void computeInfo(CodeGen::CGFunctionInfo &FI) const =0
Like RawAddress, an abstract representation of an aligned address, but the pointer contained in this ...
llvm::Value * emitRawPointer(CodeGenFunction &CGF) const
Return the pointer contained in this class after authenticating it and adding offset to it if necessa...
CGFunctionInfo - Class to encapsulate the information about a function definition.
ABIArgInfo & getReturnInfo()
unsigned getCallingConvention() const
getCallingConvention - Return the user specified calling convention, which has been translated into a...
CanQualType getReturnType() const
MutableArrayRef< ArgInfo > arguments()
void setEffectiveCallingConvention(unsigned Value)
unsigned getNumRequiredArgs() const
CodeGenFunction - This class organizes the per-function state that is used while generating LLVM code...
llvm::Value * EmitLoadOfScalar(Address Addr, bool Volatile, QualType Ty, SourceLocation Loc, AlignmentSource Source=AlignmentSource::Type, bool isNontemporal=false)
EmitLoadOfScalar - Load a scalar value from an address, taking care to appropriately convert from the...
llvm::CallInst * EmitRuntimeCall(llvm::FunctionCallee callee, const Twine &name="")
void EmitStoreOfScalar(llvm::Value *Value, Address Addr, bool Volatile, QualType Ty, AlignmentSource Source=AlignmentSource::Type, bool isInit=false, bool isNontemporal=false)
EmitStoreOfScalar - Store a scalar value to an address, taking care to appropriately convert from the...
This class organizes the cross-function state that is used while generating LLVM code.
void handleCUDALaunchBoundsAttr(llvm::Function *F, const CUDALaunchBoundsAttr *A, int32_t *MaxThreadsVal=nullptr, int32_t *MinBlocksVal=nullptr, int32_t *MaxClusterRankVal=nullptr)
Emit the IR encoding to attach the CUDA launch bounds attribute to F.
const LangOptions & getLangOpts() const
CodeGenTypes & getTypes()
ASTContext & getContext() const
llvm::Function * getIntrinsic(unsigned IID, ArrayRef< llvm::Type * > Tys={})
This class organizes the cross-module state that is used while lowering AST types to LLVM types.
LValue - This represents an lvalue references.
Address getAddress() const
RValue - This trivial value class is used to represent the result of an expression that is evaluated.
TargetCodeGenInfo - This class organizes various target-specific codegeneration issues,...
virtual bool emitCUDADeviceBuiltinSurfaceDeviceCopy(CodeGenFunction &CGF, LValue Dst, LValue Src) const
Emit the device-side copy of the builtin surface type.
virtual bool emitCUDADeviceBuiltinTextureDeviceCopy(CodeGenFunction &CGF, LValue Dst, LValue Src) const
Emit the device-side copy of the builtin texture type.
virtual llvm::Type * getCUDADeviceBuiltinSurfaceDeviceType() const
Return the device-side type for the CUDA device builtin surface type.
const T & getABIInfo() const
virtual void setTargetAttributes(const Decl *D, llvm::GlobalValue *GV, CodeGen::CodeGenModule &M) const
setTargetAttributes - Provides a convenient hook to handle extra target-specific attributes for the g...
virtual llvm::Type * getCUDADeviceBuiltinTextureDeviceType() const
Return the device-side type for the CUDA device builtin texture type.
virtual llvm::Constant * getNullPointer(const CodeGen::CodeGenModule &CGM, llvm::PointerType *T, QualType QT) const
Get target specific null pointer.
virtual bool shouldEmitStaticExternCAliases() const
Decl - This represents one declaration (or definition), e.g.
A helper class that allows the use of isa/cast/dyncast to detect TagType objects of enums.
Represents a member of a struct/union/class.
Represents a function declaration or definition.
ArrayRef< ParmVarDecl * > parameters() const
A (possibly-)qualified type.
Represents a struct/union/class.
field_range fields() const
A helper class that allows the use of isa/cast/dyncast to detect TagType objects of structs/unions/cl...
Encodes a location in the source.
virtual bool hasInt128Type() const
Determine whether the __int128 type is supported on this target.
virtual bool hasFloat16Type() const
Determine whether the _Float16 type is supported on this target.
virtual bool hasFloat128Type() const
Determine whether the __float128 type is supported on this target.
bool isFloat16Type() const
bool isIntegerType() const
isIntegerType() does not include complex integers (a GCC extension).
bool isScalarType() const
bool isFloat128Type() const
bool isCUDADeviceBuiltinSurfaceType() const
Check if the type is the CUDA device builtin surface type.
bool isCUDADeviceBuiltinTextureType() const
Check if the type is the CUDA device builtin texture type.
const ArrayType * getAsArrayTypeUnsafe() const
A variant of getAs<> for array types which silently discards qualifiers from the outermost type.
bool isRealFloatingType() const
Floating point categories.
const T * getAs() const
Member-template getAs<specific type>'.
Represents a variable declaration or definition.
ABIArgInfo classifyArgumentType(CodeGenModule &CGM, CanQualType type)
Classify the rules for how to pass a particular type.
bool classifyReturnType(const CGCXXABI &CXXABI, CGFunctionInfo &FI, const ABIInfo &Info)
std::unique_ptr< TargetCodeGenInfo > createNVPTXTargetCodeGenInfo(CodeGenModule &CGM)
RValue emitVoidPtrVAArg(CodeGenFunction &CGF, Address VAListAddr, QualType ValueTy, bool IsIndirect, TypeInfoChars ValueInfo, CharUnits SlotSizeAndAlign, bool AllowHigherAlign, AggValueSlot Slot, bool ForceRightAdjust=false)
Emit va_arg for a platform using the common void* representation, where arguments are simply emitted ...
bool isAggregateTypeForABI(QualType T)
bool Div(InterpState &S, CodePtr OpPC)
1) Pops the RHS from the stack.
The JSON file list parser is used to communicate input to InstallAPI.
const FunctionProtoType * T