doxygen/NVPTX_8h_source.html

//===--- NVPTX.h - Declare NVPTX target feature support ---------*- C++ -*-===//

//

// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.

// See https://llvm.org/LICENSE.txt for license information.

// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception

//

//===----------------------------------------------------------------------===//

//

// This file declares NVPTX TargetInfo objects.

//

//===----------------------------------------------------------------------===//


#ifndef LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H

#define LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H


#include "clang/Basic/Cuda.h"

#include "clang/Basic/TargetInfo.h"

#include "clang/Basic/TargetOptions.h"

#include "llvm/Support/Compiler.h"

#include "llvm/Support/NVPTXAddrSpace.h"

#include "llvm/TargetParser/Triple.h"

#include <optional>


namespace clang {

namespace targets {


static const unsigned NVPTXAddrSpaceMap[] = {

    0, // Default

    1, // opencl_global

    3, // opencl_local

    4, // opencl_constant

    0, // opencl_private

    // FIXME: generic has to be added to the target

    0, // opencl_generic

    1, // opencl_global_device

    1, // opencl_global_host

    1, // cuda_device

    4, // cuda_constant

    3, // cuda_shared

    1, // sycl_global

    1, // sycl_global_device

    1, // sycl_global_host

    3, // sycl_local

    0, // sycl_private

    0, // ptr32_sptr

    0, // ptr32_uptr

    0, // ptr64

    0, // hlsl_groupshared

    0, // hlsl_constant

    0, // hlsl_private

    0, // hlsl_device

    0, // hlsl_input

    0, // hlsl_push_constant

    // Wasm address space values for this target are dummy values,

    // as it is only enabled for Wasm targets.

    20, // wasm_funcref

};


/// The DWARF address class. Taken from

/// https://docs.nvidia.com/cuda/archive/10.0/ptx-writers-guide-to-interoperability/index.html#cuda-specific-dwarf


static const int NVPTXDWARFAddrSpaceMap[] = {

    -1, // Default, opencl_private or opencl_generic - not defined

    5,  // opencl_global

    -1,

    8,  // opencl_local or cuda_shared

    4,  // opencl_constant or cuda_constant

};


class LLVM_LIBRARY_VISIBILITY NVPTXTargetInfo : public TargetInfo {

  static const char *const GCCRegNames[];

  OffloadArch GPU;

  uint32_t PTXVersion;

  std::unique_ptr<TargetInfo> HostTarget;


public:

  NVPTXTargetInfo(const llvm::Triple &Triple, const TargetOptions &Opts,

                  unsigned TargetPointerWidth);


  void getTargetDefines(const LangOptions &Opts,

                        MacroBuilder &Builder) const override;


  llvm::SmallVector<Builtin::InfosShard> getTargetBuiltins() const override;


  bool useFP16ConversionIntrinsics() const override { return false; }


  bool


  initFeatureMap(llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags,

                 StringRef CPU,

                 const std::vector<std::string> &FeaturesVec) const override {

    if (GPU != OffloadArch::UNUSED)

      Features[OffloadArchToString(GPU)] = true;

    Features["ptx" + std::to_string(PTXVersion)] = true;

    return TargetInfo::initFeatureMap(Features, Diags, CPU, FeaturesVec);

  }


  bool hasFeature(StringRef Feature) const override;


  virtual bool isAddressSpaceSupersetOf(LangAS A, LangAS B) const override {

    // The generic address space AS(0) is a superset of all the other address

    // spaces used by the backend target.

    return A == B ||

           ((A == LangAS::Default ||

             (isTargetAddressSpace(A) &&

              toTargetAddressSpace(A) ==

                  llvm::NVPTXAS::ADDRESS_SPACE_GENERIC)) &&

            isTargetAddressSpace(B) &&

            toTargetAddressSpace(B) >= llvm::NVPTXAS::ADDRESS_SPACE_GENERIC &&

            toTargetAddressSpace(B) <= llvm::NVPTXAS::ADDRESS_SPACE_LOCAL &&

            toTargetAddressSpace(B) != 2);

  }


  ArrayRef<const char *> getGCCRegNames() const override;


  ArrayRef<TargetInfo::GCCRegAlias> getGCCRegAliases() const override {

    // No aliases.

    return {};

  }


  bool validateAsmConstraint(const char *&Name,

                             TargetInfo::ConstraintInfo &Info) const override {

    switch (*Name) {

    default:

      return false;

    case 'c':

    case 'h':

    case 'r':

    case 'l':

    case 'f':

    case 'd':

    case 'q':

      Info.setAllowsRegister();

      return true;

    }

  }


  std::string_view getClobbers() const override {

    // FIXME: Is this really right?

    return "";

  }


  BuiltinVaListKind getBuiltinVaListKind() const override {

    return TargetInfo::CharPtrBuiltinVaList;

  }


  bool isValidCPUName(StringRef Name) const override {

    return StringToOffloadArch(Name) != OffloadArch::UNKNOWN;

  }


  void fillValidCPUList(SmallVectorImpl<StringRef> &Values) const override {

    for (int i = static_cast<int>(OffloadArch::SM_20);

         i < static_cast<int>(OffloadArch::Generic); ++i)

      Values.emplace_back(OffloadArchToString(static_cast<OffloadArch>(i)));

  }


  bool setCPU(const std::string &Name) override {

    GPU = StringToOffloadArch(Name);

    return GPU != OffloadArch::UNKNOWN;

  }


  void setSupportedOpenCLOpts() override {

    auto &Opts = getSupportedOpenCLOpts();

    Opts["cl_clang_storage_class_specifiers"] = true;

    Opts["__cl_clang_function_pointers"] = true;

    Opts["__cl_clang_variadic_functions"] = true;

    Opts["__cl_clang_non_portable_kernel_param_types"] = true;

    Opts["__cl_clang_bitfields"] = true;


    Opts["cl_khr_fp64"] = true;

    Opts["__opencl_c_fp64"] = true;

    Opts["cl_khr_byte_addressable_store"] = true;

    Opts["cl_khr_global_int32_base_atomics"] = true;

    Opts["cl_khr_global_int32_extended_atomics"] = true;

    Opts["cl_khr_local_int32_base_atomics"] = true;

    Opts["cl_khr_local_int32_extended_atomics"] = true;


    Opts["__opencl_c_generic_address_space"] = true;

  }


  const llvm::omp::GV &getGridValue() const override {

    return llvm::omp::NVPTXGridValues;

  }


  /// \returns If a target requires an address within a target specific address

  /// space \p AddressSpace to be converted in order to be used, then return the

  /// corresponding target specific DWARF address space.

  ///

  /// \returns Otherwise return std::nullopt and no conversion will be emitted

  /// in the DWARF.

  std::optional<unsigned>


  getDWARFAddressSpace(unsigned AddressSpace) const override {

    if (AddressSpace >= std::size(NVPTXDWARFAddrSpaceMap) ||

        NVPTXDWARFAddrSpaceMap[AddressSpace] < 0)

      return std::nullopt;

    return NVPTXDWARFAddrSpaceMap[AddressSpace];

  }


  CallingConvCheckResult checkCallingConvention(CallingConv CC) const override {

    // CUDA compilations support all of the host's calling conventions.

    //

    // TODO: We should warn if you apply a non-default CC to anything other than

    // a host function.

    if (HostTarget)

      return HostTarget->checkCallingConvention(CC);

    return CC == CC_DeviceKernel ? CCCR_OK : CCCR_Warning;

  }


  bool hasBitIntType() const override { return true; }

  bool hasBFloat16Type() const override { return true; }


  OffloadArch getGPU() const { return GPU; }

};


} // namespace targets

} // namespace clang

#endif // LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H

AttrFeatureKind::Feature
@ Feature
Definition LoongArch.cpp:416

hasFeature
static bool hasFeature(StringRef Feature, const LangOptions &LangOpts, const TargetInfo &Target)
Determine whether a translation unit built using the current language options has the given feature.
Definition Module.cpp:95

TargetOptions.h
Defines the clang::TargetOptions class.

clang::DiagnosticsEngine
Concrete class used by the front-end to report problems and issues.
Definition Diagnostic.h:232

clang::LangOptions
Keeps track of the various options that can be enabled, which controls the dialect of C or C++ that i...
Definition LangOptions.h:452

clang::MacroBuilder
Definition MacroBuilder.h:23

clang::TargetInfo::TargetInfo
TargetInfo(const llvm::Triple &T)
Definition TargetInfo.cpp:60

clang::TargetInfo::BuiltinVaListKind
BuiltinVaListKind
The different kinds of __builtin_va_list types defined by the target implementation.
Definition TargetInfo.h:333

clang::TargetInfo::CharPtrBuiltinVaList
@ CharPtrBuiltinVaList
typedef char* __builtin_va_list;
Definition TargetInfo.h:335

clang::TargetInfo::getSupportedOpenCLOpts
llvm::StringMap< bool > & getSupportedOpenCLOpts()
Get supported OpenCL extensions and optional core features.
Definition TargetInfo.h:1865

clang::TargetInfo::CallingConvCheckResult
CallingConvCheckResult
Definition TargetInfo.h:1760

clang::TargetInfo::CCCR_Warning
@ CCCR_Warning
Definition TargetInfo.h:1762

clang::TargetInfo::CCCR_OK
@ CCCR_OK
Definition TargetInfo.h:1761

clang::TargetInfo::initFeatureMap
virtual bool initFeatureMap(llvm::StringMap< bool > &Features, DiagnosticsEngine &Diags, StringRef CPU, const std::vector< std::string > &FeatureVec) const
Initialize the map with the default set of target features for the CPU this should include all legal ...
Definition TargetInfo.cpp:566

clang::TargetOptions
Options for controlling the target.
Definition TargetOptions.h:26

clang::targets::NVPTXTargetInfo::hasBitIntType
bool hasBitIntType() const override
Determine whether the _BitInt type is supported on this target.
Definition NVPTX.h:207

clang::targets::NVPTXTargetInfo::getBuiltinVaListKind
BuiltinVaListKind getBuiltinVaListKind() const override
Returns the kind of __builtin_va_list type that should be used with this target.
Definition NVPTX.h:141

clang::targets::NVPTXTargetInfo::getGPU
OffloadArch getGPU() const
Definition NVPTX.h:210

clang::targets::NVPTXTargetInfo::isAddressSpaceSupersetOf
virtual bool isAddressSpaceSupersetOf(LangAS A, LangAS B) const override
Returns true if an address space can be safely converted to another.
Definition NVPTX.h:98

clang::targets::NVPTXTargetInfo::NVPTXTargetInfo
NVPTXTargetInfo(const llvm::Triple &Triple, const TargetOptions &Opts, unsigned TargetPointerWidth)
Definition NVPTX.cpp:38

clang::targets::NVPTXTargetInfo::getTargetDefines
void getTargetDefines(const LangOptions &Opts, MacroBuilder &Builder) const override
===-— Other target property query methods -----------------------—===//
Definition NVPTX.cpp:171

clang::targets::NVPTXTargetInfo::getGCCRegAliases
ArrayRef< TargetInfo::GCCRegAlias > getGCCRegAliases() const override
Definition NVPTX.h:114

clang::targets::NVPTXTargetInfo::fillValidCPUList
void fillValidCPUList(SmallVectorImpl< StringRef > &Values) const override
Fill a SmallVectorImpl with the valid values to setCPU.
Definition NVPTX.h:149

clang::targets::NVPTXTargetInfo::validateAsmConstraint
bool validateAsmConstraint(const char *&Name, TargetInfo::ConstraintInfo &Info) const override
Definition NVPTX.h:119

clang::targets::NVPTXTargetInfo::hasBFloat16Type
bool hasBFloat16Type() const override
Determine whether the _BFloat16 type is supported on this target.
Definition NVPTX.h:208

clang::targets::NVPTXTargetInfo::getClobbers
std::string_view getClobbers() const override
Returns a string of target-specific clobbers, in LLVM format.
Definition NVPTX.h:136

clang::targets::NVPTXTargetInfo::getTargetBuiltins
llvm::SmallVector< Builtin::InfosShard > getTargetBuiltins() const override
Return information about target-specific builtins for the current primary target, and info about whic...
Definition NVPTX.cpp:192

clang::targets::NVPTXTargetInfo::getDWARFAddressSpace
std::optional< unsigned > getDWARFAddressSpace(unsigned AddressSpace) const override
Definition NVPTX.h:190

clang::targets::NVPTXTargetInfo::getGridValue
const llvm::omp::GV & getGridValue() const override
Definition NVPTX.h:179

clang::targets::NVPTXTargetInfo::setCPU
bool setCPU(const std::string &Name) override
Target the specified CPU.
Definition NVPTX.h:155

clang::targets::NVPTXTargetInfo::checkCallingConvention
CallingConvCheckResult checkCallingConvention(CallingConv CC) const override
Determines whether a given calling convention is valid for the target.
Definition NVPTX.h:197

clang::targets::NVPTXTargetInfo::isValidCPUName
bool isValidCPUName(StringRef Name) const override
Determine whether this TargetInfo supports the given CPU name.
Definition NVPTX.h:145

clang::targets::NVPTXTargetInfo::useFP16ConversionIntrinsics
bool useFP16ConversionIntrinsics() const override
Check whether conversions to and from __fp16 should go through an integer bitcast with i16.
Definition NVPTX.h:84

clang::targets::NVPTXTargetInfo::initFeatureMap
bool initFeatureMap(llvm::StringMap< bool > &Features, DiagnosticsEngine &Diags, StringRef CPU, const std::vector< std::string > &FeaturesVec) const override
Initialize the map with the default set of target features for the CPU this should include all legal ...
Definition NVPTX.h:87

clang::targets::NVPTXTargetInfo::setSupportedOpenCLOpts
void setSupportedOpenCLOpts() override
Set supported OpenCL extensions and optional core features.
Definition NVPTX.h:160

llvm::ArrayRef
Definition LLVM.h:31

llvm::SmallVectorImpl
Definition Randstruct.h:18

llvm::SmallVector
Definition LLVM.h:34

Cuda.h

TargetInfo.h
Defines the clang::TargetInfo interface.

clang::targets
Definition TargetInfo.h:1964

clang::targets::NVPTXAddrSpaceMap
static const unsigned NVPTXAddrSpaceMap[]
Definition NVPTX.h:27

clang::targets::NVPTXDWARFAddrSpaceMap
static const int NVPTXDWARFAddrSpaceMap[]
The DWARF address class.
Definition NVPTX.h:61

clang
The JSON file list parser is used to communicate input to InstallAPI.
Definition CalledOnceCheck.h:17

clang::isTargetAddressSpace
bool isTargetAddressSpace(LangAS AS)
Definition AddressSpaces.h:82

clang::OffloadArch
OffloadArch
Definition OffloadArch.h:18

clang::OffloadArch::UNUSED
@ UNUSED
Definition OffloadArch.h:19

clang::OffloadArch::UNKNOWN
@ UNKNOWN
Definition OffloadArch.h:20

clang::OffloadArch::Generic
@ Generic
Definition OffloadArch.h:112

clang::OffloadArch::SM_20
@ SM_20
Definition OffloadArch.h:22

clang::toTargetAddressSpace
unsigned toTargetAddressSpace(LangAS AS)
Definition AddressSpaces.h:86

clang::StringToOffloadArch
OffloadArch StringToOffloadArch(llvm::StringRef S)
Definition OffloadArch.cpp:130

clang::LangAS
LangAS
Defines the address space values used by the address space qualifier of QualType.
Definition AddressSpaces.h:25

clang::LangAS::Default
@ Default
Definition AddressSpaces.h:28

clang::OffloadArchToString
const char * OffloadArchToString(OffloadArch A)
Definition OffloadArch.cpp:110

clang::CallingConv
CallingConv
CallingConv - Specifies the calling convention that a function uses.
Definition Specifiers.h:278

clang::CC_DeviceKernel
@ CC_DeviceKernel
Definition Specifiers.h:292

clang::TargetInfo::ConstraintInfo
Definition TargetInfo.h:1127

clang::TargetInfo::ConstraintInfo::setAllowsRegister
void setAllowsRegister()
Definition TargetInfo.h:1192