/src/llvm-project/clang/lib/Basic/Targets/NVPTX.h

Source (jump to first uncovered line)
//===--- NVPTX.h - Declare NVPTX target feature support ---------*- C++ -*-===//
//
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
// See https://llvm.org/LICENSE.txt for license information.
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
//
//===----------------------------------------------------------------------===//
//
// This file declares NVPTX TargetInfo objects.
//
//===----------------------------------------------------------------------===//

#ifndef LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H
#define LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H

#include "clang/Basic/Cuda.h"
#include "clang/Basic/TargetInfo.h"
#include "clang/Basic/TargetOptions.h"
#include "llvm/Support/Compiler.h"
#include "llvm/TargetParser/Triple.h"
#include <optional>

namespace clang {
namespace targets {

static const unsigned NVPTXAddrSpaceMap[] = {
    0, // Default
    1, // opencl_global
    3, // opencl_local
    4, // opencl_constant
    0, // opencl_private
    // FIXME: generic has to be added to the target
    0, // opencl_generic
    1, // opencl_global_device
    1, // opencl_global_host
    1, // cuda_device
    4, // cuda_constant
    3, // cuda_shared
    1, // sycl_global
    1, // sycl_global_device
    1, // sycl_global_host
    3, // sycl_local
    0, // sycl_private
    0, // ptr32_sptr
    0, // ptr32_uptr
    0, // ptr64
    0, // hlsl_groupshared
    // Wasm address space values for this target are dummy values,
    // as it is only enabled for Wasm targets.
    20, // wasm_funcref
};

/// The DWARF address class. Taken from
/// https://docs.nvidia.com/cuda/archive/10.0/ptx-writers-guide-to-interoperability/index.html#cuda-specific-dwarf
static const int NVPTXDWARFAddrSpaceMap[] = {
    -1, // Default, opencl_private or opencl_generic - not defined
    5,  // opencl_global
    -1,
    8,  // opencl_local or cuda_shared
    4,  // opencl_constant or cuda_constant
};

class LLVM_LIBRARY_VISIBILITY NVPTXTargetInfo : public TargetInfo {
  static const char *const GCCRegNames[];
  CudaArch GPU;
  uint32_t PTXVersion;
  std::unique_ptr<TargetInfo> HostTarget;

public:
  NVPTXTargetInfo(const llvm::Triple &Triple, const TargetOptions &Opts,
                  unsigned TargetPointerWidth);

  void getTargetDefines(const LangOptions &Opts,
                        MacroBuilder &Builder) const override;

  ArrayRef<Builtin::Info> getTargetBuiltins() const override;

  bool
  initFeatureMap(llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags,
                 StringRef CPU,
                 const std::vector<std::string> &FeaturesVec) const override {
    Features[CudaArchToString(GPU)] = true;
    Features["ptx" + std::to_string(PTXVersion)] = true;
    return TargetInfo::initFeatureMap(Features, Diags, CPU, FeaturesVec);
  }

  bool hasFeature(StringRef Feature) const override;

  ArrayRef<const char *> getGCCRegNames() const override;

  ArrayRef<TargetInfo::GCCRegAlias> getGCCRegAliases() const override {
    // No aliases.
    return std::nullopt;
  }

  bool validateAsmConstraint(const char *&Name,
                             TargetInfo::ConstraintInfo &Info) const override {
    switch (*Name) {
    default:
      return false;
    case 'c':
    case 'h':
    case 'r':
    case 'l':
    case 'f':
    case 'd':
      Info.setAllowsRegister();
      return true;
    }
  }

  std::string_view getClobbers() const override {
    // FIXME: Is this really right?
    return "";
  }

  BuiltinVaListKind getBuiltinVaListKind() const override {
    // FIXME: implement
    return TargetInfo::CharPtrBuiltinVaList;
  }

  bool isValidCPUName(StringRef Name) const override {
    return StringToCudaArch(Name) != CudaArch::UNKNOWN;
  }

  void fillValidCPUList(SmallVectorImpl<StringRef> &Values) const override {
    for (int i = static_cast<int>(CudaArch::SM_20);
         i < static_cast<int>(CudaArch::Generic); ++i)
      Values.emplace_back(CudaArchToString(static_cast<CudaArch>(i)));
  }

  bool setCPU(const std::string &Name) override {
    GPU = StringToCudaArch(Name);
    return GPU != CudaArch::UNKNOWN;
  }

  void setSupportedOpenCLOpts() override {
    auto &Opts = getSupportedOpenCLOpts();
    Opts["cl_clang_storage_class_specifiers"] = true;
    Opts["__cl_clang_function_pointers"] = true;
    Opts["__cl_clang_variadic_functions"] = true;
    Opts["__cl_clang_non_portable_kernel_param_types"] = true;
    Opts["__cl_clang_bitfields"] = true;

    Opts["cl_khr_fp64"] = true;
    Opts["__opencl_c_fp64"] = true;
    Opts["cl_khr_byte_addressable_store"] = true;
    Opts["cl_khr_global_int32_base_atomics"] = true;
    Opts["cl_khr_global_int32_extended_atomics"] = true;
    Opts["cl_khr_local_int32_base_atomics"] = true;
    Opts["cl_khr_local_int32_extended_atomics"] = true;
  }

  const llvm::omp::GV &getGridValue() const override {
    return llvm::omp::NVPTXGridValues;
  }

  /// \returns If a target requires an address within a target specific address
  /// space \p AddressSpace to be converted in order to be used, then return the
  /// corresponding target specific DWARF address space.
  ///
  /// \returns Otherwise return std::nullopt and no conversion will be emitted
  /// in the DWARF.
  std::optional<unsigned>
  getDWARFAddressSpace(unsigned AddressSpace) const override {
    if (AddressSpace >= std::size(NVPTXDWARFAddrSpaceMap) ||
        NVPTXDWARFAddrSpaceMap[AddressSpace] < 0)
      return std::nullopt;
    return NVPTXDWARFAddrSpaceMap[AddressSpace];
  }

  CallingConvCheckResult checkCallingConvention(CallingConv CC) const override {
    // CUDA compilations support all of the host's calling conventions.
    //
    // TODO: We should warn if you apply a non-default CC to anything other than
    // a host function.
    if (HostTarget)
      return HostTarget->checkCallingConvention(CC);
    return CCCR_Warning;
  }

  bool hasBitIntType() const override { return true; }
  bool hasBFloat16Type() const override { return true; }

  CudaArch getGPU() const { return GPU; }
};
} // namespace targets
} // namespace clang
#endif // LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H

Line	Count	Source (jump to first uncovered line)
1		//===--- NVPTX.h - Declare NVPTX target feature support ---------- C++ --===//
2		//
3		// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4		// See https://llvm.org/LICENSE.txt for license information.
5		// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6		//
7		//===----------------------------------------------------------------------===//
8		//
9		// This file declares NVPTX TargetInfo objects.
10		//
11		//===----------------------------------------------------------------------===//
12
13		#ifndef LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H
14		#define LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H
15
16		#include "clang/Basic/Cuda.h"
17		#include "clang/Basic/TargetInfo.h"
18		#include "clang/Basic/TargetOptions.h"
19		#include "llvm/Support/Compiler.h"
20		#include "llvm/TargetParser/Triple.h"
21		#include <optional>
22
23		namespace clang {
24		namespace targets {
25
26		static const unsigned NVPTXAddrSpaceMap[] = {
27		0, // Default
28		1, // opencl_global
29		3, // opencl_local
30		4, // opencl_constant
31		0, // opencl_private
32		// FIXME: generic has to be added to the target
33		0, // opencl_generic
34		1, // opencl_global_device
35		1, // opencl_global_host
36		1, // cuda_device
37		4, // cuda_constant
38		3, // cuda_shared
39		1, // sycl_global
40		1, // sycl_global_device
41		1, // sycl_global_host
42		3, // sycl_local
43		0, // sycl_private
44		0, // ptr32_sptr
45		0, // ptr32_uptr
46		0, // ptr64
47		0, // hlsl_groupshared
48		// Wasm address space values for this target are dummy values,
49		// as it is only enabled for Wasm targets.
50		20, // wasm_funcref
51		};
52
53		/// The DWARF address class. Taken from
54		/// https://docs.nvidia.com/cuda/archive/10.0/ptx-writers-guide-to-interoperability/index.html#cuda-specific-dwarf
55		static const int NVPTXDWARFAddrSpaceMap[] = {
56		-1, // Default, opencl_private or opencl_generic - not defined
57		5, // opencl_global
58		-1,
59		8, // opencl_local or cuda_shared
60		4, // opencl_constant or cuda_constant
61		};
62
63		class LLVM_LIBRARY_VISIBILITY NVPTXTargetInfo : public TargetInfo {
64		static const char *const GCCRegNames[];
65		CudaArch GPU;
66		uint32_t PTXVersion;
67		std::unique_ptr<TargetInfo> HostTarget;
68
69		public:
70		NVPTXTargetInfo(const llvm::Triple &Triple, const TargetOptions &Opts,
71		unsigned TargetPointerWidth);
72
73		void getTargetDefines(const LangOptions &Opts,
74		MacroBuilder &Builder) const override;
75
76		ArrayRef<Builtin::Info> getTargetBuiltins() const override;
77
78		bool
79		initFeatureMap(llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags,
80		StringRef CPU,
81	0	const std::vector<std::string> &FeaturesVec) const override {
82	0	Features[CudaArchToString(GPU)] = true;
83	0	Features["ptx" + std::to_string(PTXVersion)] = true;
84	0	return TargetInfo::initFeatureMap(Features, Diags, CPU, FeaturesVec);
85	0	}
86
87		bool hasFeature(StringRef Feature) const override;
88
89		ArrayRef<const char *> getGCCRegNames() const override;
90
91	0	ArrayRef<TargetInfo::GCCRegAlias> getGCCRegAliases() const override {
92		// No aliases.
93	0	return std::nullopt;
94	0	}
95
96		bool validateAsmConstraint(const char *&Name,
97	0	TargetInfo::ConstraintInfo &Info) const override {
98	0	switch (*Name) {
99	0	default:
100	0	return false;
101	0	case 'c':
102	0	case 'h':
103	0	case 'r':
104	0	case 'l':
105	0	case 'f':
106	0	case 'd':
107	0	Info.setAllowsRegister();
108	0	return true;
109	0	}
110	0	}
111
112	0	std::string_view getClobbers() const override {
113		// FIXME: Is this really right?
114	0	return "";
115	0	}
116
117	0	BuiltinVaListKind getBuiltinVaListKind() const override {
118		// FIXME: implement
119	0	return TargetInfo::CharPtrBuiltinVaList;
120	0	}
121
122	0	bool isValidCPUName(StringRef Name) const override {
123	0	return StringToCudaArch(Name) != CudaArch::UNKNOWN;
124	0	}
125
126	0	void fillValidCPUList(SmallVectorImpl<StringRef> &Values) const override {
127	0	for (int i = static_cast<int>(CudaArch::SM_20);
128	0	i < static_cast<int>(CudaArch::Generic); ++i)
129	0	Values.emplace_back(CudaArchToString(static_cast<CudaArch>(i)));
130	0	}
131
132	0	bool setCPU(const std::string &Name) override {
133	0	GPU = StringToCudaArch(Name);
134	0	return GPU != CudaArch::UNKNOWN;
135	0	}
136
137	0	void setSupportedOpenCLOpts() override {
138	0	auto &Opts = getSupportedOpenCLOpts();
139	0	Opts["cl_clang_storage_class_specifiers"] = true;
140	0	Opts["__cl_clang_function_pointers"] = true;
141	0	Opts["__cl_clang_variadic_functions"] = true;
142	0	Opts["__cl_clang_non_portable_kernel_param_types"] = true;
143	0	Opts["__cl_clang_bitfields"] = true;
144
145	0	Opts["cl_khr_fp64"] = true;
146	0	Opts["__opencl_c_fp64"] = true;
147	0	Opts["cl_khr_byte_addressable_store"] = true;
148	0	Opts["cl_khr_global_int32_base_atomics"] = true;
149	0	Opts["cl_khr_global_int32_extended_atomics"] = true;
150	0	Opts["cl_khr_local_int32_base_atomics"] = true;
151	0	Opts["cl_khr_local_int32_extended_atomics"] = true;
152	0	}
153
154	0	const llvm::omp::GV &getGridValue() const override {
155	0	return llvm::omp::NVPTXGridValues;
156	0	}
157
158		/// \returns If a target requires an address within a target specific address
159		/// space \p AddressSpace to be converted in order to be used, then return the
160		/// corresponding target specific DWARF address space.
161		///
162		/// \returns Otherwise return std::nullopt and no conversion will be emitted
163		/// in the DWARF.
164		std::optional<unsigned>
165	0	getDWARFAddressSpace(unsigned AddressSpace) const override {
166	0	if (AddressSpace >= std::size(NVPTXDWARFAddrSpaceMap) \|\|
167	0	NVPTXDWARFAddrSpaceMap[AddressSpace] < 0)
168	0	return std::nullopt;
169	0	return NVPTXDWARFAddrSpaceMap[AddressSpace];
170	0	}
171
172	0	CallingConvCheckResult checkCallingConvention(CallingConv CC) const override {
173		// CUDA compilations support all of the host's calling conventions.
174		//
175		// TODO: We should warn if you apply a non-default CC to anything other than
176		// a host function.
177	0	if (HostTarget)
178	0	return HostTarget->checkCallingConvention(CC);
179	0	return CCCR_Warning;
180	0	}
181
182	0	bool hasBitIntType() const override { return true; }
183	0	bool hasBFloat16Type() const override { return true; }
184
185	0	CudaArch getGPU() const { return GPU; }
186		};
187		} // namespace targets
188		} // namespace clang
189		#endif // LLVM_CLANG_LIB_BASIC_TARGETS_NVPTX_H

Coverage Report

Created: 2024-01-17 10:31