1 //===--- AMDGPU.h - Declare AMDGPU target feature support -------*- C++ -*-===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 // This file declares AMDGPU TargetInfo objects.
11 //===----------------------------------------------------------------------===//
13 #ifndef LLVM_CLANG_LIB_BASIC_TARGETS_AMDGPU_H
14 #define LLVM_CLANG_LIB_BASIC_TARGETS_AMDGPU_H
16 #include "clang/Basic/TargetInfo.h"
17 #include "clang/Basic/TargetOptions.h"
18 #include "llvm/ADT/StringSet.h"
19 #include "llvm/ADT/Triple.h"
20 #include "llvm/Support/Compiler.h"
21 #include "llvm/Support/TargetParser.h"
26 class LLVM_LIBRARY_VISIBILITY AMDGPUTargetInfo final : public TargetInfo {
28 static const Builtin::Info BuiltinInfo[];
29 static const char *const GCCRegNames[];
38 static const LangASMap AMDGPUDefIsGenMap;
39 static const LangASMap AMDGPUDefIsPrivMap;
41 llvm::AMDGPU::GPUKind GPUKind;
44 bool hasFP64() const {
45 return getTriple().getArch() == llvm::Triple::amdgcn ||
46 !!(GPUFeatures & llvm::AMDGPU::FEATURE_FP64);
50 bool hasFastFMAF() const {
51 return !!(GPUFeatures & llvm::AMDGPU::FEATURE_FAST_FMA_F32);
55 bool hasFastFMA() const {
56 return getTriple().getArch() == llvm::Triple::amdgcn;
59 bool hasFMAF() const {
60 return getTriple().getArch() == llvm::Triple::amdgcn ||
61 !!(GPUFeatures & llvm::AMDGPU::FEATURE_FMA);
64 bool hasFullRateDenormalsF32() const {
65 return !!(GPUFeatures & llvm::AMDGPU::FEATURE_FAST_DENORMAL_F32);
68 bool hasLDEXPF() const {
69 return getTriple().getArch() == llvm::Triple::amdgcn ||
70 !!(GPUFeatures & llvm::AMDGPU::FEATURE_LDEXP);
73 static bool isAMDGCN(const llvm::Triple &TT) {
74 return TT.getArch() == llvm::Triple::amdgcn;
77 static bool isR600(const llvm::Triple &TT) {
78 return TT.getArch() == llvm::Triple::r600;
82 AMDGPUTargetInfo(const llvm::Triple &Triple, const TargetOptions &Opts);
84 void setAddressSpaceMap(bool DefaultIsPrivate);
86 void adjust(LangOptions &Opts) override;
88 uint64_t getPointerWidthV(unsigned AddrSpace) const override {
89 if (isR600(getTriple()))
92 if (AddrSpace == Private || AddrSpace == Local)
98 uint64_t getPointerAlignV(unsigned AddrSpace) const override {
99 return getPointerWidthV(AddrSpace);
102 uint64_t getMaxPointerWidth() const override {
103 return getTriple().getArch() == llvm::Triple::amdgcn ? 64 : 32;
106 const char *getClobbers() const override { return ""; }
108 ArrayRef<const char *> getGCCRegNames() const override;
110 ArrayRef<TargetInfo::GCCRegAlias> getGCCRegAliases() const override {
114 /// Accepted register names: (n, m is unsigned integer, n < m)
119 /// {S} , where S is a special register name
122 bool validateAsmConstraint(const char *&Name,
123 TargetInfo::ConstraintInfo &Info) const override {
124 static const ::llvm::StringSet<> SpecialRegs({
125 "exec", "vcc", "flat_scratch", "m0", "scc", "tba", "tma",
126 "flat_scratch_lo", "flat_scratch_hi", "vcc_lo", "vcc_hi", "exec_lo",
127 "exec_hi", "tma_lo", "tma_hi", "tba_lo", "tba_hi",
131 bool HasLeftParen = false;
132 if (S.front() == '{') {
138 if (S.front() != 'v' && S.front() != 's') {
141 auto E = S.find('}');
142 if (!SpecialRegs.count(S.substr(0, E)))
144 S = S.drop_front(E + 1);
147 // Found {S} where S is a special register.
148 Info.setAllowsRegister();
157 Info.setAllowsRegister();
161 bool HasLeftBracket = false;
162 if (!S.empty() && S.front() == '[') {
163 HasLeftBracket = true;
166 unsigned long long N;
167 if (S.empty() || consumeUnsignedInteger(S, 10, N))
169 if (!S.empty() && S.front() == ':') {
173 unsigned long long M;
174 if (consumeUnsignedInteger(S, 10, M) || N >= M)
177 if (HasLeftBracket) {
178 if (S.empty() || S.front() != ']')
182 if (S.empty() || S.front() != '}')
187 // Found {vn}, {sn}, {v[n]}, {s[n]}, {v[n:m]}, or {s[n:m]}.
188 Info.setAllowsRegister();
193 // \p Constraint will be left pointing at the last character of
194 // the constraint. In practice, it won't be changed unless the
195 // constraint is longer than one character.
196 std::string convertConstraint(const char *&Constraint) const override {
197 const char *Begin = Constraint;
198 TargetInfo::ConstraintInfo Info("", "");
199 if (validateAsmConstraint(Constraint, Info))
200 return std::string(Begin).substr(0, Constraint - Begin + 1);
203 return std::string(1, *Constraint);
207 initFeatureMap(llvm::StringMap<bool> &Features, DiagnosticsEngine &Diags,
209 const std::vector<std::string> &FeatureVec) const override;
211 void adjustTargetOptions(const CodeGenOptions &CGOpts,
212 TargetOptions &TargetOpts) const override;
214 ArrayRef<Builtin::Info> getTargetBuiltins() const override;
216 void getTargetDefines(const LangOptions &Opts,
217 MacroBuilder &Builder) const override;
219 BuiltinVaListKind getBuiltinVaListKind() const override {
220 return TargetInfo::CharPtrBuiltinVaList;
223 bool isValidCPUName(StringRef Name) const override {
224 if (getTriple().getArch() == llvm::Triple::amdgcn)
225 return llvm::AMDGPU::parseArchAMDGCN(Name) != llvm::AMDGPU::GK_NONE;
226 return llvm::AMDGPU::parseArchR600(Name) != llvm::AMDGPU::GK_NONE;
229 void fillValidCPUList(SmallVectorImpl<StringRef> &Values) const override;
231 bool setCPU(const std::string &Name) override {
232 if (getTriple().getArch() == llvm::Triple::amdgcn) {
233 GPUKind = llvm::AMDGPU::parseArchAMDGCN(Name);
234 GPUFeatures = llvm::AMDGPU::getArchAttrAMDGCN(GPUKind);
236 GPUKind = llvm::AMDGPU::parseArchR600(Name);
237 GPUFeatures = llvm::AMDGPU::getArchAttrR600(GPUKind);
240 return GPUKind != llvm::AMDGPU::GK_NONE;
243 void setSupportedOpenCLOpts() override {
244 auto &Opts = getSupportedOpenCLOpts();
245 Opts.support("cl_clang_storage_class_specifiers");
246 Opts.support("cl_khr_icd");
248 bool IsAMDGCN = isAMDGCN(getTriple());
251 Opts.support("cl_khr_fp64");
253 if (IsAMDGCN || GPUKind >= llvm::AMDGPU::GK_CEDAR) {
254 Opts.support("cl_khr_byte_addressable_store");
255 Opts.support("cl_khr_global_int32_base_atomics");
256 Opts.support("cl_khr_global_int32_extended_atomics");
257 Opts.support("cl_khr_local_int32_base_atomics");
258 Opts.support("cl_khr_local_int32_extended_atomics");
262 Opts.support("cl_khr_fp16");
263 Opts.support("cl_khr_int64_base_atomics");
264 Opts.support("cl_khr_int64_extended_atomics");
265 Opts.support("cl_khr_mipmap_image");
266 Opts.support("cl_khr_subgroups");
267 Opts.support("cl_khr_3d_image_writes");
268 Opts.support("cl_amd_media_ops");
269 Opts.support("cl_amd_media_ops2");
273 LangAS getOpenCLTypeAddrSpace(OpenCLTypeKind TK) const override {
276 return LangAS::opencl_constant;
280 case OCLTK_ReserveID:
281 return LangAS::opencl_global;
284 return TargetInfo::getOpenCLTypeAddrSpace(TK);
288 LangAS getOpenCLBuiltinAddressSpace(unsigned AS) const override {
291 return LangAS::opencl_generic;
293 return LangAS::opencl_global;
295 return LangAS::opencl_local;
297 return LangAS::opencl_constant;
299 return LangAS::opencl_private;
301 return getLangASFromTargetAS(AS);
305 LangAS getCUDABuiltinAddressSpace(unsigned AS) const override {
306 return LangAS::Default;
309 llvm::Optional<LangAS> getConstantAddressSpace() const override {
310 return getLangASFromTargetAS(Constant);
313 /// \returns Target specific vtbl ptr address space.
314 unsigned getVtblPtrAddressSpace() const override {
315 return static_cast<unsigned>(Constant);
318 /// \returns If a target requires an address within a target specific address
319 /// space \p AddressSpace to be converted in order to be used, then return the
320 /// corresponding target specific DWARF address space.
322 /// \returns Otherwise return None and no conversion will be emitted in the
325 getDWARFAddressSpace(unsigned AddressSpace) const override {
326 const unsigned DWARF_Private = 1;
327 const unsigned DWARF_Local = 2;
328 if (AddressSpace == Private) {
329 return DWARF_Private;
330 } else if (AddressSpace == Local) {
337 CallingConvCheckResult checkCallingConvention(CallingConv CC) const override {
342 case CC_OpenCLKernel:
347 // In amdgcn target the null pointer in global, constant, and generic
348 // address space has value 0 but in private and local address space has
350 uint64_t getNullPointerValue(LangAS AS) const override {
351 return AS == LangAS::opencl_local ? ~0 : 0;
354 void setAuxTarget(const TargetInfo *Aux) override;
357 } // namespace targets
360 #endif // LLVM_CLANG_LIB_BASIC_TARGETS_AMDGPU_H